diff --git "a/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" "b/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" --- "a/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" +++ "b/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 6.169, "train/learning_rate": 2.9295774647887323e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8917, "_timestamp": 1647953419, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 9.0, 9.0, 11.0, 15.0, 19.0, 21.0, 28.0, 38.0, 39.0, 52.0, 40.0, 55.0, 46.0, 59.0, 44.0, 60.0, 47.0, 53.0, 44.0, 40.0, 47.0, 38.0, 22.0, 23.0, 25.0, 20.0, 17.0, 12.0, 13.0, 14.0, 8.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.31623077392578, -72.91283416748047, -70.50942993164062, -68.10603332519531, -65.70263671875, -63.29923629760742, -60.895835876464844, -58.49243927001953, -56.08903884887695, -53.685638427734375, -51.28224182128906, -48.878841400146484, -46.475440979003906, -44.072044372558594, -41.668643951416016, -39.26524353027344, -36.861846923828125, -34.45844650268555, -32.055049896240234, -29.651649475097656, -27.24825096130371, -24.844852447509766, -22.441452026367188, -20.038053512573242, -17.634654998779297, -15.231256484985352, -12.82785701751709, -10.424457550048828, -8.021059036254883, -5.6176605224609375, -3.214261054992676, -0.8108615875244141, 1.5925369262695312, 3.9959359169006348, 6.399334907531738, 8.802734375, 11.206132888793945, 13.60953140258789, 16.01293182373047, 18.416330337524414, 20.81972885131836, 23.223127365112305, 25.62652587890625, 28.029926300048828, 30.433324813842773, 32.83672332763672, 35.2401237487793, 37.643524169921875, 40.04692077636719, 42.450321197509766, 44.85371780395508, 47.257118225097656, 49.66051483154297, 52.06391525268555, 54.467315673828125, 56.87071228027344, 59.274112701416016, 61.677513122558594, 64.0809097290039, 66.48430633544922, 68.88771057128906, 71.29110717773438, 73.69450378417969, 76.09790802001953, 78.50130462646484]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 6.0, 7.0, 10.0, 11.0, 19.0, 18.0, 21.0, 20.0, 24.0, 35.0, 21.0, 32.0, 28.0, 42.0, 41.0, 34.0, 38.0, 33.0, 43.0, 43.0, 33.0, 49.0, 35.0, 38.0, 41.0, 26.0, 31.0, 34.0, 30.0, 23.0, 25.0, 16.0, 5.0, 14.0, 8.0, 8.0, 9.0, 8.0, 8.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-70.98054504394531, -68.85433197021484, -66.72811889648438, -64.60191345214844, -62.47570037841797, -60.3494873046875, -58.2232780456543, -56.097068786621094, -53.970855712890625, -51.844642639160156, -49.71843338012695, -47.59222412109375, -45.46601104736328, -43.33979797363281, -41.21358871459961, -39.087379455566406, -36.96116638183594, -34.83495330810547, -32.708744049072266, -30.58253288269043, -28.456321716308594, -26.330110549926758, -24.203899383544922, -22.077688217163086, -19.95147705078125, -17.825265884399414, -15.699054718017578, -13.572843551635742, -11.446632385253906, -9.32042121887207, -7.194210052490234, -5.067998886108398, -2.9417877197265625, -0.8155765533447266, 1.3106346130371094, 3.4368457794189453, 5.563056945800781, 7.689268112182617, 9.815479278564453, 11.941690444946289, 14.067901611328125, 16.19411277770996, 18.320323944091797, 20.446535110473633, 22.57274627685547, 24.698957443237305, 26.82516860961914, 28.951379776000977, 31.077590942382812, 33.20380401611328, 35.330013275146484, 37.45622253417969, 39.582435607910156, 41.708648681640625, 43.83485794067383, 45.96106719970703, 48.0872802734375, 50.21349334716797, 52.33970260620117, 54.465911865234375, 56.592124938964844, 58.71833801269531, 60.844547271728516, 62.97075653076172, 65.09696960449219]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 11.0, 21.0, 22.0, 32.0, 61.0, 74.0, 111.0, 170.0, 235.0, 347.0, 544.0, 812.0, 1235.0, 1852.0, 2936.0, 4699.0, 7550.0, 12381.0, 20737.0, 35593.0, 62323.0, 116794.0, 233638.0, 457231.0, 760199.0, 900650.0, 714252.0, 410371.0, 204565.0, 103984.0, 57030.0, 32374.0, 19208.0, 11567.0, 7362.0, 4627.0, 2838.0, 1970.0, 1307.0, 829.0, 578.0, 378.0, 267.0, 181.0, 120.0, 78.0, 50.0, 32.0, 25.0, 7.0, 12.0, 8.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-50.625, -49.013671875, -47.40234375, -45.791015625, -44.1796875, -42.568359375, -40.95703125, -39.345703125, -37.734375, -36.123046875, -34.51171875, -32.900390625, -31.2890625, -29.677734375, -28.06640625, -26.455078125, -24.84375, -23.232421875, -21.62109375, -20.009765625, -18.3984375, -16.787109375, -15.17578125, -13.564453125, -11.953125, -10.341796875, -8.73046875, -7.119140625, -5.5078125, -3.896484375, -2.28515625, -0.673828125, 0.9375, 2.548828125, 4.16015625, 5.771484375, 7.3828125, 8.994140625, 10.60546875, 12.216796875, 13.828125, 15.439453125, 17.05078125, 18.662109375, 20.2734375, 21.884765625, 23.49609375, 25.107421875, 26.71875, 28.330078125, 29.94140625, 31.552734375, 33.1640625, 34.775390625, 36.38671875, 37.998046875, 39.609375, 41.220703125, 42.83203125, 44.443359375, 46.0546875, 47.666015625, 49.27734375, 50.888671875, 52.5]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 10.0, 7.0, 5.0, 7.0, 15.0, 12.0, 22.0, 17.0, 22.0, 28.0, 31.0, 26.0, 36.0, 22.0, 35.0, 38.0, 32.0, 46.0, 44.0, 39.0, 34.0, 39.0, 44.0, 51.0, 39.0, 35.0, 27.0, 28.0, 24.0, 25.0, 28.0, 13.0, 19.0, 10.0, 10.0, 13.0, 12.0, 9.0, 10.0, 8.0, 5.0, 2.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 4.0], "bins": [-48.46875, -47.07861328125, -45.6884765625, -44.29833984375, -42.908203125, -41.51806640625, -40.1279296875, -38.73779296875, -37.34765625, -35.95751953125, -34.5673828125, -33.17724609375, -31.787109375, -30.39697265625, -29.0068359375, -27.61669921875, -26.2265625, -24.83642578125, -23.4462890625, -22.05615234375, -20.666015625, -19.27587890625, -17.8857421875, -16.49560546875, -15.10546875, -13.71533203125, -12.3251953125, -10.93505859375, -9.544921875, -8.15478515625, -6.7646484375, -5.37451171875, -3.984375, -2.59423828125, -1.2041015625, 0.18603515625, 1.576171875, 2.96630859375, 4.3564453125, 5.74658203125, 7.13671875, 8.52685546875, 9.9169921875, 11.30712890625, 12.697265625, 14.08740234375, 15.4775390625, 16.86767578125, 18.2578125, 19.64794921875, 21.0380859375, 22.42822265625, 23.818359375, 25.20849609375, 26.5986328125, 27.98876953125, 29.37890625, 30.76904296875, 32.1591796875, 33.54931640625, 34.939453125, 36.32958984375, 37.7197265625, 39.10986328125, 40.5]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 18.0, 26.0, 57.0, 57.0, 117.0, 179.0, 261.0, 399.0, 648.0, 1013.0, 1450.0, 2147.0, 3262.0, 5037.0, 7592.0, 11320.0, 17636.0, 26513.0, 40841.0, 62307.0, 94929.0, 143500.0, 218067.0, 325364.0, 479356.0, 643684.0, 648074.0, 485396.0, 329809.0, 220582.0, 146055.0, 95567.0, 62778.0, 41024.0, 27097.0, 17538.0, 11528.0, 7852.0, 5070.0, 3463.0, 2253.0, 1487.0, 981.0, 639.0, 503.0, 290.0, 185.0, 142.0, 89.0, 31.0, 33.0, 26.0, 8.0, 6.0, 4.0, 3.0], "bins": [-42.71875, -41.462890625, -40.20703125, -38.951171875, -37.6953125, -36.439453125, -35.18359375, -33.927734375, -32.671875, -31.416015625, -30.16015625, -28.904296875, -27.6484375, -26.392578125, -25.13671875, -23.880859375, -22.625, -21.369140625, -20.11328125, -18.857421875, -17.6015625, -16.345703125, -15.08984375, -13.833984375, -12.578125, -11.322265625, -10.06640625, -8.810546875, -7.5546875, -6.298828125, -5.04296875, -3.787109375, -2.53125, -1.275390625, -0.01953125, 1.236328125, 2.4921875, 3.748046875, 5.00390625, 6.259765625, 7.515625, 8.771484375, 10.02734375, 11.283203125, 12.5390625, 13.794921875, 15.05078125, 16.306640625, 17.5625, 18.818359375, 20.07421875, 21.330078125, 22.5859375, 23.841796875, 25.09765625, 26.353515625, 27.609375, 28.865234375, 30.12109375, 31.376953125, 32.6328125, 33.888671875, 35.14453125, 36.400390625, 37.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 8.0, 3.0, 9.0, 8.0, 27.0, 17.0, 31.0, 22.0, 34.0, 35.0, 49.0, 63.0, 79.0, 88.0, 114.0, 124.0, 145.0, 177.0, 235.0, 255.0, 297.0, 288.0, 286.0, 296.0, 232.0, 200.0, 189.0, 126.0, 113.0, 101.0, 86.0, 68.0, 50.0, 41.0, 43.0, 25.0, 23.0, 20.0, 13.0, 11.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.71875, -20.089111328125, -19.45947265625, -18.829833984375, -18.2001953125, -17.570556640625, -16.94091796875, -16.311279296875, -15.681640625, -15.052001953125, -14.42236328125, -13.792724609375, -13.1630859375, -12.533447265625, -11.90380859375, -11.274169921875, -10.64453125, -10.014892578125, -9.38525390625, -8.755615234375, -8.1259765625, -7.496337890625, -6.86669921875, -6.237060546875, -5.607421875, -4.977783203125, -4.34814453125, -3.718505859375, -3.0888671875, -2.459228515625, -1.82958984375, -1.199951171875, -0.5703125, 0.059326171875, 0.68896484375, 1.318603515625, 1.9482421875, 2.577880859375, 3.20751953125, 3.837158203125, 4.466796875, 5.096435546875, 5.72607421875, 6.355712890625, 6.9853515625, 7.614990234375, 8.24462890625, 8.874267578125, 9.50390625, 10.133544921875, 10.76318359375, 11.392822265625, 12.0224609375, 12.652099609375, 13.28173828125, 13.911376953125, 14.541015625, 15.170654296875, 15.80029296875, 16.429931640625, 17.0595703125, 17.689208984375, 18.31884765625, 18.948486328125, 19.578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 7.0, 6.0, 11.0, 9.0, 17.0, 24.0, 25.0, 26.0, 27.0, 31.0, 35.0, 47.0, 56.0, 41.0, 42.0, 37.0, 50.0, 38.0, 52.0, 54.0, 50.0, 50.0, 42.0, 32.0, 31.0, 23.0, 33.0, 17.0, 13.0, 12.0, 12.0, 10.0, 8.0, 6.0, 9.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.76505661010742, -42.194217681884766, -40.62337875366211, -39.05253982543945, -37.4817008972168, -35.91086196899414, -34.34001922607422, -32.76918029785156, -31.19834327697754, -29.627504348754883, -28.056665420532227, -26.485824584960938, -24.91498565673828, -23.344146728515625, -21.77330780029297, -20.202468872070312, -18.631629943847656, -17.060791015625, -15.489952087402344, -13.919112205505371, -12.348273277282715, -10.777434349060059, -9.206594467163086, -7.63575553894043, -6.064916610717773, -4.494077682495117, -2.9232382774353027, -1.3523988723754883, 0.21844005584716797, 1.7892789840698242, 3.360118865966797, 4.930957794189453, 6.501792907714844, 8.0726318359375, 9.643470764160156, 11.214310646057129, 12.785149574279785, 14.355988502502441, 15.926828384399414, 17.49766731262207, 19.068506240844727, 20.639345169067383, 22.21018409729004, 23.781024932861328, 25.351863861083984, 26.92270278930664, 28.493541717529297, 30.064380645751953, 31.63521957397461, 33.206058502197266, 34.77689743041992, 36.34773635864258, 37.918575286865234, 39.48941421508789, 41.06025695800781, 42.63109588623047, 44.201934814453125, 45.77277374267578, 47.34361267089844, 48.914451599121094, 50.48529052734375, 52.056129455566406, 53.62696838378906, 55.19780731201172, 56.768646240234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 4.0, 2.0, 12.0, 10.0, 14.0, 15.0, 14.0, 17.0, 19.0, 28.0, 25.0, 31.0, 34.0, 32.0, 49.0, 51.0, 50.0, 36.0, 35.0, 45.0, 45.0, 43.0, 40.0, 34.0, 32.0, 40.0, 42.0, 38.0, 23.0, 27.0, 28.0, 14.0, 12.0, 13.0, 8.0, 6.0, 6.0, 2.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-56.3577880859375, -54.805931091308594, -53.25407791137695, -51.70222091674805, -50.150367736816406, -48.5985107421875, -47.046653747558594, -45.49479675292969, -43.94294357299805, -42.39108657836914, -40.8392333984375, -39.287376403808594, -37.73551940917969, -36.18366622924805, -34.63180923461914, -33.0799560546875, -31.528099060058594, -29.97624397277832, -28.424388885498047, -26.87253189086914, -25.320676803588867, -23.768821716308594, -22.216964721679688, -20.665109634399414, -19.11325454711914, -17.561399459838867, -16.009544372558594, -14.457687377929688, -12.905832290649414, -11.35397720336914, -9.80212116241455, -8.250265121459961, -6.6984100341796875, -5.146554470062256, -3.594698905944824, -2.0428433418273926, -0.49098777770996094, 1.0608677864074707, 2.6127233505249023, 4.164579391479492, 5.716434478759766, 7.268290042877197, 8.820145606994629, 10.372001647949219, 11.923856735229492, 13.475711822509766, 15.027567863464355, 16.579423904418945, 18.13127899169922, 19.683134078979492, 21.234989166259766, 22.786846160888672, 24.338701248168945, 25.89055633544922, 27.442413330078125, 28.9942684173584, 30.546123504638672, 32.09798049926758, 33.64983367919922, 35.201690673828125, 36.75354766845703, 38.30540084838867, 39.85725784301758, 41.40911102294922, 42.960968017578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 6.0, 14.0, 15.0, 19.0, 37.0, 43.0, 82.0, 89.0, 150.0, 219.0, 279.0, 396.0, 587.0, 800.0, 1201.0, 1728.0, 2422.0, 3635.0, 5337.0, 8070.0, 11717.0, 17851.0, 27499.0, 42145.0, 64786.0, 101494.0, 161766.0, 204647.0, 139423.0, 87544.0, 56166.0, 36372.0, 23882.0, 15657.0, 10412.0, 6979.0, 4686.0, 3141.0, 2261.0, 1512.0, 1029.0, 771.0, 527.0, 346.0, 254.0, 159.0, 126.0, 95.0, 61.0, 46.0, 28.0, 17.0, 13.0, 10.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.875, -12.4361572265625, -11.997314453125, -11.5584716796875, -11.11962890625, -10.6807861328125, -10.241943359375, -9.8031005859375, -9.3642578125, -8.9254150390625, -8.486572265625, -8.0477294921875, -7.60888671875, -7.1700439453125, -6.731201171875, -6.2923583984375, -5.853515625, -5.4146728515625, -4.975830078125, -4.5369873046875, -4.09814453125, -3.6593017578125, -3.220458984375, -2.7816162109375, -2.3427734375, -1.9039306640625, -1.465087890625, -1.0262451171875, -0.58740234375, -0.1485595703125, 0.290283203125, 0.7291259765625, 1.16796875, 1.6068115234375, 2.045654296875, 2.4844970703125, 2.92333984375, 3.3621826171875, 3.801025390625, 4.2398681640625, 4.6787109375, 5.1175537109375, 5.556396484375, 5.9952392578125, 6.43408203125, 6.8729248046875, 7.311767578125, 7.7506103515625, 8.189453125, 8.6282958984375, 9.067138671875, 9.5059814453125, 9.94482421875, 10.3836669921875, 10.822509765625, 11.2613525390625, 11.7001953125, 12.1390380859375, 12.577880859375, 13.0167236328125, 13.45556640625, 13.8944091796875, 14.333251953125, 14.7720947265625, 15.2109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 9.0, 12.0, 11.0, 16.0, 26.0, 35.0, 18.0, 26.0, 49.0, 28.0, 39.0, 37.0, 30.0, 40.0, 42.0, 47.0, 37.0, 41.0, 32.0, 36.0, 39.0, 44.0, 37.0, 31.0, 28.0, 29.0, 20.0, 18.0, 27.0, 14.0, 8.0, 10.0, 9.0, 10.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0], "bins": [-47.375, -45.9765625, -44.578125, -43.1796875, -41.78125, -40.3828125, -38.984375, -37.5859375, -36.1875, -34.7890625, -33.390625, -31.9921875, -30.59375, -29.1953125, -27.796875, -26.3984375, -25.0, -23.6015625, -22.203125, -20.8046875, -19.40625, -18.0078125, -16.609375, -15.2109375, -13.8125, -12.4140625, -11.015625, -9.6171875, -8.21875, -6.8203125, -5.421875, -4.0234375, -2.625, -1.2265625, 0.171875, 1.5703125, 2.96875, 4.3671875, 5.765625, 7.1640625, 8.5625, 9.9609375, 11.359375, 12.7578125, 14.15625, 15.5546875, 16.953125, 18.3515625, 19.75, 21.1484375, 22.546875, 23.9453125, 25.34375, 26.7421875, 28.140625, 29.5390625, 30.9375, 32.3359375, 33.734375, 35.1328125, 36.53125, 37.9296875, 39.328125, 40.7265625, 42.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 5.0, 22.0, 24.0, 28.0, 42.0, 71.0, 96.0, 157.0, 229.0, 340.0, 512.0, 803.0, 1260.0, 1827.0, 3040.0, 5206.0, 8331.0, 14128.0, 24135.0, 42999.0, 80122.0, 160577.0, 285147.0, 199519.0, 97655.0, 51306.0, 28735.0, 16631.0, 9890.0, 5842.0, 3563.0, 2220.0, 1419.0, 866.0, 582.0, 383.0, 235.0, 203.0, 136.0, 71.0, 52.0, 36.0, 24.0, 20.0, 12.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.213623046875, -9.88037109375, -9.547119140625, -9.2138671875, -8.880615234375, -8.54736328125, -8.214111328125, -7.880859375, -7.547607421875, -7.21435546875, -6.881103515625, -6.5478515625, -6.214599609375, -5.88134765625, -5.548095703125, -5.21484375, -4.881591796875, -4.54833984375, -4.215087890625, -3.8818359375, -3.548583984375, -3.21533203125, -2.882080078125, -2.548828125, -2.215576171875, -1.88232421875, -1.549072265625, -1.2158203125, -0.882568359375, -0.54931640625, -0.216064453125, 0.1171875, 0.450439453125, 0.78369140625, 1.116943359375, 1.4501953125, 1.783447265625, 2.11669921875, 2.449951171875, 2.783203125, 3.116455078125, 3.44970703125, 3.782958984375, 4.1162109375, 4.449462890625, 4.78271484375, 5.115966796875, 5.44921875, 5.782470703125, 6.11572265625, 6.448974609375, 6.7822265625, 7.115478515625, 7.44873046875, 7.781982421875, 8.115234375, 8.448486328125, 8.78173828125, 9.114990234375, 9.4482421875, 9.781494140625, 10.11474609375, 10.447998046875, 10.78125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 6.0, 8.0, 14.0, 8.0, 19.0, 19.0, 27.0, 17.0, 33.0, 24.0, 28.0, 27.0, 31.0, 48.0, 31.0, 29.0, 30.0, 31.0, 43.0, 42.0, 39.0, 35.0, 37.0, 42.0, 25.0, 31.0, 22.0, 33.0, 20.0, 25.0, 27.0, 17.0, 16.0, 23.0, 10.0, 14.0, 14.0, 8.0, 5.0, 5.0, 3.0, 6.0, 5.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.96875, -30.056640625, -29.14453125, -28.232421875, -27.3203125, -26.408203125, -25.49609375, -24.583984375, -23.671875, -22.759765625, -21.84765625, -20.935546875, -20.0234375, -19.111328125, -18.19921875, -17.287109375, -16.375, -15.462890625, -14.55078125, -13.638671875, -12.7265625, -11.814453125, -10.90234375, -9.990234375, -9.078125, -8.166015625, -7.25390625, -6.341796875, -5.4296875, -4.517578125, -3.60546875, -2.693359375, -1.78125, -0.869140625, 0.04296875, 0.955078125, 1.8671875, 2.779296875, 3.69140625, 4.603515625, 5.515625, 6.427734375, 7.33984375, 8.251953125, 9.1640625, 10.076171875, 10.98828125, 11.900390625, 12.8125, 13.724609375, 14.63671875, 15.548828125, 16.4609375, 17.373046875, 18.28515625, 19.197265625, 20.109375, 21.021484375, 21.93359375, 22.845703125, 23.7578125, 24.669921875, 25.58203125, 26.494140625, 27.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 11.0, 19.0, 39.0, 48.0, 78.0, 97.0, 188.0, 271.0, 442.0, 698.0, 1014.0, 1591.0, 2639.0, 4110.0, 6676.0, 10869.0, 17702.0, 29504.0, 49901.0, 86776.0, 151075.0, 253556.0, 180731.0, 102937.0, 59112.0, 34479.0, 20681.0, 12530.0, 7654.0, 4867.0, 2977.0, 1942.0, 1200.0, 757.0, 459.0, 326.0, 222.0, 129.0, 79.0, 50.0, 23.0, 31.0, 20.0, 15.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.7422027587890625, -0.715362548828125, -0.6885223388671875, -0.66168212890625, -0.6348419189453125, -0.608001708984375, -0.5811614990234375, -0.5543212890625, -0.5274810791015625, -0.500640869140625, -0.4738006591796875, -0.44696044921875, -0.4201202392578125, -0.393280029296875, -0.3664398193359375, -0.339599609375, -0.3127593994140625, -0.285919189453125, -0.2590789794921875, -0.23223876953125, -0.2053985595703125, -0.178558349609375, -0.1517181396484375, -0.1248779296875, -0.0980377197265625, -0.071197509765625, -0.0443572998046875, -0.01751708984375, 0.0093231201171875, 0.036163330078125, 0.0630035400390625, 0.08984375, 0.1166839599609375, 0.143524169921875, 0.1703643798828125, 0.19720458984375, 0.2240447998046875, 0.250885009765625, 0.2777252197265625, 0.3045654296875, 0.3314056396484375, 0.358245849609375, 0.3850860595703125, 0.41192626953125, 0.4387664794921875, 0.465606689453125, 0.4924468994140625, 0.519287109375, 0.5461273193359375, 0.572967529296875, 0.5998077392578125, 0.62664794921875, 0.6534881591796875, 0.680328369140625, 0.7071685791015625, 0.7340087890625, 0.7608489990234375, 0.787689208984375, 0.8145294189453125, 0.84136962890625, 0.8682098388671875, 0.895050048828125, 0.9218902587890625, 0.94873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 10.0, 6.0, 4.0, 7.0, 10.0, 15.0, 13.0, 29.0, 20.0, 28.0, 35.0, 39.0, 48.0, 64.0, 58.0, 83.0, 81.0, 62.0, 55.0, 42.0, 40.0, 36.0, 34.0, 29.0, 17.0, 17.0, 18.0, 20.0, 21.0, 12.0, 5.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0002512931823730469, -0.0002432689070701599, -0.00023524463176727295, -0.00022722035646438599, -0.00021919608116149902, -0.00021117180585861206, -0.0002031475305557251, -0.00019512325525283813, -0.00018709897994995117, -0.0001790747046470642, -0.00017105042934417725, -0.00016302615404129028, -0.00015500187873840332, -0.00014697760343551636, -0.0001389533281326294, -0.00013092905282974243, -0.00012290477752685547, -0.0001148805022239685, -0.00010685622692108154, -9.883195161819458e-05, -9.080767631530762e-05, -8.278340101242065e-05, -7.475912570953369e-05, -6.673485040664673e-05, -5.8710575103759766e-05, -5.06862998008728e-05, -4.266202449798584e-05, -3.463774919509888e-05, -2.6613473892211914e-05, -1.858919858932495e-05, -1.0564923286437988e-05, -2.5406479835510254e-06, 5.4836273193359375e-06, 1.35079026222229e-05, 2.1532177925109863e-05, 2.9556453227996826e-05, 3.758072853088379e-05, 4.560500383377075e-05, 5.3629279136657715e-05, 6.165355443954468e-05, 6.967782974243164e-05, 7.77021050453186e-05, 8.572638034820557e-05, 9.375065565109253e-05, 0.00010177493095397949, 0.00010979920625686646, 0.00011782348155975342, 0.00012584775686264038, 0.00013387203216552734, 0.0001418963074684143, 0.00014992058277130127, 0.00015794485807418823, 0.0001659691333770752, 0.00017399340867996216, 0.00018201768398284912, 0.00019004195928573608, 0.00019806623458862305, 0.00020609050989151, 0.00021411478519439697, 0.00022213906049728394, 0.0002301633358001709, 0.00023818761110305786, 0.0002462118864059448, 0.0002542361617088318, 0.00026226043701171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 15.0, 17.0, 17.0, 29.0, 43.0, 62.0, 88.0, 133.0, 160.0, 208.0, 335.0, 523.0, 818.0, 1361.0, 2089.0, 3534.0, 5807.0, 9754.0, 16264.0, 26988.0, 45080.0, 73361.0, 116678.0, 182328.0, 205922.0, 136279.0, 85920.0, 53430.0, 32129.0, 19426.0, 11573.0, 7051.0, 4150.0, 2530.0, 1541.0, 971.0, 612.0, 399.0, 270.0, 185.0, 134.0, 122.0, 61.0, 49.0, 32.0, 31.0, 14.0, 12.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2998046875, -1.2606201171875, -1.221435546875, -1.1822509765625, -1.14306640625, -1.1038818359375, -1.064697265625, -1.0255126953125, -0.986328125, -0.9471435546875, -0.907958984375, -0.8687744140625, -0.82958984375, -0.7904052734375, -0.751220703125, -0.7120361328125, -0.6728515625, -0.6336669921875, -0.594482421875, -0.5552978515625, -0.51611328125, -0.4769287109375, -0.437744140625, -0.3985595703125, -0.359375, -0.3201904296875, -0.281005859375, -0.2418212890625, -0.20263671875, -0.1634521484375, -0.124267578125, -0.0850830078125, -0.0458984375, -0.0067138671875, 0.032470703125, 0.0716552734375, 0.11083984375, 0.1500244140625, 0.189208984375, 0.2283935546875, 0.267578125, 0.3067626953125, 0.345947265625, 0.3851318359375, 0.42431640625, 0.4635009765625, 0.502685546875, 0.5418701171875, 0.5810546875, 0.6202392578125, 0.659423828125, 0.6986083984375, 0.73779296875, 0.7769775390625, 0.816162109375, 0.8553466796875, 0.89453125, 0.9337158203125, 0.972900390625, 1.0120849609375, 1.05126953125, 1.0904541015625, 1.129638671875, 1.1688232421875, 1.2080078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 16.0, 13.0, 17.0, 16.0, 15.0, 21.0, 25.0, 32.0, 21.0, 24.0, 46.0, 41.0, 43.0, 44.0, 42.0, 52.0, 49.0, 52.0, 53.0, 39.0, 52.0, 31.0, 37.0, 29.0, 16.0, 24.0, 19.0, 21.0, 20.0, 16.0, 12.0, 8.0, 5.0, 6.0, 9.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.3581695556640625, -0.345001220703125, -0.3318328857421875, -0.31866455078125, -0.3054962158203125, -0.292327880859375, -0.2791595458984375, -0.2659912109375, -0.2528228759765625, -0.239654541015625, -0.2264862060546875, -0.21331787109375, -0.2001495361328125, -0.186981201171875, -0.1738128662109375, -0.16064453125, -0.1474761962890625, -0.134307861328125, -0.1211395263671875, -0.10797119140625, -0.0948028564453125, -0.081634521484375, -0.0684661865234375, -0.0552978515625, -0.0421295166015625, -0.028961181640625, -0.0157928466796875, -0.00262451171875, 0.0105438232421875, 0.023712158203125, 0.0368804931640625, 0.050048828125, 0.0632171630859375, 0.076385498046875, 0.0895538330078125, 0.10272216796875, 0.1158905029296875, 0.129058837890625, 0.1422271728515625, 0.1553955078125, 0.1685638427734375, 0.181732177734375, 0.1949005126953125, 0.20806884765625, 0.2212371826171875, 0.234405517578125, 0.2475738525390625, 0.2607421875, 0.2739105224609375, 0.287078857421875, 0.3002471923828125, 0.31341552734375, 0.3265838623046875, 0.339752197265625, 0.3529205322265625, 0.3660888671875, 0.3792572021484375, 0.392425537109375, 0.4055938720703125, 0.41876220703125, 0.4319305419921875, 0.445098876953125, 0.4582672119140625, 0.471435546875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 9.0, 10.0, 19.0, 22.0, 22.0, 23.0, 26.0, 30.0, 36.0, 34.0, 46.0, 49.0, 40.0, 44.0, 48.0, 45.0, 50.0, 43.0, 58.0, 48.0, 49.0, 29.0, 35.0, 27.0, 26.0, 25.0, 21.0, 15.0, 10.0, 9.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.78710174560547, -40.31550598144531, -38.843910217285156, -37.372310638427734, -35.90071487426758, -34.42911911010742, -32.957523345947266, -31.485925674438477, -30.014328002929688, -28.54273223876953, -27.071134567260742, -25.599538803100586, -24.127941131591797, -22.65634536743164, -21.184749603271484, -19.713151931762695, -18.24155616760254, -16.769960403442383, -15.298362731933594, -13.826766967773438, -12.355169296264648, -10.883573532104492, -9.41197681427002, -7.940380096435547, -6.468783378601074, -4.997186660766602, -3.525590181350708, -2.0539937019348145, -0.5823969841003418, 0.8891997337341309, 2.3607959747314453, 3.832392692565918, 5.303989410400391, 6.775586128234863, 8.247182846069336, 9.718778610229492, 11.190376281738281, 12.661972045898438, 14.13356876373291, 15.605165481567383, 17.076763153076172, 18.548358917236328, 20.019956588745117, 21.491552352905273, 22.963150024414062, 24.43474578857422, 25.906341552734375, 27.377939224243164, 28.84953498840332, 30.321130752563477, 31.792728424072266, 33.26432418823242, 34.73591995239258, 36.20751953125, 37.679115295410156, 39.15071105957031, 40.62230682373047, 42.093902587890625, 43.56549835205078, 45.0370979309082, 46.50869369506836, 47.980289459228516, 49.45188522338867, 50.923484802246094, 52.39508056640625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 5.0, 1.0, 15.0, 8.0, 14.0, 17.0, 11.0, 17.0, 26.0, 22.0, 34.0, 26.0, 36.0, 35.0, 52.0, 42.0, 50.0, 37.0, 40.0, 43.0, 36.0, 57.0, 30.0, 35.0, 33.0, 40.0, 48.0, 32.0, 27.0, 23.0, 26.0, 11.0, 15.0, 13.0, 5.0, 8.0, 4.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.87858581542969, -51.40857696533203, -49.938568115234375, -48.46855926513672, -46.99855041503906, -45.528541564941406, -44.05853271484375, -42.588523864746094, -41.11851501464844, -39.64850616455078, -38.178497314453125, -36.70848846435547, -35.23847961425781, -33.768470764160156, -32.2984619140625, -30.828453063964844, -29.358442306518555, -27.8884334564209, -26.418424606323242, -24.948415756225586, -23.47840690612793, -22.008398056030273, -20.538387298583984, -19.068378448486328, -17.598369598388672, -16.128360748291016, -14.65835189819336, -13.188343048095703, -11.718334197998047, -10.24832534790039, -8.778315544128418, -7.308306694030762, -5.838298797607422, -4.368289947509766, -2.8982808589935303, -1.428271770477295, 0.04173707962036133, 1.5117459297180176, 2.981755256652832, 4.451764106750488, 5.9217729568481445, 7.391781806945801, 8.861790657043457, 10.33180046081543, 11.801809310913086, 13.271818161010742, 14.741827011108398, 16.211835861206055, 17.68184471130371, 19.151853561401367, 20.621862411499023, 22.09187126159668, 23.561880111694336, 25.031888961791992, 26.50189971923828, 27.971908569335938, 29.441917419433594, 30.91192626953125, 32.381935119628906, 33.85194396972656, 35.32195281982422, 36.791961669921875, 38.26197052001953, 39.73197937011719, 41.201988220214844]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 1.0, 6.0, 12.0, 33.0, 27.0, 48.0, 67.0, 145.0, 178.0, 281.0, 485.0, 746.0, 1203.0, 2110.0, 3331.0, 5638.0, 9705.0, 17129.0, 29746.0, 50874.0, 83627.0, 125590.0, 161567.0, 168764.0, 141216.0, 98099.0, 61708.0, 36370.0, 20993.0, 11799.0, 6883.0, 4041.0, 2328.0, 1467.0, 880.0, 499.0, 355.0, 233.0, 128.0, 82.0, 56.0, 39.0, 22.0, 17.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.75, -50.1904296875, -48.630859375, -47.0712890625, -45.51171875, -43.9521484375, -42.392578125, -40.8330078125, -39.2734375, -37.7138671875, -36.154296875, -34.5947265625, -33.03515625, -31.4755859375, -29.916015625, -28.3564453125, -26.796875, -25.2373046875, -23.677734375, -22.1181640625, -20.55859375, -18.9990234375, -17.439453125, -15.8798828125, -14.3203125, -12.7607421875, -11.201171875, -9.6416015625, -8.08203125, -6.5224609375, -4.962890625, -3.4033203125, -1.84375, -0.2841796875, 1.275390625, 2.8349609375, 4.39453125, 5.9541015625, 7.513671875, 9.0732421875, 10.6328125, 12.1923828125, 13.751953125, 15.3115234375, 16.87109375, 18.4306640625, 19.990234375, 21.5498046875, 23.109375, 24.6689453125, 26.228515625, 27.7880859375, 29.34765625, 30.9072265625, 32.466796875, 34.0263671875, 35.5859375, 37.1455078125, 38.705078125, 40.2646484375, 41.82421875, 43.3837890625, 44.943359375, 46.5029296875, 48.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 6.0, 9.0, 12.0, 9.0, 17.0, 11.0, 16.0, 19.0, 31.0, 22.0, 32.0, 34.0, 35.0, 37.0, 42.0, 47.0, 31.0, 50.0, 45.0, 44.0, 37.0, 46.0, 33.0, 39.0, 44.0, 30.0, 40.0, 35.0, 29.0, 31.0, 19.0, 16.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-49.5, -48.18212890625, -46.8642578125, -45.54638671875, -44.228515625, -42.91064453125, -41.5927734375, -40.27490234375, -38.95703125, -37.63916015625, -36.3212890625, -35.00341796875, -33.685546875, -32.36767578125, -31.0498046875, -29.73193359375, -28.4140625, -27.09619140625, -25.7783203125, -24.46044921875, -23.142578125, -21.82470703125, -20.5068359375, -19.18896484375, -17.87109375, -16.55322265625, -15.2353515625, -13.91748046875, -12.599609375, -11.28173828125, -9.9638671875, -8.64599609375, -7.328125, -6.01025390625, -4.6923828125, -3.37451171875, -2.056640625, -0.73876953125, 0.5791015625, 1.89697265625, 3.21484375, 4.53271484375, 5.8505859375, 7.16845703125, 8.486328125, 9.80419921875, 11.1220703125, 12.43994140625, 13.7578125, 15.07568359375, 16.3935546875, 17.71142578125, 19.029296875, 20.34716796875, 21.6650390625, 22.98291015625, 24.30078125, 25.61865234375, 26.9365234375, 28.25439453125, 29.572265625, 30.89013671875, 32.2080078125, 33.52587890625, 34.84375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 7.0, 7.0, 11.0, 20.0, 27.0, 52.0, 62.0, 93.0, 199.0, 279.0, 350.0, 556.0, 711.0, 1065.0, 1510.0, 2170.0, 3022.0, 4463.0, 6121.0, 8562.0, 12091.0, 16459.0, 22345.0, 30106.0, 39125.0, 51536.0, 64031.0, 76914.0, 87622.0, 93421.0, 93716.0, 88141.0, 77077.0, 63913.0, 51309.0, 39856.0, 30300.0, 22603.0, 16681.0, 12130.0, 8731.0, 6345.0, 4503.0, 3125.0, 2192.0, 1584.0, 1122.0, 756.0, 507.0, 338.0, 233.0, 168.0, 98.0, 89.0, 38.0, 36.0, 20.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0], "bins": [-28.796875, -27.868408203125, -26.93994140625, -26.011474609375, -25.0830078125, -24.154541015625, -23.22607421875, -22.297607421875, -21.369140625, -20.440673828125, -19.51220703125, -18.583740234375, -17.6552734375, -16.726806640625, -15.79833984375, -14.869873046875, -13.94140625, -13.012939453125, -12.08447265625, -11.156005859375, -10.2275390625, -9.299072265625, -8.37060546875, -7.442138671875, -6.513671875, -5.585205078125, -4.65673828125, -3.728271484375, -2.7998046875, -1.871337890625, -0.94287109375, -0.014404296875, 0.9140625, 1.842529296875, 2.77099609375, 3.699462890625, 4.6279296875, 5.556396484375, 6.48486328125, 7.413330078125, 8.341796875, 9.270263671875, 10.19873046875, 11.127197265625, 12.0556640625, 12.984130859375, 13.91259765625, 14.841064453125, 15.76953125, 16.697998046875, 17.62646484375, 18.554931640625, 19.4833984375, 20.411865234375, 21.34033203125, 22.268798828125, 23.197265625, 24.125732421875, 25.05419921875, 25.982666015625, 26.9111328125, 27.839599609375, 28.76806640625, 29.696533203125, 30.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 3.0, 6.0, 11.0, 7.0, 8.0, 19.0, 13.0, 18.0, 20.0, 19.0, 23.0, 25.0, 21.0, 23.0, 33.0, 27.0, 32.0, 30.0, 41.0, 32.0, 36.0, 39.0, 27.0, 26.0, 35.0, 37.0, 29.0, 33.0, 30.0, 37.0, 30.0, 13.0, 20.0, 19.0, 22.0, 16.0, 15.0, 16.0, 14.0, 14.0, 10.0, 14.0, 15.0, 7.0, 9.0, 5.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-21.03125, -20.325439453125, -19.61962890625, -18.913818359375, -18.2080078125, -17.502197265625, -16.79638671875, -16.090576171875, -15.384765625, -14.678955078125, -13.97314453125, -13.267333984375, -12.5615234375, -11.855712890625, -11.14990234375, -10.444091796875, -9.73828125, -9.032470703125, -8.32666015625, -7.620849609375, -6.9150390625, -6.209228515625, -5.50341796875, -4.797607421875, -4.091796875, -3.385986328125, -2.68017578125, -1.974365234375, -1.2685546875, -0.562744140625, 0.14306640625, 0.848876953125, 1.5546875, 2.260498046875, 2.96630859375, 3.672119140625, 4.3779296875, 5.083740234375, 5.78955078125, 6.495361328125, 7.201171875, 7.906982421875, 8.61279296875, 9.318603515625, 10.0244140625, 10.730224609375, 11.43603515625, 12.141845703125, 12.84765625, 13.553466796875, 14.25927734375, 14.965087890625, 15.6708984375, 16.376708984375, 17.08251953125, 17.788330078125, 18.494140625, 19.199951171875, 19.90576171875, 20.611572265625, 21.3173828125, 22.023193359375, 22.72900390625, 23.434814453125, 24.140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 10.0, 3.0, 11.0, 12.0, 20.0, 42.0, 33.0, 86.0, 124.0, 179.0, 250.0, 406.0, 570.0, 920.0, 1392.0, 1980.0, 2987.0, 4702.0, 7187.0, 10660.0, 15976.0, 24155.0, 36271.0, 51727.0, 72775.0, 95998.0, 115627.0, 125433.0, 119687.0, 102229.0, 79298.0, 57381.0, 39963.0, 26931.0, 18021.0, 11852.0, 8108.0, 5355.0, 3461.0, 2194.0, 1528.0, 1004.0, 662.0, 452.0, 279.0, 218.0, 161.0, 93.0, 52.0, 40.0, 29.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.98681640625, -6.7587890625, -6.53076171875, -6.302734375, -6.07470703125, -5.8466796875, -5.61865234375, -5.390625, -5.16259765625, -4.9345703125, -4.70654296875, -4.478515625, -4.25048828125, -4.0224609375, -3.79443359375, -3.56640625, -3.33837890625, -3.1103515625, -2.88232421875, -2.654296875, -2.42626953125, -2.1982421875, -1.97021484375, -1.7421875, -1.51416015625, -1.2861328125, -1.05810546875, -0.830078125, -0.60205078125, -0.3740234375, -0.14599609375, 0.08203125, 0.31005859375, 0.5380859375, 0.76611328125, 0.994140625, 1.22216796875, 1.4501953125, 1.67822265625, 1.90625, 2.13427734375, 2.3623046875, 2.59033203125, 2.818359375, 3.04638671875, 3.2744140625, 3.50244140625, 3.73046875, 3.95849609375, 4.1865234375, 4.41455078125, 4.642578125, 4.87060546875, 5.0986328125, 5.32666015625, 5.5546875, 5.78271484375, 6.0107421875, 6.23876953125, 6.466796875, 6.69482421875, 6.9228515625, 7.15087890625, 7.37890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 11.0, 3.0, 5.0, 12.0, 7.0, 9.0, 10.0, 18.0, 20.0, 23.0, 24.0, 22.0, 27.0, 32.0, 44.0, 31.0, 45.0, 46.0, 40.0, 44.0, 59.0, 55.0, 47.0, 40.0, 43.0, 28.0, 35.0, 26.0, 23.0, 28.0, 19.0, 12.0, 16.0, 21.0, 15.0, 8.0, 8.0, 9.0, 5.0, 9.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006685256958007812, -0.0006450265645980835, -0.0006215274333953857, -0.000598028302192688, -0.0005745291709899902, -0.0005510300397872925, -0.0005275309085845947, -0.000504031777381897, -0.0004805326461791992, -0.00045703351497650146, -0.0004335343837738037, -0.00041003525257110596, -0.0003865361213684082, -0.00036303699016571045, -0.0003395378589630127, -0.00031603872776031494, -0.0002925395965576172, -0.00026904046535491943, -0.0002455413341522217, -0.00022204220294952393, -0.00019854307174682617, -0.00017504394054412842, -0.00015154480934143066, -0.0001280456781387329, -0.00010454654693603516, -8.10474157333374e-05, -5.754828453063965e-05, -3.4049153327941895e-05, -1.055002212524414e-05, 1.2949109077453613e-05, 3.644824028015137e-05, 5.994737148284912e-05, 8.344650268554688e-05, 0.00010694563388824463, 0.00013044476509094238, 0.00015394389629364014, 0.0001774430274963379, 0.00020094215869903564, 0.0002244412899017334, 0.00024794042110443115, 0.0002714395523071289, 0.00029493868350982666, 0.0003184378147125244, 0.00034193694591522217, 0.0003654360771179199, 0.0003889352083206177, 0.00041243433952331543, 0.0004359334707260132, 0.00045943260192871094, 0.0004829317331314087, 0.0005064308643341064, 0.0005299299955368042, 0.000553429126739502, 0.0005769282579421997, 0.0006004273891448975, 0.0006239265203475952, 0.000647425651550293, 0.0006709247827529907, 0.0006944239139556885, 0.0007179230451583862, 0.000741422176361084, 0.0007649213075637817, 0.0007884204387664795, 0.0008119195699691772, 0.000835418701171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 5.0, 13.0, 12.0, 24.0, 38.0, 44.0, 67.0, 109.0, 162.0, 228.0, 374.0, 534.0, 823.0, 1270.0, 2102.0, 3312.0, 5503.0, 8907.0, 14634.0, 24363.0, 39060.0, 61832.0, 90645.0, 123907.0, 146160.0, 147265.0, 122911.0, 90659.0, 61566.0, 39039.0, 24544.0, 14940.0, 8777.0, 5515.0, 3410.0, 2097.0, 1287.0, 805.0, 540.0, 358.0, 229.0, 155.0, 109.0, 67.0, 49.0, 42.0, 28.0, 11.0, 15.0, 9.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.9375, -8.658203125, -8.37890625, -8.099609375, -7.8203125, -7.541015625, -7.26171875, -6.982421875, -6.703125, -6.423828125, -6.14453125, -5.865234375, -5.5859375, -5.306640625, -5.02734375, -4.748046875, -4.46875, -4.189453125, -3.91015625, -3.630859375, -3.3515625, -3.072265625, -2.79296875, -2.513671875, -2.234375, -1.955078125, -1.67578125, -1.396484375, -1.1171875, -0.837890625, -0.55859375, -0.279296875, 0.0, 0.279296875, 0.55859375, 0.837890625, 1.1171875, 1.396484375, 1.67578125, 1.955078125, 2.234375, 2.513671875, 2.79296875, 3.072265625, 3.3515625, 3.630859375, 3.91015625, 4.189453125, 4.46875, 4.748046875, 5.02734375, 5.306640625, 5.5859375, 5.865234375, 6.14453125, 6.423828125, 6.703125, 6.982421875, 7.26171875, 7.541015625, 7.8203125, 8.099609375, 8.37890625, 8.658203125, 8.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 3.0, 6.0, 8.0, 14.0, 15.0, 26.0, 22.0, 23.0, 26.0, 31.0, 50.0, 44.0, 68.0, 47.0, 39.0, 62.0, 64.0, 68.0, 45.0, 53.0, 42.0, 43.0, 36.0, 28.0, 22.0, 19.0, 18.0, 17.0, 19.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.359375, -4.2379150390625, -4.116455078125, -3.9949951171875, -3.87353515625, -3.7520751953125, -3.630615234375, -3.5091552734375, -3.3876953125, -3.2662353515625, -3.144775390625, -3.0233154296875, -2.90185546875, -2.7803955078125, -2.658935546875, -2.5374755859375, -2.416015625, -2.2945556640625, -2.173095703125, -2.0516357421875, -1.93017578125, -1.8087158203125, -1.687255859375, -1.5657958984375, -1.4443359375, -1.3228759765625, -1.201416015625, -1.0799560546875, -0.95849609375, -0.8370361328125, -0.715576171875, -0.5941162109375, -0.47265625, -0.3511962890625, -0.229736328125, -0.1082763671875, 0.01318359375, 0.1346435546875, 0.256103515625, 0.3775634765625, 0.4990234375, 0.6204833984375, 0.741943359375, 0.8634033203125, 0.98486328125, 1.1063232421875, 1.227783203125, 1.3492431640625, 1.470703125, 1.5921630859375, 1.713623046875, 1.8350830078125, 1.95654296875, 2.0780029296875, 2.199462890625, 2.3209228515625, 2.4423828125, 2.5638427734375, 2.685302734375, 2.8067626953125, 2.92822265625, 3.0496826171875, 3.171142578125, 3.2926025390625, 3.4140625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 5.0, 3.0, 15.0, 20.0, 17.0, 26.0, 24.0, 33.0, 23.0, 33.0, 42.0, 53.0, 49.0, 61.0, 53.0, 50.0, 63.0, 63.0, 57.0, 45.0, 37.0, 43.0, 26.0, 37.0, 22.0, 16.0, 18.0, 17.0, 13.0, 2.0, 3.0, 9.0, 4.0, 2.0, 0.0, 8.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.36299133300781, -35.89435958862305, -34.42573165893555, -32.95709991455078, -31.48847198486328, -30.019840240478516, -28.551210403442383, -27.08258056640625, -25.613950729370117, -24.145320892333984, -22.67669105529785, -21.20806121826172, -19.739429473876953, -18.270801544189453, -16.802169799804688, -15.333539962768555, -13.864910125732422, -12.396280288696289, -10.927650451660156, -9.459019660949707, -7.990389823913574, -6.521759986877441, -5.053129196166992, -3.5844993591308594, -2.1158695220947266, -0.6472394466400146, 0.8213906288146973, 2.2900209426879883, 3.758650779724121, 5.227280616760254, 6.695911407470703, 8.164541244506836, 9.633174896240234, 11.101804733276367, 12.5704345703125, 14.03906536102295, 15.507695198059082, 16.97632598876953, 18.444955825805664, 19.913585662841797, 21.38221549987793, 22.850845336914062, 24.319475173950195, 25.788105010986328, 27.256736755371094, 28.725364685058594, 30.19399642944336, 31.662626266479492, 33.131256103515625, 34.59988784790039, 36.06851577758789, 37.537147521972656, 39.005775451660156, 40.47440719604492, 41.94303894042969, 43.41166687011719, 44.88029479980469, 46.34892654418945, 47.81755447387695, 49.28618621826172, 50.75481414794922, 52.223445892333984, 53.69207763671875, 55.16070556640625, 56.629337310791016]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 12.0, 4.0, 8.0, 15.0, 10.0, 18.0, 16.0, 14.0, 22.0, 17.0, 26.0, 31.0, 29.0, 27.0, 36.0, 26.0, 39.0, 36.0, 37.0, 37.0, 45.0, 33.0, 43.0, 37.0, 34.0, 37.0, 36.0, 28.0, 34.0, 25.0, 31.0, 32.0, 24.0, 26.0, 15.0, 12.0, 7.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 6.0, 1.0, 3.0], "bins": [-47.087921142578125, -45.79851150512695, -44.50910186767578, -43.219688415527344, -41.93027877807617, -40.640869140625, -39.35145950317383, -38.062049865722656, -36.77263641357422, -35.48322677612305, -34.193817138671875, -32.90440368652344, -31.614994049072266, -30.325584411621094, -29.036174774169922, -27.74676513671875, -26.457355499267578, -25.167945861816406, -23.8785343170166, -22.58912467956543, -21.299713134765625, -20.010303497314453, -18.72089385986328, -17.43148422241211, -16.142072677612305, -14.852662086486816, -13.563251495361328, -12.273841857910156, -10.984431266784668, -9.69502067565918, -8.405611038208008, -7.1162004470825195, -5.826786041259766, -4.537375450134277, -3.2479653358459473, -1.958554983139038, -0.6691446304321289, 0.6202659606933594, 1.9096760749816895, 3.1990861892700195, 4.488496780395508, 5.777907371520996, 7.067317485809326, 8.356727600097656, 9.646138191223145, 10.935548782348633, 12.224958419799805, 13.514369010925293, 14.803779602050781, 16.093189239501953, 17.382600784301758, 18.67201042175293, 19.961421966552734, 21.250831604003906, 22.540241241455078, 23.82965087890625, 25.119062423706055, 26.408472061157227, 27.69788360595703, 28.987293243408203, 30.276702880859375, 31.56611442565918, 32.855525970458984, 34.144935607910156, 35.43434524536133]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 12.0, 11.0, 20.0, 26.0, 50.0, 75.0, 113.0, 166.0, 259.0, 397.0, 597.0, 968.0, 1489.0, 2377.0, 3686.0, 5914.0, 9127.0, 14320.0, 22305.0, 35596.0, 55859.0, 87970.0, 137647.0, 214006.0, 320197.0, 451876.0, 562098.0, 591976.0, 521768.0, 394919.0, 270973.0, 177335.0, 113321.0, 72673.0, 45461.0, 29010.0, 18345.0, 11329.0, 7313.0, 4643.0, 2885.0, 1853.0, 1192.0, 780.0, 490.0, 314.0, 197.0, 134.0, 82.0, 65.0, 33.0, 16.0, 8.0, 10.0, 3.0, 1.0, 3.0], "bins": [-31.234375, -30.3232421875, -29.412109375, -28.5009765625, -27.58984375, -26.6787109375, -25.767578125, -24.8564453125, -23.9453125, -23.0341796875, -22.123046875, -21.2119140625, -20.30078125, -19.3896484375, -18.478515625, -17.5673828125, -16.65625, -15.7451171875, -14.833984375, -13.9228515625, -13.01171875, -12.1005859375, -11.189453125, -10.2783203125, -9.3671875, -8.4560546875, -7.544921875, -6.6337890625, -5.72265625, -4.8115234375, -3.900390625, -2.9892578125, -2.078125, -1.1669921875, -0.255859375, 0.6552734375, 1.56640625, 2.4775390625, 3.388671875, 4.2998046875, 5.2109375, 6.1220703125, 7.033203125, 7.9443359375, 8.85546875, 9.7666015625, 10.677734375, 11.5888671875, 12.5, 13.4111328125, 14.322265625, 15.2333984375, 16.14453125, 17.0556640625, 17.966796875, 18.8779296875, 19.7890625, 20.7001953125, 21.611328125, 22.5224609375, 23.43359375, 24.3447265625, 25.255859375, 26.1669921875, 27.078125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 12.0, 16.0, 19.0, 10.0, 12.0, 27.0, 18.0, 25.0, 34.0, 28.0, 30.0, 30.0, 28.0, 30.0, 42.0, 41.0, 47.0, 45.0, 38.0, 44.0, 38.0, 32.0, 27.0, 43.0, 29.0, 38.0, 34.0, 29.0, 34.0, 19.0, 18.0, 13.0, 6.0, 11.0, 7.0, 2.0, 4.0, 7.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-32.84375, -31.942138671875, -31.04052734375, -30.138916015625, -29.2373046875, -28.335693359375, -27.43408203125, -26.532470703125, -25.630859375, -24.729248046875, -23.82763671875, -22.926025390625, -22.0244140625, -21.122802734375, -20.22119140625, -19.319580078125, -18.41796875, -17.516357421875, -16.61474609375, -15.713134765625, -14.8115234375, -13.909912109375, -13.00830078125, -12.106689453125, -11.205078125, -10.303466796875, -9.40185546875, -8.500244140625, -7.5986328125, -6.697021484375, -5.79541015625, -4.893798828125, -3.9921875, -3.090576171875, -2.18896484375, -1.287353515625, -0.3857421875, 0.515869140625, 1.41748046875, 2.319091796875, 3.220703125, 4.122314453125, 5.02392578125, 5.925537109375, 6.8271484375, 7.728759765625, 8.63037109375, 9.531982421875, 10.43359375, 11.335205078125, 12.23681640625, 13.138427734375, 14.0400390625, 14.941650390625, 15.84326171875, 16.744873046875, 17.646484375, 18.548095703125, 19.44970703125, 20.351318359375, 21.2529296875, 22.154541015625, 23.05615234375, 23.957763671875, 24.859375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 10.0, 24.0, 24.0, 33.0, 64.0, 96.0, 158.0, 278.0, 434.0, 750.0, 1243.0, 2108.0, 3534.0, 5844.0, 9964.0, 16807.0, 27848.0, 46526.0, 76122.0, 121388.0, 185891.0, 274957.0, 380561.0, 481305.0, 541954.0, 529412.0, 453440.0, 348278.0, 246499.0, 165672.0, 106216.0, 66234.0, 39918.0, 24221.0, 14603.0, 8956.0, 5145.0, 3130.0, 1820.0, 1085.0, 667.0, 388.0, 289.0, 154.0, 95.0, 58.0, 34.0, 23.0, 12.0, 3.0, 7.0, 3.0, 5.0, 0.0, 2.0], "bins": [-29.921875, -29.0380859375, -28.154296875, -27.2705078125, -26.38671875, -25.5029296875, -24.619140625, -23.7353515625, -22.8515625, -21.9677734375, -21.083984375, -20.2001953125, -19.31640625, -18.4326171875, -17.548828125, -16.6650390625, -15.78125, -14.8974609375, -14.013671875, -13.1298828125, -12.24609375, -11.3623046875, -10.478515625, -9.5947265625, -8.7109375, -7.8271484375, -6.943359375, -6.0595703125, -5.17578125, -4.2919921875, -3.408203125, -2.5244140625, -1.640625, -0.7568359375, 0.126953125, 1.0107421875, 1.89453125, 2.7783203125, 3.662109375, 4.5458984375, 5.4296875, 6.3134765625, 7.197265625, 8.0810546875, 8.96484375, 9.8486328125, 10.732421875, 11.6162109375, 12.5, 13.3837890625, 14.267578125, 15.1513671875, 16.03515625, 16.9189453125, 17.802734375, 18.6865234375, 19.5703125, 20.4541015625, 21.337890625, 22.2216796875, 23.10546875, 23.9892578125, 24.873046875, 25.7568359375, 26.640625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 9.0, 17.0, 21.0, 28.0, 41.0, 36.0, 41.0, 48.0, 59.0, 77.0, 101.0, 129.0, 142.0, 147.0, 194.0, 198.0, 235.0, 232.0, 235.0, 238.0, 219.0, 218.0, 235.0, 195.0, 187.0, 160.0, 127.0, 112.0, 93.0, 57.0, 63.0, 40.0, 32.0, 15.0, 23.0, 18.0, 14.0, 11.0, 5.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.976318359375, -14.50732421875, -14.038330078125, -13.5693359375, -13.100341796875, -12.63134765625, -12.162353515625, -11.693359375, -11.224365234375, -10.75537109375, -10.286376953125, -9.8173828125, -9.348388671875, -8.87939453125, -8.410400390625, -7.94140625, -7.472412109375, -7.00341796875, -6.534423828125, -6.0654296875, -5.596435546875, -5.12744140625, -4.658447265625, -4.189453125, -3.720458984375, -3.25146484375, -2.782470703125, -2.3134765625, -1.844482421875, -1.37548828125, -0.906494140625, -0.4375, 0.031494140625, 0.50048828125, 0.969482421875, 1.4384765625, 1.907470703125, 2.37646484375, 2.845458984375, 3.314453125, 3.783447265625, 4.25244140625, 4.721435546875, 5.1904296875, 5.659423828125, 6.12841796875, 6.597412109375, 7.06640625, 7.535400390625, 8.00439453125, 8.473388671875, 8.9423828125, 9.411376953125, 9.88037109375, 10.349365234375, 10.818359375, 11.287353515625, 11.75634765625, 12.225341796875, 12.6943359375, 13.163330078125, 13.63232421875, 14.101318359375, 14.5703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 6.0, 8.0, 17.0, 18.0, 22.0, 17.0, 20.0, 24.0, 26.0, 32.0, 32.0, 44.0, 45.0, 44.0, 39.0, 51.0, 41.0, 52.0, 43.0, 39.0, 48.0, 44.0, 32.0, 24.0, 37.0, 23.0, 22.0, 29.0, 20.0, 17.0, 11.0, 13.0, 9.0, 7.0, 5.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.593976974487305, -26.68051528930664, -25.76705551147461, -24.853593826293945, -23.94013214111328, -23.02667236328125, -22.113210678100586, -21.199748992919922, -20.28628921508789, -19.372827529907227, -18.459367752075195, -17.54590606689453, -16.6324462890625, -15.718984603881836, -14.805522918701172, -13.892062187194824, -12.978601455688477, -12.065140724182129, -11.151679992675781, -10.238218307495117, -9.32475757598877, -8.411296844482422, -7.497835636138916, -6.58437442779541, -5.6709136962890625, -4.757452964782715, -3.843991756439209, -2.9305307865142822, -2.0170698165893555, -1.1036090850830078, -0.19014787673950195, 0.7233133316040039, 1.6367759704589844, 2.550236940383911, 3.463697910308838, 4.377159118652344, 5.290619850158691, 6.204080581665039, 7.117541790008545, 8.03100299835205, 8.944463729858398, 9.857924461364746, 10.771385192871094, 11.684846878051758, 12.598307609558105, 13.511768341064453, 14.425230026245117, 15.338690757751465, 16.252151489257812, 17.165613174438477, 18.079072952270508, 18.992534637451172, 19.905994415283203, 20.819456100463867, 21.73291778564453, 22.646377563476562, 23.559839248657227, 24.47330093383789, 25.386760711669922, 26.300222396850586, 27.21368408203125, 28.12714385986328, 29.040605545043945, 29.95406723022461, 30.86752700805664]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 9.0, 12.0, 13.0, 7.0, 15.0, 14.0, 20.0, 22.0, 19.0, 28.0, 30.0, 28.0, 36.0, 33.0, 38.0, 36.0, 33.0, 40.0, 40.0, 30.0, 28.0, 35.0, 46.0, 38.0, 38.0, 34.0, 36.0, 25.0, 29.0, 24.0, 20.0, 22.0, 25.0, 17.0, 11.0, 10.0, 12.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.56411361694336, -28.58710289001465, -27.610090255737305, -26.633079528808594, -25.656068801879883, -24.679058074951172, -23.702045440673828, -22.725034713745117, -21.748023986816406, -20.771013259887695, -19.79400062561035, -18.81698989868164, -17.83997917175293, -16.86296844482422, -15.885955810546875, -14.908945083618164, -13.93193244934082, -12.954920768737793, -11.977910041809082, -11.000898361206055, -10.023887634277344, -9.046875953674316, -8.069864273071289, -7.09285306930542, -6.115841865539551, -5.138830661773682, -4.1618194580078125, -3.184807777404785, -2.207796573638916, -1.2307853698730469, -0.25377368927001953, 0.7232375144958496, 1.7002487182617188, 2.677259922027588, 3.654271364212036, 4.631282806396484, 5.6082940101623535, 6.585305213928223, 7.56231689453125, 8.539327621459961, 9.516339302062988, 10.493350982666016, 11.470361709594727, 12.447373390197754, 13.424385070800781, 14.401395797729492, 15.37840747833252, 16.355419158935547, 17.332429885864258, 18.30944061279297, 19.286453247070312, 20.263463973999023, 21.240474700927734, 22.217487335205078, 23.19449806213379, 24.1715087890625, 25.148521423339844, 26.125532150268555, 27.1025447845459, 28.07955551147461, 29.05656623840332, 30.03357696533203, 31.010589599609375, 31.987600326538086, 32.9646110534668]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 1.0, 2.0, 7.0, 22.0, 20.0, 18.0, 28.0, 54.0, 76.0, 107.0, 166.0, 286.0, 551.0, 1013.0, 1826.0, 3599.0, 7074.0, 14465.0, 29432.0, 61891.0, 133749.0, 278654.0, 269686.0, 129696.0, 59537.0, 28412.0, 13862.0, 6715.0, 3468.0, 1839.0, 933.0, 485.0, 332.0, 200.0, 107.0, 59.0, 60.0, 27.0, 24.0, 26.0, 12.0, 12.0, 7.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.295166015625, -11.91064453125, -11.526123046875, -11.1416015625, -10.757080078125, -10.37255859375, -9.988037109375, -9.603515625, -9.218994140625, -8.83447265625, -8.449951171875, -8.0654296875, -7.680908203125, -7.29638671875, -6.911865234375, -6.52734375, -6.142822265625, -5.75830078125, -5.373779296875, -4.9892578125, -4.604736328125, -4.22021484375, -3.835693359375, -3.451171875, -3.066650390625, -2.68212890625, -2.297607421875, -1.9130859375, -1.528564453125, -1.14404296875, -0.759521484375, -0.375, 0.009521484375, 0.39404296875, 0.778564453125, 1.1630859375, 1.547607421875, 1.93212890625, 2.316650390625, 2.701171875, 3.085693359375, 3.47021484375, 3.854736328125, 4.2392578125, 4.623779296875, 5.00830078125, 5.392822265625, 5.77734375, 6.161865234375, 6.54638671875, 6.930908203125, 7.3154296875, 7.699951171875, 8.08447265625, 8.468994140625, 8.853515625, 9.238037109375, 9.62255859375, 10.007080078125, 10.3916015625, 10.776123046875, 11.16064453125, 11.545166015625, 11.9296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 3.0, 2.0, 4.0, 9.0, 6.0, 12.0, 8.0, 16.0, 13.0, 20.0, 22.0, 13.0, 22.0, 25.0, 27.0, 26.0, 26.0, 29.0, 31.0, 30.0, 39.0, 41.0, 35.0, 29.0, 26.0, 36.0, 44.0, 23.0, 37.0, 32.0, 24.0, 33.0, 36.0, 26.0, 30.0, 23.0, 19.0, 21.0, 17.0, 15.0, 14.0, 7.0, 11.0, 7.0, 6.0, 3.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-28.0, -27.09765625, -26.1953125, -25.29296875, -24.390625, -23.48828125, -22.5859375, -21.68359375, -20.78125, -19.87890625, -18.9765625, -18.07421875, -17.171875, -16.26953125, -15.3671875, -14.46484375, -13.5625, -12.66015625, -11.7578125, -10.85546875, -9.953125, -9.05078125, -8.1484375, -7.24609375, -6.34375, -5.44140625, -4.5390625, -3.63671875, -2.734375, -1.83203125, -0.9296875, -0.02734375, 0.875, 1.77734375, 2.6796875, 3.58203125, 4.484375, 5.38671875, 6.2890625, 7.19140625, 8.09375, 8.99609375, 9.8984375, 10.80078125, 11.703125, 12.60546875, 13.5078125, 14.41015625, 15.3125, 16.21484375, 17.1171875, 18.01953125, 18.921875, 19.82421875, 20.7265625, 21.62890625, 22.53125, 23.43359375, 24.3359375, 25.23828125, 26.140625, 27.04296875, 27.9453125, 28.84765625, 29.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 10.0, 16.0, 15.0, 23.0, 19.0, 38.0, 65.0, 114.0, 134.0, 233.0, 355.0, 536.0, 833.0, 1276.0, 2142.0, 3505.0, 6046.0, 10522.0, 19395.0, 35758.0, 69650.0, 140792.0, 268910.0, 239542.0, 118638.0, 59328.0, 30985.0, 16771.0, 9387.0, 5259.0, 3126.0, 1933.0, 1109.0, 714.0, 442.0, 286.0, 200.0, 143.0, 108.0, 53.0, 34.0, 23.0, 34.0, 15.0, 11.0, 8.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.82421875, -6.61669921875, -6.4091796875, -6.20166015625, -5.994140625, -5.78662109375, -5.5791015625, -5.37158203125, -5.1640625, -4.95654296875, -4.7490234375, -4.54150390625, -4.333984375, -4.12646484375, -3.9189453125, -3.71142578125, -3.50390625, -3.29638671875, -3.0888671875, -2.88134765625, -2.673828125, -2.46630859375, -2.2587890625, -2.05126953125, -1.84375, -1.63623046875, -1.4287109375, -1.22119140625, -1.013671875, -0.80615234375, -0.5986328125, -0.39111328125, -0.18359375, 0.02392578125, 0.2314453125, 0.43896484375, 0.646484375, 0.85400390625, 1.0615234375, 1.26904296875, 1.4765625, 1.68408203125, 1.8916015625, 2.09912109375, 2.306640625, 2.51416015625, 2.7216796875, 2.92919921875, 3.13671875, 3.34423828125, 3.5517578125, 3.75927734375, 3.966796875, 4.17431640625, 4.3818359375, 4.58935546875, 4.796875, 5.00439453125, 5.2119140625, 5.41943359375, 5.626953125, 5.83447265625, 6.0419921875, 6.24951171875, 6.45703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 5.0, 5.0, 8.0, 11.0, 7.0, 23.0, 19.0, 25.0, 27.0, 23.0, 28.0, 24.0, 30.0, 31.0, 42.0, 37.0, 31.0, 43.0, 39.0, 35.0, 40.0, 39.0, 34.0, 37.0, 48.0, 36.0, 41.0, 32.0, 29.0, 25.0, 22.0, 20.0, 14.0, 16.0, 15.0, 14.0, 9.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.21875, -22.5, -21.78125, -21.0625, -20.34375, -19.625, -18.90625, -18.1875, -17.46875, -16.75, -16.03125, -15.3125, -14.59375, -13.875, -13.15625, -12.4375, -11.71875, -11.0, -10.28125, -9.5625, -8.84375, -8.125, -7.40625, -6.6875, -5.96875, -5.25, -4.53125, -3.8125, -3.09375, -2.375, -1.65625, -0.9375, -0.21875, 0.5, 1.21875, 1.9375, 2.65625, 3.375, 4.09375, 4.8125, 5.53125, 6.25, 6.96875, 7.6875, 8.40625, 9.125, 9.84375, 10.5625, 11.28125, 12.0, 12.71875, 13.4375, 14.15625, 14.875, 15.59375, 16.3125, 17.03125, 17.75, 18.46875, 19.1875, 19.90625, 20.625, 21.34375, 22.0625, 22.78125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 18.0, 18.0, 32.0, 46.0, 46.0, 72.0, 109.0, 133.0, 231.0, 332.0, 474.0, 628.0, 1018.0, 1522.0, 2225.0, 3332.0, 5182.0, 8014.0, 12608.0, 20778.0, 34866.0, 61106.0, 117162.0, 251753.0, 253020.0, 119066.0, 62004.0, 35120.0, 21069.0, 12760.0, 8147.0, 5194.0, 3472.0, 2201.0, 1513.0, 1004.0, 719.0, 483.0, 311.0, 207.0, 147.0, 121.0, 90.0, 71.0, 34.0, 31.0, 15.0, 11.0, 11.0, 9.0, 2.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.462890625, -0.4474639892578125, -0.432037353515625, -0.4166107177734375, -0.40118408203125, -0.3857574462890625, -0.370330810546875, -0.3549041748046875, -0.3394775390625, -0.3240509033203125, -0.308624267578125, -0.2931976318359375, -0.27777099609375, -0.2623443603515625, -0.246917724609375, -0.2314910888671875, -0.216064453125, -0.2006378173828125, -0.185211181640625, -0.1697845458984375, -0.15435791015625, -0.1389312744140625, -0.123504638671875, -0.1080780029296875, -0.0926513671875, -0.0772247314453125, -0.061798095703125, -0.0463714599609375, -0.03094482421875, -0.0155181884765625, -9.1552734375e-05, 0.0153350830078125, 0.03076171875, 0.0461883544921875, 0.061614990234375, 0.0770416259765625, 0.09246826171875, 0.1078948974609375, 0.123321533203125, 0.1387481689453125, 0.1541748046875, 0.1696014404296875, 0.185028076171875, 0.2004547119140625, 0.21588134765625, 0.2313079833984375, 0.246734619140625, 0.2621612548828125, 0.277587890625, 0.2930145263671875, 0.308441162109375, 0.3238677978515625, 0.33929443359375, 0.3547210693359375, 0.370147705078125, 0.3855743408203125, 0.4010009765625, 0.4164276123046875, 0.431854248046875, 0.4472808837890625, 0.46270751953125, 0.4781341552734375, 0.493560791015625, 0.5089874267578125, 0.5244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 9.0, 9.0, 16.0, 16.0, 19.0, 25.0, 44.0, 36.0, 45.0, 58.0, 71.0, 73.0, 69.0, 76.0, 81.0, 73.0, 45.0, 49.0, 32.0, 28.0, 23.0, 26.0, 12.0, 10.0, 12.0, 12.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014197826385498047, -0.00013800431042909622, -0.00013403035700321198, -0.00013005640357732773, -0.00012608245015144348, -0.00012210849672555923, -0.00011813454329967499, -0.00011416058987379074, -0.0001101866364479065, -0.00010621268302202225, -0.000102238729596138, -9.826477617025375e-05, -9.429082274436951e-05, -9.031686931848526e-05, -8.634291589260101e-05, -8.236896246671677e-05, -7.839500904083252e-05, -7.442105561494827e-05, -7.044710218906403e-05, -6.647314876317978e-05, -6.249919533729553e-05, -5.8525241911411285e-05, -5.455128848552704e-05, -5.057733505964279e-05, -4.6603381633758545e-05, -4.26294282078743e-05, -3.865547478199005e-05, -3.4681521356105804e-05, -3.070756793022156e-05, -2.673361450433731e-05, -2.2759661078453064e-05, -1.8785707652568817e-05, -1.481175422668457e-05, -1.0837800800800323e-05, -6.863847374916077e-06, -2.88989394903183e-06, 1.084059476852417e-06, 5.058012902736664e-06, 9.03196632862091e-06, 1.3005919754505157e-05, 1.6979873180389404e-05, 2.095382660627365e-05, 2.4927780032157898e-05, 2.8901733458042145e-05, 3.287568688392639e-05, 3.684964030981064e-05, 4.0823593735694885e-05, 4.479754716157913e-05, 4.877150058746338e-05, 5.2745454013347626e-05, 5.671940743923187e-05, 6.069336086511612e-05, 6.466731429100037e-05, 6.864126771688461e-05, 7.261522114276886e-05, 7.65891745686531e-05, 8.056312799453735e-05, 8.45370814204216e-05, 8.851103484630585e-05, 9.24849882721901e-05, 9.645894169807434e-05, 0.00010043289512395859, 0.00010440684854984283, 0.00010838080197572708, 0.00011235475540161133]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 8.0, 9.0, 15.0, 17.0, 35.0, 58.0, 85.0, 114.0, 160.0, 204.0, 348.0, 513.0, 734.0, 1101.0, 1676.0, 2330.0, 3482.0, 5136.0, 7458.0, 11168.0, 16083.0, 24244.0, 35621.0, 55817.0, 91758.0, 171107.0, 263408.0, 135319.0, 76700.0, 47596.0, 31024.0, 20859.0, 14157.0, 9512.0, 6572.0, 4414.0, 2994.0, 2167.0, 1429.0, 998.0, 740.0, 457.0, 297.0, 216.0, 136.0, 101.0, 67.0, 38.0, 32.0, 19.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2724609375, -1.231842041015625, -1.19122314453125, -1.150604248046875, -1.1099853515625, -1.069366455078125, -1.02874755859375, -0.988128662109375, -0.947509765625, -0.906890869140625, -0.86627197265625, -0.825653076171875, -0.7850341796875, -0.744415283203125, -0.70379638671875, -0.663177490234375, -0.62255859375, -0.581939697265625, -0.54132080078125, -0.500701904296875, -0.4600830078125, -0.419464111328125, -0.37884521484375, -0.338226318359375, -0.297607421875, -0.256988525390625, -0.21636962890625, -0.175750732421875, -0.1351318359375, -0.094512939453125, -0.05389404296875, -0.013275146484375, 0.02734375, 0.067962646484375, 0.10858154296875, 0.149200439453125, 0.1898193359375, 0.230438232421875, 0.27105712890625, 0.311676025390625, 0.352294921875, 0.392913818359375, 0.43353271484375, 0.474151611328125, 0.5147705078125, 0.555389404296875, 0.59600830078125, 0.636627197265625, 0.67724609375, 0.717864990234375, 0.75848388671875, 0.799102783203125, 0.8397216796875, 0.880340576171875, 0.92095947265625, 0.961578369140625, 1.002197265625, 1.042816162109375, 1.08343505859375, 1.124053955078125, 1.1646728515625, 1.205291748046875, 1.24591064453125, 1.286529541015625, 1.3271484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 7.0, 13.0, 15.0, 11.0, 13.0, 15.0, 21.0, 23.0, 16.0, 27.0, 25.0, 28.0, 30.0, 36.0, 54.0, 57.0, 53.0, 70.0, 65.0, 47.0, 52.0, 47.0, 26.0, 22.0, 26.0, 26.0, 31.0, 17.0, 26.0, 18.0, 14.0, 13.0, 8.0, 9.0, 6.0, 5.0, 1.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.51611328125, -0.5005073547363281, -0.48490142822265625, -0.4692955017089844, -0.4536895751953125, -0.4380836486816406, -0.42247772216796875, -0.4068717956542969, -0.391265869140625, -0.3756599426269531, -0.36005401611328125, -0.3444480895996094, -0.3288421630859375, -0.3132362365722656, -0.29763031005859375, -0.2820243835449219, -0.26641845703125, -0.2508125305175781, -0.23520660400390625, -0.21960067749023438, -0.2039947509765625, -0.18838882446289062, -0.17278289794921875, -0.15717697143554688, -0.141571044921875, -0.12596511840820312, -0.11035919189453125, -0.09475326538085938, -0.0791473388671875, -0.06354141235351562, -0.04793548583984375, -0.032329559326171875, -0.0167236328125, -0.001117706298828125, 0.01448822021484375, 0.030094146728515625, 0.0457000732421875, 0.061305999755859375, 0.07691192626953125, 0.09251785278320312, 0.108123779296875, 0.12372970581054688, 0.13933563232421875, 0.15494155883789062, 0.1705474853515625, 0.18615341186523438, 0.20175933837890625, 0.21736526489257812, 0.23297119140625, 0.24857711791992188, 0.26418304443359375, 0.2797889709472656, 0.2953948974609375, 0.3110008239746094, 0.32660675048828125, 0.3422126770019531, 0.357818603515625, 0.3734245300292969, 0.38903045654296875, 0.4046363830566406, 0.4202423095703125, 0.4358482360839844, 0.45145416259765625, 0.4670600891113281, 0.482666015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 10.0, 17.0, 12.0, 26.0, 22.0, 23.0, 18.0, 36.0, 23.0, 33.0, 47.0, 42.0, 35.0, 43.0, 51.0, 46.0, 49.0, 43.0, 37.0, 43.0, 40.0, 37.0, 26.0, 30.0, 28.0, 20.0, 27.0, 22.0, 23.0, 11.0, 5.0, 7.0, 10.0, 4.0, 9.0, 5.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.90628433227539, -25.035118103027344, -24.16395378112793, -23.292787551879883, -22.421621322631836, -21.550457000732422, -20.679290771484375, -19.808124542236328, -18.93695831298828, -18.065792083740234, -17.19462776184082, -16.323461532592773, -15.452295303344727, -14.581130027770996, -13.709964752197266, -12.838798522949219, -11.967634201049805, -11.096468925476074, -10.225302696228027, -9.354137420654297, -8.48297119140625, -7.6118059158325195, -6.740640640258789, -5.8694748878479, -4.998309135437012, -4.127143383026123, -3.2559778690338135, -2.384812355041504, -1.5136466026306152, -0.6424808502197266, 0.2286844253540039, 1.0998501777648926, 1.971017837524414, 2.8421835899353027, 3.7133491039276123, 4.584514617919922, 5.4556803703308105, 6.326846122741699, 7.19801139831543, 8.069177627563477, 8.940342903137207, 9.811508178710938, 10.682674407958984, 11.553839683532715, 12.425004959106445, 13.296171188354492, 14.167336463928223, 15.038501739501953, 15.90966796875, 16.780834197998047, 17.65199851989746, 18.523164749145508, 19.394330978393555, 20.26549530029297, 21.136661529541016, 22.007827758789062, 22.87899398803711, 23.750160217285156, 24.62132453918457, 25.492490768432617, 26.363656997680664, 27.234821319580078, 28.105987548828125, 28.977153778076172, 29.848318099975586]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 6.0, 6.0, 14.0, 13.0, 9.0, 10.0, 21.0, 18.0, 21.0, 24.0, 26.0, 29.0, 25.0, 37.0, 34.0, 40.0, 35.0, 36.0, 39.0, 38.0, 30.0, 27.0, 35.0, 41.0, 45.0, 36.0, 35.0, 35.0, 27.0, 26.0, 24.0, 25.0, 20.0, 24.0, 12.0, 14.0, 8.0, 12.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.470666885375977, -27.520793914794922, -26.570919036865234, -25.621044158935547, -24.671171188354492, -23.721298217773438, -22.77142333984375, -21.821548461914062, -20.871675491333008, -19.921802520751953, -18.971927642822266, -18.022052764892578, -17.072179794311523, -16.12230682373047, -15.172431945800781, -14.22255802154541, -13.272684097290039, -12.322810173034668, -11.372936248779297, -10.423062324523926, -9.473188400268555, -8.523314476013184, -7.5734405517578125, -6.623566627502441, -5.67369270324707, -4.723818778991699, -3.773944854736328, -2.824070930480957, -1.874197006225586, -0.9243230819702148, 0.02555084228515625, 0.9754247665405273, 1.9252967834472656, 2.8751707077026367, 3.825044631958008, 4.774918556213379, 5.72479248046875, 6.674666404724121, 7.624540328979492, 8.574414253234863, 9.524288177490234, 10.474162101745605, 11.424036026000977, 12.373909950256348, 13.323783874511719, 14.27365779876709, 15.223531723022461, 16.173404693603516, 17.123279571533203, 18.07315444946289, 19.023027420043945, 19.972900390625, 20.922775268554688, 21.872650146484375, 22.82252311706543, 23.772396087646484, 24.722270965576172, 25.67214584350586, 26.622018814086914, 27.57189178466797, 28.521766662597656, 29.471641540527344, 30.4215145111084, 31.371387481689453, 32.32126235961914]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 12.0, 20.0, 38.0, 42.0, 63.0, 96.0, 146.0, 259.0, 381.0, 555.0, 795.0, 1237.0, 1782.0, 2662.0, 3974.0, 6019.0, 8945.0, 13053.0, 19244.0, 27619.0, 38187.0, 52174.0, 67736.0, 83866.0, 96931.0, 104767.0, 104382.0, 95323.0, 81337.0, 66056.0, 50535.0, 37175.0, 26384.0, 18458.0, 12505.0, 8697.0, 5655.0, 3793.0, 2482.0, 1670.0, 1101.0, 775.0, 554.0, 320.0, 265.0, 174.0, 117.0, 62.0, 35.0, 35.0, 22.0, 17.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0], "bins": [-21.46875, -20.796630859375, -20.12451171875, -19.452392578125, -18.7802734375, -18.108154296875, -17.43603515625, -16.763916015625, -16.091796875, -15.419677734375, -14.74755859375, -14.075439453125, -13.4033203125, -12.731201171875, -12.05908203125, -11.386962890625, -10.71484375, -10.042724609375, -9.37060546875, -8.698486328125, -8.0263671875, -7.354248046875, -6.68212890625, -6.010009765625, -5.337890625, -4.665771484375, -3.99365234375, -3.321533203125, -2.6494140625, -1.977294921875, -1.30517578125, -0.633056640625, 0.0390625, 0.711181640625, 1.38330078125, 2.055419921875, 2.7275390625, 3.399658203125, 4.07177734375, 4.743896484375, 5.416015625, 6.088134765625, 6.76025390625, 7.432373046875, 8.1044921875, 8.776611328125, 9.44873046875, 10.120849609375, 10.79296875, 11.465087890625, 12.13720703125, 12.809326171875, 13.4814453125, 14.153564453125, 14.82568359375, 15.497802734375, 16.169921875, 16.842041015625, 17.51416015625, 18.186279296875, 18.8583984375, 19.530517578125, 20.20263671875, 20.874755859375, 21.546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 8.0, 11.0, 11.0, 12.0, 16.0, 20.0, 21.0, 22.0, 17.0, 22.0, 29.0, 29.0, 44.0, 28.0, 50.0, 31.0, 37.0, 43.0, 28.0, 45.0, 39.0, 43.0, 39.0, 37.0, 41.0, 40.0, 26.0, 15.0, 30.0, 24.0, 20.0, 21.0, 14.0, 8.0, 8.0, 11.0, 8.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.15625, -28.2197265625, -27.283203125, -26.3466796875, -25.41015625, -24.4736328125, -23.537109375, -22.6005859375, -21.6640625, -20.7275390625, -19.791015625, -18.8544921875, -17.91796875, -16.9814453125, -16.044921875, -15.1083984375, -14.171875, -13.2353515625, -12.298828125, -11.3623046875, -10.42578125, -9.4892578125, -8.552734375, -7.6162109375, -6.6796875, -5.7431640625, -4.806640625, -3.8701171875, -2.93359375, -1.9970703125, -1.060546875, -0.1240234375, 0.8125, 1.7490234375, 2.685546875, 3.6220703125, 4.55859375, 5.4951171875, 6.431640625, 7.3681640625, 8.3046875, 9.2412109375, 10.177734375, 11.1142578125, 12.05078125, 12.9873046875, 13.923828125, 14.8603515625, 15.796875, 16.7333984375, 17.669921875, 18.6064453125, 19.54296875, 20.4794921875, 21.416015625, 22.3525390625, 23.2890625, 24.2255859375, 25.162109375, 26.0986328125, 27.03515625, 27.9716796875, 28.908203125, 29.8447265625, 30.78125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 3.0, 5.0, 16.0, 29.0, 25.0, 56.0, 66.0, 102.0, 181.0, 244.0, 378.0, 519.0, 793.0, 1103.0, 1692.0, 2434.0, 3611.0, 5145.0, 7866.0, 11854.0, 17179.0, 24898.0, 34919.0, 48458.0, 64006.0, 81250.0, 96224.0, 105333.0, 106554.0, 99182.0, 85711.0, 69676.0, 52603.0, 39066.0, 27525.0, 19068.0, 12983.0, 8819.0, 6209.0, 4083.0, 2829.0, 1890.0, 1320.0, 824.0, 576.0, 401.0, 305.0, 171.0, 140.0, 83.0, 52.0, 40.0, 31.0, 9.0, 8.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.796875, -21.09716796875, -20.3974609375, -19.69775390625, -18.998046875, -18.29833984375, -17.5986328125, -16.89892578125, -16.19921875, -15.49951171875, -14.7998046875, -14.10009765625, -13.400390625, -12.70068359375, -12.0009765625, -11.30126953125, -10.6015625, -9.90185546875, -9.2021484375, -8.50244140625, -7.802734375, -7.10302734375, -6.4033203125, -5.70361328125, -5.00390625, -4.30419921875, -3.6044921875, -2.90478515625, -2.205078125, -1.50537109375, -0.8056640625, -0.10595703125, 0.59375, 1.29345703125, 1.9931640625, 2.69287109375, 3.392578125, 4.09228515625, 4.7919921875, 5.49169921875, 6.19140625, 6.89111328125, 7.5908203125, 8.29052734375, 8.990234375, 9.68994140625, 10.3896484375, 11.08935546875, 11.7890625, 12.48876953125, 13.1884765625, 13.88818359375, 14.587890625, 15.28759765625, 15.9873046875, 16.68701171875, 17.38671875, 18.08642578125, 18.7861328125, 19.48583984375, 20.185546875, 20.88525390625, 21.5849609375, 22.28466796875, 22.984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 6.0, 9.0, 5.0, 10.0, 16.0, 13.0, 13.0, 4.0, 17.0, 32.0, 31.0, 24.0, 30.0, 36.0, 39.0, 44.0, 45.0, 46.0, 30.0, 52.0, 47.0, 45.0, 51.0, 29.0, 42.0, 28.0, 33.0, 29.0, 29.0, 27.0, 16.0, 23.0, 17.0, 21.0, 16.0, 9.0, 4.0, 5.0, 7.0, 4.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.898193359375, -20.24951171875, -19.600830078125, -18.9521484375, -18.303466796875, -17.65478515625, -17.006103515625, -16.357421875, -15.708740234375, -15.06005859375, -14.411376953125, -13.7626953125, -13.114013671875, -12.46533203125, -11.816650390625, -11.16796875, -10.519287109375, -9.87060546875, -9.221923828125, -8.5732421875, -7.924560546875, -7.27587890625, -6.627197265625, -5.978515625, -5.329833984375, -4.68115234375, -4.032470703125, -3.3837890625, -2.735107421875, -2.08642578125, -1.437744140625, -0.7890625, -0.140380859375, 0.50830078125, 1.156982421875, 1.8056640625, 2.454345703125, 3.10302734375, 3.751708984375, 4.400390625, 5.049072265625, 5.69775390625, 6.346435546875, 6.9951171875, 7.643798828125, 8.29248046875, 8.941162109375, 9.58984375, 10.238525390625, 10.88720703125, 11.535888671875, 12.1845703125, 12.833251953125, 13.48193359375, 14.130615234375, 14.779296875, 15.427978515625, 16.07666015625, 16.725341796875, 17.3740234375, 18.022705078125, 18.67138671875, 19.320068359375, 19.96875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 2.0, 6.0, 12.0, 24.0, 21.0, 42.0, 53.0, 90.0, 137.0, 203.0, 345.0, 554.0, 939.0, 1557.0, 2606.0, 4454.0, 7528.0, 12881.0, 22176.0, 37748.0, 60214.0, 92277.0, 127205.0, 151798.0, 151716.0, 128526.0, 92858.0, 60950.0, 37469.0, 22349.0, 13016.0, 7539.0, 4506.0, 2620.0, 1624.0, 944.0, 604.0, 307.0, 234.0, 143.0, 87.0, 74.0, 32.0, 22.0, 17.0, 13.0, 12.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-8.25, -8.00006103515625, -7.7501220703125, -7.50018310546875, -7.250244140625, -7.00030517578125, -6.7503662109375, -6.50042724609375, -6.25048828125, -6.00054931640625, -5.7506103515625, -5.50067138671875, -5.250732421875, -5.00079345703125, -4.7508544921875, -4.50091552734375, -4.2509765625, -4.00103759765625, -3.7510986328125, -3.50115966796875, -3.251220703125, -3.00128173828125, -2.7513427734375, -2.50140380859375, -2.25146484375, -2.00152587890625, -1.7515869140625, -1.50164794921875, -1.251708984375, -1.00177001953125, -0.7518310546875, -0.50189208984375, -0.251953125, -0.00201416015625, 0.2479248046875, 0.49786376953125, 0.747802734375, 0.99774169921875, 1.2476806640625, 1.49761962890625, 1.74755859375, 1.99749755859375, 2.2474365234375, 2.49737548828125, 2.747314453125, 2.99725341796875, 3.2471923828125, 3.49713134765625, 3.7470703125, 3.99700927734375, 4.2469482421875, 4.49688720703125, 4.746826171875, 4.99676513671875, 5.2467041015625, 5.49664306640625, 5.74658203125, 5.99652099609375, 6.2464599609375, 6.49639892578125, 6.746337890625, 6.99627685546875, 7.2462158203125, 7.49615478515625, 7.74609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 5.0, 11.0, 4.0, 9.0, 13.0, 11.0, 21.0, 24.0, 36.0, 27.0, 27.0, 53.0, 51.0, 43.0, 55.0, 53.0, 51.0, 70.0, 56.0, 54.0, 41.0, 33.0, 46.0, 31.0, 39.0, 25.0, 24.0, 14.0, 23.0, 14.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005884170532226562, -0.0005662664771080017, -0.0005441159009933472, -0.0005219653248786926, -0.0004998147487640381, -0.00047766417264938354, -0.000455513596534729, -0.00043336302042007446, -0.0004112124443054199, -0.0003890618681907654, -0.00036691129207611084, -0.0003447607159614563, -0.00032261013984680176, -0.0003004595637321472, -0.0002783089876174927, -0.00025615841150283813, -0.0002340078353881836, -0.00021185725927352905, -0.0001897066831588745, -0.00016755610704421997, -0.00014540553092956543, -0.0001232549548149109, -0.00010110437870025635, -7.89538025856018e-05, -5.6803226470947266e-05, -3.4652650356292725e-05, -1.2502074241638184e-05, 9.648501873016357e-06, 3.17990779876709e-05, 5.394965410232544e-05, 7.610023021697998e-05, 9.825080633163452e-05, 0.00012040138244628906, 0.0001425519585609436, 0.00016470253467559814, 0.00018685311079025269, 0.00020900368690490723, 0.00023115426301956177, 0.0002533048391342163, 0.00027545541524887085, 0.0002976059913635254, 0.00031975656747817993, 0.00034190714359283447, 0.000364057719707489, 0.00038620829582214355, 0.0004083588719367981, 0.00043050944805145264, 0.0004526600241661072, 0.0004748106002807617, 0.0004969611763954163, 0.0005191117525100708, 0.0005412623286247253, 0.0005634129047393799, 0.0005855634808540344, 0.000607714056968689, 0.0006298646330833435, 0.000652015209197998, 0.0006741657853126526, 0.0006963163614273071, 0.0007184669375419617, 0.0007406175136566162, 0.0007627680897712708, 0.0007849186658859253, 0.0008070692420005798, 0.0008292198181152344]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 10.0, 10.0, 15.0, 27.0, 42.0, 67.0, 103.0, 168.0, 241.0, 325.0, 560.0, 808.0, 1154.0, 1875.0, 3002.0, 4603.0, 7311.0, 11407.0, 18161.0, 28649.0, 43960.0, 64883.0, 90803.0, 116568.0, 132763.0, 133412.0, 115574.0, 89016.0, 63186.0, 42836.0, 27831.0, 17953.0, 11320.0, 7100.0, 4563.0, 2990.0, 1840.0, 1226.0, 742.0, 488.0, 341.0, 223.0, 122.0, 86.0, 70.0, 47.0, 25.0, 14.0, 14.0, 9.0, 5.0, 4.0, 4.0, 0.0, 3.0], "bins": [-7.6328125, -7.40814208984375, -7.1834716796875, -6.95880126953125, -6.734130859375, -6.50946044921875, -6.2847900390625, -6.06011962890625, -5.83544921875, -5.61077880859375, -5.3861083984375, -5.16143798828125, -4.936767578125, -4.71209716796875, -4.4874267578125, -4.26275634765625, -4.0380859375, -3.81341552734375, -3.5887451171875, -3.36407470703125, -3.139404296875, -2.91473388671875, -2.6900634765625, -2.46539306640625, -2.24072265625, -2.01605224609375, -1.7913818359375, -1.56671142578125, -1.342041015625, -1.11737060546875, -0.8927001953125, -0.66802978515625, -0.443359375, -0.21868896484375, 0.0059814453125, 0.23065185546875, 0.455322265625, 0.67999267578125, 0.9046630859375, 1.12933349609375, 1.35400390625, 1.57867431640625, 1.8033447265625, 2.02801513671875, 2.252685546875, 2.47735595703125, 2.7020263671875, 2.92669677734375, 3.1513671875, 3.37603759765625, 3.6007080078125, 3.82537841796875, 4.050048828125, 4.27471923828125, 4.4993896484375, 4.72406005859375, 4.94873046875, 5.17340087890625, 5.3980712890625, 5.62274169921875, 5.847412109375, 6.07208251953125, 6.2967529296875, 6.52142333984375, 6.74609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 11.0, 4.0, 12.0, 6.0, 20.0, 14.0, 15.0, 38.0, 38.0, 39.0, 47.0, 60.0, 55.0, 56.0, 51.0, 64.0, 59.0, 52.0, 49.0, 47.0, 52.0, 37.0, 29.0, 19.0, 19.0, 23.0, 17.0, 11.0, 11.0, 7.0, 3.0, 5.0, 4.0, 5.0, 6.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96484375, -2.84429931640625, -2.7237548828125, -2.60321044921875, -2.482666015625, -2.36212158203125, -2.2415771484375, -2.12103271484375, -2.00048828125, -1.87994384765625, -1.7593994140625, -1.63885498046875, -1.518310546875, -1.39776611328125, -1.2772216796875, -1.15667724609375, -1.0361328125, -0.91558837890625, -0.7950439453125, -0.67449951171875, -0.553955078125, -0.43341064453125, -0.3128662109375, -0.19232177734375, -0.07177734375, 0.04876708984375, 0.1693115234375, 0.28985595703125, 0.410400390625, 0.53094482421875, 0.6514892578125, 0.77203369140625, 0.892578125, 1.01312255859375, 1.1336669921875, 1.25421142578125, 1.374755859375, 1.49530029296875, 1.6158447265625, 1.73638916015625, 1.85693359375, 1.97747802734375, 2.0980224609375, 2.21856689453125, 2.339111328125, 2.45965576171875, 2.5802001953125, 2.70074462890625, 2.8212890625, 2.94183349609375, 3.0623779296875, 3.18292236328125, 3.303466796875, 3.42401123046875, 3.5445556640625, 3.66510009765625, 3.78564453125, 3.90618896484375, 4.0267333984375, 4.14727783203125, 4.267822265625, 4.38836669921875, 4.5089111328125, 4.62945556640625, 4.75]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 9.0, 11.0, 18.0, 11.0, 8.0, 20.0, 19.0, 29.0, 37.0, 29.0, 40.0, 30.0, 46.0, 46.0, 45.0, 66.0, 49.0, 49.0, 49.0, 52.0, 58.0, 22.0, 42.0, 31.0, 36.0, 20.0, 28.0, 14.0, 19.0, 15.0, 10.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.106853485107422, -26.15304183959961, -25.199230194091797, -24.245418548583984, -23.291606903076172, -22.33779525756836, -21.38398551940918, -20.430173873901367, -19.476362228393555, -18.522550582885742, -17.56873893737793, -16.614927291870117, -15.661116600036621, -14.707304954528809, -13.753494262695312, -12.7996826171875, -11.845870971679688, -10.892059326171875, -9.938247680664062, -8.984436988830566, -8.030625343322754, -7.076813697814941, -6.123002529144287, -5.169191360473633, -4.21537971496582, -3.261568307876587, -2.3077569007873535, -1.3539454936981201, -0.4001340866088867, 0.5536775588989258, 1.50748872756958, 2.4612998962402344, 3.415111541748047, 4.368923187255859, 5.322734355926514, 6.276545524597168, 7.2303571701049805, 8.184168815612793, 9.137979507446289, 10.091791152954102, 11.045602798461914, 11.999414443969727, 12.953226089477539, 13.907036781311035, 14.860848426818848, 15.81466007232666, 16.768470764160156, 17.72228240966797, 18.67609405517578, 19.629905700683594, 20.583717346191406, 21.53752899169922, 22.49134063720703, 23.445152282714844, 24.398962020874023, 25.352773666381836, 26.30658531188965, 27.26039695739746, 28.214208602905273, 29.168020248413086, 30.121829986572266, 31.075641632080078, 32.02945327758789, 32.9832649230957, 33.937076568603516]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 16.0, 6.0, 11.0, 9.0, 17.0, 22.0, 18.0, 23.0, 16.0, 32.0, 23.0, 46.0, 36.0, 37.0, 32.0, 36.0, 40.0, 31.0, 42.0, 53.0, 49.0, 53.0, 32.0, 27.0, 32.0, 35.0, 34.0, 27.0, 24.0, 14.0, 29.0, 9.0, 13.0, 16.0, 12.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.512569427490234, -32.47273254394531, -31.43289566040039, -30.39305877685547, -29.353221893310547, -28.313385009765625, -27.273550033569336, -26.233713150024414, -25.193876266479492, -24.15403938293457, -23.11420249938965, -22.074365615844727, -21.034530639648438, -19.994693756103516, -18.954856872558594, -17.915019989013672, -16.87518310546875, -15.835346221923828, -14.795509338378906, -13.7556734085083, -12.715836524963379, -11.675999641418457, -10.636163711547852, -9.59632682800293, -8.556489944458008, -7.516653060913086, -6.476816654205322, -5.436980247497559, -4.397143363952637, -3.357306480407715, -2.317470073699951, -1.2776336669921875, -0.23780059814453125, 0.8020360469818115, 1.8418726921081543, 2.881709337234497, 3.92154598236084, 4.961382865905762, 6.001219272613525, 7.041055679321289, 8.080892562866211, 9.120729446411133, 10.160566329956055, 11.20040225982666, 12.240239143371582, 13.280076026916504, 14.31991195678711, 15.359748840332031, 16.399585723876953, 17.439422607421875, 18.479259490966797, 19.51909637451172, 20.55893325805664, 21.598770141601562, 22.63860511779785, 23.678442001342773, 24.718278884887695, 25.758115768432617, 26.79795265197754, 27.83778953552246, 28.87762451171875, 29.917461395263672, 30.957298278808594, 31.997135162353516, 33.03697204589844]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 7.0, 21.0, 28.0, 50.0, 101.0, 153.0, 270.0, 484.0, 778.0, 1378.0, 2351.0, 3922.0, 6518.0, 11088.0, 18566.0, 30284.0, 50692.0, 83157.0, 134644.0, 212355.0, 318622.0, 444717.0, 550084.0, 586011.0, 531357.0, 414176.0, 292011.0, 191906.0, 120844.0, 74128.0, 45528.0, 27206.0, 16552.0, 9649.0, 5829.0, 3531.0, 2074.0, 1240.0, 796.0, 487.0, 239.0, 159.0, 109.0, 75.0, 44.0, 20.0, 12.0, 13.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.552978515625, -20.79345703125, -20.033935546875, -19.2744140625, -18.514892578125, -17.75537109375, -16.995849609375, -16.236328125, -15.476806640625, -14.71728515625, -13.957763671875, -13.1982421875, -12.438720703125, -11.67919921875, -10.919677734375, -10.16015625, -9.400634765625, -8.64111328125, -7.881591796875, -7.1220703125, -6.362548828125, -5.60302734375, -4.843505859375, -4.083984375, -3.324462890625, -2.56494140625, -1.805419921875, -1.0458984375, -0.286376953125, 0.47314453125, 1.232666015625, 1.9921875, 2.751708984375, 3.51123046875, 4.270751953125, 5.0302734375, 5.789794921875, 6.54931640625, 7.308837890625, 8.068359375, 8.827880859375, 9.58740234375, 10.346923828125, 11.1064453125, 11.865966796875, 12.62548828125, 13.385009765625, 14.14453125, 14.904052734375, 15.66357421875, 16.423095703125, 17.1826171875, 17.942138671875, 18.70166015625, 19.461181640625, 20.220703125, 20.980224609375, 21.73974609375, 22.499267578125, 23.2587890625, 24.018310546875, 24.77783203125, 25.537353515625, 26.296875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 16.0, 9.0, 7.0, 11.0, 11.0, 12.0, 17.0, 19.0, 27.0, 24.0, 31.0, 25.0, 24.0, 30.0, 33.0, 35.0, 44.0, 49.0, 37.0, 40.0, 46.0, 40.0, 39.0, 35.0, 34.0, 39.0, 29.0, 32.0, 25.0, 22.0, 22.0, 25.0, 20.0, 24.0, 13.0, 5.0, 14.0, 5.0, 1.0, 6.0, 1.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.6083984375, -19.904296875, -19.2001953125, -18.49609375, -17.7919921875, -17.087890625, -16.3837890625, -15.6796875, -14.9755859375, -14.271484375, -13.5673828125, -12.86328125, -12.1591796875, -11.455078125, -10.7509765625, -10.046875, -9.3427734375, -8.638671875, -7.9345703125, -7.23046875, -6.5263671875, -5.822265625, -5.1181640625, -4.4140625, -3.7099609375, -3.005859375, -2.3017578125, -1.59765625, -0.8935546875, -0.189453125, 0.5146484375, 1.21875, 1.9228515625, 2.626953125, 3.3310546875, 4.03515625, 4.7392578125, 5.443359375, 6.1474609375, 6.8515625, 7.5556640625, 8.259765625, 8.9638671875, 9.66796875, 10.3720703125, 11.076171875, 11.7802734375, 12.484375, 13.1884765625, 13.892578125, 14.5966796875, 15.30078125, 16.0048828125, 16.708984375, 17.4130859375, 18.1171875, 18.8212890625, 19.525390625, 20.2294921875, 20.93359375, 21.6376953125, 22.341796875, 23.0458984375, 23.75]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [4.0, 6.0, 8.0, 16.0, 16.0, 34.0, 72.0, 103.0, 142.0, 280.0, 380.0, 675.0, 1022.0, 1613.0, 2763.0, 4236.0, 6949.0, 11128.0, 17898.0, 27988.0, 43356.0, 65901.0, 98278.0, 141862.0, 197600.0, 263431.0, 330904.0, 388613.0, 428629.0, 432294.0, 402726.0, 349929.0, 281892.0, 215711.0, 157678.0, 109779.0, 74177.0, 49482.0, 32000.0, 20501.0, 12849.0, 8003.0, 5087.0, 3095.0, 1930.0, 1195.0, 728.0, 522.0, 284.0, 193.0, 135.0, 84.0, 41.0, 27.0, 22.0, 7.0, 15.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.1904296875, -15.615234375, -15.0400390625, -14.46484375, -13.8896484375, -13.314453125, -12.7392578125, -12.1640625, -11.5888671875, -11.013671875, -10.4384765625, -9.86328125, -9.2880859375, -8.712890625, -8.1376953125, -7.5625, -6.9873046875, -6.412109375, -5.8369140625, -5.26171875, -4.6865234375, -4.111328125, -3.5361328125, -2.9609375, -2.3857421875, -1.810546875, -1.2353515625, -0.66015625, -0.0849609375, 0.490234375, 1.0654296875, 1.640625, 2.2158203125, 2.791015625, 3.3662109375, 3.94140625, 4.5166015625, 5.091796875, 5.6669921875, 6.2421875, 6.8173828125, 7.392578125, 7.9677734375, 8.54296875, 9.1181640625, 9.693359375, 10.2685546875, 10.84375, 11.4189453125, 11.994140625, 12.5693359375, 13.14453125, 13.7197265625, 14.294921875, 14.8701171875, 15.4453125, 16.0205078125, 16.595703125, 17.1708984375, 17.74609375, 18.3212890625, 18.896484375, 19.4716796875, 20.046875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 6.0, 6.0, 14.0, 13.0, 15.0, 16.0, 15.0, 37.0, 31.0, 36.0, 55.0, 64.0, 71.0, 68.0, 87.0, 120.0, 113.0, 128.0, 135.0, 138.0, 168.0, 166.0, 182.0, 193.0, 184.0, 155.0, 177.0, 169.0, 149.0, 180.0, 162.0, 155.0, 112.0, 127.0, 108.0, 77.0, 79.0, 65.0, 59.0, 51.0, 31.0, 31.0, 26.0, 22.0, 18.0, 17.0, 6.0, 7.0, 5.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0], "bins": [-10.2421875, -9.946044921875, -9.64990234375, -9.353759765625, -9.0576171875, -8.761474609375, -8.46533203125, -8.169189453125, -7.873046875, -7.576904296875, -7.28076171875, -6.984619140625, -6.6884765625, -6.392333984375, -6.09619140625, -5.800048828125, -5.50390625, -5.207763671875, -4.91162109375, -4.615478515625, -4.3193359375, -4.023193359375, -3.72705078125, -3.430908203125, -3.134765625, -2.838623046875, -2.54248046875, -2.246337890625, -1.9501953125, -1.654052734375, -1.35791015625, -1.061767578125, -0.765625, -0.469482421875, -0.17333984375, 0.122802734375, 0.4189453125, 0.715087890625, 1.01123046875, 1.307373046875, 1.603515625, 1.899658203125, 2.19580078125, 2.491943359375, 2.7880859375, 3.084228515625, 3.38037109375, 3.676513671875, 3.97265625, 4.268798828125, 4.56494140625, 4.861083984375, 5.1572265625, 5.453369140625, 5.74951171875, 6.045654296875, 6.341796875, 6.637939453125, 6.93408203125, 7.230224609375, 7.5263671875, 7.822509765625, 8.11865234375, 8.414794921875, 8.7109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 5.0, 11.0, 12.0, 12.0, 11.0, 20.0, 12.0, 26.0, 26.0, 20.0, 34.0, 42.0, 39.0, 35.0, 63.0, 50.0, 48.0, 53.0, 53.0, 59.0, 38.0, 48.0, 37.0, 32.0, 37.0, 24.0, 18.0, 20.0, 17.0, 18.0, 15.0, 9.0, 11.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-26.09819984436035, -25.360565185546875, -24.6229305267334, -23.885295867919922, -23.147663116455078, -22.4100284576416, -21.672393798828125, -20.93475914001465, -20.197124481201172, -19.459489822387695, -18.72185516357422, -17.984222412109375, -17.2465877532959, -16.508953094482422, -15.771318435668945, -15.033683776855469, -14.296051025390625, -13.558416366577148, -12.820782661437988, -12.083148002624512, -11.345514297485352, -10.607879638671875, -9.870244979858398, -9.132610321044922, -8.394976615905762, -7.657342433929443, -6.919708251953125, -6.182073593139648, -5.44443941116333, -4.706805229187012, -3.969170570373535, -3.231536388397217, -2.4939022064208984, -1.7562679052352905, -1.0186336040496826, -0.28099918365478516, 0.4566349983215332, 1.1942691802978516, 1.9319038391113281, 2.6695380210876465, 3.407172203063965, 4.144806385040283, 4.882440567016602, 5.620075225830078, 6.3577094078063965, 7.095343589782715, 7.832978248596191, 8.570611953735352, 9.308246612548828, 10.045881271362305, 10.783514976501465, 11.521149635314941, 12.258783340454102, 12.996417999267578, 13.734052658081055, 14.471687316894531, 15.209321022033691, 15.946955680847168, 16.684589385986328, 17.422224044799805, 18.15985870361328, 18.897491455078125, 19.635128021240234, 20.372760772705078, 21.110395431518555]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 9.0, 8.0, 13.0, 6.0, 13.0, 23.0, 25.0, 34.0, 33.0, 26.0, 21.0, 26.0, 34.0, 34.0, 45.0, 47.0, 47.0, 55.0, 38.0, 37.0, 39.0, 42.0, 49.0, 40.0, 30.0, 21.0, 21.0, 34.0, 28.0, 26.0, 20.0, 7.0, 13.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.70098304748535, -26.826419830322266, -25.951858520507812, -25.077295303344727, -24.20273208618164, -23.328170776367188, -22.4536075592041, -21.579044342041016, -20.704483032226562, -19.829919815063477, -18.955358505249023, -18.080795288085938, -17.20623207092285, -16.331668853759766, -15.457107543945312, -14.582544326782227, -13.70798110961914, -12.833418846130371, -11.958855628967285, -11.084293365478516, -10.20973014831543, -9.33516788482666, -8.46060562133789, -7.586042881011963, -6.711480140686035, -5.836917400360107, -4.96235466003418, -4.08779239654541, -3.2132296562194824, -2.3386669158935547, -1.4641046524047852, -0.5895419120788574, 0.2850189208984375, 1.1595815420150757, 2.034144163131714, 2.9087066650390625, 3.7832694053649902, 4.657832145690918, 5.5323944091796875, 6.406957149505615, 7.281519889831543, 8.156082153320312, 9.030645370483398, 9.905207633972168, 10.779769897460938, 11.654333114624023, 12.528895378112793, 13.403457641601562, 14.278020858764648, 15.152583122253418, 16.027145385742188, 16.901708602905273, 17.77627182006836, 18.650833129882812, 19.5253963470459, 20.399959564208984, 21.274520874023438, 22.149084091186523, 23.023645401000977, 23.898208618164062, 24.77277183532715, 25.647335052490234, 26.521896362304688, 27.396459579467773, 28.27102279663086]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 15.0, 13.0, 24.0, 62.0, 80.0, 114.0, 192.0, 284.0, 403.0, 680.0, 1020.0, 1568.0, 2577.0, 3929.0, 6250.0, 9890.0, 15985.0, 26367.0, 42962.0, 71426.0, 115557.0, 174242.0, 195997.0, 143694.0, 91285.0, 55469.0, 33683.0, 20520.0, 12803.0, 7758.0, 4938.0, 3221.0, 1987.0, 1275.0, 751.0, 574.0, 375.0, 218.0, 142.0, 81.0, 53.0, 31.0, 23.0, 11.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99334716796875, -4.8226318359375, -4.65191650390625, -4.481201171875, -4.31048583984375, -4.1397705078125, -3.96905517578125, -3.79833984375, -3.62762451171875, -3.4569091796875, -3.28619384765625, -3.115478515625, -2.94476318359375, -2.7740478515625, -2.60333251953125, -2.4326171875, -2.26190185546875, -2.0911865234375, -1.92047119140625, -1.749755859375, -1.57904052734375, -1.4083251953125, -1.23760986328125, -1.06689453125, -0.89617919921875, -0.7254638671875, -0.55474853515625, -0.384033203125, -0.21331787109375, -0.0426025390625, 0.12811279296875, 0.298828125, 0.46954345703125, 0.6402587890625, 0.81097412109375, 0.981689453125, 1.15240478515625, 1.3231201171875, 1.49383544921875, 1.66455078125, 1.83526611328125, 2.0059814453125, 2.17669677734375, 2.347412109375, 2.51812744140625, 2.6888427734375, 2.85955810546875, 3.0302734375, 3.20098876953125, 3.3717041015625, 3.54241943359375, 3.713134765625, 3.88385009765625, 4.0545654296875, 4.22528076171875, 4.39599609375, 4.56671142578125, 4.7374267578125, 4.90814208984375, 5.078857421875, 5.24957275390625, 5.4202880859375, 5.59100341796875, 5.76171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 9.0, 5.0, 10.0, 11.0, 10.0, 11.0, 12.0, 18.0, 22.0, 26.0, 27.0, 26.0, 29.0, 26.0, 38.0, 37.0, 39.0, 43.0, 42.0, 53.0, 40.0, 49.0, 26.0, 40.0, 43.0, 32.0, 32.0, 34.0, 21.0, 29.0, 29.0, 27.0, 16.0, 18.0, 8.0, 14.0, 7.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-26.21875, -25.3720703125, -24.525390625, -23.6787109375, -22.83203125, -21.9853515625, -21.138671875, -20.2919921875, -19.4453125, -18.5986328125, -17.751953125, -16.9052734375, -16.05859375, -15.2119140625, -14.365234375, -13.5185546875, -12.671875, -11.8251953125, -10.978515625, -10.1318359375, -9.28515625, -8.4384765625, -7.591796875, -6.7451171875, -5.8984375, -5.0517578125, -4.205078125, -3.3583984375, -2.51171875, -1.6650390625, -0.818359375, 0.0283203125, 0.875, 1.7216796875, 2.568359375, 3.4150390625, 4.26171875, 5.1083984375, 5.955078125, 6.8017578125, 7.6484375, 8.4951171875, 9.341796875, 10.1884765625, 11.03515625, 11.8818359375, 12.728515625, 13.5751953125, 14.421875, 15.2685546875, 16.115234375, 16.9619140625, 17.80859375, 18.6552734375, 19.501953125, 20.3486328125, 21.1953125, 22.0419921875, 22.888671875, 23.7353515625, 24.58203125, 25.4287109375, 26.275390625, 27.1220703125, 27.96875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 10.0, 18.0, 29.0, 43.0, 45.0, 96.0, 102.0, 229.0, 360.0, 508.0, 753.0, 1277.0, 2061.0, 3214.0, 5376.0, 8795.0, 15301.0, 25990.0, 46255.0, 83913.0, 161235.0, 262803.0, 196582.0, 102611.0, 55031.0, 31327.0, 17827.0, 10414.0, 6277.0, 3770.0, 2304.0, 1428.0, 879.0, 610.0, 372.0, 245.0, 145.0, 98.0, 68.0, 52.0, 29.0, 21.0, 19.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.85546875, -4.706787109375, -4.55810546875, -4.409423828125, -4.2607421875, -4.112060546875, -3.96337890625, -3.814697265625, -3.666015625, -3.517333984375, -3.36865234375, -3.219970703125, -3.0712890625, -2.922607421875, -2.77392578125, -2.625244140625, -2.4765625, -2.327880859375, -2.17919921875, -2.030517578125, -1.8818359375, -1.733154296875, -1.58447265625, -1.435791015625, -1.287109375, -1.138427734375, -0.98974609375, -0.841064453125, -0.6923828125, -0.543701171875, -0.39501953125, -0.246337890625, -0.09765625, 0.051025390625, 0.19970703125, 0.348388671875, 0.4970703125, 0.645751953125, 0.79443359375, 0.943115234375, 1.091796875, 1.240478515625, 1.38916015625, 1.537841796875, 1.6865234375, 1.835205078125, 1.98388671875, 2.132568359375, 2.28125, 2.429931640625, 2.57861328125, 2.727294921875, 2.8759765625, 3.024658203125, 3.17333984375, 3.322021484375, 3.470703125, 3.619384765625, 3.76806640625, 3.916748046875, 4.0654296875, 4.214111328125, 4.36279296875, 4.511474609375, 4.66015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 4.0, 4.0, 9.0, 8.0, 11.0, 19.0, 20.0, 20.0, 21.0, 18.0, 24.0, 30.0, 24.0, 19.0, 35.0, 32.0, 27.0, 54.0, 43.0, 46.0, 44.0, 47.0, 43.0, 41.0, 42.0, 42.0, 24.0, 28.0, 31.0, 29.0, 15.0, 24.0, 16.0, 19.0, 16.0, 10.0, 16.0, 9.0, 10.0, 12.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.09375, -17.52978515625, -16.9658203125, -16.40185546875, -15.837890625, -15.27392578125, -14.7099609375, -14.14599609375, -13.58203125, -13.01806640625, -12.4541015625, -11.89013671875, -11.326171875, -10.76220703125, -10.1982421875, -9.63427734375, -9.0703125, -8.50634765625, -7.9423828125, -7.37841796875, -6.814453125, -6.25048828125, -5.6865234375, -5.12255859375, -4.55859375, -3.99462890625, -3.4306640625, -2.86669921875, -2.302734375, -1.73876953125, -1.1748046875, -0.61083984375, -0.046875, 0.51708984375, 1.0810546875, 1.64501953125, 2.208984375, 2.77294921875, 3.3369140625, 3.90087890625, 4.46484375, 5.02880859375, 5.5927734375, 6.15673828125, 6.720703125, 7.28466796875, 7.8486328125, 8.41259765625, 8.9765625, 9.54052734375, 10.1044921875, 10.66845703125, 11.232421875, 11.79638671875, 12.3603515625, 12.92431640625, 13.48828125, 14.05224609375, 14.6162109375, 15.18017578125, 15.744140625, 16.30810546875, 16.8720703125, 17.43603515625, 18.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 21.0, 15.0, 24.0, 45.0, 57.0, 85.0, 134.0, 155.0, 305.0, 446.0, 747.0, 1290.0, 2062.0, 3610.0, 6585.0, 12398.0, 24081.0, 49740.0, 116895.0, 356308.0, 287252.0, 97503.0, 42877.0, 20964.0, 10864.0, 5941.0, 3289.0, 1817.0, 1128.0, 674.0, 434.0, 286.0, 152.0, 95.0, 77.0, 52.0, 41.0, 22.0, 23.0, 14.0, 10.0, 3.0, 5.0, 1.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4873046875, -0.47153472900390625, -0.4557647705078125, -0.43999481201171875, -0.424224853515625, -0.40845489501953125, -0.3926849365234375, -0.37691497802734375, -0.36114501953125, -0.34537506103515625, -0.3296051025390625, -0.31383514404296875, -0.298065185546875, -0.28229522705078125, -0.2665252685546875, -0.25075531005859375, -0.2349853515625, -0.21921539306640625, -0.2034454345703125, -0.18767547607421875, -0.171905517578125, -0.15613555908203125, -0.1403656005859375, -0.12459564208984375, -0.10882568359375, -0.09305572509765625, -0.0772857666015625, -0.06151580810546875, -0.045745849609375, -0.02997589111328125, -0.0142059326171875, 0.00156402587890625, 0.017333984375, 0.03310394287109375, 0.0488739013671875, 0.06464385986328125, 0.080413818359375, 0.09618377685546875, 0.1119537353515625, 0.12772369384765625, 0.14349365234375, 0.15926361083984375, 0.1750335693359375, 0.19080352783203125, 0.206573486328125, 0.22234344482421875, 0.2381134033203125, 0.25388336181640625, 0.2696533203125, 0.28542327880859375, 0.3011932373046875, 0.31696319580078125, 0.332733154296875, 0.34850311279296875, 0.3642730712890625, 0.38004302978515625, 0.39581298828125, 0.41158294677734375, 0.4273529052734375, 0.44312286376953125, 0.458892822265625, 0.47466278076171875, 0.4904327392578125, 0.5062026977539062, 0.52197265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 9.0, 10.0, 8.0, 19.0, 16.0, 12.0, 36.0, 36.0, 44.0, 48.0, 77.0, 85.0, 103.0, 89.0, 88.0, 69.0, 56.0, 54.0, 28.0, 24.0, 20.0, 13.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00012046098709106445, -0.00011718831956386566, -0.00011391565203666687, -0.00011064298450946808, -0.00010737031698226929, -0.0001040976494550705, -0.0001008249819278717, -9.755231440067291e-05, -9.427964687347412e-05, -9.100697934627533e-05, -8.773431181907654e-05, -8.446164429187775e-05, -8.118897676467896e-05, -7.791630923748016e-05, -7.464364171028137e-05, -7.137097418308258e-05, -6.809830665588379e-05, -6.4825639128685e-05, -6.15529716014862e-05, -5.8280304074287415e-05, -5.500763654708862e-05, -5.173496901988983e-05, -4.846230149269104e-05, -4.518963396549225e-05, -4.191696643829346e-05, -3.8644298911094666e-05, -3.5371631383895874e-05, -3.209896385669708e-05, -2.882629632949829e-05, -2.55536288022995e-05, -2.2280961275100708e-05, -1.9008293747901917e-05, -1.5735626220703125e-05, -1.2462958693504333e-05, -9.190291166305542e-06, -5.9176236391067505e-06, -2.644956111907959e-06, 6.277114152908325e-07, 3.900378942489624e-06, 7.1730464696884155e-06, 1.0445713996887207e-05, 1.3718381524085999e-05, 1.699104905128479e-05, 2.026371657848358e-05, 2.3536384105682373e-05, 2.6809051632881165e-05, 3.0081719160079956e-05, 3.335438668727875e-05, 3.662705421447754e-05, 3.989972174167633e-05, 4.317238926887512e-05, 4.6445056796073914e-05, 4.9717724323272705e-05, 5.2990391850471497e-05, 5.626305937767029e-05, 5.953572690486908e-05, 6.280839443206787e-05, 6.608106195926666e-05, 6.935372948646545e-05, 7.262639701366425e-05, 7.589906454086304e-05, 7.917173206806183e-05, 8.244439959526062e-05, 8.571706712245941e-05, 8.89897346496582e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 8.0, 5.0, 15.0, 26.0, 33.0, 43.0, 67.0, 73.0, 108.0, 163.0, 228.0, 302.0, 413.0, 623.0, 768.0, 1178.0, 1622.0, 2340.0, 3215.0, 4571.0, 6506.0, 9665.0, 14082.0, 21252.0, 33415.0, 53549.0, 91714.0, 178501.0, 280216.0, 136658.0, 75294.0, 45051.0, 28448.0, 18178.0, 12152.0, 8271.0, 5805.0, 4044.0, 2804.0, 2081.0, 1420.0, 1010.0, 702.0, 588.0, 369.0, 308.0, 174.0, 161.0, 111.0, 78.0, 53.0, 34.0, 24.0, 21.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.91259765625, -0.8824996948242188, -0.8524017333984375, -0.8223037719726562, -0.792205810546875, -0.7621078491210938, -0.7320098876953125, -0.7019119262695312, -0.67181396484375, -0.6417160034179688, -0.6116180419921875, -0.5815200805664062, -0.551422119140625, -0.5213241577148438, -0.4912261962890625, -0.46112823486328125, -0.4310302734375, -0.40093231201171875, -0.3708343505859375, -0.34073638916015625, -0.310638427734375, -0.28054046630859375, -0.2504425048828125, -0.22034454345703125, -0.19024658203125, -0.16014862060546875, -0.1300506591796875, -0.09995269775390625, -0.069854736328125, -0.03975677490234375, -0.0096588134765625, 0.02043914794921875, 0.050537109375, 0.08063507080078125, 0.1107330322265625, 0.14083099365234375, 0.170928955078125, 0.20102691650390625, 0.2311248779296875, 0.26122283935546875, 0.29132080078125, 0.32141876220703125, 0.3515167236328125, 0.38161468505859375, 0.411712646484375, 0.44181060791015625, 0.4719085693359375, 0.5020065307617188, 0.5321044921875, 0.5622024536132812, 0.5923004150390625, 0.6223983764648438, 0.652496337890625, 0.6825942993164062, 0.7126922607421875, 0.7427902221679688, 0.77288818359375, 0.8029861450195312, 0.8330841064453125, 0.8631820678710938, 0.893280029296875, 0.9233779907226562, 0.9534759521484375, 0.9835739135742188, 1.013671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 2.0, 5.0, 12.0, 9.0, 11.0, 18.0, 22.0, 25.0, 23.0, 32.0, 36.0, 18.0, 38.0, 27.0, 43.0, 59.0, 60.0, 90.0, 63.0, 55.0, 42.0, 41.0, 31.0, 24.0, 33.0, 26.0, 27.0, 18.0, 20.0, 13.0, 5.0, 11.0, 8.0, 7.0, 4.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.33251953125, -0.32281494140625, -0.3131103515625, -0.30340576171875, -0.293701171875, -0.28399658203125, -0.2742919921875, -0.26458740234375, -0.2548828125, -0.24517822265625, -0.2354736328125, -0.22576904296875, -0.216064453125, -0.20635986328125, -0.1966552734375, -0.18695068359375, -0.17724609375, -0.16754150390625, -0.1578369140625, -0.14813232421875, -0.138427734375, -0.12872314453125, -0.1190185546875, -0.10931396484375, -0.099609375, -0.08990478515625, -0.0802001953125, -0.07049560546875, -0.060791015625, -0.05108642578125, -0.0413818359375, -0.03167724609375, -0.02197265625, -0.01226806640625, -0.0025634765625, 0.00714111328125, 0.016845703125, 0.02655029296875, 0.0362548828125, 0.04595947265625, 0.0556640625, 0.06536865234375, 0.0750732421875, 0.08477783203125, 0.094482421875, 0.10418701171875, 0.1138916015625, 0.12359619140625, 0.13330078125, 0.14300537109375, 0.1527099609375, 0.16241455078125, 0.172119140625, 0.18182373046875, 0.1915283203125, 0.20123291015625, 0.2109375, 0.22064208984375, 0.2303466796875, 0.24005126953125, 0.249755859375, 0.25946044921875, 0.2691650390625, 0.27886962890625, 0.28857421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 7.0, 6.0, 16.0, 12.0, 7.0, 22.0, 12.0, 23.0, 26.0, 17.0, 28.0, 42.0, 31.0, 45.0, 54.0, 56.0, 43.0, 50.0, 55.0, 47.0, 51.0, 36.0, 46.0, 38.0, 24.0, 33.0, 27.0, 19.0, 16.0, 16.0, 16.0, 16.0, 12.0, 8.0, 4.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.600421905517578, -23.88871955871582, -23.177017211914062, -22.465316772460938, -21.75361442565918, -21.041912078857422, -20.330211639404297, -19.61850929260254, -18.90680694580078, -18.195104598999023, -17.483402252197266, -16.77170181274414, -16.059999465942383, -15.348297119140625, -14.636595726013184, -13.924894332885742, -13.213191986083984, -12.501489639282227, -11.789788246154785, -11.078086853027344, -10.366384506225586, -9.654682159423828, -8.942980766296387, -8.231279373168945, -7.5195770263671875, -6.807875156402588, -6.096173286437988, -5.384471416473389, -4.672769546508789, -3.9610676765441895, -3.24936580657959, -2.5376639366149902, -1.8259639739990234, -1.1142621040344238, -0.4025602340698242, 0.3091416358947754, 1.020843505859375, 1.7325453758239746, 2.444247245788574, 3.155949115753174, 3.8676509857177734, 4.579352855682373, 5.291054725646973, 6.002756595611572, 6.714458465576172, 7.4261603355407715, 8.137862205505371, 8.849563598632812, 9.56126594543457, 10.272968292236328, 10.98466968536377, 11.696371078491211, 12.408073425292969, 13.119775772094727, 13.831477165222168, 14.54317855834961, 15.254880905151367, 15.966583251953125, 16.67828369140625, 17.389986038208008, 18.101688385009766, 18.813390731811523, 19.52509307861328, 20.236793518066406, 20.948495864868164]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 9.0, 8.0, 10.0, 7.0, 14.0, 23.0, 28.0, 33.0, 31.0, 27.0, 23.0, 27.0, 38.0, 31.0, 44.0, 47.0, 45.0, 56.0, 40.0, 39.0, 35.0, 42.0, 49.0, 37.0, 29.0, 20.0, 28.0, 26.0, 34.0, 23.0, 17.0, 11.0, 12.0, 8.0, 9.0, 4.0, 6.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.148395538330078, -26.28829574584961, -25.428197860717773, -24.568099975585938, -23.70800018310547, -22.847900390625, -21.987802505493164, -21.127704620361328, -20.26760482788086, -19.40750503540039, -18.547407150268555, -17.68730926513672, -16.82720947265625, -15.967110633850098, -15.107011795043945, -14.246912956237793, -13.38681411743164, -12.526715278625488, -11.666616439819336, -10.806517601013184, -9.946418762207031, -9.086319923400879, -8.226221084594727, -7.366122245788574, -6.506023406982422, -5.6459245681762695, -4.785825729370117, -3.925726890563965, -3.0656280517578125, -2.20552921295166, -1.3454303741455078, -0.48533153533935547, 0.37476539611816406, 1.2348642349243164, 2.0949630737304688, 2.955061912536621, 3.8151607513427734, 4.675259590148926, 5.535358428955078, 6.3954572677612305, 7.255556106567383, 8.115654945373535, 8.975753784179688, 9.83585262298584, 10.695951461791992, 11.556050300598145, 12.416149139404297, 13.27624797821045, 14.136346817016602, 14.996445655822754, 15.856544494628906, 16.716644287109375, 17.57674217224121, 18.436840057373047, 19.296939849853516, 20.157039642333984, 21.01713752746582, 21.877235412597656, 22.737335205078125, 23.597434997558594, 24.45753288269043, 25.317630767822266, 26.177730560302734, 27.037830352783203, 27.89792823791504]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 7.0, 6.0, 10.0, 13.0, 24.0, 24.0, 43.0, 57.0, 100.0, 151.0, 207.0, 391.0, 539.0, 847.0, 1243.0, 1933.0, 3000.0, 4519.0, 6981.0, 10594.0, 15733.0, 22808.0, 32622.0, 44912.0, 59931.0, 76300.0, 91066.0, 100981.0, 105049.0, 100933.0, 90119.0, 75021.0, 59095.0, 44429.0, 31576.0, 22381.0, 14940.0, 10210.0, 6782.0, 4410.0, 2997.0, 1904.0, 1246.0, 871.0, 581.0, 328.0, 238.0, 136.0, 89.0, 69.0, 43.0, 29.0, 25.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0], "bins": [-17.078125, -16.535400390625, -15.99267578125, -15.449951171875, -14.9072265625, -14.364501953125, -13.82177734375, -13.279052734375, -12.736328125, -12.193603515625, -11.65087890625, -11.108154296875, -10.5654296875, -10.022705078125, -9.47998046875, -8.937255859375, -8.39453125, -7.851806640625, -7.30908203125, -6.766357421875, -6.2236328125, -5.680908203125, -5.13818359375, -4.595458984375, -4.052734375, -3.510009765625, -2.96728515625, -2.424560546875, -1.8818359375, -1.339111328125, -0.79638671875, -0.253662109375, 0.2890625, 0.831787109375, 1.37451171875, 1.917236328125, 2.4599609375, 3.002685546875, 3.54541015625, 4.088134765625, 4.630859375, 5.173583984375, 5.71630859375, 6.259033203125, 6.8017578125, 7.344482421875, 7.88720703125, 8.429931640625, 8.97265625, 9.515380859375, 10.05810546875, 10.600830078125, 11.1435546875, 11.686279296875, 12.22900390625, 12.771728515625, 13.314453125, 13.857177734375, 14.39990234375, 14.942626953125, 15.4853515625, 16.028076171875, 16.57080078125, 17.113525390625, 17.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 5.0, 6.0, 4.0, 8.0, 11.0, 12.0, 15.0, 26.0, 16.0, 19.0, 31.0, 39.0, 25.0, 26.0, 40.0, 34.0, 42.0, 37.0, 39.0, 44.0, 46.0, 45.0, 39.0, 45.0, 41.0, 32.0, 42.0, 28.0, 31.0, 28.0, 22.0, 15.0, 20.0, 18.0, 8.0, 13.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.5, -25.67041015625, -24.8408203125, -24.01123046875, -23.181640625, -22.35205078125, -21.5224609375, -20.69287109375, -19.86328125, -19.03369140625, -18.2041015625, -17.37451171875, -16.544921875, -15.71533203125, -14.8857421875, -14.05615234375, -13.2265625, -12.39697265625, -11.5673828125, -10.73779296875, -9.908203125, -9.07861328125, -8.2490234375, -7.41943359375, -6.58984375, -5.76025390625, -4.9306640625, -4.10107421875, -3.271484375, -2.44189453125, -1.6123046875, -0.78271484375, 0.046875, 0.87646484375, 1.7060546875, 2.53564453125, 3.365234375, 4.19482421875, 5.0244140625, 5.85400390625, 6.68359375, 7.51318359375, 8.3427734375, 9.17236328125, 10.001953125, 10.83154296875, 11.6611328125, 12.49072265625, 13.3203125, 14.14990234375, 14.9794921875, 15.80908203125, 16.638671875, 17.46826171875, 18.2978515625, 19.12744140625, 19.95703125, 20.78662109375, 21.6162109375, 22.44580078125, 23.275390625, 24.10498046875, 24.9345703125, 25.76416015625, 26.59375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 19.0, 24.0, 42.0, 64.0, 90.0, 158.0, 241.0, 319.0, 496.0, 700.0, 1093.0, 1612.0, 2313.0, 3556.0, 5385.0, 7919.0, 11314.0, 16307.0, 23865.0, 33267.0, 44829.0, 58701.0, 73421.0, 86906.0, 96453.0, 100428.0, 97257.0, 88248.0, 75057.0, 59491.0, 46026.0, 34199.0, 24620.0, 17245.0, 11883.0, 8044.0, 5710.0, 3667.0, 2517.0, 1694.0, 1092.0, 759.0, 480.0, 315.0, 252.0, 160.0, 112.0, 63.0, 47.0, 22.0, 29.0, 9.0, 10.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-16.4375, -15.91650390625, -15.3955078125, -14.87451171875, -14.353515625, -13.83251953125, -13.3115234375, -12.79052734375, -12.26953125, -11.74853515625, -11.2275390625, -10.70654296875, -10.185546875, -9.66455078125, -9.1435546875, -8.62255859375, -8.1015625, -7.58056640625, -7.0595703125, -6.53857421875, -6.017578125, -5.49658203125, -4.9755859375, -4.45458984375, -3.93359375, -3.41259765625, -2.8916015625, -2.37060546875, -1.849609375, -1.32861328125, -0.8076171875, -0.28662109375, 0.234375, 0.75537109375, 1.2763671875, 1.79736328125, 2.318359375, 2.83935546875, 3.3603515625, 3.88134765625, 4.40234375, 4.92333984375, 5.4443359375, 5.96533203125, 6.486328125, 7.00732421875, 7.5283203125, 8.04931640625, 8.5703125, 9.09130859375, 9.6123046875, 10.13330078125, 10.654296875, 11.17529296875, 11.6962890625, 12.21728515625, 12.73828125, 13.25927734375, 13.7802734375, 14.30126953125, 14.822265625, 15.34326171875, 15.8642578125, 16.38525390625, 16.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 5.0, 11.0, 17.0, 20.0, 18.0, 16.0, 19.0, 27.0, 20.0, 25.0, 19.0, 29.0, 33.0, 30.0, 33.0, 30.0, 29.0, 28.0, 43.0, 42.0, 50.0, 40.0, 40.0, 36.0, 34.0, 39.0, 27.0, 24.0, 21.0, 27.0, 15.0, 19.0, 11.0, 13.0, 13.0, 18.0, 8.0, 11.0, 11.0, 7.0, 5.0, 4.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.15625, -14.6834716796875, -14.210693359375, -13.7379150390625, -13.26513671875, -12.7923583984375, -12.319580078125, -11.8468017578125, -11.3740234375, -10.9012451171875, -10.428466796875, -9.9556884765625, -9.48291015625, -9.0101318359375, -8.537353515625, -8.0645751953125, -7.591796875, -7.1190185546875, -6.646240234375, -6.1734619140625, -5.70068359375, -5.2279052734375, -4.755126953125, -4.2823486328125, -3.8095703125, -3.3367919921875, -2.864013671875, -2.3912353515625, -1.91845703125, -1.4456787109375, -0.972900390625, -0.5001220703125, -0.02734375, 0.4454345703125, 0.918212890625, 1.3909912109375, 1.86376953125, 2.3365478515625, 2.809326171875, 3.2821044921875, 3.7548828125, 4.2276611328125, 4.700439453125, 5.1732177734375, 5.64599609375, 6.1187744140625, 6.591552734375, 7.0643310546875, 7.537109375, 8.0098876953125, 8.482666015625, 8.9554443359375, 9.42822265625, 9.9010009765625, 10.373779296875, 10.8465576171875, 11.3193359375, 11.7921142578125, 12.264892578125, 12.7376708984375, 13.21044921875, 13.6832275390625, 14.156005859375, 14.6287841796875, 15.1015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 12.0, 26.0, 38.0, 53.0, 74.0, 122.0, 206.0, 337.0, 586.0, 1043.0, 1813.0, 3346.0, 6431.0, 11610.0, 21871.0, 38398.0, 66547.0, 105494.0, 146613.0, 169008.0, 159129.0, 122755.0, 82001.0, 49814.0, 27960.0, 15145.0, 8215.0, 4346.0, 2353.0, 1341.0, 778.0, 414.0, 253.0, 152.0, 89.0, 60.0, 32.0, 25.0, 15.0, 16.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.57421875, -7.33538818359375, -7.0965576171875, -6.85772705078125, -6.618896484375, -6.38006591796875, -6.1412353515625, -5.90240478515625, -5.66357421875, -5.42474365234375, -5.1859130859375, -4.94708251953125, -4.708251953125, -4.46942138671875, -4.2305908203125, -3.99176025390625, -3.7529296875, -3.51409912109375, -3.2752685546875, -3.03643798828125, -2.797607421875, -2.55877685546875, -2.3199462890625, -2.08111572265625, -1.84228515625, -1.60345458984375, -1.3646240234375, -1.12579345703125, -0.886962890625, -0.64813232421875, -0.4093017578125, -0.17047119140625, 0.068359375, 0.30718994140625, 0.5460205078125, 0.78485107421875, 1.023681640625, 1.26251220703125, 1.5013427734375, 1.74017333984375, 1.97900390625, 2.21783447265625, 2.4566650390625, 2.69549560546875, 2.934326171875, 3.17315673828125, 3.4119873046875, 3.65081787109375, 3.8896484375, 4.12847900390625, 4.3673095703125, 4.60614013671875, 4.844970703125, 5.08380126953125, 5.3226318359375, 5.56146240234375, 5.80029296875, 6.03912353515625, 6.2779541015625, 6.51678466796875, 6.755615234375, 6.99444580078125, 7.2332763671875, 7.47210693359375, 7.7109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 8.0, 11.0, 13.0, 15.0, 22.0, 16.0, 15.0, 33.0, 32.0, 39.0, 40.0, 47.0, 47.0, 42.0, 41.0, 62.0, 49.0, 50.0, 38.0, 49.0, 38.0, 36.0, 29.0, 33.0, 41.0, 24.0, 20.0, 14.0, 12.0, 14.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005679130554199219, -0.0005493834614753723, -0.0005308538675308228, -0.0005123242735862732, -0.0004937946796417236, -0.00047526508569717407, -0.0004567354917526245, -0.00043820589780807495, -0.0004196763038635254, -0.00040114670991897583, -0.00038261711597442627, -0.0003640875220298767, -0.00034555792808532715, -0.0003270283341407776, -0.00030849874019622803, -0.00028996914625167847, -0.0002714395523071289, -0.00025290995836257935, -0.00023438036441802979, -0.00021585077047348022, -0.00019732117652893066, -0.0001787915825843811, -0.00016026198863983154, -0.00014173239469528198, -0.00012320280075073242, -0.00010467320680618286, -8.61436128616333e-05, -6.761401891708374e-05, -4.908442497253418e-05, -3.055483102798462e-05, -1.2025237083435059e-05, 6.504356861114502e-06, 2.5033950805664062e-05, 4.356354475021362e-05, 6.209313869476318e-05, 8.062273263931274e-05, 9.91523265838623e-05, 0.00011768192052841187, 0.00013621151447296143, 0.00015474110841751099, 0.00017327070236206055, 0.0001918002963066101, 0.00021032989025115967, 0.00022885948419570923, 0.0002473890781402588, 0.00026591867208480835, 0.0002844482660293579, 0.00030297785997390747, 0.00032150745391845703, 0.0003400370478630066, 0.00035856664180755615, 0.0003770962357521057, 0.0003956258296966553, 0.00041415542364120483, 0.0004326850175857544, 0.00045121461153030396, 0.0004697442054748535, 0.0004882737994194031, 0.0005068033933639526, 0.0005253329873085022, 0.0005438625812530518, 0.0005623921751976013, 0.0005809217691421509, 0.0005994513630867004, 0.00061798095703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 7.0, 8.0, 12.0, 15.0, 32.0, 44.0, 81.0, 104.0, 193.0, 279.0, 494.0, 713.0, 1185.0, 1994.0, 3210.0, 5537.0, 9181.0, 15398.0, 25255.0, 39870.0, 60866.0, 86920.0, 114126.0, 134115.0, 136600.0, 122845.0, 97486.0, 69950.0, 46606.0, 29691.0, 18350.0, 10868.0, 6575.0, 3879.0, 2306.0, 1398.0, 887.0, 526.0, 344.0, 204.0, 141.0, 92.0, 60.0, 46.0, 24.0, 17.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0], "bins": [-7.51171875, -7.3040771484375, -7.096435546875, -6.8887939453125, -6.68115234375, -6.4735107421875, -6.265869140625, -6.0582275390625, -5.8505859375, -5.6429443359375, -5.435302734375, -5.2276611328125, -5.02001953125, -4.8123779296875, -4.604736328125, -4.3970947265625, -4.189453125, -3.9818115234375, -3.774169921875, -3.5665283203125, -3.35888671875, -3.1512451171875, -2.943603515625, -2.7359619140625, -2.5283203125, -2.3206787109375, -2.113037109375, -1.9053955078125, -1.69775390625, -1.4901123046875, -1.282470703125, -1.0748291015625, -0.8671875, -0.6595458984375, -0.451904296875, -0.2442626953125, -0.03662109375, 0.1710205078125, 0.378662109375, 0.5863037109375, 0.7939453125, 1.0015869140625, 1.209228515625, 1.4168701171875, 1.62451171875, 1.8321533203125, 2.039794921875, 2.2474365234375, 2.455078125, 2.6627197265625, 2.870361328125, 3.0780029296875, 3.28564453125, 3.4932861328125, 3.700927734375, 3.9085693359375, 4.1162109375, 4.3238525390625, 4.531494140625, 4.7391357421875, 4.94677734375, 5.1544189453125, 5.362060546875, 5.5697021484375, 5.77734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 12.0, 16.0, 21.0, 19.0, 13.0, 27.0, 29.0, 43.0, 42.0, 31.0, 43.0, 48.0, 48.0, 55.0, 47.0, 54.0, 53.0, 66.0, 39.0, 43.0, 33.0, 31.0, 27.0, 15.0, 18.0, 18.0, 18.0, 17.0, 10.0, 7.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.75030517578125, -2.6568603515625, -2.56341552734375, -2.469970703125, -2.37652587890625, -2.2830810546875, -2.18963623046875, -2.09619140625, -2.00274658203125, -1.9093017578125, -1.81585693359375, -1.722412109375, -1.62896728515625, -1.5355224609375, -1.44207763671875, -1.3486328125, -1.25518798828125, -1.1617431640625, -1.06829833984375, -0.974853515625, -0.88140869140625, -0.7879638671875, -0.69451904296875, -0.60107421875, -0.50762939453125, -0.4141845703125, -0.32073974609375, -0.227294921875, -0.13385009765625, -0.0404052734375, 0.05303955078125, 0.146484375, 0.23992919921875, 0.3333740234375, 0.42681884765625, 0.520263671875, 0.61370849609375, 0.7071533203125, 0.80059814453125, 0.89404296875, 0.98748779296875, 1.0809326171875, 1.17437744140625, 1.267822265625, 1.36126708984375, 1.4547119140625, 1.54815673828125, 1.6416015625, 1.73504638671875, 1.8284912109375, 1.92193603515625, 2.015380859375, 2.10882568359375, 2.2022705078125, 2.29571533203125, 2.38916015625, 2.48260498046875, 2.5760498046875, 2.66949462890625, 2.762939453125, 2.85638427734375, 2.9498291015625, 3.04327392578125, 3.13671875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 7.0, 4.0, 6.0, 10.0, 8.0, 6.0, 16.0, 17.0, 25.0, 29.0, 18.0, 29.0, 38.0, 30.0, 47.0, 51.0, 46.0, 50.0, 44.0, 56.0, 67.0, 35.0, 43.0, 42.0, 31.0, 45.0, 27.0, 21.0, 25.0, 21.0, 19.0, 16.0, 17.0, 10.0, 7.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.900941848754883, -23.196670532226562, -22.492401123046875, -21.788129806518555, -21.083858489990234, -20.379589080810547, -19.675317764282227, -18.971046447753906, -18.26677703857422, -17.5625057220459, -16.85823631286621, -16.15396499633789, -15.449694633483887, -14.745424270629883, -14.041152954101562, -13.336882591247559, -12.632612228393555, -11.92834186553955, -11.224071502685547, -10.519800186157227, -9.815529823303223, -9.111259460449219, -8.406988143920898, -7.7027177810668945, -6.998447418212891, -6.294177055358887, -5.589906215667725, -4.8856353759765625, -4.181365013122559, -3.4770944118499756, -2.7728238105773926, -2.0685529708862305, -1.3642845153808594, -0.6600139141082764, 0.04425668716430664, 0.7485272884368896, 1.4527978897094727, 2.1570684909820557, 2.8613390922546387, 3.565609931945801, 4.269880294799805, 4.974150657653809, 5.678421497344971, 6.382692337036133, 7.086962699890137, 7.791233062744141, 8.495504379272461, 9.199774742126465, 9.904045104980469, 10.608315467834473, 11.312585830688477, 12.016857147216797, 12.7211275100708, 13.425397872924805, 14.129669189453125, 14.833939552307129, 15.538209915161133, 16.242481231689453, 16.94675064086914, 17.65102195739746, 18.35529327392578, 19.05956268310547, 19.76383399963379, 20.46810531616211, 21.172374725341797]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 6.0, 7.0, 12.0, 8.0, 17.0, 16.0, 19.0, 19.0, 20.0, 24.0, 32.0, 27.0, 28.0, 33.0, 45.0, 38.0, 28.0, 55.0, 40.0, 44.0, 34.0, 40.0, 36.0, 29.0, 39.0, 32.0, 30.0, 32.0, 28.0, 24.0, 23.0, 20.0, 18.0, 17.0, 12.0, 7.0, 7.0, 9.0, 10.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.045042037963867, -23.230960845947266, -22.416881561279297, -21.602800369262695, -20.788719177246094, -19.974639892578125, -19.160558700561523, -18.346477508544922, -17.532398223876953, -16.71831703186035, -15.904236793518066, -15.090156555175781, -14.27607536315918, -13.461995124816895, -12.64791488647461, -11.833833694458008, -11.019752502441406, -10.205672264099121, -9.39159107208252, -8.577510833740234, -7.763430118560791, -6.949349403381348, -6.1352691650390625, -5.321188449859619, -4.507107734680176, -3.6930270195007324, -2.878946542739868, -2.064866065979004, -1.2507853507995605, -0.4367046356201172, 0.37737560272216797, 1.1914563179016113, 2.0055389404296875, 2.819619655609131, 3.633700132369995, 4.447780609130859, 5.261861324310303, 6.075942039489746, 6.890022277832031, 7.704102993011475, 8.518183708190918, 9.332263946533203, 10.146345138549805, 10.96042537689209, 11.774505615234375, 12.588586807250977, 13.402667045593262, 14.216747283935547, 15.030828475952148, 15.844908714294434, 16.65898895263672, 17.47307014465332, 18.287151336669922, 19.10123062133789, 19.915311813354492, 20.729393005371094, 21.543472290039062, 22.357553482055664, 23.171632766723633, 23.985713958740234, 24.799795150756836, 25.613876342773438, 26.427955627441406, 27.242036819458008, 28.05611801147461]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [5.0, 3.0, 8.0, 15.0, 29.0, 33.0, 50.0, 64.0, 121.0, 210.0, 334.0, 517.0, 860.0, 1385.0, 2080.0, 3484.0, 5595.0, 8930.0, 14401.0, 22351.0, 35620.0, 55633.0, 86604.0, 131257.0, 194133.0, 275969.0, 370630.0, 453945.0, 502938.0, 493926.0, 432693.0, 340834.0, 252761.0, 174634.0, 117972.0, 77383.0, 49597.0, 32110.0, 20155.0, 12954.0, 7953.0, 5112.0, 3313.0, 1989.0, 1361.0, 878.0, 523.0, 328.0, 230.0, 143.0, 104.0, 58.0, 41.0, 15.0, 13.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.171875, -15.611572265625, -15.05126953125, -14.490966796875, -13.9306640625, -13.370361328125, -12.81005859375, -12.249755859375, -11.689453125, -11.129150390625, -10.56884765625, -10.008544921875, -9.4482421875, -8.887939453125, -8.32763671875, -7.767333984375, -7.20703125, -6.646728515625, -6.08642578125, -5.526123046875, -4.9658203125, -4.405517578125, -3.84521484375, -3.284912109375, -2.724609375, -2.164306640625, -1.60400390625, -1.043701171875, -0.4833984375, 0.076904296875, 0.63720703125, 1.197509765625, 1.7578125, 2.318115234375, 2.87841796875, 3.438720703125, 3.9990234375, 4.559326171875, 5.11962890625, 5.679931640625, 6.240234375, 6.800537109375, 7.36083984375, 7.921142578125, 8.4814453125, 9.041748046875, 9.60205078125, 10.162353515625, 10.72265625, 11.282958984375, 11.84326171875, 12.403564453125, 12.9638671875, 13.524169921875, 14.08447265625, 14.644775390625, 15.205078125, 15.765380859375, 16.32568359375, 16.885986328125, 17.4462890625, 18.006591796875, 18.56689453125, 19.127197265625, 19.6875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 8.0, 7.0, 9.0, 10.0, 14.0, 17.0, 14.0, 19.0, 31.0, 37.0, 35.0, 38.0, 30.0, 36.0, 36.0, 36.0, 42.0, 43.0, 55.0, 46.0, 42.0, 44.0, 29.0, 47.0, 37.0, 24.0, 31.0, 34.0, 23.0, 16.0, 19.0, 14.0, 10.0, 12.0, 7.0, 6.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.349853515625, -17.69970703125, -17.049560546875, -16.3994140625, -15.749267578125, -15.09912109375, -14.448974609375, -13.798828125, -13.148681640625, -12.49853515625, -11.848388671875, -11.1982421875, -10.548095703125, -9.89794921875, -9.247802734375, -8.59765625, -7.947509765625, -7.29736328125, -6.647216796875, -5.9970703125, -5.346923828125, -4.69677734375, -4.046630859375, -3.396484375, -2.746337890625, -2.09619140625, -1.446044921875, -0.7958984375, -0.145751953125, 0.50439453125, 1.154541015625, 1.8046875, 2.454833984375, 3.10498046875, 3.755126953125, 4.4052734375, 5.055419921875, 5.70556640625, 6.355712890625, 7.005859375, 7.656005859375, 8.30615234375, 8.956298828125, 9.6064453125, 10.256591796875, 10.90673828125, 11.556884765625, 12.20703125, 12.857177734375, 13.50732421875, 14.157470703125, 14.8076171875, 15.457763671875, 16.10791015625, 16.758056640625, 17.408203125, 18.058349609375, 18.70849609375, 19.358642578125, 20.0087890625, 20.658935546875, 21.30908203125, 21.959228515625, 22.609375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 9.0, 13.0, 20.0, 43.0, 59.0, 96.0, 164.0, 257.0, 436.0, 731.0, 1313.0, 2193.0, 3665.0, 6121.0, 10192.0, 16761.0, 27300.0, 43981.0, 69806.0, 106494.0, 157553.0, 223436.0, 299336.0, 374806.0, 436955.0, 463122.0, 450467.0, 400731.0, 327970.0, 249918.0, 179856.0, 123473.0, 81611.0, 52500.0, 32909.0, 19956.0, 12151.0, 7204.0, 4286.0, 2559.0, 1537.0, 899.0, 576.0, 340.0, 209.0, 116.0, 67.0, 42.0, 18.0, 11.0, 10.0, 11.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.0306396484375, -14.506591796875, -13.9825439453125, -13.45849609375, -12.9344482421875, -12.410400390625, -11.8863525390625, -11.3623046875, -10.8382568359375, -10.314208984375, -9.7901611328125, -9.26611328125, -8.7420654296875, -8.218017578125, -7.6939697265625, -7.169921875, -6.6458740234375, -6.121826171875, -5.5977783203125, -5.07373046875, -4.5496826171875, -4.025634765625, -3.5015869140625, -2.9775390625, -2.4534912109375, -1.929443359375, -1.4053955078125, -0.88134765625, -0.3572998046875, 0.166748046875, 0.6907958984375, 1.21484375, 1.7388916015625, 2.262939453125, 2.7869873046875, 3.31103515625, 3.8350830078125, 4.359130859375, 4.8831787109375, 5.4072265625, 5.9312744140625, 6.455322265625, 6.9793701171875, 7.50341796875, 8.0274658203125, 8.551513671875, 9.0755615234375, 9.599609375, 10.1236572265625, 10.647705078125, 11.1717529296875, 11.69580078125, 12.2198486328125, 12.743896484375, 13.2679443359375, 13.7919921875, 14.3160400390625, 14.840087890625, 15.3641357421875, 15.88818359375, 16.4122314453125, 16.936279296875, 17.4603271484375, 17.984375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 15.0, 18.0, 20.0, 16.0, 20.0, 32.0, 39.0, 39.0, 79.0, 60.0, 51.0, 83.0, 107.0, 141.0, 127.0, 154.0, 169.0, 175.0, 177.0, 202.0, 215.0, 203.0, 207.0, 186.0, 188.0, 174.0, 156.0, 157.0, 134.0, 120.0, 113.0, 101.0, 73.0, 54.0, 57.0, 43.0, 27.0, 22.0, 22.0, 16.0, 18.0, 12.0, 10.0, 5.0, 13.0, 2.0, 3.0, 2.0, 3.0, 3.0], "bins": [-10.1171875, -9.832763671875, -9.54833984375, -9.263916015625, -8.9794921875, -8.695068359375, -8.41064453125, -8.126220703125, -7.841796875, -7.557373046875, -7.27294921875, -6.988525390625, -6.7041015625, -6.419677734375, -6.13525390625, -5.850830078125, -5.56640625, -5.281982421875, -4.99755859375, -4.713134765625, -4.4287109375, -4.144287109375, -3.85986328125, -3.575439453125, -3.291015625, -3.006591796875, -2.72216796875, -2.437744140625, -2.1533203125, -1.868896484375, -1.58447265625, -1.300048828125, -1.015625, -0.731201171875, -0.44677734375, -0.162353515625, 0.1220703125, 0.406494140625, 0.69091796875, 0.975341796875, 1.259765625, 1.544189453125, 1.82861328125, 2.113037109375, 2.3974609375, 2.681884765625, 2.96630859375, 3.250732421875, 3.53515625, 3.819580078125, 4.10400390625, 4.388427734375, 4.6728515625, 4.957275390625, 5.24169921875, 5.526123046875, 5.810546875, 6.094970703125, 6.37939453125, 6.663818359375, 6.9482421875, 7.232666015625, 7.51708984375, 7.801513671875, 8.0859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 5.0, 16.0, 12.0, 19.0, 19.0, 37.0, 25.0, 35.0, 27.0, 49.0, 59.0, 40.0, 43.0, 43.0, 50.0, 60.0, 39.0, 45.0, 30.0, 36.0, 45.0, 32.0, 23.0, 19.0, 16.0, 24.0, 15.0, 21.0, 10.0, 11.0, 12.0, 7.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.732458114624023, -17.11579704284668, -16.499135971069336, -15.882474899291992, -15.265813827514648, -14.649152755737305, -14.032491683959961, -13.415830612182617, -12.799169540405273, -12.18250846862793, -11.565847396850586, -10.949186325073242, -10.332525253295898, -9.715864181518555, -9.099203109741211, -8.482542037963867, -7.865880966186523, -7.24921989440918, -6.632558822631836, -6.015897750854492, -5.399236679077148, -4.782575607299805, -4.165914535522461, -3.549253463745117, -2.9325923919677734, -2.3159313201904297, -1.699270248413086, -1.0826091766357422, -0.46594810485839844, 0.1507129669189453, 0.7673740386962891, 1.3840351104736328, 2.0006942749023438, 2.6173553466796875, 3.2340164184570312, 3.850677490234375, 4.467338562011719, 5.0839996337890625, 5.700660705566406, 6.31732177734375, 6.933982849121094, 7.5506439208984375, 8.167304992675781, 8.783966064453125, 9.400627136230469, 10.017288208007812, 10.633949279785156, 11.2506103515625, 11.867271423339844, 12.483932495117188, 13.100593566894531, 13.717254638671875, 14.333915710449219, 14.950576782226562, 15.567237854003906, 16.18389892578125, 16.800559997558594, 17.417221069335938, 18.03388214111328, 18.650543212890625, 19.26720428466797, 19.883865356445312, 20.500526428222656, 21.1171875, 21.733848571777344]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 3.0, 8.0, 10.0, 13.0, 15.0, 15.0, 14.0, 17.0, 19.0, 26.0, 26.0, 27.0, 23.0, 35.0, 35.0, 49.0, 36.0, 38.0, 41.0, 47.0, 35.0, 43.0, 39.0, 52.0, 25.0, 35.0, 29.0, 39.0, 32.0, 27.0, 30.0, 17.0, 21.0, 9.0, 11.0, 11.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.07156753540039, -21.348522186279297, -20.625476837158203, -19.90243148803711, -19.17938804626465, -18.456342697143555, -17.73329734802246, -17.010251998901367, -16.287208557128906, -15.564163208007812, -14.841118812561035, -14.118073463439941, -13.395029067993164, -12.67198371887207, -11.948938369750977, -11.225893020629883, -10.502847671508789, -9.779802322387695, -9.056757926940918, -8.333712577819824, -7.610667705535889, -6.887622833251953, -6.164577484130859, -5.441532611846924, -4.718487739562988, -3.9954428672790527, -3.272397756576538, -2.5493526458740234, -1.826307773590088, -1.1032629013061523, -0.3802175521850586, 0.34282732009887695, 1.0658721923828125, 1.7889171838760376, 2.5119621753692627, 3.2350072860717773, 3.958052158355713, 4.681097030639648, 5.404142379760742, 6.127187252044678, 6.850232124328613, 7.573276996612549, 8.296321868896484, 9.019367218017578, 9.742412567138672, 10.46545696258545, 11.188502311706543, 11.91154670715332, 12.634592056274414, 13.357637405395508, 14.080681800842285, 14.803727149963379, 15.526771545410156, 16.24981689453125, 16.972862243652344, 17.695907592773438, 18.41895294189453, 19.141998291015625, 19.86504364013672, 20.588088989257812, 21.311132431030273, 22.034177780151367, 22.75722312927246, 23.480268478393555, 24.203311920166016]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 18.0, 18.0, 32.0, 48.0, 66.0, 93.0, 130.0, 184.0, 277.0, 400.0, 629.0, 873.0, 1316.0, 1892.0, 2821.0, 4235.0, 6402.0, 9904.0, 14936.0, 23448.0, 37786.0, 60498.0, 95904.0, 147841.0, 195939.0, 158484.0, 104042.0, 65837.0, 41041.0, 25863.0, 16328.0, 10320.0, 6960.0, 4601.0, 2978.0, 2008.0, 1391.0, 900.0, 649.0, 450.0, 301.0, 199.0, 178.0, 88.0, 68.0, 63.0, 25.0, 19.0, 24.0, 20.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.8359375, -3.714508056640625, -3.59307861328125, -3.471649169921875, -3.3502197265625, -3.228790283203125, -3.10736083984375, -2.985931396484375, -2.864501953125, -2.743072509765625, -2.62164306640625, -2.500213623046875, -2.3787841796875, -2.257354736328125, -2.13592529296875, -2.014495849609375, -1.89306640625, -1.771636962890625, -1.65020751953125, -1.528778076171875, -1.4073486328125, -1.285919189453125, -1.16448974609375, -1.043060302734375, -0.921630859375, -0.800201416015625, -0.67877197265625, -0.557342529296875, -0.4359130859375, -0.314483642578125, -0.19305419921875, -0.071624755859375, 0.0498046875, 0.171234130859375, 0.29266357421875, 0.414093017578125, 0.5355224609375, 0.656951904296875, 0.77838134765625, 0.899810791015625, 1.021240234375, 1.142669677734375, 1.26409912109375, 1.385528564453125, 1.5069580078125, 1.628387451171875, 1.74981689453125, 1.871246337890625, 1.99267578125, 2.114105224609375, 2.23553466796875, 2.356964111328125, 2.4783935546875, 2.599822998046875, 2.72125244140625, 2.842681884765625, 2.964111328125, 3.085540771484375, 3.20697021484375, 3.328399658203125, 3.4498291015625, 3.571258544921875, 3.69268798828125, 3.814117431640625, 3.935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 9.0, 11.0, 15.0, 15.0, 20.0, 14.0, 18.0, 15.0, 20.0, 24.0, 21.0, 23.0, 34.0, 36.0, 40.0, 37.0, 42.0, 39.0, 39.0, 45.0, 38.0, 52.0, 36.0, 35.0, 30.0, 27.0, 30.0, 36.0, 24.0, 36.0, 21.0, 17.0, 13.0, 11.0, 11.0, 15.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.21875, -19.49658203125, -18.7744140625, -18.05224609375, -17.330078125, -16.60791015625, -15.8857421875, -15.16357421875, -14.44140625, -13.71923828125, -12.9970703125, -12.27490234375, -11.552734375, -10.83056640625, -10.1083984375, -9.38623046875, -8.6640625, -7.94189453125, -7.2197265625, -6.49755859375, -5.775390625, -5.05322265625, -4.3310546875, -3.60888671875, -2.88671875, -2.16455078125, -1.4423828125, -0.72021484375, 0.001953125, 0.72412109375, 1.4462890625, 2.16845703125, 2.890625, 3.61279296875, 4.3349609375, 5.05712890625, 5.779296875, 6.50146484375, 7.2236328125, 7.94580078125, 8.66796875, 9.39013671875, 10.1123046875, 10.83447265625, 11.556640625, 12.27880859375, 13.0009765625, 13.72314453125, 14.4453125, 15.16748046875, 15.8896484375, 16.61181640625, 17.333984375, 18.05615234375, 18.7783203125, 19.50048828125, 20.22265625, 20.94482421875, 21.6669921875, 22.38916015625, 23.111328125, 23.83349609375, 24.5556640625, 25.27783203125, 26.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 12.0, 18.0, 29.0, 29.0, 55.0, 94.0, 131.0, 230.0, 332.0, 582.0, 877.0, 1339.0, 2114.0, 3514.0, 5887.0, 9978.0, 16806.0, 29348.0, 52397.0, 97171.0, 187935.0, 271645.0, 168547.0, 87558.0, 47323.0, 26628.0, 15205.0, 8922.0, 5359.0, 3292.0, 1896.0, 1225.0, 725.0, 491.0, 322.0, 213.0, 115.0, 76.0, 59.0, 25.0, 11.0, 21.0, 11.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.33203125, -4.202392578125, -4.07275390625, -3.943115234375, -3.8134765625, -3.683837890625, -3.55419921875, -3.424560546875, -3.294921875, -3.165283203125, -3.03564453125, -2.906005859375, -2.7763671875, -2.646728515625, -2.51708984375, -2.387451171875, -2.2578125, -2.128173828125, -1.99853515625, -1.868896484375, -1.7392578125, -1.609619140625, -1.47998046875, -1.350341796875, -1.220703125, -1.091064453125, -0.96142578125, -0.831787109375, -0.7021484375, -0.572509765625, -0.44287109375, -0.313232421875, -0.18359375, -0.053955078125, 0.07568359375, 0.205322265625, 0.3349609375, 0.464599609375, 0.59423828125, 0.723876953125, 0.853515625, 0.983154296875, 1.11279296875, 1.242431640625, 1.3720703125, 1.501708984375, 1.63134765625, 1.760986328125, 1.890625, 2.020263671875, 2.14990234375, 2.279541015625, 2.4091796875, 2.538818359375, 2.66845703125, 2.798095703125, 2.927734375, 3.057373046875, 3.18701171875, 3.316650390625, 3.4462890625, 3.575927734375, 3.70556640625, 3.835205078125, 3.96484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 7.0, 8.0, 6.0, 3.0, 3.0, 7.0, 5.0, 14.0, 13.0, 19.0, 21.0, 29.0, 31.0, 25.0, 16.0, 27.0, 33.0, 45.0, 38.0, 39.0, 38.0, 41.0, 45.0, 38.0, 46.0, 40.0, 53.0, 29.0, 45.0, 33.0, 22.0, 20.0, 28.0, 21.0, 19.0, 23.0, 17.0, 18.0, 9.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.45751953125, -12.9775390625, -12.49755859375, -12.017578125, -11.53759765625, -11.0576171875, -10.57763671875, -10.09765625, -9.61767578125, -9.1376953125, -8.65771484375, -8.177734375, -7.69775390625, -7.2177734375, -6.73779296875, -6.2578125, -5.77783203125, -5.2978515625, -4.81787109375, -4.337890625, -3.85791015625, -3.3779296875, -2.89794921875, -2.41796875, -1.93798828125, -1.4580078125, -0.97802734375, -0.498046875, -0.01806640625, 0.4619140625, 0.94189453125, 1.421875, 1.90185546875, 2.3818359375, 2.86181640625, 3.341796875, 3.82177734375, 4.3017578125, 4.78173828125, 5.26171875, 5.74169921875, 6.2216796875, 6.70166015625, 7.181640625, 7.66162109375, 8.1416015625, 8.62158203125, 9.1015625, 9.58154296875, 10.0615234375, 10.54150390625, 11.021484375, 11.50146484375, 11.9814453125, 12.46142578125, 12.94140625, 13.42138671875, 13.9013671875, 14.38134765625, 14.861328125, 15.34130859375, 15.8212890625, 16.30126953125, 16.78125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 2.0, 3.0, 8.0, 6.0, 8.0, 19.0, 21.0, 35.0, 51.0, 78.0, 93.0, 134.0, 164.0, 247.0, 339.0, 529.0, 765.0, 1060.0, 1505.0, 2376.0, 3424.0, 5241.0, 8154.0, 12614.0, 20724.0, 34925.0, 63336.0, 128071.0, 292836.0, 236625.0, 101664.0, 52605.0, 30236.0, 18167.0, 11098.0, 7112.0, 4561.0, 2999.0, 2065.0, 1443.0, 957.0, 660.0, 472.0, 316.0, 224.0, 161.0, 120.0, 81.0, 60.0, 40.0, 40.0, 25.0, 18.0, 16.0, 11.0, 9.0, 2.0, 5.0, 4.0, 3.0], "bins": [-0.276611328125, -0.2681922912597656, -0.25977325439453125, -0.2513542175292969, -0.2429351806640625, -0.23451614379882812, -0.22609710693359375, -0.21767807006835938, -0.209259033203125, -0.20083999633789062, -0.19242095947265625, -0.18400192260742188, -0.1755828857421875, -0.16716384887695312, -0.15874481201171875, -0.15032577514648438, -0.14190673828125, -0.13348770141601562, -0.12506866455078125, -0.11664962768554688, -0.1082305908203125, -0.09981155395507812, -0.09139251708984375, -0.08297348022460938, -0.074554443359375, -0.06613540649414062, -0.05771636962890625, -0.049297332763671875, -0.0408782958984375, -0.032459259033203125, -0.02404022216796875, -0.015621185302734375, -0.0072021484375, 0.001216888427734375, 0.00963592529296875, 0.018054962158203125, 0.0264739990234375, 0.034893035888671875, 0.04331207275390625, 0.051731109619140625, 0.060150146484375, 0.06856918334960938, 0.07698822021484375, 0.08540725708007812, 0.0938262939453125, 0.10224533081054688, 0.11066436767578125, 0.11908340454101562, 0.12750244140625, 0.13592147827148438, 0.14434051513671875, 0.15275955200195312, 0.1611785888671875, 0.16959762573242188, 0.17801666259765625, 0.18643569946289062, 0.194854736328125, 0.20327377319335938, 0.21169281005859375, 0.22011184692382812, 0.2285308837890625, 0.23694992065429688, 0.24536895751953125, 0.2537879943847656, 0.26220703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 15.0, 19.0, 21.0, 28.0, 25.0, 39.0, 37.0, 38.0, 59.0, 46.0, 55.0, 50.0, 65.0, 60.0, 60.0, 59.0, 43.0, 45.0, 54.0, 22.0, 30.0, 18.0, 23.0, 10.0, 6.0, 14.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8041343688964844e-05, -4.660803824663162e-05, -4.51747328042984e-05, -4.374142736196518e-05, -4.230812191963196e-05, -4.0874816477298737e-05, -3.9441511034965515e-05, -3.8008205592632294e-05, -3.657490015029907e-05, -3.514159470796585e-05, -3.370828926563263e-05, -3.227498382329941e-05, -3.0841678380966187e-05, -2.9408372938632965e-05, -2.7975067496299744e-05, -2.6541762053966522e-05, -2.51084566116333e-05, -2.367515116930008e-05, -2.2241845726966858e-05, -2.0808540284633636e-05, -1.9375234842300415e-05, -1.7941929399967194e-05, -1.6508623957633972e-05, -1.507531851530075e-05, -1.364201307296753e-05, -1.2208707630634308e-05, -1.0775402188301086e-05, -9.342096745967865e-06, -7.908791303634644e-06, -6.475485861301422e-06, -5.042180418968201e-06, -3.6088749766349792e-06, -2.175569534301758e-06, -7.422640919685364e-07, 6.910413503646851e-07, 2.1243467926979065e-06, 3.557652235031128e-06, 4.990957677364349e-06, 6.424263119697571e-06, 7.857568562030792e-06, 9.290874004364014e-06, 1.0724179446697235e-05, 1.2157484889030457e-05, 1.3590790331363678e-05, 1.50240957736969e-05, 1.645740121603012e-05, 1.7890706658363342e-05, 1.9324012100696564e-05, 2.0757317543029785e-05, 2.2190622985363007e-05, 2.3623928427696228e-05, 2.505723387002945e-05, 2.649053931236267e-05, 2.7923844754695892e-05, 2.9357150197029114e-05, 3.0790455639362335e-05, 3.222376108169556e-05, 3.365706652402878e-05, 3.5090371966362e-05, 3.652367740869522e-05, 3.795698285102844e-05, 3.9390288293361664e-05, 4.0823593735694885e-05, 4.225689917802811e-05, 4.369020462036133e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 9.0, 5.0, 15.0, 25.0, 41.0, 68.0, 88.0, 140.0, 188.0, 325.0, 411.0, 709.0, 1024.0, 1503.0, 2260.0, 3430.0, 5388.0, 8301.0, 13218.0, 21459.0, 36230.0, 61623.0, 115788.0, 275348.0, 247030.0, 106490.0, 58012.0, 33740.0, 20278.0, 12479.0, 8049.0, 5011.0, 3283.0, 2274.0, 1513.0, 905.0, 628.0, 424.0, 272.0, 210.0, 123.0, 82.0, 69.0, 30.0, 25.0, 14.0, 10.0, 7.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77685546875, -0.7532730102539062, -0.7296905517578125, -0.7061080932617188, -0.682525634765625, -0.6589431762695312, -0.6353607177734375, -0.6117782592773438, -0.58819580078125, -0.5646133422851562, -0.5410308837890625, -0.5174484252929688, -0.493865966796875, -0.47028350830078125, -0.4467010498046875, -0.42311859130859375, -0.3995361328125, -0.37595367431640625, -0.3523712158203125, -0.32878875732421875, -0.305206298828125, -0.28162384033203125, -0.2580413818359375, -0.23445892333984375, -0.21087646484375, -0.18729400634765625, -0.1637115478515625, -0.14012908935546875, -0.116546630859375, -0.09296417236328125, -0.0693817138671875, -0.04579925537109375, -0.022216796875, 0.00136566162109375, 0.0249481201171875, 0.04853057861328125, 0.072113037109375, 0.09569549560546875, 0.1192779541015625, 0.14286041259765625, 0.16644287109375, 0.19002532958984375, 0.2136077880859375, 0.23719024658203125, 0.260772705078125, 0.28435516357421875, 0.3079376220703125, 0.33152008056640625, 0.3551025390625, 0.37868499755859375, 0.4022674560546875, 0.42584991455078125, 0.449432373046875, 0.47301483154296875, 0.4965972900390625, 0.5201797485351562, 0.54376220703125, 0.5673446655273438, 0.5909271240234375, 0.6145095825195312, 0.638092041015625, 0.6616744995117188, 0.6852569580078125, 0.7088394165039062, 0.732421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 11.0, 8.0, 5.0, 10.0, 15.0, 12.0, 33.0, 27.0, 30.0, 31.0, 37.0, 35.0, 56.0, 82.0, 106.0, 105.0, 75.0, 65.0, 39.0, 31.0, 29.0, 27.0, 24.0, 16.0, 11.0, 14.0, 16.0, 10.0, 12.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.44775390625, -0.4352684020996094, -0.42278289794921875, -0.4102973937988281, -0.3978118896484375, -0.3853263854980469, -0.37284088134765625, -0.3603553771972656, -0.347869873046875, -0.3353843688964844, -0.32289886474609375, -0.3104133605957031, -0.2979278564453125, -0.2854423522949219, -0.27295684814453125, -0.2604713439941406, -0.24798583984375, -0.23550033569335938, -0.22301483154296875, -0.21052932739257812, -0.1980438232421875, -0.18555831909179688, -0.17307281494140625, -0.16058731079101562, -0.148101806640625, -0.13561630249023438, -0.12313079833984375, -0.11064529418945312, -0.0981597900390625, -0.08567428588867188, -0.07318878173828125, -0.060703277587890625, -0.0482177734375, -0.035732269287109375, -0.02324676513671875, -0.010761260986328125, 0.0017242431640625, 0.014209747314453125, 0.02669525146484375, 0.039180755615234375, 0.051666259765625, 0.06415176391601562, 0.07663726806640625, 0.08912277221679688, 0.1016082763671875, 0.11409378051757812, 0.12657928466796875, 0.13906478881835938, 0.15155029296875, 0.16403579711914062, 0.17652130126953125, 0.18900680541992188, 0.2014923095703125, 0.21397781372070312, 0.22646331787109375, 0.23894882202148438, 0.251434326171875, 0.2639198303222656, 0.27640533447265625, 0.2888908386230469, 0.3013763427734375, 0.3138618469238281, 0.32634735107421875, 0.3388328552246094, 0.351318359375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 10.0, 13.0, 10.0, 4.0, 18.0, 16.0, 17.0, 23.0, 25.0, 30.0, 39.0, 33.0, 43.0, 51.0, 42.0, 45.0, 37.0, 61.0, 44.0, 41.0, 38.0, 36.0, 37.0, 37.0, 32.0, 28.0, 24.0, 13.0, 19.0, 18.0, 19.0, 14.0, 12.0, 11.0, 8.0, 10.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.975675582885742, -16.385644912719727, -15.795613288879395, -15.205582618713379, -14.615550994873047, -14.025520324707031, -13.435489654541016, -12.845458984375, -12.255427360534668, -11.665396690368652, -11.07536506652832, -10.485334396362305, -9.895303726196289, -9.305272102355957, -8.715241432189941, -8.12520980834961, -7.535179138183594, -6.94514799118042, -6.355116844177246, -5.7650861740112305, -5.175055027008057, -4.585023880004883, -3.994992971420288, -3.4049620628356934, -2.8149309158325195, -2.2248997688293457, -1.634868860244751, -1.0448378324508667, -0.4548068046569824, 0.1352243423461914, 0.7252552509307861, 1.3152861595153809, 1.9053192138671875, 2.4953503608703613, 3.085381269454956, 3.675412178039551, 4.265443325042725, 4.855474472045898, 5.445505142211914, 6.035536289215088, 6.625567436218262, 7.2155985832214355, 7.805629730224609, 8.395660400390625, 8.98569107055664, 9.575722694396973, 10.165753364562988, 10.75578498840332, 11.345815658569336, 11.935846328735352, 12.525877952575684, 13.1159086227417, 13.705940246582031, 14.295970916748047, 14.886001586914062, 15.476032257080078, 16.066062927246094, 16.65609359741211, 17.246124267578125, 17.836156845092773, 18.42618751525879, 19.016218185424805, 19.60624885559082, 20.196279525756836, 20.786312103271484]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 11.0, 6.0, 14.0, 13.0, 13.0, 20.0, 14.0, 18.0, 26.0, 25.0, 27.0, 22.0, 29.0, 40.0, 38.0, 43.0, 36.0, 46.0, 34.0, 42.0, 40.0, 42.0, 50.0, 36.0, 26.0, 35.0, 32.0, 37.0, 27.0, 26.0, 27.0, 12.0, 18.0, 12.0, 8.0, 9.0, 11.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.029541015625, -21.3182315826416, -20.606924057006836, -19.895614624023438, -19.18430519104004, -18.47299575805664, -17.761688232421875, -17.050378799438477, -16.339069366455078, -15.627760887145996, -14.916451454162598, -14.205142974853516, -13.493833541870117, -12.782525062561035, -12.071216583251953, -11.359907150268555, -10.648599624633789, -9.937291145324707, -9.225981712341309, -8.514673233032227, -7.803364276885986, -7.092055320739746, -6.380746841430664, -5.669437885284424, -4.958128929138184, -4.246819972991943, -3.5355112552642822, -2.824202537536621, -2.112893581390381, -1.4015846252441406, -0.6902761459350586, 0.02103281021118164, 0.7323398590087891, 1.4436486959457397, 2.1549575328826904, 2.8662662506103516, 3.577575206756592, 4.288884162902832, 5.000192642211914, 5.711501598358154, 6.4228105545043945, 7.134119510650635, 7.845428466796875, 8.556736946105957, 9.268045425415039, 9.979354858398438, 10.69066333770752, 11.401971817016602, 12.11328125, 12.824589729309082, 13.53589916229248, 14.247207641601562, 14.958517074584961, 15.669825553894043, 16.381134033203125, 17.092443466186523, 17.803752899169922, 18.51506233215332, 19.226369857788086, 19.937679290771484, 20.648988723754883, 21.36029815673828, 22.071605682373047, 22.782915115356445, 23.49422264099121]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 11.0, 25.0, 20.0, 24.0, 50.0, 68.0, 97.0, 148.0, 242.0, 348.0, 527.0, 812.0, 1268.0, 1903.0, 2998.0, 4504.0, 6926.0, 10882.0, 15985.0, 23698.0, 33894.0, 46093.0, 61897.0, 78232.0, 93243.0, 103147.0, 106082.0, 100920.0, 89005.0, 73115.0, 57091.0, 42675.0, 30405.0, 20891.0, 14291.0, 9323.0, 6093.0, 4063.0, 2640.0, 1683.0, 1153.0, 725.0, 486.0, 301.0, 188.0, 128.0, 83.0, 69.0, 35.0, 30.0, 16.0, 12.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0], "bins": [-14.5625, -14.1123046875, -13.662109375, -13.2119140625, -12.76171875, -12.3115234375, -11.861328125, -11.4111328125, -10.9609375, -10.5107421875, -10.060546875, -9.6103515625, -9.16015625, -8.7099609375, -8.259765625, -7.8095703125, -7.359375, -6.9091796875, -6.458984375, -6.0087890625, -5.55859375, -5.1083984375, -4.658203125, -4.2080078125, -3.7578125, -3.3076171875, -2.857421875, -2.4072265625, -1.95703125, -1.5068359375, -1.056640625, -0.6064453125, -0.15625, 0.2939453125, 0.744140625, 1.1943359375, 1.64453125, 2.0947265625, 2.544921875, 2.9951171875, 3.4453125, 3.8955078125, 4.345703125, 4.7958984375, 5.24609375, 5.6962890625, 6.146484375, 6.5966796875, 7.046875, 7.4970703125, 7.947265625, 8.3974609375, 8.84765625, 9.2978515625, 9.748046875, 10.1982421875, 10.6484375, 11.0986328125, 11.548828125, 11.9990234375, 12.44921875, 12.8994140625, 13.349609375, 13.7998046875, 14.25]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 15.0, 8.0, 11.0, 17.0, 19.0, 31.0, 28.0, 16.0, 30.0, 30.0, 34.0, 31.0, 37.0, 46.0, 42.0, 45.0, 34.0, 55.0, 46.0, 35.0, 40.0, 46.0, 42.0, 45.0, 27.0, 34.0, 19.0, 21.0, 21.0, 16.0, 14.0, 9.0, 13.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.3125, -22.54833984375, -21.7841796875, -21.02001953125, -20.255859375, -19.49169921875, -18.7275390625, -17.96337890625, -17.19921875, -16.43505859375, -15.6708984375, -14.90673828125, -14.142578125, -13.37841796875, -12.6142578125, -11.85009765625, -11.0859375, -10.32177734375, -9.5576171875, -8.79345703125, -8.029296875, -7.26513671875, -6.5009765625, -5.73681640625, -4.97265625, -4.20849609375, -3.4443359375, -2.68017578125, -1.916015625, -1.15185546875, -0.3876953125, 0.37646484375, 1.140625, 1.90478515625, 2.6689453125, 3.43310546875, 4.197265625, 4.96142578125, 5.7255859375, 6.48974609375, 7.25390625, 8.01806640625, 8.7822265625, 9.54638671875, 10.310546875, 11.07470703125, 11.8388671875, 12.60302734375, 13.3671875, 14.13134765625, 14.8955078125, 15.65966796875, 16.423828125, 17.18798828125, 17.9521484375, 18.71630859375, 19.48046875, 20.24462890625, 21.0087890625, 21.77294921875, 22.537109375, 23.30126953125, 24.0654296875, 24.82958984375, 25.59375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 6.0, 7.0, 9.0, 18.0, 28.0, 47.0, 67.0, 104.0, 155.0, 281.0, 402.0, 630.0, 1103.0, 1737.0, 3001.0, 4823.0, 7719.0, 12526.0, 19708.0, 30481.0, 45227.0, 64571.0, 86510.0, 105724.0, 120711.0, 121862.0, 111201.0, 93039.0, 71247.0, 50701.0, 34672.0, 22626.0, 14280.0, 8924.0, 5591.0, 3371.0, 2133.0, 1347.0, 742.0, 455.0, 314.0, 186.0, 95.0, 65.0, 36.0, 32.0, 17.0, 12.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-17.1875, -16.6690673828125, -16.150634765625, -15.6322021484375, -15.11376953125, -14.5953369140625, -14.076904296875, -13.5584716796875, -13.0400390625, -12.5216064453125, -12.003173828125, -11.4847412109375, -10.96630859375, -10.4478759765625, -9.929443359375, -9.4110107421875, -8.892578125, -8.3741455078125, -7.855712890625, -7.3372802734375, -6.81884765625, -6.3004150390625, -5.781982421875, -5.2635498046875, -4.7451171875, -4.2266845703125, -3.708251953125, -3.1898193359375, -2.67138671875, -2.1529541015625, -1.634521484375, -1.1160888671875, -0.59765625, -0.0792236328125, 0.439208984375, 0.9576416015625, 1.47607421875, 1.9945068359375, 2.512939453125, 3.0313720703125, 3.5498046875, 4.0682373046875, 4.586669921875, 5.1051025390625, 5.62353515625, 6.1419677734375, 6.660400390625, 7.1788330078125, 7.697265625, 8.2156982421875, 8.734130859375, 9.2525634765625, 9.77099609375, 10.2894287109375, 10.807861328125, 11.3262939453125, 11.8447265625, 12.3631591796875, 12.881591796875, 13.4000244140625, 13.91845703125, 14.4368896484375, 14.955322265625, 15.4737548828125, 15.9921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 5.0, 5.0, 10.0, 6.0, 4.0, 13.0, 18.0, 13.0, 32.0, 29.0, 16.0, 22.0, 24.0, 31.0, 40.0, 22.0, 41.0, 39.0, 36.0, 38.0, 48.0, 46.0, 44.0, 33.0, 35.0, 43.0, 30.0, 29.0, 25.0, 34.0, 24.0, 25.0, 33.0, 16.0, 11.0, 16.0, 11.0, 12.0, 7.0, 8.0, 4.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.53125, -13.092529296875, -12.65380859375, -12.215087890625, -11.7763671875, -11.337646484375, -10.89892578125, -10.460205078125, -10.021484375, -9.582763671875, -9.14404296875, -8.705322265625, -8.2666015625, -7.827880859375, -7.38916015625, -6.950439453125, -6.51171875, -6.072998046875, -5.63427734375, -5.195556640625, -4.7568359375, -4.318115234375, -3.87939453125, -3.440673828125, -3.001953125, -2.563232421875, -2.12451171875, -1.685791015625, -1.2470703125, -0.808349609375, -0.36962890625, 0.069091796875, 0.5078125, 0.946533203125, 1.38525390625, 1.823974609375, 2.2626953125, 2.701416015625, 3.14013671875, 3.578857421875, 4.017578125, 4.456298828125, 4.89501953125, 5.333740234375, 5.7724609375, 6.211181640625, 6.64990234375, 7.088623046875, 7.52734375, 7.966064453125, 8.40478515625, 8.843505859375, 9.2822265625, 9.720947265625, 10.15966796875, 10.598388671875, 11.037109375, 11.475830078125, 11.91455078125, 12.353271484375, 12.7919921875, 13.230712890625, 13.66943359375, 14.108154296875, 14.546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 18.0, 33.0, 44.0, 82.0, 153.0, 182.0, 262.0, 462.0, 715.0, 1098.0, 1705.0, 2948.0, 4596.0, 7470.0, 11714.0, 18991.0, 29066.0, 43897.0, 62389.0, 84717.0, 105703.0, 119541.0, 123002.0, 113273.0, 94886.0, 72497.0, 51984.0, 35046.0, 22844.0, 14477.0, 9243.0, 5781.0, 3587.0, 2235.0, 1402.0, 937.0, 557.0, 349.0, 242.0, 167.0, 74.0, 58.0, 32.0, 21.0, 17.0, 11.0, 13.0, 8.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2802734375, -4.138671875, -3.9970703125, -3.85546875, -3.7138671875, -3.572265625, -3.4306640625, -3.2890625, -3.1474609375, -3.005859375, -2.8642578125, -2.72265625, -2.5810546875, -2.439453125, -2.2978515625, -2.15625, -2.0146484375, -1.873046875, -1.7314453125, -1.58984375, -1.4482421875, -1.306640625, -1.1650390625, -1.0234375, -0.8818359375, -0.740234375, -0.5986328125, -0.45703125, -0.3154296875, -0.173828125, -0.0322265625, 0.109375, 0.2509765625, 0.392578125, 0.5341796875, 0.67578125, 0.8173828125, 0.958984375, 1.1005859375, 1.2421875, 1.3837890625, 1.525390625, 1.6669921875, 1.80859375, 1.9501953125, 2.091796875, 2.2333984375, 2.375, 2.5166015625, 2.658203125, 2.7998046875, 2.94140625, 3.0830078125, 3.224609375, 3.3662109375, 3.5078125, 3.6494140625, 3.791015625, 3.9326171875, 4.07421875, 4.2158203125, 4.357421875, 4.4990234375, 4.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 5.0, 12.0, 7.0, 12.0, 13.0, 17.0, 26.0, 24.0, 37.0, 36.0, 38.0, 45.0, 41.0, 54.0, 47.0, 54.0, 38.0, 40.0, 42.0, 34.0, 41.0, 40.0, 32.0, 22.0, 40.0, 30.0, 29.0, 20.0, 25.0, 17.0, 15.0, 15.0, 5.0, 13.0, 4.0, 2.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040340423583984375, -0.0003894492983818054, -0.0003754943609237671, -0.00036153942346572876, -0.00034758448600769043, -0.0003336295485496521, -0.00031967461109161377, -0.00030571967363357544, -0.0002917647361755371, -0.0002778097987174988, -0.00026385486125946045, -0.0002498999238014221, -0.0002359449863433838, -0.00022199004888534546, -0.00020803511142730713, -0.0001940801739692688, -0.00018012523651123047, -0.00016617029905319214, -0.0001522153615951538, -0.00013826042413711548, -0.00012430548667907715, -0.00011035054922103882, -9.639561176300049e-05, -8.244067430496216e-05, -6.848573684692383e-05, -5.45307993888855e-05, -4.057586193084717e-05, -2.6620924472808838e-05, -1.2665987014770508e-05, 1.2889504432678223e-06, 1.5243887901306152e-05, 2.9198825359344482e-05, 4.315376281738281e-05, 5.710870027542114e-05, 7.106363773345947e-05, 8.50185751914978e-05, 9.897351264953613e-05, 0.00011292845010757446, 0.0001268833875656128, 0.00014083832502365112, 0.00015479326248168945, 0.00016874819993972778, 0.0001827031373977661, 0.00019665807485580444, 0.00021061301231384277, 0.0002245679497718811, 0.00023852288722991943, 0.00025247782468795776, 0.0002664327621459961, 0.0002803876996040344, 0.00029434263706207275, 0.0003082975745201111, 0.0003222525119781494, 0.00033620744943618774, 0.0003501623868942261, 0.0003641173243522644, 0.00037807226181030273, 0.00039202719926834106, 0.0004059821367263794, 0.0004199370741844177, 0.00043389201164245605, 0.0004478469491004944, 0.0004618018865585327, 0.00047575682401657104, 0.0004897117614746094]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 9.0, 10.0, 12.0, 17.0, 24.0, 38.0, 45.0, 60.0, 102.0, 160.0, 242.0, 363.0, 598.0, 913.0, 1378.0, 2106.0, 3398.0, 5576.0, 8796.0, 14558.0, 22824.0, 36460.0, 54787.0, 78026.0, 104328.0, 124743.0, 133656.0, 124484.0, 103535.0, 77329.0, 54232.0, 35626.0, 22484.0, 14206.0, 8575.0, 5412.0, 3440.0, 2096.0, 1344.0, 851.0, 585.0, 382.0, 236.0, 177.0, 97.0, 75.0, 56.0, 46.0, 20.0, 18.0, 10.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0], "bins": [-5.47265625, -5.3092041015625, -5.145751953125, -4.9822998046875, -4.81884765625, -4.6553955078125, -4.491943359375, -4.3284912109375, -4.1650390625, -4.0015869140625, -3.838134765625, -3.6746826171875, -3.51123046875, -3.3477783203125, -3.184326171875, -3.0208740234375, -2.857421875, -2.6939697265625, -2.530517578125, -2.3670654296875, -2.20361328125, -2.0401611328125, -1.876708984375, -1.7132568359375, -1.5498046875, -1.3863525390625, -1.222900390625, -1.0594482421875, -0.89599609375, -0.7325439453125, -0.569091796875, -0.4056396484375, -0.2421875, -0.0787353515625, 0.084716796875, 0.2481689453125, 0.41162109375, 0.5750732421875, 0.738525390625, 0.9019775390625, 1.0654296875, 1.2288818359375, 1.392333984375, 1.5557861328125, 1.71923828125, 1.8826904296875, 2.046142578125, 2.2095947265625, 2.373046875, 2.5364990234375, 2.699951171875, 2.8634033203125, 3.02685546875, 3.1903076171875, 3.353759765625, 3.5172119140625, 3.6806640625, 3.8441162109375, 4.007568359375, 4.1710205078125, 4.33447265625, 4.4979248046875, 4.661376953125, 4.8248291015625, 4.98828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 9.0, 7.0, 5.0, 14.0, 13.0, 19.0, 22.0, 24.0, 33.0, 34.0, 35.0, 46.0, 40.0, 46.0, 51.0, 58.0, 51.0, 55.0, 37.0, 57.0, 47.0, 41.0, 39.0, 40.0, 26.0, 35.0, 22.0, 15.0, 18.0, 12.0, 7.0, 10.0, 6.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.94921875, -2.866851806640625, -2.78448486328125, -2.702117919921875, -2.6197509765625, -2.537384033203125, -2.45501708984375, -2.372650146484375, -2.290283203125, -2.207916259765625, -2.12554931640625, -2.043182373046875, -1.9608154296875, -1.878448486328125, -1.79608154296875, -1.713714599609375, -1.63134765625, -1.548980712890625, -1.46661376953125, -1.384246826171875, -1.3018798828125, -1.219512939453125, -1.13714599609375, -1.054779052734375, -0.972412109375, -0.890045166015625, -0.80767822265625, -0.725311279296875, -0.6429443359375, -0.560577392578125, -0.47821044921875, -0.395843505859375, -0.3134765625, -0.231109619140625, -0.14874267578125, -0.066375732421875, 0.0159912109375, 0.098358154296875, 0.18072509765625, 0.263092041015625, 0.345458984375, 0.427825927734375, 0.51019287109375, 0.592559814453125, 0.6749267578125, 0.757293701171875, 0.83966064453125, 0.922027587890625, 1.00439453125, 1.086761474609375, 1.16912841796875, 1.251495361328125, 1.3338623046875, 1.416229248046875, 1.49859619140625, 1.580963134765625, 1.663330078125, 1.745697021484375, 1.82806396484375, 1.910430908203125, 1.9927978515625, 2.075164794921875, 2.15753173828125, 2.239898681640625, 2.322265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 2.0, 8.0, 11.0, 14.0, 13.0, 8.0, 14.0, 28.0, 20.0, 34.0, 34.0, 35.0, 44.0, 52.0, 50.0, 60.0, 52.0, 60.0, 36.0, 39.0, 45.0, 50.0, 35.0, 43.0, 30.0, 29.0, 22.0, 18.0, 13.0, 13.0, 14.0, 14.0, 12.0, 7.0, 6.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-20.028152465820312, -19.368614196777344, -18.709077835083008, -18.049541473388672, -17.390003204345703, -16.730464935302734, -16.0709285736084, -15.411391258239746, -14.751853942871094, -14.092316627502441, -13.432779312133789, -12.773241996765137, -12.113704681396484, -11.454167366027832, -10.79463005065918, -10.135092735290527, -9.475555419921875, -8.816018104553223, -8.15648078918457, -7.496943473815918, -6.837406158447266, -6.177868843078613, -5.518331527709961, -4.858794212341309, -4.199256896972656, -3.539719581604004, -2.8801822662353516, -2.220644950866699, -1.5611076354980469, -0.9015703201293945, -0.2420330047607422, 0.41750431060791016, 1.0770397186279297, 1.736577033996582, 2.3961143493652344, 3.0556516647338867, 3.715188980102539, 4.374726295471191, 5.034263610839844, 5.693800926208496, 6.353338241577148, 7.012875556945801, 7.672412872314453, 8.331950187683105, 8.991487503051758, 9.65102481842041, 10.310562133789062, 10.970099449157715, 11.629636764526367, 12.28917407989502, 12.948711395263672, 13.608248710632324, 14.267786026000977, 14.927323341369629, 15.586860656738281, 16.24639892578125, 16.905935287475586, 17.565471649169922, 18.22500991821289, 18.88454818725586, 19.544084548950195, 20.20362091064453, 20.8631591796875, 21.52269744873047, 22.182233810424805]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 7.0, 12.0, 7.0, 10.0, 17.0, 8.0, 7.0, 22.0, 25.0, 24.0, 22.0, 31.0, 21.0, 46.0, 33.0, 43.0, 36.0, 40.0, 33.0, 28.0, 47.0, 27.0, 45.0, 43.0, 43.0, 36.0, 42.0, 35.0, 29.0, 28.0, 16.0, 21.0, 18.0, 18.0, 10.0, 13.0, 8.0, 9.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.120607376098633, -22.418781280517578, -21.716955184936523, -21.01512908935547, -20.31330108642578, -19.611474990844727, -18.909648895263672, -18.207822799682617, -17.505996704101562, -16.804170608520508, -16.102344512939453, -15.400517463684082, -14.698690414428711, -13.996864318847656, -13.295038223266602, -12.593212127685547, -11.89138412475586, -11.189558029174805, -10.487730979919434, -9.785904884338379, -9.084077835083008, -8.382251739501953, -7.680425643920898, -6.9785990715026855, -6.276772499084473, -5.57494592666626, -4.873119354248047, -4.171293258666992, -3.4694666862487793, -2.7676401138305664, -2.0658140182495117, -1.3639874458312988, -0.6621589660644531, 0.039667487144470215, 0.7414939403533936, 1.4433202743530273, 2.1451468467712402, 2.846973419189453, 3.548799514770508, 4.250626087188721, 4.952452659606934, 5.6542792320251465, 6.356105804443359, 7.057931900024414, 7.759758472442627, 8.46158504486084, 9.163411140441895, 9.865238189697266, 10.56706428527832, 11.268890380859375, 11.970717430114746, 12.6725435256958, 13.374370574951172, 14.076196670532227, 14.778022766113281, 15.479848861694336, 16.18167495727539, 16.883501052856445, 17.5853271484375, 18.287155151367188, 18.988981246948242, 19.690807342529297, 20.39263343811035, 21.094459533691406, 21.796287536621094]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 19.0, 33.0, 43.0, 68.0, 106.0, 173.0, 264.0, 438.0, 742.0, 1073.0, 1877.0, 2853.0, 4711.0, 7600.0, 12137.0, 19266.0, 30981.0, 48276.0, 75909.0, 116064.0, 171454.0, 246278.0, 333164.0, 420729.0, 482471.0, 495343.0, 454626.0, 377461.0, 288027.0, 206313.0, 140629.0, 93252.0, 60172.0, 38633.0, 23920.0, 14831.0, 9348.0, 5860.0, 3499.0, 2137.0, 1362.0, 768.0, 523.0, 328.0, 193.0, 146.0, 80.0, 53.0, 28.0, 11.0, 9.0, 1.0, 2.0, 2.0, 2.0], "bins": [-16.734375, -16.2457275390625, -15.757080078125, -15.2684326171875, -14.77978515625, -14.2911376953125, -13.802490234375, -13.3138427734375, -12.8251953125, -12.3365478515625, -11.847900390625, -11.3592529296875, -10.87060546875, -10.3819580078125, -9.893310546875, -9.4046630859375, -8.916015625, -8.4273681640625, -7.938720703125, -7.4500732421875, -6.96142578125, -6.4727783203125, -5.984130859375, -5.4954833984375, -5.0068359375, -4.5181884765625, -4.029541015625, -3.5408935546875, -3.05224609375, -2.5635986328125, -2.074951171875, -1.5863037109375, -1.09765625, -0.6090087890625, -0.120361328125, 0.3682861328125, 0.85693359375, 1.3455810546875, 1.834228515625, 2.3228759765625, 2.8115234375, 3.3001708984375, 3.788818359375, 4.2774658203125, 4.76611328125, 5.2547607421875, 5.743408203125, 6.2320556640625, 6.720703125, 7.2093505859375, 7.697998046875, 8.1866455078125, 8.67529296875, 9.1639404296875, 9.652587890625, 10.1412353515625, 10.6298828125, 11.1185302734375, 11.607177734375, 12.0958251953125, 12.58447265625, 13.0731201171875, 13.561767578125, 14.0504150390625, 14.5390625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 6.0, 5.0, 5.0, 9.0, 7.0, 8.0, 14.0, 12.0, 17.0, 21.0, 31.0, 24.0, 22.0, 43.0, 28.0, 31.0, 27.0, 40.0, 43.0, 27.0, 28.0, 41.0, 32.0, 40.0, 39.0, 29.0, 39.0, 30.0, 33.0, 40.0, 29.0, 27.0, 33.0, 17.0, 14.0, 16.0, 10.0, 11.0, 12.0, 11.0, 11.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-16.25, -15.75390625, -15.2578125, -14.76171875, -14.265625, -13.76953125, -13.2734375, -12.77734375, -12.28125, -11.78515625, -11.2890625, -10.79296875, -10.296875, -9.80078125, -9.3046875, -8.80859375, -8.3125, -7.81640625, -7.3203125, -6.82421875, -6.328125, -5.83203125, -5.3359375, -4.83984375, -4.34375, -3.84765625, -3.3515625, -2.85546875, -2.359375, -1.86328125, -1.3671875, -0.87109375, -0.375, 0.12109375, 0.6171875, 1.11328125, 1.609375, 2.10546875, 2.6015625, 3.09765625, 3.59375, 4.08984375, 4.5859375, 5.08203125, 5.578125, 6.07421875, 6.5703125, 7.06640625, 7.5625, 8.05859375, 8.5546875, 9.05078125, 9.546875, 10.04296875, 10.5390625, 11.03515625, 11.53125, 12.02734375, 12.5234375, 13.01953125, 13.515625, 14.01171875, 14.5078125, 15.00390625, 15.5]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 7.0, 1.0, 15.0, 30.0, 58.0, 81.0, 133.0, 211.0, 351.0, 561.0, 945.0, 1503.0, 2425.0, 4054.0, 6538.0, 10522.0, 16345.0, 26076.0, 39629.0, 59569.0, 87844.0, 124988.0, 172410.0, 227684.0, 287788.0, 344226.0, 385396.0, 406391.0, 397522.0, 364757.0, 314969.0, 255882.0, 197915.0, 146756.0, 104056.0, 72157.0, 48206.0, 31521.0, 20369.0, 13205.0, 8152.0, 5120.0, 3128.0, 1852.0, 1199.0, 708.0, 391.0, 269.0, 158.0, 85.0, 61.0, 27.0, 18.0, 11.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0], "bins": [-13.125, -12.71142578125, -12.2978515625, -11.88427734375, -11.470703125, -11.05712890625, -10.6435546875, -10.22998046875, -9.81640625, -9.40283203125, -8.9892578125, -8.57568359375, -8.162109375, -7.74853515625, -7.3349609375, -6.92138671875, -6.5078125, -6.09423828125, -5.6806640625, -5.26708984375, -4.853515625, -4.43994140625, -4.0263671875, -3.61279296875, -3.19921875, -2.78564453125, -2.3720703125, -1.95849609375, -1.544921875, -1.13134765625, -0.7177734375, -0.30419921875, 0.109375, 0.52294921875, 0.9365234375, 1.35009765625, 1.763671875, 2.17724609375, 2.5908203125, 3.00439453125, 3.41796875, 3.83154296875, 4.2451171875, 4.65869140625, 5.072265625, 5.48583984375, 5.8994140625, 6.31298828125, 6.7265625, 7.14013671875, 7.5537109375, 7.96728515625, 8.380859375, 8.79443359375, 9.2080078125, 9.62158203125, 10.03515625, 10.44873046875, 10.8623046875, 11.27587890625, 11.689453125, 12.10302734375, 12.5166015625, 12.93017578125, 13.34375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 0.0, 6.0, 11.0, 17.0, 28.0, 22.0, 35.0, 28.0, 42.0, 55.0, 73.0, 71.0, 88.0, 70.0, 102.0, 116.0, 136.0, 147.0, 132.0, 181.0, 159.0, 158.0, 186.0, 197.0, 191.0, 164.0, 176.0, 165.0, 156.0, 136.0, 165.0, 130.0, 87.0, 95.0, 84.0, 83.0, 67.0, 53.0, 57.0, 38.0, 26.0, 22.0, 20.0, 19.0, 22.0, 15.0, 4.0, 6.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.71875, -6.5015869140625, -6.284423828125, -6.0672607421875, -5.85009765625, -5.6329345703125, -5.415771484375, -5.1986083984375, -4.9814453125, -4.7642822265625, -4.547119140625, -4.3299560546875, -4.11279296875, -3.8956298828125, -3.678466796875, -3.4613037109375, -3.244140625, -3.0269775390625, -2.809814453125, -2.5926513671875, -2.37548828125, -2.1583251953125, -1.941162109375, -1.7239990234375, -1.5068359375, -1.2896728515625, -1.072509765625, -0.8553466796875, -0.63818359375, -0.4210205078125, -0.203857421875, 0.0133056640625, 0.23046875, 0.4476318359375, 0.664794921875, 0.8819580078125, 1.09912109375, 1.3162841796875, 1.533447265625, 1.7506103515625, 1.9677734375, 2.1849365234375, 2.402099609375, 2.6192626953125, 2.83642578125, 3.0535888671875, 3.270751953125, 3.4879150390625, 3.705078125, 3.9222412109375, 4.139404296875, 4.3565673828125, 4.57373046875, 4.7908935546875, 5.008056640625, 5.2252197265625, 5.4423828125, 5.6595458984375, 5.876708984375, 6.0938720703125, 6.31103515625, 6.5281982421875, 6.745361328125, 6.9625244140625, 7.1796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 14.0, 12.0, 10.0, 27.0, 19.0, 24.0, 31.0, 28.0, 31.0, 45.0, 59.0, 48.0, 39.0, 39.0, 50.0, 36.0, 39.0, 50.0, 40.0, 39.0, 39.0, 34.0, 18.0, 37.0, 18.0, 22.0, 17.0, 17.0, 13.0, 16.0, 10.0, 10.0, 6.0, 6.0, 3.0, 6.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.5313777923584, -16.966203689575195, -16.401029586791992, -15.835855484008789, -15.270681381225586, -14.705507278442383, -14.14033317565918, -13.575159072875977, -13.009984970092773, -12.44481086730957, -11.879636764526367, -11.314462661743164, -10.749288558959961, -10.184114456176758, -9.618940353393555, -9.053766250610352, -8.488592147827148, -7.923418045043945, -7.358243942260742, -6.793069839477539, -6.227895736694336, -5.662721633911133, -5.09754753112793, -4.532373428344727, -3.9671993255615234, -3.4020252227783203, -2.836851119995117, -2.271677017211914, -1.706502914428711, -1.1413288116455078, -0.5761547088623047, -0.010980606079101562, 0.5541915893554688, 1.1193656921386719, 1.684539794921875, 2.249713897705078, 2.8148880004882812, 3.3800621032714844, 3.9452362060546875, 4.510410308837891, 5.075584411621094, 5.640758514404297, 6.2059326171875, 6.771106719970703, 7.336280822753906, 7.901454925537109, 8.466629028320312, 9.031803131103516, 9.596977233886719, 10.162151336669922, 10.727325439453125, 11.292499542236328, 11.857673645019531, 12.422847747802734, 12.988021850585938, 13.55319595336914, 14.118370056152344, 14.683544158935547, 15.24871826171875, 15.813892364501953, 16.379066467285156, 16.94424057006836, 17.509414672851562, 18.074588775634766, 18.63976287841797]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 5.0, 12.0, 11.0, 8.0, 15.0, 15.0, 18.0, 20.0, 13.0, 20.0, 17.0, 31.0, 35.0, 27.0, 32.0, 23.0, 36.0, 37.0, 33.0, 26.0, 36.0, 43.0, 40.0, 37.0, 38.0, 26.0, 39.0, 39.0, 28.0, 29.0, 33.0, 34.0, 20.0, 21.0, 15.0, 15.0, 9.0, 9.0, 8.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-19.478485107421875, -18.89680290222168, -18.31511878967285, -17.733436584472656, -17.151752471923828, -16.570070266723633, -15.988387107849121, -15.40670394897461, -14.825020790100098, -14.243337631225586, -13.661654472351074, -13.079971313476562, -12.498289108276367, -11.916604995727539, -11.334922790527344, -10.753239631652832, -10.17155647277832, -9.589873313903809, -9.008190155029297, -8.426506996154785, -7.844824314117432, -7.26314115524292, -6.681458473205566, -6.099775314331055, -5.518092155456543, -4.936408996582031, -4.3547258377075195, -3.773043155670166, -3.1913599967956543, -2.6096768379211426, -2.02799391746521, -1.4463109970092773, -0.8646297454833984, -0.28294670581817627, 0.2987363338470459, 0.8804193735122681, 1.4621024131774902, 2.043785572052002, 2.6254684925079346, 3.207151412963867, 3.788834571838379, 4.370517730712891, 4.952200889587402, 5.533883571624756, 6.115566730499268, 6.697249889373779, 7.278932571411133, 7.8606157302856445, 8.442298889160156, 9.023982048034668, 9.60566520690918, 10.187348365783691, 10.769031524658203, 11.350713729858398, 11.93239688873291, 12.514080047607422, 13.095763206481934, 13.677446365356445, 14.259129524230957, 14.840812683105469, 15.422494888305664, 16.004179000854492, 16.585861206054688, 17.167545318603516, 17.74922752380371]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 22.0, 16.0, 25.0, 54.0, 53.0, 77.0, 131.0, 196.0, 274.0, 383.0, 603.0, 860.0, 1172.0, 1814.0, 2663.0, 3881.0, 5788.0, 8356.0, 12711.0, 18857.0, 28815.0, 43810.0, 68217.0, 105414.0, 155890.0, 184158.0, 138520.0, 91590.0, 59219.0, 38489.0, 25648.0, 16461.0, 11185.0, 7370.0, 5025.0, 3406.0, 2338.0, 1568.0, 1110.0, 735.0, 530.0, 349.0, 233.0, 166.0, 126.0, 88.0, 57.0, 33.0, 22.0, 14.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.05078125, -2.956451416015625, -2.86212158203125, -2.767791748046875, -2.6734619140625, -2.579132080078125, -2.48480224609375, -2.390472412109375, -2.296142578125, -2.201812744140625, -2.10748291015625, -2.013153076171875, -1.9188232421875, -1.824493408203125, -1.73016357421875, -1.635833740234375, -1.54150390625, -1.447174072265625, -1.35284423828125, -1.258514404296875, -1.1641845703125, -1.069854736328125, -0.97552490234375, -0.881195068359375, -0.786865234375, -0.692535400390625, -0.59820556640625, -0.503875732421875, -0.4095458984375, -0.315216064453125, -0.22088623046875, -0.126556396484375, -0.0322265625, 0.062103271484375, 0.15643310546875, 0.250762939453125, 0.3450927734375, 0.439422607421875, 0.53375244140625, 0.628082275390625, 0.722412109375, 0.816741943359375, 0.91107177734375, 1.005401611328125, 1.0997314453125, 1.194061279296875, 1.28839111328125, 1.382720947265625, 1.47705078125, 1.571380615234375, 1.66571044921875, 1.760040283203125, 1.8543701171875, 1.948699951171875, 2.04302978515625, 2.137359619140625, 2.231689453125, 2.326019287109375, 2.42034912109375, 2.514678955078125, 2.6090087890625, 2.703338623046875, 2.79766845703125, 2.891998291015625, 2.986328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 4.0, 11.0, 9.0, 8.0, 11.0, 13.0, 17.0, 20.0, 24.0, 25.0, 22.0, 26.0, 32.0, 35.0, 36.0, 28.0, 30.0, 34.0, 40.0, 55.0, 35.0, 47.0, 38.0, 42.0, 35.0, 38.0, 38.0, 37.0, 27.0, 31.0, 29.0, 22.0, 17.0, 10.0, 17.0, 9.0, 6.0, 14.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.34375, -21.682373046875, -21.02099609375, -20.359619140625, -19.6982421875, -19.036865234375, -18.37548828125, -17.714111328125, -17.052734375, -16.391357421875, -15.72998046875, -15.068603515625, -14.4072265625, -13.745849609375, -13.08447265625, -12.423095703125, -11.76171875, -11.100341796875, -10.43896484375, -9.777587890625, -9.1162109375, -8.454833984375, -7.79345703125, -7.132080078125, -6.470703125, -5.809326171875, -5.14794921875, -4.486572265625, -3.8251953125, -3.163818359375, -2.50244140625, -1.841064453125, -1.1796875, -0.518310546875, 0.14306640625, 0.804443359375, 1.4658203125, 2.127197265625, 2.78857421875, 3.449951171875, 4.111328125, 4.772705078125, 5.43408203125, 6.095458984375, 6.7568359375, 7.418212890625, 8.07958984375, 8.740966796875, 9.40234375, 10.063720703125, 10.72509765625, 11.386474609375, 12.0478515625, 12.709228515625, 13.37060546875, 14.031982421875, 14.693359375, 15.354736328125, 16.01611328125, 16.677490234375, 17.3388671875, 18.000244140625, 18.66162109375, 19.322998046875, 19.984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 11.0, 19.0, 18.0, 33.0, 50.0, 59.0, 96.0, 144.0, 230.0, 286.0, 457.0, 689.0, 1046.0, 1619.0, 2486.0, 3979.0, 5928.0, 9476.0, 15351.0, 24734.0, 40250.0, 67158.0, 116038.0, 196990.0, 219778.0, 137184.0, 79599.0, 47171.0, 28876.0, 17762.0, 11080.0, 7030.0, 4470.0, 2937.0, 1856.0, 1215.0, 796.0, 567.0, 335.0, 267.0, 160.0, 105.0, 65.0, 43.0, 41.0, 28.0, 18.0, 12.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.904296875, -2.81396484375, -2.7236328125, -2.63330078125, -2.54296875, -2.45263671875, -2.3623046875, -2.27197265625, -2.181640625, -2.09130859375, -2.0009765625, -1.91064453125, -1.8203125, -1.72998046875, -1.6396484375, -1.54931640625, -1.458984375, -1.36865234375, -1.2783203125, -1.18798828125, -1.09765625, -1.00732421875, -0.9169921875, -0.82666015625, -0.736328125, -0.64599609375, -0.5556640625, -0.46533203125, -0.375, -0.28466796875, -0.1943359375, -0.10400390625, -0.013671875, 0.07666015625, 0.1669921875, 0.25732421875, 0.34765625, 0.43798828125, 0.5283203125, 0.61865234375, 0.708984375, 0.79931640625, 0.8896484375, 0.97998046875, 1.0703125, 1.16064453125, 1.2509765625, 1.34130859375, 1.431640625, 1.52197265625, 1.6123046875, 1.70263671875, 1.79296875, 1.88330078125, 1.9736328125, 2.06396484375, 2.154296875, 2.24462890625, 2.3349609375, 2.42529296875, 2.515625, 2.60595703125, 2.6962890625, 2.78662109375, 2.876953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 12.0, 5.0, 10.0, 16.0, 8.0, 9.0, 29.0, 17.0, 20.0, 28.0, 29.0, 27.0, 30.0, 42.0, 42.0, 45.0, 34.0, 49.0, 40.0, 41.0, 44.0, 42.0, 38.0, 35.0, 38.0, 36.0, 33.0, 24.0, 25.0, 17.0, 21.0, 12.0, 20.0, 13.0, 13.0, 11.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.2734375, -14.8433837890625, -14.413330078125, -13.9832763671875, -13.55322265625, -13.1231689453125, -12.693115234375, -12.2630615234375, -11.8330078125, -11.4029541015625, -10.972900390625, -10.5428466796875, -10.11279296875, -9.6827392578125, -9.252685546875, -8.8226318359375, -8.392578125, -7.9625244140625, -7.532470703125, -7.1024169921875, -6.67236328125, -6.2423095703125, -5.812255859375, -5.3822021484375, -4.9521484375, -4.5220947265625, -4.092041015625, -3.6619873046875, -3.23193359375, -2.8018798828125, -2.371826171875, -1.9417724609375, -1.51171875, -1.0816650390625, -0.651611328125, -0.2215576171875, 0.20849609375, 0.6385498046875, 1.068603515625, 1.4986572265625, 1.9287109375, 2.3587646484375, 2.788818359375, 3.2188720703125, 3.64892578125, 4.0789794921875, 4.509033203125, 4.9390869140625, 5.369140625, 5.7991943359375, 6.229248046875, 6.6593017578125, 7.08935546875, 7.5194091796875, 7.949462890625, 8.3795166015625, 8.8095703125, 9.2396240234375, 9.669677734375, 10.0997314453125, 10.52978515625, 10.9598388671875, 11.389892578125, 11.8199462890625, 12.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 15.0, 22.0, 30.0, 42.0, 53.0, 110.0, 202.0, 259.0, 438.0, 692.0, 1073.0, 1727.0, 2904.0, 4911.0, 8505.0, 14605.0, 27582.0, 54945.0, 124445.0, 327763.0, 270909.0, 103594.0, 47648.0, 24133.0, 13107.0, 7533.0, 4351.0, 2630.0, 1561.0, 1026.0, 647.0, 385.0, 246.0, 153.0, 94.0, 77.0, 35.0, 37.0, 12.0, 19.0, 12.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24902725219726562, -0.24121856689453125, -0.23340988159179688, -0.2256011962890625, -0.21779251098632812, -0.20998382568359375, -0.20217514038085938, -0.194366455078125, -0.18655776977539062, -0.17874908447265625, -0.17094039916992188, -0.1631317138671875, -0.15532302856445312, -0.14751434326171875, -0.13970565795898438, -0.13189697265625, -0.12408828735351562, -0.11627960205078125, -0.10847091674804688, -0.1006622314453125, -0.09285354614257812, -0.08504486083984375, -0.07723617553710938, -0.069427490234375, -0.061618804931640625, -0.05381011962890625, -0.046001434326171875, -0.0381927490234375, -0.030384063720703125, -0.02257537841796875, -0.014766693115234375, -0.0069580078125, 0.000850677490234375, 0.00865936279296875, 0.016468048095703125, 0.0242767333984375, 0.032085418701171875, 0.03989410400390625, 0.047702789306640625, 0.055511474609375, 0.06332015991210938, 0.07112884521484375, 0.07893753051757812, 0.0867462158203125, 0.09455490112304688, 0.10236358642578125, 0.11017227172851562, 0.11798095703125, 0.12578964233398438, 0.13359832763671875, 0.14140701293945312, 0.1492156982421875, 0.15702438354492188, 0.16483306884765625, 0.17264175415039062, 0.180450439453125, 0.18825912475585938, 0.19606781005859375, 0.20387649536132812, 0.2116851806640625, 0.21949386596679688, 0.22730255126953125, 0.23511123657226562, 0.242919921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 4.0, 9.0, 10.0, 11.0, 10.0, 18.0, 12.0, 27.0, 18.0, 26.0, 25.0, 28.0, 34.0, 40.0, 46.0, 42.0, 39.0, 41.0, 45.0, 64.0, 52.0, 38.0, 52.0, 38.0, 33.0, 35.0, 30.0, 30.0, 24.0, 13.0, 14.0, 17.0, 5.0, 9.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0], "bins": [-2.849102020263672e-05, -2.7602538466453552e-05, -2.6714056730270386e-05, -2.582557499408722e-05, -2.4937093257904053e-05, -2.4048611521720886e-05, -2.316012978553772e-05, -2.2271648049354553e-05, -2.1383166313171387e-05, -2.049468457698822e-05, -1.9606202840805054e-05, -1.8717721104621887e-05, -1.782923936843872e-05, -1.6940757632255554e-05, -1.6052275896072388e-05, -1.5163794159889221e-05, -1.4275312423706055e-05, -1.3386830687522888e-05, -1.2498348951339722e-05, -1.1609867215156555e-05, -1.0721385478973389e-05, -9.832903742790222e-06, -8.944422006607056e-06, -8.05594027042389e-06, -7.167458534240723e-06, -6.278976798057556e-06, -5.39049506187439e-06, -4.502013325691223e-06, -3.6135315895080566e-06, -2.72504985332489e-06, -1.8365681171417236e-06, -9.480863809585571e-07, -5.960464477539063e-08, 8.288770914077759e-07, 1.7173588275909424e-06, 2.605840563774109e-06, 3.4943222999572754e-06, 4.382804036140442e-06, 5.271285772323608e-06, 6.159767508506775e-06, 7.048249244689941e-06, 7.936730980873108e-06, 8.825212717056274e-06, 9.713694453239441e-06, 1.0602176189422607e-05, 1.1490657925605774e-05, 1.237913966178894e-05, 1.3267621397972107e-05, 1.4156103134155273e-05, 1.504458487033844e-05, 1.5933066606521606e-05, 1.6821548342704773e-05, 1.771003007888794e-05, 1.8598511815071106e-05, 1.9486993551254272e-05, 2.037547528743744e-05, 2.1263957023620605e-05, 2.2152438759803772e-05, 2.304092049598694e-05, 2.3929402232170105e-05, 2.481788396835327e-05, 2.5706365704536438e-05, 2.6594847440719604e-05, 2.748332917690277e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 13.0, 19.0, 28.0, 50.0, 57.0, 75.0, 130.0, 199.0, 249.0, 336.0, 475.0, 626.0, 848.0, 1225.0, 1740.0, 2460.0, 3480.0, 4760.0, 7182.0, 10421.0, 15423.0, 23120.0, 35407.0, 56206.0, 92618.0, 174822.0, 264256.0, 134963.0, 76603.0, 47376.0, 30133.0, 19739.0, 13475.0, 8864.0, 6180.0, 4296.0, 3136.0, 2166.0, 1544.0, 1071.0, 805.0, 534.0, 430.0, 292.0, 212.0, 147.0, 108.0, 78.0, 74.0, 29.0, 25.0, 23.0, 10.0, 7.0, 4.0, 0.0, 3.0, 6.0], "bins": [-0.459228515625, -0.4450187683105469, -0.43080902099609375, -0.4165992736816406, -0.4023895263671875, -0.3881797790527344, -0.37397003173828125, -0.3597602844238281, -0.345550537109375, -0.3313407897949219, -0.31713104248046875, -0.3029212951660156, -0.2887115478515625, -0.2745018005371094, -0.26029205322265625, -0.24608230590820312, -0.23187255859375, -0.21766281127929688, -0.20345306396484375, -0.18924331665039062, -0.1750335693359375, -0.16082382202148438, -0.14661407470703125, -0.13240432739257812, -0.118194580078125, -0.10398483276367188, -0.08977508544921875, -0.07556533813476562, -0.0613555908203125, -0.047145843505859375, -0.03293609619140625, -0.018726348876953125, -0.0045166015625, 0.009693145751953125, 0.02390289306640625, 0.038112640380859375, 0.0523223876953125, 0.06653213500976562, 0.08074188232421875, 0.09495162963867188, 0.109161376953125, 0.12337112426757812, 0.13758087158203125, 0.15179061889648438, 0.1660003662109375, 0.18021011352539062, 0.19441986083984375, 0.20862960815429688, 0.22283935546875, 0.23704910278320312, 0.25125885009765625, 0.2654685974121094, 0.2796783447265625, 0.2938880920410156, 0.30809783935546875, 0.3223075866699219, 0.336517333984375, 0.3507270812988281, 0.36493682861328125, 0.3791465759277344, 0.3933563232421875, 0.4075660705566406, 0.42177581787109375, 0.4359855651855469, 0.4501953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 3.0, 2.0, 6.0, 4.0, 9.0, 11.0, 10.0, 13.0, 12.0, 16.0, 18.0, 23.0, 26.0, 35.0, 41.0, 35.0, 52.0, 70.0, 84.0, 85.0, 68.0, 60.0, 57.0, 49.0, 35.0, 15.0, 20.0, 22.0, 22.0, 19.0, 16.0, 6.0, 14.0, 9.0, 3.0, 10.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.163330078125, -0.15808486938476562, -0.15283966064453125, -0.14759445190429688, -0.1423492431640625, -0.13710403442382812, -0.13185882568359375, -0.12661361694335938, -0.121368408203125, -0.11612319946289062, -0.11087799072265625, -0.10563278198242188, -0.1003875732421875, -0.09514236450195312, -0.08989715576171875, -0.08465194702148438, -0.07940673828125, -0.07416152954101562, -0.06891632080078125, -0.06367111206054688, -0.0584259033203125, -0.053180694580078125, -0.04793548583984375, -0.042690277099609375, -0.037445068359375, -0.032199859619140625, -0.02695465087890625, -0.021709442138671875, -0.0164642333984375, -0.011219024658203125, -0.00597381591796875, -0.000728607177734375, 0.0045166015625, 0.009761810302734375, 0.01500701904296875, 0.020252227783203125, 0.0254974365234375, 0.030742645263671875, 0.03598785400390625, 0.041233062744140625, 0.046478271484375, 0.051723480224609375, 0.05696868896484375, 0.062213897705078125, 0.0674591064453125, 0.07270431518554688, 0.07794952392578125, 0.08319473266601562, 0.08843994140625, 0.09368515014648438, 0.09893035888671875, 0.10417556762695312, 0.1094207763671875, 0.11466598510742188, 0.11991119384765625, 0.12515640258789062, 0.130401611328125, 0.13564682006835938, 0.14089202880859375, 0.14613723754882812, 0.1513824462890625, 0.15662765502929688, 0.16187286376953125, 0.16711807250976562, 0.17236328125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 15.0, 10.0, 12.0, 26.0, 21.0, 21.0, 22.0, 36.0, 34.0, 44.0, 59.0, 42.0, 34.0, 47.0, 50.0, 39.0, 48.0, 45.0, 41.0, 41.0, 30.0, 30.0, 33.0, 33.0, 16.0, 19.0, 19.0, 15.0, 12.0, 20.0, 10.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.553495407104492, -16.988121032714844, -16.422746658325195, -15.857373237609863, -15.291998863220215, -14.726625442504883, -14.161251068115234, -13.595876693725586, -13.030502319335938, -12.465127944946289, -11.899754524230957, -11.334380149841309, -10.76900577545166, -10.203632354736328, -9.63825798034668, -9.072883605957031, -8.5075101852417, -7.942136287689209, -7.3767619132995605, -6.81138801574707, -6.246013641357422, -5.680639743804932, -5.115265846252441, -4.549891471862793, -3.9845175743103027, -3.4191434383392334, -2.853769302368164, -2.288395404815674, -1.7230212688446045, -1.1576471328735352, -0.5922732353210449, -0.026899099349975586, 0.5384750366210938, 1.103849172592163, 1.6692231893539429, 2.2345972061157227, 2.799971342086792, 3.3653454780578613, 3.9307193756103516, 4.49609375, 5.06146764755249, 5.6268415451049805, 6.192215919494629, 6.757589817047119, 7.322963714599609, 7.888338088989258, 8.453712463378906, 9.019085884094238, 9.584460258483887, 10.149834632873535, 10.715208053588867, 11.280582427978516, 11.845956802368164, 12.411331176757812, 12.976704597473145, 13.542078971862793, 14.107452392578125, 14.672826766967773, 15.238200187683105, 15.803574562072754, 16.368947982788086, 16.934322357177734, 17.499696731567383, 18.06507110595703, 18.63044548034668]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 5.0, 6.0, 14.0, 9.0, 7.0, 16.0, 15.0, 18.0, 18.0, 15.0, 21.0, 20.0, 29.0, 33.0, 29.0, 28.0, 29.0, 40.0, 28.0, 32.0, 29.0, 36.0, 43.0, 43.0, 35.0, 34.0, 30.0, 36.0, 37.0, 28.0, 31.0, 34.0, 30.0, 22.0, 19.0, 18.0, 14.0, 9.0, 9.0, 8.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-19.341848373413086, -18.765254974365234, -18.188661575317383, -17.612070083618164, -17.035476684570312, -16.45888328552246, -15.88228988647461, -15.305697441101074, -14.729104995727539, -14.152511596679688, -13.575919151306152, -12.9993257522583, -12.422733306884766, -11.846139907836914, -11.269546508789062, -10.692954063415527, -10.116360664367676, -9.539767265319824, -8.963174819946289, -8.386581420898438, -7.809988975524902, -7.233395576477051, -6.656802654266357, -6.080209732055664, -5.503616809844971, -4.927023887634277, -4.350430965423584, -3.7738378047943115, -3.197244882583618, -2.620651960372925, -2.0440587997436523, -1.467465877532959, -0.8908729553222656, -0.3142799735069275, 0.26231300830841064, 0.8389060497283936, 1.415498971939087, 1.9920918941497803, 2.5686850547790527, 3.145277976989746, 3.7218708992004395, 4.298463821411133, 4.875056743621826, 5.4516496658325195, 6.028243064880371, 6.604835510253906, 7.181428909301758, 7.758021831512451, 8.334614753723145, 8.911208152770996, 9.487800598144531, 10.064393997192383, 10.640986442565918, 11.21757984161377, 11.794172286987305, 12.370765686035156, 12.947359085083008, 13.52395248413086, 14.100544929504395, 14.677138328552246, 15.253730773925781, 15.830324172973633, 16.406917572021484, 16.983509063720703, 17.560102462768555]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 11.0, 20.0, 31.0, 45.0, 89.0, 173.0, 237.0, 368.0, 682.0, 1016.0, 1807.0, 2702.0, 4405.0, 6933.0, 11076.0, 16966.0, 25637.0, 38944.0, 54369.0, 72927.0, 92464.0, 108184.0, 115224.0, 112591.0, 100597.0, 82609.0, 63299.0, 45540.0, 31652.0, 20975.0, 13534.0, 8805.0, 5550.0, 3578.0, 2117.0, 1313.0, 794.0, 496.0, 308.0, 188.0, 116.0, 72.0, 47.0, 31.0, 13.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.5438232421875, -13.103271484375, -12.6627197265625, -12.22216796875, -11.7816162109375, -11.341064453125, -10.9005126953125, -10.4599609375, -10.0194091796875, -9.578857421875, -9.1383056640625, -8.69775390625, -8.2572021484375, -7.816650390625, -7.3760986328125, -6.935546875, -6.4949951171875, -6.054443359375, -5.6138916015625, -5.17333984375, -4.7327880859375, -4.292236328125, -3.8516845703125, -3.4111328125, -2.9705810546875, -2.530029296875, -2.0894775390625, -1.64892578125, -1.2083740234375, -0.767822265625, -0.3272705078125, 0.11328125, 0.5538330078125, 0.994384765625, 1.4349365234375, 1.87548828125, 2.3160400390625, 2.756591796875, 3.1971435546875, 3.6376953125, 4.0782470703125, 4.518798828125, 4.9593505859375, 5.39990234375, 5.8404541015625, 6.281005859375, 6.7215576171875, 7.162109375, 7.6026611328125, 8.043212890625, 8.4837646484375, 8.92431640625, 9.3648681640625, 9.805419921875, 10.2459716796875, 10.6865234375, 11.1270751953125, 11.567626953125, 12.0081787109375, 12.44873046875, 12.8892822265625, 13.329833984375, 13.7703857421875, 14.2109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 4.0, 9.0, 13.0, 24.0, 23.0, 16.0, 13.0, 19.0, 22.0, 30.0, 33.0, 26.0, 26.0, 33.0, 39.0, 33.0, 34.0, 35.0, 32.0, 47.0, 34.0, 52.0, 38.0, 32.0, 23.0, 38.0, 33.0, 32.0, 24.0, 21.0, 19.0, 21.0, 18.0, 8.0, 11.0, 12.0, 7.0, 7.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.59375, -19.000732421875, -18.40771484375, -17.814697265625, -17.2216796875, -16.628662109375, -16.03564453125, -15.442626953125, -14.849609375, -14.256591796875, -13.66357421875, -13.070556640625, -12.4775390625, -11.884521484375, -11.29150390625, -10.698486328125, -10.10546875, -9.512451171875, -8.91943359375, -8.326416015625, -7.7333984375, -7.140380859375, -6.54736328125, -5.954345703125, -5.361328125, -4.768310546875, -4.17529296875, -3.582275390625, -2.9892578125, -2.396240234375, -1.80322265625, -1.210205078125, -0.6171875, -0.024169921875, 0.56884765625, 1.161865234375, 1.7548828125, 2.347900390625, 2.94091796875, 3.533935546875, 4.126953125, 4.719970703125, 5.31298828125, 5.906005859375, 6.4990234375, 7.092041015625, 7.68505859375, 8.278076171875, 8.87109375, 9.464111328125, 10.05712890625, 10.650146484375, 11.2431640625, 11.836181640625, 12.42919921875, 13.022216796875, 13.615234375, 14.208251953125, 14.80126953125, 15.394287109375, 15.9873046875, 16.580322265625, 17.17333984375, 17.766357421875, 18.359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 13.0, 21.0, 27.0, 46.0, 60.0, 73.0, 130.0, 189.0, 279.0, 482.0, 693.0, 1100.0, 1616.0, 2619.0, 3979.0, 5992.0, 8999.0, 13513.0, 19720.0, 28265.0, 39910.0, 53233.0, 69415.0, 84836.0, 97528.0, 103891.0, 102771.0, 94723.0, 81702.0, 65468.0, 50194.0, 37056.0, 25970.0, 18020.0, 12049.0, 8235.0, 5420.0, 3574.0, 2326.0, 1549.0, 995.0, 671.0, 389.0, 282.0, 182.0, 116.0, 82.0, 55.0, 42.0, 13.0, 15.0, 11.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-12.7578125, -12.357666015625, -11.95751953125, -11.557373046875, -11.1572265625, -10.757080078125, -10.35693359375, -9.956787109375, -9.556640625, -9.156494140625, -8.75634765625, -8.356201171875, -7.9560546875, -7.555908203125, -7.15576171875, -6.755615234375, -6.35546875, -5.955322265625, -5.55517578125, -5.155029296875, -4.7548828125, -4.354736328125, -3.95458984375, -3.554443359375, -3.154296875, -2.754150390625, -2.35400390625, -1.953857421875, -1.5537109375, -1.153564453125, -0.75341796875, -0.353271484375, 0.046875, 0.447021484375, 0.84716796875, 1.247314453125, 1.6474609375, 2.047607421875, 2.44775390625, 2.847900390625, 3.248046875, 3.648193359375, 4.04833984375, 4.448486328125, 4.8486328125, 5.248779296875, 5.64892578125, 6.049072265625, 6.44921875, 6.849365234375, 7.24951171875, 7.649658203125, 8.0498046875, 8.449951171875, 8.85009765625, 9.250244140625, 9.650390625, 10.050537109375, 10.45068359375, 10.850830078125, 11.2509765625, 11.651123046875, 12.05126953125, 12.451416015625, 12.8515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 4.0, 11.0, 17.0, 4.0, 15.0, 16.0, 24.0, 21.0, 22.0, 26.0, 29.0, 21.0, 30.0, 37.0, 47.0, 40.0, 30.0, 41.0, 35.0, 45.0, 52.0, 38.0, 37.0, 43.0, 28.0, 34.0, 34.0, 29.0, 29.0, 14.0, 17.0, 15.0, 25.0, 14.0, 10.0, 14.0, 6.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.4140625, -12.0147705078125, -11.615478515625, -11.2161865234375, -10.81689453125, -10.4176025390625, -10.018310546875, -9.6190185546875, -9.2197265625, -8.8204345703125, -8.421142578125, -8.0218505859375, -7.62255859375, -7.2232666015625, -6.823974609375, -6.4246826171875, -6.025390625, -5.6260986328125, -5.226806640625, -4.8275146484375, -4.42822265625, -4.0289306640625, -3.629638671875, -3.2303466796875, -2.8310546875, -2.4317626953125, -2.032470703125, -1.6331787109375, -1.23388671875, -0.8345947265625, -0.435302734375, -0.0360107421875, 0.36328125, 0.7625732421875, 1.161865234375, 1.5611572265625, 1.96044921875, 2.3597412109375, 2.759033203125, 3.1583251953125, 3.5576171875, 3.9569091796875, 4.356201171875, 4.7554931640625, 5.15478515625, 5.5540771484375, 5.953369140625, 6.3526611328125, 6.751953125, 7.1512451171875, 7.550537109375, 7.9498291015625, 8.34912109375, 8.7484130859375, 9.147705078125, 9.5469970703125, 9.9462890625, 10.3455810546875, 10.744873046875, 11.1441650390625, 11.54345703125, 11.9427490234375, 12.342041015625, 12.7413330078125, 13.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 18.0, 21.0, 25.0, 47.0, 82.0, 90.0, 144.0, 258.0, 428.0, 660.0, 1091.0, 1885.0, 3342.0, 5846.0, 10244.0, 18290.0, 31165.0, 53244.0, 83252.0, 118347.0, 146438.0, 155852.0, 138329.0, 105258.0, 70340.0, 43558.0, 25571.0, 14855.0, 8386.0, 4748.0, 2699.0, 1611.0, 931.0, 562.0, 339.0, 198.0, 131.0, 94.0, 54.0, 39.0, 22.0, 19.0, 11.0, 7.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4375, -5.25811767578125, -5.0787353515625, -4.89935302734375, -4.719970703125, -4.54058837890625, -4.3612060546875, -4.18182373046875, -4.00244140625, -3.82305908203125, -3.6436767578125, -3.46429443359375, -3.284912109375, -3.10552978515625, -2.9261474609375, -2.74676513671875, -2.5673828125, -2.38800048828125, -2.2086181640625, -2.02923583984375, -1.849853515625, -1.67047119140625, -1.4910888671875, -1.31170654296875, -1.13232421875, -0.95294189453125, -0.7735595703125, -0.59417724609375, -0.414794921875, -0.23541259765625, -0.0560302734375, 0.12335205078125, 0.302734375, 0.48211669921875, 0.6614990234375, 0.84088134765625, 1.020263671875, 1.19964599609375, 1.3790283203125, 1.55841064453125, 1.73779296875, 1.91717529296875, 2.0965576171875, 2.27593994140625, 2.455322265625, 2.63470458984375, 2.8140869140625, 2.99346923828125, 3.1728515625, 3.35223388671875, 3.5316162109375, 3.71099853515625, 3.890380859375, 4.06976318359375, 4.2491455078125, 4.42852783203125, 4.60791015625, 4.78729248046875, 4.9666748046875, 5.14605712890625, 5.325439453125, 5.50482177734375, 5.6842041015625, 5.86358642578125, 6.04296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 4.0, 6.0, 15.0, 12.0, 18.0, 20.0, 15.0, 39.0, 26.0, 23.0, 31.0, 27.0, 57.0, 41.0, 62.0, 49.0, 57.0, 55.0, 41.0, 64.0, 45.0, 37.0, 42.0, 26.0, 35.0, 22.0, 24.0, 21.0, 13.0, 14.0, 10.0, 10.0, 6.0, 2.0, 5.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005044937133789062, -0.00048752129077911377, -0.0004705488681793213, -0.0004535764455795288, -0.00043660402297973633, -0.00041963160037994385, -0.00040265917778015137, -0.0003856867551803589, -0.0003687143325805664, -0.0003517419099807739, -0.00033476948738098145, -0.00031779706478118896, -0.0003008246421813965, -0.000283852219581604, -0.0002668797969818115, -0.00024990737438201904, -0.00023293495178222656, -0.00021596252918243408, -0.0001989901065826416, -0.00018201768398284912, -0.00016504526138305664, -0.00014807283878326416, -0.00013110041618347168, -0.0001141279935836792, -9.715557098388672e-05, -8.018314838409424e-05, -6.321072578430176e-05, -4.623830318450928e-05, -2.9265880584716797e-05, -1.2293457984924316e-05, 4.678964614868164e-06, 2.1651387214660645e-05, 3.8623809814453125e-05, 5.5596232414245605e-05, 7.256865501403809e-05, 8.954107761383057e-05, 0.00010651350021362305, 0.00012348592281341553, 0.000140458345413208, 0.0001574307680130005, 0.00017440319061279297, 0.00019137561321258545, 0.00020834803581237793, 0.0002253204584121704, 0.0002422928810119629, 0.00025926530361175537, 0.00027623772621154785, 0.00029321014881134033, 0.0003101825714111328, 0.0003271549940109253, 0.0003441274166107178, 0.00036109983921051025, 0.00037807226181030273, 0.0003950446844100952, 0.0004120171070098877, 0.0004289895296096802, 0.00044596195220947266, 0.00046293437480926514, 0.0004799067974090576, 0.0004968792200088501, 0.0005138516426086426, 0.0005308240652084351, 0.0005477964878082275, 0.00056476891040802, 0.0005817413330078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 14.0, 24.0, 34.0, 41.0, 57.0, 109.0, 143.0, 195.0, 276.0, 484.0, 699.0, 1082.0, 1743.0, 2847.0, 4634.0, 7904.0, 13229.0, 22082.0, 36458.0, 58002.0, 86945.0, 118104.0, 141369.0, 146121.0, 129068.0, 98438.0, 67830.0, 43607.0, 26601.0, 16091.0, 9391.0, 5663.0, 3516.0, 2035.0, 1324.0, 838.0, 558.0, 327.0, 247.0, 136.0, 104.0, 61.0, 43.0, 32.0, 19.0, 13.0, 14.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.61297607421875, -5.4329833984375, -5.25299072265625, -5.072998046875, -4.89300537109375, -4.7130126953125, -4.53302001953125, -4.35302734375, -4.17303466796875, -3.9930419921875, -3.81304931640625, -3.633056640625, -3.45306396484375, -3.2730712890625, -3.09307861328125, -2.9130859375, -2.73309326171875, -2.5531005859375, -2.37310791015625, -2.193115234375, -2.01312255859375, -1.8331298828125, -1.65313720703125, -1.47314453125, -1.29315185546875, -1.1131591796875, -0.93316650390625, -0.753173828125, -0.57318115234375, -0.3931884765625, -0.21319580078125, -0.033203125, 0.14678955078125, 0.3267822265625, 0.50677490234375, 0.686767578125, 0.86676025390625, 1.0467529296875, 1.22674560546875, 1.40673828125, 1.58673095703125, 1.7667236328125, 1.94671630859375, 2.126708984375, 2.30670166015625, 2.4866943359375, 2.66668701171875, 2.8466796875, 3.02667236328125, 3.2066650390625, 3.38665771484375, 3.566650390625, 3.74664306640625, 3.9266357421875, 4.10662841796875, 4.28662109375, 4.46661376953125, 4.6466064453125, 4.82659912109375, 5.006591796875, 5.18658447265625, 5.3665771484375, 5.54656982421875, 5.7265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 7.0, 13.0, 13.0, 11.0, 13.0, 13.0, 25.0, 30.0, 42.0, 42.0, 41.0, 61.0, 70.0, 73.0, 58.0, 72.0, 48.0, 73.0, 45.0, 44.0, 35.0, 34.0, 21.0, 26.0, 25.0, 16.0, 11.0, 5.0, 11.0, 4.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-3.95703125, -3.858062744140625, -3.75909423828125, -3.660125732421875, -3.5611572265625, -3.462188720703125, -3.36322021484375, -3.264251708984375, -3.165283203125, -3.066314697265625, -2.96734619140625, -2.868377685546875, -2.7694091796875, -2.670440673828125, -2.57147216796875, -2.472503662109375, -2.37353515625, -2.274566650390625, -2.17559814453125, -2.076629638671875, -1.9776611328125, -1.878692626953125, -1.77972412109375, -1.680755615234375, -1.581787109375, -1.482818603515625, -1.38385009765625, -1.284881591796875, -1.1859130859375, -1.086944580078125, -0.98797607421875, -0.889007568359375, -0.7900390625, -0.691070556640625, -0.59210205078125, -0.493133544921875, -0.3941650390625, -0.295196533203125, -0.19622802734375, -0.097259521484375, 0.001708984375, 0.100677490234375, 0.19964599609375, 0.298614501953125, 0.3975830078125, 0.496551513671875, 0.59552001953125, 0.694488525390625, 0.79345703125, 0.892425537109375, 0.99139404296875, 1.090362548828125, 1.1893310546875, 1.288299560546875, 1.38726806640625, 1.486236572265625, 1.585205078125, 1.684173583984375, 1.78314208984375, 1.882110595703125, 1.9810791015625, 2.080047607421875, 2.17901611328125, 2.277984619140625, 2.376953125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 4.0, 7.0, 7.0, 10.0, 11.0, 8.0, 9.0, 10.0, 15.0, 24.0, 21.0, 32.0, 38.0, 35.0, 40.0, 42.0, 52.0, 39.0, 46.0, 52.0, 48.0, 42.0, 43.0, 36.0, 50.0, 37.0, 37.0, 28.0, 27.0, 22.0, 18.0, 21.0, 20.0, 12.0, 5.0, 8.0, 9.0, 10.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.937471389770508, -18.364242553710938, -17.791011810302734, -17.21778106689453, -16.64455223083496, -16.07132339477539, -15.498092651367188, -14.9248628616333, -14.351633071899414, -13.778403282165527, -13.20517349243164, -12.631943702697754, -12.058713912963867, -11.48548412322998, -10.912254333496094, -10.339024543762207, -9.76579475402832, -9.192564964294434, -8.619335174560547, -8.04610538482666, -7.472875595092773, -6.899645805358887, -6.326416015625, -5.753186225891113, -5.179956436157227, -4.60672664642334, -4.033496856689453, -3.4602670669555664, -2.8870372772216797, -2.313807487487793, -1.7405776977539062, -1.1673479080200195, -0.5941200256347656, -0.020890235900878906, 0.5523395538330078, 1.1255693435668945, 1.6987991333007812, 2.272028923034668, 2.8452587127685547, 3.4184885025024414, 3.991718292236328, 4.564948081970215, 5.138177871704102, 5.711407661437988, 6.284637451171875, 6.857867240905762, 7.431097030639648, 8.004326820373535, 8.577556610107422, 9.150786399841309, 9.724016189575195, 10.297245979309082, 10.870475769042969, 11.443705558776855, 12.016935348510742, 12.590165138244629, 13.163394927978516, 13.736624717712402, 14.309854507446289, 14.883084297180176, 15.456314086914062, 16.029544830322266, 16.602773666381836, 17.176002502441406, 17.74923324584961]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 4.0, 4.0, 4.0, 4.0, 6.0, 17.0, 6.0, 8.0, 14.0, 16.0, 18.0, 22.0, 24.0, 24.0, 18.0, 29.0, 33.0, 28.0, 33.0, 36.0, 30.0, 36.0, 31.0, 44.0, 39.0, 42.0, 49.0, 36.0, 37.0, 37.0, 33.0, 24.0, 30.0, 31.0, 24.0, 22.0, 21.0, 18.0, 8.0, 16.0, 10.0, 7.0, 8.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0], "bins": [-21.505176544189453, -20.888151168823242, -20.27112579345703, -19.654102325439453, -19.037076950073242, -18.42005157470703, -17.803028106689453, -17.186002731323242, -16.56897735595703, -15.95195198059082, -15.334927558898926, -14.717903137207031, -14.10087776184082, -13.48385238647461, -12.866827964782715, -12.24980354309082, -11.63277816772461, -11.015752792358398, -10.398728370666504, -9.78170394897461, -9.164678573608398, -8.547653198242188, -7.930628776550293, -7.31360387802124, -6.6965789794921875, -6.079554080963135, -5.462529182434082, -4.845504283905029, -4.228479385375977, -3.611454486846924, -2.994429588317871, -2.3774046897888184, -1.7603778839111328, -1.14335298538208, -0.5263280868530273, 0.09069681167602539, 0.7077217102050781, 1.3247466087341309, 1.9417715072631836, 2.5587964057922363, 3.175821304321289, 3.792846202850342, 4.4098711013793945, 5.026895999908447, 5.6439208984375, 6.260945796966553, 6.8779706954956055, 7.494995594024658, 8.112020492553711, 8.729045867919922, 9.346070289611816, 9.963094711303711, 10.580120086669922, 11.197145462036133, 11.814169883728027, 12.431194305419922, 13.048219680786133, 13.665245056152344, 14.282269477844238, 14.899293899536133, 15.516319274902344, 16.133344650268555, 16.750370025634766, 17.367393493652344, 17.984418869018555]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 6.0, 8.0, 8.0, 19.0, 40.0, 66.0, 96.0, 142.0, 241.0, 389.0, 651.0, 1031.0, 1674.0, 2717.0, 4508.0, 6879.0, 11073.0, 17145.0, 27290.0, 42491.0, 64995.0, 97653.0, 144083.0, 205704.0, 280755.0, 359132.0, 427700.0, 465213.0, 458787.0, 410538.0, 338673.0, 259786.0, 187597.0, 130275.0, 87671.0, 57636.0, 37533.0, 24131.0, 15153.0, 9439.0, 5976.0, 3579.0, 2302.0, 1407.0, 803.0, 496.0, 328.0, 218.0, 103.0, 61.0, 45.0, 18.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-13.65625, -13.2275390625, -12.798828125, -12.3701171875, -11.94140625, -11.5126953125, -11.083984375, -10.6552734375, -10.2265625, -9.7978515625, -9.369140625, -8.9404296875, -8.51171875, -8.0830078125, -7.654296875, -7.2255859375, -6.796875, -6.3681640625, -5.939453125, -5.5107421875, -5.08203125, -4.6533203125, -4.224609375, -3.7958984375, -3.3671875, -2.9384765625, -2.509765625, -2.0810546875, -1.65234375, -1.2236328125, -0.794921875, -0.3662109375, 0.0625, 0.4912109375, 0.919921875, 1.3486328125, 1.77734375, 2.2060546875, 2.634765625, 3.0634765625, 3.4921875, 3.9208984375, 4.349609375, 4.7783203125, 5.20703125, 5.6357421875, 6.064453125, 6.4931640625, 6.921875, 7.3505859375, 7.779296875, 8.2080078125, 8.63671875, 9.0654296875, 9.494140625, 9.9228515625, 10.3515625, 10.7802734375, 11.208984375, 11.6376953125, 12.06640625, 12.4951171875, 12.923828125, 13.3525390625, 13.78125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 10.0, 10.0, 11.0, 11.0, 20.0, 19.0, 24.0, 14.0, 23.0, 32.0, 30.0, 39.0, 36.0, 36.0, 29.0, 37.0, 36.0, 44.0, 49.0, 39.0, 45.0, 32.0, 36.0, 36.0, 36.0, 31.0, 23.0, 36.0, 22.0, 25.0, 21.0, 9.0, 19.0, 11.0, 9.0, 8.0, 7.0, 9.0, 6.0, 1.0, 1.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.665771484375, -15.17529296875, -14.684814453125, -14.1943359375, -13.703857421875, -13.21337890625, -12.722900390625, -12.232421875, -11.741943359375, -11.25146484375, -10.760986328125, -10.2705078125, -9.780029296875, -9.28955078125, -8.799072265625, -8.30859375, -7.818115234375, -7.32763671875, -6.837158203125, -6.3466796875, -5.856201171875, -5.36572265625, -4.875244140625, -4.384765625, -3.894287109375, -3.40380859375, -2.913330078125, -2.4228515625, -1.932373046875, -1.44189453125, -0.951416015625, -0.4609375, 0.029541015625, 0.52001953125, 1.010498046875, 1.5009765625, 1.991455078125, 2.48193359375, 2.972412109375, 3.462890625, 3.953369140625, 4.44384765625, 4.934326171875, 5.4248046875, 5.915283203125, 6.40576171875, 6.896240234375, 7.38671875, 7.877197265625, 8.36767578125, 8.858154296875, 9.3486328125, 9.839111328125, 10.32958984375, 10.820068359375, 11.310546875, 11.801025390625, 12.29150390625, 12.781982421875, 13.2724609375, 13.762939453125, 14.25341796875, 14.743896484375, 15.234375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 15.0, 29.0, 47.0, 103.0, 170.0, 290.0, 556.0, 905.0, 1533.0, 2806.0, 4833.0, 8412.0, 14313.0, 23750.0, 38852.0, 62052.0, 95152.0, 142542.0, 203074.0, 273146.0, 345539.0, 408333.0, 444954.0, 448352.0, 413384.0, 353292.0, 281967.0, 210228.0, 148638.0, 100349.0, 65110.0, 40765.0, 24802.0, 15086.0, 8840.0, 5249.0, 2974.0, 1637.0, 921.0, 550.0, 301.0, 196.0, 101.0, 59.0, 25.0, 20.0, 11.0, 3.0, 10.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.3203125, -13.8870849609375, -13.453857421875, -13.0206298828125, -12.58740234375, -12.1541748046875, -11.720947265625, -11.2877197265625, -10.8544921875, -10.4212646484375, -9.988037109375, -9.5548095703125, -9.12158203125, -8.6883544921875, -8.255126953125, -7.8218994140625, -7.388671875, -6.9554443359375, -6.522216796875, -6.0889892578125, -5.65576171875, -5.2225341796875, -4.789306640625, -4.3560791015625, -3.9228515625, -3.4896240234375, -3.056396484375, -2.6231689453125, -2.18994140625, -1.7567138671875, -1.323486328125, -0.8902587890625, -0.45703125, -0.0238037109375, 0.409423828125, 0.8426513671875, 1.27587890625, 1.7091064453125, 2.142333984375, 2.5755615234375, 3.0087890625, 3.4420166015625, 3.875244140625, 4.3084716796875, 4.74169921875, 5.1749267578125, 5.608154296875, 6.0413818359375, 6.474609375, 6.9078369140625, 7.341064453125, 7.7742919921875, 8.20751953125, 8.6407470703125, 9.073974609375, 9.5072021484375, 9.9404296875, 10.3736572265625, 10.806884765625, 11.2401123046875, 11.67333984375, 12.1065673828125, 12.539794921875, 12.9730224609375, 13.40625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 12.0, 9.0, 16.0, 20.0, 28.0, 28.0, 45.0, 45.0, 51.0, 69.0, 94.0, 89.0, 105.0, 127.0, 156.0, 187.0, 194.0, 176.0, 206.0, 204.0, 215.0, 218.0, 193.0, 214.0, 197.0, 167.0, 146.0, 130.0, 120.0, 117.0, 98.0, 73.0, 56.0, 54.0, 52.0, 35.0, 24.0, 20.0, 18.0, 10.0, 15.0, 8.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.1875, -7.9456787109375, -7.703857421875, -7.4620361328125, -7.22021484375, -6.9783935546875, -6.736572265625, -6.4947509765625, -6.2529296875, -6.0111083984375, -5.769287109375, -5.5274658203125, -5.28564453125, -5.0438232421875, -4.802001953125, -4.5601806640625, -4.318359375, -4.0765380859375, -3.834716796875, -3.5928955078125, -3.35107421875, -3.1092529296875, -2.867431640625, -2.6256103515625, -2.3837890625, -2.1419677734375, -1.900146484375, -1.6583251953125, -1.41650390625, -1.1746826171875, -0.932861328125, -0.6910400390625, -0.44921875, -0.2073974609375, 0.034423828125, 0.2762451171875, 0.51806640625, 0.7598876953125, 1.001708984375, 1.2435302734375, 1.4853515625, 1.7271728515625, 1.968994140625, 2.2108154296875, 2.45263671875, 2.6944580078125, 2.936279296875, 3.1781005859375, 3.419921875, 3.6617431640625, 3.903564453125, 4.1453857421875, 4.38720703125, 4.6290283203125, 4.870849609375, 5.1126708984375, 5.3544921875, 5.5963134765625, 5.838134765625, 6.0799560546875, 6.32177734375, 6.5635986328125, 6.805419921875, 7.0472412109375, 7.2890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 6.0, 14.0, 7.0, 17.0, 30.0, 27.0, 29.0, 25.0, 45.0, 30.0, 47.0, 51.0, 68.0, 48.0, 61.0, 61.0, 45.0, 56.0, 45.0, 41.0, 46.0, 35.0, 26.0, 30.0, 27.0, 8.0, 11.0, 5.0, 9.0, 13.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.800466537475586, -19.15241241455078, -18.504356384277344, -17.85630226135254, -17.2082462310791, -16.560192108154297, -15.912137031555176, -15.264081954956055, -14.616026878356934, -13.967971801757812, -13.319916725158691, -12.67186164855957, -12.023807525634766, -11.375751495361328, -10.727697372436523, -10.079642295837402, -9.431587219238281, -8.78353214263916, -8.135477066040039, -7.487422466278076, -6.839367389678955, -6.191312313079834, -5.543257713317871, -4.89520263671875, -4.247147560119629, -3.599092483520508, -2.951037645339966, -2.302982807159424, -1.6549277305603027, -1.0068726539611816, -0.35881781578063965, 0.28923702239990234, 0.9372940063476562, 1.5853489637374878, 2.2334039211273193, 2.8814587593078613, 3.5295138359069824, 4.1775689125061035, 4.825623512268066, 5.4736785888671875, 6.121733665466309, 6.76978874206543, 7.417843818664551, 8.065898895263672, 8.713953018188477, 9.362009048461914, 10.010063171386719, 10.65811824798584, 11.306173324584961, 11.954228401184082, 12.602283477783203, 13.250338554382324, 13.898393630981445, 14.54644775390625, 15.194502830505371, 15.842557907104492, 16.490612030029297, 17.1386661529541, 17.78672218322754, 18.434776306152344, 19.08283233642578, 19.730886459350586, 20.378942489624023, 21.026996612548828, 21.675052642822266]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 2.0, 2.0, 5.0, 10.0, 12.0, 5.0, 11.0, 16.0, 16.0, 15.0, 16.0, 23.0, 23.0, 28.0, 34.0, 33.0, 48.0, 32.0, 43.0, 49.0, 42.0, 36.0, 33.0, 39.0, 42.0, 41.0, 37.0, 30.0, 36.0, 38.0, 38.0, 20.0, 33.0, 17.0, 20.0, 18.0, 16.0, 10.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.51458740234375, -19.896921157836914, -19.279253005981445, -18.66158676147461, -18.04391860961914, -17.426252365112305, -16.808584213256836, -16.19091796875, -15.573250770568848, -14.955583572387695, -14.337916374206543, -13.72024917602539, -13.102582931518555, -12.484914779663086, -11.86724853515625, -11.249581336975098, -10.631914138793945, -10.014246940612793, -9.39657974243164, -8.778912544250488, -8.161245346069336, -7.543578624725342, -6.925911903381348, -6.308244705200195, -5.690577507019043, -5.072910308837891, -4.455243110656738, -3.837576389312744, -3.219909191131592, -2.6022419929504395, -1.9845750331878662, -1.366908073425293, -0.7492408752441406, -0.13157379627227783, 0.48609328269958496, 1.1037603616714478, 1.7214274406433105, 2.339094638824463, 2.956761598587036, 3.5744285583496094, 4.192095756530762, 4.809762954711914, 5.427430152893066, 6.0450968742370605, 6.662764072418213, 7.280431270599365, 7.898097991943359, 8.515765190124512, 9.133432388305664, 9.751099586486816, 10.368766784667969, 10.986433982849121, 11.604101181030273, 12.22176742553711, 12.839434623718262, 13.457101821899414, 14.074769020080566, 14.692436218261719, 15.310103416442871, 15.927770614624023, 16.54543685913086, 17.163105010986328, 17.780771255493164, 18.3984375, 19.01610565185547]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 12.0, 15.0, 45.0, 45.0, 67.0, 94.0, 129.0, 199.0, 311.0, 380.0, 602.0, 857.0, 1168.0, 1694.0, 2515.0, 3724.0, 5178.0, 7746.0, 11387.0, 17138.0, 25948.0, 39814.0, 63043.0, 100954.0, 158685.0, 197439.0, 147692.0, 91621.0, 58352.0, 37259.0, 24537.0, 15954.0, 10707.0, 7368.0, 4916.0, 3372.0, 2345.0, 1565.0, 1113.0, 824.0, 556.0, 398.0, 249.0, 162.0, 125.0, 81.0, 56.0, 33.0, 26.0, 11.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.904296875, -2.814697265625, -2.72509765625, -2.635498046875, -2.5458984375, -2.456298828125, -2.36669921875, -2.277099609375, -2.1875, -2.097900390625, -2.00830078125, -1.918701171875, -1.8291015625, -1.739501953125, -1.64990234375, -1.560302734375, -1.470703125, -1.381103515625, -1.29150390625, -1.201904296875, -1.1123046875, -1.022705078125, -0.93310546875, -0.843505859375, -0.75390625, -0.664306640625, -0.57470703125, -0.485107421875, -0.3955078125, -0.305908203125, -0.21630859375, -0.126708984375, -0.037109375, 0.052490234375, 0.14208984375, 0.231689453125, 0.3212890625, 0.410888671875, 0.50048828125, 0.590087890625, 0.6796875, 0.769287109375, 0.85888671875, 0.948486328125, 1.0380859375, 1.127685546875, 1.21728515625, 1.306884765625, 1.396484375, 1.486083984375, 1.57568359375, 1.665283203125, 1.7548828125, 1.844482421875, 1.93408203125, 2.023681640625, 2.11328125, 2.202880859375, 2.29248046875, 2.382080078125, 2.4716796875, 2.561279296875, 2.65087890625, 2.740478515625, 2.830078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 3.0, 8.0, 10.0, 15.0, 12.0, 12.0, 6.0, 20.0, 24.0, 24.0, 28.0, 31.0, 26.0, 36.0, 41.0, 35.0, 30.0, 33.0, 40.0, 32.0, 39.0, 38.0, 41.0, 29.0, 43.0, 31.0, 29.0, 37.0, 29.0, 27.0, 37.0, 23.0, 21.0, 13.0, 13.0, 19.0, 13.0, 7.0, 5.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-19.796875, -19.217529296875, -18.63818359375, -18.058837890625, -17.4794921875, -16.900146484375, -16.32080078125, -15.741455078125, -15.162109375, -14.582763671875, -14.00341796875, -13.424072265625, -12.8447265625, -12.265380859375, -11.68603515625, -11.106689453125, -10.52734375, -9.947998046875, -9.36865234375, -8.789306640625, -8.2099609375, -7.630615234375, -7.05126953125, -6.471923828125, -5.892578125, -5.313232421875, -4.73388671875, -4.154541015625, -3.5751953125, -2.995849609375, -2.41650390625, -1.837158203125, -1.2578125, -0.678466796875, -0.09912109375, 0.480224609375, 1.0595703125, 1.638916015625, 2.21826171875, 2.797607421875, 3.376953125, 3.956298828125, 4.53564453125, 5.114990234375, 5.6943359375, 6.273681640625, 6.85302734375, 7.432373046875, 8.01171875, 8.591064453125, 9.17041015625, 9.749755859375, 10.3291015625, 10.908447265625, 11.48779296875, 12.067138671875, 12.646484375, 13.225830078125, 13.80517578125, 14.384521484375, 14.9638671875, 15.543212890625, 16.12255859375, 16.701904296875, 17.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 7.0, 8.0, 7.0, 10.0, 17.0, 21.0, 42.0, 63.0, 62.0, 101.0, 147.0, 261.0, 352.0, 556.0, 781.0, 1220.0, 1827.0, 2811.0, 4199.0, 6427.0, 9930.0, 15313.0, 24128.0, 37988.0, 62263.0, 103194.0, 173169.0, 216582.0, 149848.0, 89236.0, 54052.0, 33516.0, 21006.0, 13578.0, 8685.0, 5834.0, 3780.0, 2485.0, 1678.0, 1094.0, 677.0, 511.0, 359.0, 245.0, 169.0, 107.0, 71.0, 51.0, 36.0, 24.0, 12.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0], "bins": [-2.61328125, -2.529937744140625, -2.44659423828125, -2.363250732421875, -2.2799072265625, -2.196563720703125, -2.11322021484375, -2.029876708984375, -1.946533203125, -1.863189697265625, -1.77984619140625, -1.696502685546875, -1.6131591796875, -1.529815673828125, -1.44647216796875, -1.363128662109375, -1.27978515625, -1.196441650390625, -1.11309814453125, -1.029754638671875, -0.9464111328125, -0.863067626953125, -0.77972412109375, -0.696380615234375, -0.613037109375, -0.529693603515625, -0.44635009765625, -0.363006591796875, -0.2796630859375, -0.196319580078125, -0.11297607421875, -0.029632568359375, 0.0537109375, 0.137054443359375, 0.22039794921875, 0.303741455078125, 0.3870849609375, 0.470428466796875, 0.55377197265625, 0.637115478515625, 0.720458984375, 0.803802490234375, 0.88714599609375, 0.970489501953125, 1.0538330078125, 1.137176513671875, 1.22052001953125, 1.303863525390625, 1.38720703125, 1.470550537109375, 1.55389404296875, 1.637237548828125, 1.7205810546875, 1.803924560546875, 1.88726806640625, 1.970611572265625, 2.053955078125, 2.137298583984375, 2.22064208984375, 2.303985595703125, 2.3873291015625, 2.470672607421875, 2.55401611328125, 2.637359619140625, 2.720703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 15.0, 9.0, 12.0, 12.0, 18.0, 14.0, 12.0, 15.0, 19.0, 28.0, 37.0, 31.0, 35.0, 36.0, 46.0, 40.0, 38.0, 31.0, 32.0, 40.0, 49.0, 39.0, 51.0, 32.0, 33.0, 31.0, 28.0, 29.0, 28.0, 14.0, 28.0, 19.0, 15.0, 13.0, 17.0, 12.0, 5.0, 8.0, 5.0, 7.0, 0.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.1171875, -11.7501220703125, -11.383056640625, -11.0159912109375, -10.64892578125, -10.2818603515625, -9.914794921875, -9.5477294921875, -9.1806640625, -8.8135986328125, -8.446533203125, -8.0794677734375, -7.71240234375, -7.3453369140625, -6.978271484375, -6.6112060546875, -6.244140625, -5.8770751953125, -5.510009765625, -5.1429443359375, -4.77587890625, -4.4088134765625, -4.041748046875, -3.6746826171875, -3.3076171875, -2.9405517578125, -2.573486328125, -2.2064208984375, -1.83935546875, -1.4722900390625, -1.105224609375, -0.7381591796875, -0.37109375, -0.0040283203125, 0.363037109375, 0.7301025390625, 1.09716796875, 1.4642333984375, 1.831298828125, 2.1983642578125, 2.5654296875, 2.9324951171875, 3.299560546875, 3.6666259765625, 4.03369140625, 4.4007568359375, 4.767822265625, 5.1348876953125, 5.501953125, 5.8690185546875, 6.236083984375, 6.6031494140625, 6.97021484375, 7.3372802734375, 7.704345703125, 8.0714111328125, 8.4384765625, 8.8055419921875, 9.172607421875, 9.5396728515625, 9.90673828125, 10.2738037109375, 10.640869140625, 11.0079345703125, 11.375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 10.0, 10.0, 12.0, 22.0, 42.0, 32.0, 75.0, 89.0, 129.0, 198.0, 253.0, 352.0, 567.0, 800.0, 1159.0, 1830.0, 2825.0, 4425.0, 6961.0, 11390.0, 19355.0, 34119.0, 63647.0, 134668.0, 318263.0, 233029.0, 97268.0, 48522.0, 26813.0, 15813.0, 9304.0, 5812.0, 3707.0, 2304.0, 1486.0, 1045.0, 688.0, 450.0, 317.0, 211.0, 155.0, 119.0, 85.0, 50.0, 37.0, 33.0, 19.0, 11.0, 10.0, 12.0, 5.0, 6.0, 7.0, 2.0, 1.0, 2.0], "bins": [-0.171630859375, -0.1663970947265625, -0.161163330078125, -0.1559295654296875, -0.15069580078125, -0.1454620361328125, -0.140228271484375, -0.1349945068359375, -0.1297607421875, -0.1245269775390625, -0.119293212890625, -0.1140594482421875, -0.10882568359375, -0.1035919189453125, -0.098358154296875, -0.0931243896484375, -0.087890625, -0.0826568603515625, -0.077423095703125, -0.0721893310546875, -0.06695556640625, -0.0617218017578125, -0.056488037109375, -0.0512542724609375, -0.0460205078125, -0.0407867431640625, -0.035552978515625, -0.0303192138671875, -0.02508544921875, -0.0198516845703125, -0.014617919921875, -0.0093841552734375, -0.004150390625, 0.0010833740234375, 0.006317138671875, 0.0115509033203125, 0.01678466796875, 0.0220184326171875, 0.027252197265625, 0.0324859619140625, 0.0377197265625, 0.0429534912109375, 0.048187255859375, 0.0534210205078125, 0.05865478515625, 0.0638885498046875, 0.069122314453125, 0.0743560791015625, 0.07958984375, 0.0848236083984375, 0.090057373046875, 0.0952911376953125, 0.10052490234375, 0.1057586669921875, 0.110992431640625, 0.1162261962890625, 0.1214599609375, 0.1266937255859375, 0.131927490234375, 0.1371612548828125, 0.14239501953125, 0.1476287841796875, 0.152862548828125, 0.1580963134765625, 0.163330078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 3.0, 7.0, 8.0, 7.0, 12.0, 16.0, 18.0, 26.0, 25.0, 41.0, 40.0, 59.0, 51.0, 76.0, 58.0, 69.0, 72.0, 67.0, 64.0, 38.0, 51.0, 49.0, 28.0, 22.0, 27.0, 16.0, 22.0, 13.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4928321838378906e-05, -3.3882446587085724e-05, -3.283657133579254e-05, -3.179069608449936e-05, -3.074482083320618e-05, -2.9698945581912994e-05, -2.8653070330619812e-05, -2.760719507932663e-05, -2.6561319828033447e-05, -2.5515444576740265e-05, -2.4469569325447083e-05, -2.34236940741539e-05, -2.2377818822860718e-05, -2.1331943571567535e-05, -2.0286068320274353e-05, -1.924019306898117e-05, -1.8194317817687988e-05, -1.7148442566394806e-05, -1.6102567315101624e-05, -1.5056692063808441e-05, -1.4010816812515259e-05, -1.2964941561222076e-05, -1.1919066309928894e-05, -1.0873191058635712e-05, -9.82731580734253e-06, -8.781440556049347e-06, -7.735565304756165e-06, -6.689690053462982e-06, -5.6438148021698e-06, -4.5979395508766174e-06, -3.552064299583435e-06, -2.5061890482902527e-06, -1.4603137969970703e-06, -4.1443854570388794e-07, 6.314367055892944e-07, 1.6773119568824768e-06, 2.723187208175659e-06, 3.7690624594688416e-06, 4.814937710762024e-06, 5.860812962055206e-06, 6.906688213348389e-06, 7.952563464641571e-06, 8.998438715934753e-06, 1.0044313967227936e-05, 1.1090189218521118e-05, 1.21360644698143e-05, 1.3181939721107483e-05, 1.4227814972400665e-05, 1.5273690223693848e-05, 1.631956547498703e-05, 1.7365440726280212e-05, 1.8411315977573395e-05, 1.9457191228866577e-05, 2.050306648015976e-05, 2.1548941731452942e-05, 2.2594816982746124e-05, 2.3640692234039307e-05, 2.468656748533249e-05, 2.573244273662567e-05, 2.6778317987918854e-05, 2.7824193239212036e-05, 2.887006849050522e-05, 2.99159437417984e-05, 3.096181899309158e-05, 3.2007694244384766e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 4.0, 6.0, 8.0, 11.0, 8.0, 18.0, 17.0, 29.0, 29.0, 62.0, 75.0, 91.0, 134.0, 167.0, 259.0, 369.0, 461.0, 718.0, 959.0, 1456.0, 2216.0, 3410.0, 5446.0, 8903.0, 14855.0, 26149.0, 47141.0, 91489.0, 207895.0, 338681.0, 139744.0, 68229.0, 36652.0, 20621.0, 11820.0, 7131.0, 4469.0, 2819.0, 1809.0, 1241.0, 828.0, 597.0, 411.0, 311.0, 242.0, 151.0, 116.0, 77.0, 52.0, 54.0, 32.0, 23.0, 19.0, 11.0, 10.0, 9.0, 4.0, 3.0, 4.0, 6.0, 3.0], "bins": [-0.415771484375, -0.40289306640625, -0.3900146484375, -0.37713623046875, -0.3642578125, -0.35137939453125, -0.3385009765625, -0.32562255859375, -0.312744140625, -0.29986572265625, -0.2869873046875, -0.27410888671875, -0.26123046875, -0.24835205078125, -0.2354736328125, -0.22259521484375, -0.209716796875, -0.19683837890625, -0.1839599609375, -0.17108154296875, -0.158203125, -0.14532470703125, -0.1324462890625, -0.11956787109375, -0.106689453125, -0.09381103515625, -0.0809326171875, -0.06805419921875, -0.05517578125, -0.04229736328125, -0.0294189453125, -0.01654052734375, -0.003662109375, 0.00921630859375, 0.0220947265625, 0.03497314453125, 0.0478515625, 0.06072998046875, 0.0736083984375, 0.08648681640625, 0.099365234375, 0.11224365234375, 0.1251220703125, 0.13800048828125, 0.15087890625, 0.16375732421875, 0.1766357421875, 0.18951416015625, 0.202392578125, 0.21527099609375, 0.2281494140625, 0.24102783203125, 0.25390625, 0.26678466796875, 0.2796630859375, 0.29254150390625, 0.305419921875, 0.31829833984375, 0.3311767578125, 0.34405517578125, 0.35693359375, 0.36981201171875, 0.3826904296875, 0.39556884765625, 0.408447265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 9.0, 8.0, 14.0, 20.0, 16.0, 27.0, 23.0, 41.0, 51.0, 71.0, 81.0, 94.0, 92.0, 85.0, 62.0, 53.0, 40.0, 46.0, 34.0, 31.0, 15.0, 14.0, 13.0, 11.0, 11.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130859375, -0.1268157958984375, -0.122772216796875, -0.1187286376953125, -0.11468505859375, -0.1106414794921875, -0.106597900390625, -0.1025543212890625, -0.0985107421875, -0.0944671630859375, -0.090423583984375, -0.0863800048828125, -0.08233642578125, -0.0782928466796875, -0.074249267578125, -0.0702056884765625, -0.066162109375, -0.0621185302734375, -0.058074951171875, -0.0540313720703125, -0.04998779296875, -0.0459442138671875, -0.041900634765625, -0.0378570556640625, -0.0338134765625, -0.0297698974609375, -0.025726318359375, -0.0216827392578125, -0.01763916015625, -0.0135955810546875, -0.009552001953125, -0.0055084228515625, -0.00146484375, 0.0025787353515625, 0.006622314453125, 0.0106658935546875, 0.01470947265625, 0.0187530517578125, 0.022796630859375, 0.0268402099609375, 0.0308837890625, 0.0349273681640625, 0.038970947265625, 0.0430145263671875, 0.04705810546875, 0.0511016845703125, 0.055145263671875, 0.0591888427734375, 0.063232421875, 0.0672760009765625, 0.071319580078125, 0.0753631591796875, 0.07940673828125, 0.0834503173828125, 0.087493896484375, 0.0915374755859375, 0.0955810546875, 0.0996246337890625, 0.103668212890625, 0.1077117919921875, 0.11175537109375, 0.1157989501953125, 0.119842529296875, 0.1238861083984375, 0.1279296875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 6.0, 15.0, 10.0, 17.0, 27.0, 31.0, 22.0, 30.0, 39.0, 35.0, 52.0, 52.0, 63.0, 47.0, 61.0, 61.0, 46.0, 59.0, 46.0, 44.0, 37.0, 32.0, 28.0, 33.0, 22.0, 10.0, 11.0, 9.0, 8.0, 11.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.753684997558594, -19.107946395874023, -18.462209701538086, -17.816471099853516, -17.170734405517578, -16.524995803833008, -15.879258155822754, -15.2335205078125, -14.587782859802246, -13.942045211791992, -13.296307563781738, -12.650569915771484, -12.004831314086914, -11.359094619750977, -10.713356018066406, -10.067618370056152, -9.421880722045898, -8.776143074035645, -8.13040542602539, -7.4846673011779785, -6.838929653167725, -6.193192005157471, -5.547453880310059, -4.901716232299805, -4.255978584289551, -3.610240936279297, -2.964503049850464, -2.318765163421631, -1.673027515411377, -1.027289867401123, -0.38155198097229004, 0.26418590545654297, 0.9099235534667969, 1.5556613206863403, 2.201399087905884, 2.847136974334717, 3.4928746223449707, 4.138612270355225, 4.784350395202637, 5.430088043212891, 6.0758256912231445, 6.721563339233398, 7.367300987243652, 8.013038635253906, 8.658777236938477, 9.304513931274414, 9.950252532958984, 10.595990180969238, 11.241727828979492, 11.887465476989746, 12.533203125, 13.178940773010254, 13.824678421020508, 14.470417022705078, 15.116154670715332, 15.761892318725586, 16.407630920410156, 17.053369522094727, 17.699106216430664, 18.344844818115234, 18.990581512451172, 19.636320114135742, 20.28205680847168, 20.92779541015625, 21.573532104492188]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 2.0, 2.0, 5.0, 11.0, 10.0, 6.0, 11.0, 14.0, 18.0, 15.0, 15.0, 25.0, 23.0, 26.0, 34.0, 34.0, 46.0, 34.0, 43.0, 51.0, 38.0, 38.0, 33.0, 39.0, 46.0, 38.0, 37.0, 29.0, 37.0, 35.0, 38.0, 24.0, 31.0, 17.0, 20.0, 16.0, 19.0, 9.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.323606491088867, -19.70870018005371, -19.093795776367188, -18.47888946533203, -17.863983154296875, -17.24907684326172, -16.634172439575195, -16.01926612854004, -15.404359817504883, -14.789454460144043, -14.174548149108887, -13.559642791748047, -12.94473648071289, -12.32983112335205, -11.714925765991211, -11.100019454956055, -10.485114097595215, -9.870208740234375, -9.255302429199219, -8.640397071838379, -8.025490760803223, -7.410585403442383, -6.795679569244385, -6.180773735046387, -5.565867900848389, -4.950962066650391, -4.336056232452393, -3.7211506366729736, -3.1062448024749756, -2.4913389682769775, -1.8764333724975586, -1.2615275382995605, -0.6466217041015625, -0.03171592950820923, 0.583189845085144, 1.1980955600738525, 1.8130013942718506, 2.4279072284698486, 3.0428128242492676, 3.6577186584472656, 4.272624492645264, 4.887530326843262, 5.50243616104126, 6.117341995239258, 6.732247352600098, 7.347153663635254, 7.962059020996094, 8.57696533203125, 9.19187068939209, 9.80677604675293, 10.421682357788086, 11.036587715148926, 11.651494026184082, 12.266399383544922, 12.881305694580078, 13.496211051940918, 14.111116409301758, 14.726021766662598, 15.340928077697754, 15.955833435058594, 16.57073974609375, 17.185646057128906, 17.80055046081543, 18.415456771850586, 19.030363082885742]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 8.0, 15.0, 23.0, 39.0, 66.0, 118.0, 148.0, 271.0, 380.0, 625.0, 980.0, 1503.0, 2258.0, 3723.0, 5560.0, 8663.0, 12581.0, 18700.0, 26827.0, 37164.0, 49549.0, 64844.0, 78285.0, 90931.0, 98786.0, 100507.0, 95751.0, 84444.0, 70423.0, 56255.0, 42556.0, 30906.0, 21690.0, 15041.0, 9879.0, 6672.0, 4342.0, 2917.0, 1759.0, 1232.0, 765.0, 506.0, 309.0, 195.0, 129.0, 88.0, 46.0, 35.0, 24.0, 18.0, 8.0, 6.0, 1.0, 1.0, 2.0], "bins": [-12.1328125, -11.7781982421875, -11.423583984375, -11.0689697265625, -10.71435546875, -10.3597412109375, -10.005126953125, -9.6505126953125, -9.2958984375, -8.9412841796875, -8.586669921875, -8.2320556640625, -7.87744140625, -7.5228271484375, -7.168212890625, -6.8135986328125, -6.458984375, -6.1043701171875, -5.749755859375, -5.3951416015625, -5.04052734375, -4.6859130859375, -4.331298828125, -3.9766845703125, -3.6220703125, -3.2674560546875, -2.912841796875, -2.5582275390625, -2.20361328125, -1.8489990234375, -1.494384765625, -1.1397705078125, -0.78515625, -0.4305419921875, -0.075927734375, 0.2786865234375, 0.63330078125, 0.9879150390625, 1.342529296875, 1.6971435546875, 2.0517578125, 2.4063720703125, 2.760986328125, 3.1156005859375, 3.47021484375, 3.8248291015625, 4.179443359375, 4.5340576171875, 4.888671875, 5.2432861328125, 5.597900390625, 5.9525146484375, 6.30712890625, 6.6617431640625, 7.016357421875, 7.3709716796875, 7.7255859375, 8.0802001953125, 8.434814453125, 8.7894287109375, 9.14404296875, 9.4986572265625, 9.853271484375, 10.2078857421875, 10.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 2.0, 5.0, 10.0, 7.0, 9.0, 11.0, 7.0, 19.0, 16.0, 25.0, 20.0, 17.0, 24.0, 28.0, 39.0, 44.0, 30.0, 27.0, 34.0, 38.0, 49.0, 33.0, 38.0, 37.0, 39.0, 40.0, 27.0, 31.0, 34.0, 33.0, 33.0, 15.0, 35.0, 19.0, 26.0, 16.0, 11.0, 16.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.625, -18.061767578125, -17.49853515625, -16.935302734375, -16.3720703125, -15.808837890625, -15.24560546875, -14.682373046875, -14.119140625, -13.555908203125, -12.99267578125, -12.429443359375, -11.8662109375, -11.302978515625, -10.73974609375, -10.176513671875, -9.61328125, -9.050048828125, -8.48681640625, -7.923583984375, -7.3603515625, -6.797119140625, -6.23388671875, -5.670654296875, -5.107421875, -4.544189453125, -3.98095703125, -3.417724609375, -2.8544921875, -2.291259765625, -1.72802734375, -1.164794921875, -0.6015625, -0.038330078125, 0.52490234375, 1.088134765625, 1.6513671875, 2.214599609375, 2.77783203125, 3.341064453125, 3.904296875, 4.467529296875, 5.03076171875, 5.593994140625, 6.1572265625, 6.720458984375, 7.28369140625, 7.846923828125, 8.41015625, 8.973388671875, 9.53662109375, 10.099853515625, 10.6630859375, 11.226318359375, 11.78955078125, 12.352783203125, 12.916015625, 13.479248046875, 14.04248046875, 14.605712890625, 15.1689453125, 15.732177734375, 16.29541015625, 16.858642578125, 17.421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [7.0, 5.0, 12.0, 13.0, 22.0, 49.0, 60.0, 88.0, 165.0, 223.0, 368.0, 506.0, 825.0, 1165.0, 1796.0, 2708.0, 3829.0, 5513.0, 8082.0, 11628.0, 16451.0, 22680.0, 30432.0, 40625.0, 51924.0, 63340.0, 74730.0, 83746.0, 89442.0, 90193.0, 86256.0, 77617.0, 66850.0, 55210.0, 44078.0, 33519.0, 25085.0, 17794.0, 12909.0, 9074.0, 6413.0, 4397.0, 2925.0, 1997.0, 1267.0, 851.0, 604.0, 395.0, 240.0, 155.0, 91.0, 69.0, 50.0, 44.0, 17.0, 16.0, 12.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.3515625, -9.03076171875, -8.7099609375, -8.38916015625, -8.068359375, -7.74755859375, -7.4267578125, -7.10595703125, -6.78515625, -6.46435546875, -6.1435546875, -5.82275390625, -5.501953125, -5.18115234375, -4.8603515625, -4.53955078125, -4.21875, -3.89794921875, -3.5771484375, -3.25634765625, -2.935546875, -2.61474609375, -2.2939453125, -1.97314453125, -1.65234375, -1.33154296875, -1.0107421875, -0.68994140625, -0.369140625, -0.04833984375, 0.2724609375, 0.59326171875, 0.9140625, 1.23486328125, 1.5556640625, 1.87646484375, 2.197265625, 2.51806640625, 2.8388671875, 3.15966796875, 3.48046875, 3.80126953125, 4.1220703125, 4.44287109375, 4.763671875, 5.08447265625, 5.4052734375, 5.72607421875, 6.046875, 6.36767578125, 6.6884765625, 7.00927734375, 7.330078125, 7.65087890625, 7.9716796875, 8.29248046875, 8.61328125, 8.93408203125, 9.2548828125, 9.57568359375, 9.896484375, 10.21728515625, 10.5380859375, 10.85888671875, 11.1796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 10.0, 3.0, 9.0, 10.0, 10.0, 6.0, 9.0, 14.0, 20.0, 16.0, 20.0, 23.0, 21.0, 20.0, 37.0, 22.0, 35.0, 29.0, 28.0, 40.0, 24.0, 29.0, 33.0, 31.0, 33.0, 34.0, 35.0, 36.0, 29.0, 33.0, 29.0, 23.0, 21.0, 28.0, 24.0, 19.0, 17.0, 20.0, 16.0, 13.0, 8.0, 16.0, 7.0, 12.0, 6.0, 8.0, 5.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0], "bins": [-10.328125, -10.0126953125, -9.697265625, -9.3818359375, -9.06640625, -8.7509765625, -8.435546875, -8.1201171875, -7.8046875, -7.4892578125, -7.173828125, -6.8583984375, -6.54296875, -6.2275390625, -5.912109375, -5.5966796875, -5.28125, -4.9658203125, -4.650390625, -4.3349609375, -4.01953125, -3.7041015625, -3.388671875, -3.0732421875, -2.7578125, -2.4423828125, -2.126953125, -1.8115234375, -1.49609375, -1.1806640625, -0.865234375, -0.5498046875, -0.234375, 0.0810546875, 0.396484375, 0.7119140625, 1.02734375, 1.3427734375, 1.658203125, 1.9736328125, 2.2890625, 2.6044921875, 2.919921875, 3.2353515625, 3.55078125, 3.8662109375, 4.181640625, 4.4970703125, 4.8125, 5.1279296875, 5.443359375, 5.7587890625, 6.07421875, 6.3896484375, 6.705078125, 7.0205078125, 7.3359375, 7.6513671875, 7.966796875, 8.2822265625, 8.59765625, 8.9130859375, 9.228515625, 9.5439453125, 9.859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 12.0, 15.0, 36.0, 48.0, 82.0, 125.0, 186.0, 267.0, 424.0, 605.0, 944.0, 1521.0, 2424.0, 3984.0, 6123.0, 9508.0, 15156.0, 22577.0, 33953.0, 49389.0, 67398.0, 87527.0, 104621.0, 115470.0, 115398.0, 105852.0, 88348.0, 67941.0, 49748.0, 34042.0, 22977.0, 15107.0, 9737.0, 6090.0, 4019.0, 2413.0, 1555.0, 1062.0, 661.0, 445.0, 267.0, 186.0, 121.0, 63.0, 59.0, 24.0, 18.0, 10.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-3.66015625, -3.5382080078125, -3.416259765625, -3.2943115234375, -3.17236328125, -3.0504150390625, -2.928466796875, -2.8065185546875, -2.6845703125, -2.5626220703125, -2.440673828125, -2.3187255859375, -2.19677734375, -2.0748291015625, -1.952880859375, -1.8309326171875, -1.708984375, -1.5870361328125, -1.465087890625, -1.3431396484375, -1.22119140625, -1.0992431640625, -0.977294921875, -0.8553466796875, -0.7333984375, -0.6114501953125, -0.489501953125, -0.3675537109375, -0.24560546875, -0.1236572265625, -0.001708984375, 0.1202392578125, 0.2421875, 0.3641357421875, 0.486083984375, 0.6080322265625, 0.72998046875, 0.8519287109375, 0.973876953125, 1.0958251953125, 1.2177734375, 1.3397216796875, 1.461669921875, 1.5836181640625, 1.70556640625, 1.8275146484375, 1.949462890625, 2.0714111328125, 2.193359375, 2.3153076171875, 2.437255859375, 2.5592041015625, 2.68115234375, 2.8031005859375, 2.925048828125, 3.0469970703125, 3.1689453125, 3.2908935546875, 3.412841796875, 3.5347900390625, 3.65673828125, 3.7786865234375, 3.900634765625, 4.0225830078125, 4.14453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 8.0, 10.0, 14.0, 10.0, 17.0, 26.0, 24.0, 24.0, 30.0, 32.0, 33.0, 34.0, 36.0, 53.0, 50.0, 51.0, 44.0, 50.0, 50.0, 43.0, 43.0, 40.0, 31.0, 37.0, 30.0, 27.0, 34.0, 22.0, 21.0, 17.0, 5.0, 6.0, 8.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004680156707763672, -0.00045404955744743347, -0.00044008344411849976, -0.00042611733078956604, -0.0004121512174606323, -0.0003981851041316986, -0.0003842189908027649, -0.0003702528774738312, -0.00035628676414489746, -0.00034232065081596375, -0.00032835453748703003, -0.0003143884241580963, -0.0003004223108291626, -0.0002864561975002289, -0.00027249008417129517, -0.00025852397084236145, -0.00024455785751342773, -0.00023059174418449402, -0.0002166256308555603, -0.0002026595175266266, -0.00018869340419769287, -0.00017472729086875916, -0.00016076117753982544, -0.00014679506421089172, -0.000132828950881958, -0.00011886283755302429, -0.00010489672422409058, -9.093061089515686e-05, -7.696449756622314e-05, -6.299838423728943e-05, -4.903227090835571e-05, -3.5066157579422e-05, -2.110004425048828e-05, -7.1339309215545654e-06, 6.83218240737915e-06, 2.0798295736312866e-05, 3.476440906524658e-05, 4.87305223941803e-05, 6.269663572311401e-05, 7.666274905204773e-05, 9.062886238098145e-05, 0.00010459497570991516, 0.00011856108903884888, 0.0001325272023677826, 0.0001464933156967163, 0.00016045942902565002, 0.00017442554235458374, 0.00018839165568351746, 0.00020235776901245117, 0.0002163238823413849, 0.0002302899956703186, 0.0002442561089992523, 0.00025822222232818604, 0.00027218833565711975, 0.00028615444898605347, 0.0003001205623149872, 0.0003140866756439209, 0.0003280527889728546, 0.00034201890230178833, 0.00035598501563072205, 0.00036995112895965576, 0.0003839172422885895, 0.0003978833556175232, 0.0004118494689464569, 0.0004258155822753906]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 4.0, 13.0, 25.0, 45.0, 69.0, 97.0, 147.0, 223.0, 401.0, 582.0, 921.0, 1501.0, 2435.0, 4031.0, 6626.0, 10669.0, 17254.0, 27499.0, 42566.0, 62790.0, 87169.0, 110564.0, 126278.0, 129335.0, 117116.0, 96053.0, 70929.0, 48892.0, 31905.0, 20082.0, 12517.0, 7608.0, 4706.0, 2800.0, 1760.0, 1079.0, 691.0, 423.0, 283.0, 161.0, 123.0, 62.0, 43.0, 18.0, 32.0, 6.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2734375, -4.13177490234375, -3.9901123046875, -3.84844970703125, -3.706787109375, -3.56512451171875, -3.4234619140625, -3.28179931640625, -3.14013671875, -2.99847412109375, -2.8568115234375, -2.71514892578125, -2.573486328125, -2.43182373046875, -2.2901611328125, -2.14849853515625, -2.0068359375, -1.86517333984375, -1.7235107421875, -1.58184814453125, -1.440185546875, -1.29852294921875, -1.1568603515625, -1.01519775390625, -0.87353515625, -0.73187255859375, -0.5902099609375, -0.44854736328125, -0.306884765625, -0.16522216796875, -0.0235595703125, 0.11810302734375, 0.259765625, 0.40142822265625, 0.5430908203125, 0.68475341796875, 0.826416015625, 0.96807861328125, 1.1097412109375, 1.25140380859375, 1.39306640625, 1.53472900390625, 1.6763916015625, 1.81805419921875, 1.959716796875, 2.10137939453125, 2.2430419921875, 2.38470458984375, 2.5263671875, 2.66802978515625, 2.8096923828125, 2.95135498046875, 3.093017578125, 3.23468017578125, 3.3763427734375, 3.51800537109375, 3.65966796875, 3.80133056640625, 3.9429931640625, 4.08465576171875, 4.226318359375, 4.36798095703125, 4.5096435546875, 4.65130615234375, 4.79296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 9.0, 7.0, 13.0, 11.0, 12.0, 16.0, 24.0, 13.0, 25.0, 26.0, 34.0, 32.0, 33.0, 34.0, 48.0, 40.0, 49.0, 45.0, 48.0, 50.0, 56.0, 53.0, 43.0, 37.0, 26.0, 40.0, 23.0, 28.0, 17.0, 19.0, 14.0, 13.0, 8.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9931640625, -1.9305267333984375, -1.867889404296875, -1.8052520751953125, -1.74261474609375, -1.6799774169921875, -1.617340087890625, -1.5547027587890625, -1.4920654296875, -1.4294281005859375, -1.366790771484375, -1.3041534423828125, -1.24151611328125, -1.1788787841796875, -1.116241455078125, -1.0536041259765625, -0.990966796875, -0.9283294677734375, -0.865692138671875, -0.8030548095703125, -0.74041748046875, -0.6777801513671875, -0.615142822265625, -0.5525054931640625, -0.4898681640625, -0.4272308349609375, -0.364593505859375, -0.3019561767578125, -0.23931884765625, -0.1766815185546875, -0.114044189453125, -0.0514068603515625, 0.01123046875, 0.0738677978515625, 0.136505126953125, 0.1991424560546875, 0.26177978515625, 0.3244171142578125, 0.387054443359375, 0.4496917724609375, 0.5123291015625, 0.5749664306640625, 0.637603759765625, 0.7002410888671875, 0.76287841796875, 0.8255157470703125, 0.888153076171875, 0.9507904052734375, 1.013427734375, 1.0760650634765625, 1.138702392578125, 1.2013397216796875, 1.26397705078125, 1.3266143798828125, 1.389251708984375, 1.4518890380859375, 1.5145263671875, 1.5771636962890625, 1.639801025390625, 1.7024383544921875, 1.76507568359375, 1.8277130126953125, 1.890350341796875, 1.9529876708984375, 2.015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 8.0, 6.0, 9.0, 12.0, 14.0, 17.0, 11.0, 19.0, 18.0, 28.0, 29.0, 41.0, 46.0, 43.0, 40.0, 44.0, 42.0, 55.0, 52.0, 53.0, 56.0, 51.0, 49.0, 31.0, 29.0, 26.0, 27.0, 20.0, 19.0, 23.0, 18.0, 11.0, 12.0, 8.0, 8.0, 4.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.630645751953125, -18.050676345825195, -17.470706939697266, -16.890737533569336, -16.310768127441406, -15.730798721313477, -15.150829315185547, -14.570859909057617, -13.990890502929688, -13.410921096801758, -12.830951690673828, -12.250982284545898, -11.671012878417969, -11.091043472290039, -10.51107406616211, -9.93110466003418, -9.351134300231934, -8.771164894104004, -8.191195487976074, -7.6112260818481445, -7.031256675720215, -6.451287269592285, -5.871317386627197, -5.291347980499268, -4.711378574371338, -4.131409168243408, -3.5514397621154785, -2.9714701175689697, -2.39150071144104, -1.8115313053131104, -1.2315616607666016, -0.6515922546386719, -0.07162284851074219, 0.5083466172218323, 1.0883160829544067, 1.668285608291626, 2.2482550144195557, 2.8282244205474854, 3.408194065093994, 3.988163471221924, 4.5681328773498535, 5.148102283477783, 5.728071689605713, 6.308041572570801, 6.8880109786987305, 7.46798038482666, 8.04794979095459, 8.62791919708252, 9.20788860321045, 9.787858009338379, 10.367827415466309, 10.947796821594238, 11.527766227722168, 12.107735633850098, 12.687705993652344, 13.267675399780273, 13.847644805908203, 14.427614212036133, 15.007583618164062, 15.587553024291992, 16.167522430419922, 16.74749183654785, 17.32746124267578, 17.90743064880371, 18.48740005493164]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 9.0, 10.0, 18.0, 25.0, 10.0, 18.0, 20.0, 25.0, 19.0, 27.0, 33.0, 33.0, 39.0, 39.0, 37.0, 42.0, 36.0, 33.0, 39.0, 32.0, 38.0, 44.0, 41.0, 34.0, 29.0, 37.0, 32.0, 22.0, 23.0, 27.0, 23.0, 15.0, 26.0, 9.0, 9.0, 5.0, 7.0, 7.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.912578582763672, -18.298572540283203, -17.6845645904541, -17.070558547973633, -16.45655059814453, -15.842544555664062, -15.228537559509277, -14.614530563354492, -14.000523567199707, -13.386516571044922, -12.772509574890137, -12.158502578735352, -11.544496536254883, -10.930488586425781, -10.316482543945312, -9.702475547790527, -9.088468551635742, -8.474461555480957, -7.860454559326172, -7.246448040008545, -6.63244104385376, -6.018434047698975, -5.404427528381348, -4.7904205322265625, -4.176413536071777, -3.562406539916992, -2.948399782180786, -2.33439302444458, -1.720386028289795, -1.1063790321350098, -0.4923722743988037, 0.12163448333740234, 0.7356395721435547, 1.3496464490890503, 1.963653326034546, 2.577660083770752, 3.191667079925537, 3.8056740760803223, 4.419680595397949, 5.033687591552734, 5.6476945877075195, 6.261701583862305, 6.87570858001709, 7.489715099334717, 8.103721618652344, 8.717729568481445, 9.331735610961914, 9.9457426071167, 10.559749603271484, 11.17375659942627, 11.787763595581055, 12.40177059173584, 13.015777587890625, 13.629783630371094, 14.243790626525879, 14.857797622680664, 15.47180461883545, 16.085811614990234, 16.699817657470703, 17.313825607299805, 17.927831649780273, 18.541839599609375, 19.155845642089844, 19.769851684570312, 20.383859634399414]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 6.0, 11.0, 34.0, 39.0, 100.0, 156.0, 257.0, 452.0, 747.0, 1198.0, 2097.0, 3556.0, 5996.0, 10343.0, 16886.0, 27958.0, 44940.0, 72153.0, 111810.0, 166500.0, 239409.0, 322277.0, 407163.0, 467205.0, 487982.0, 458313.0, 389800.0, 305592.0, 223747.0, 155079.0, 102291.0, 66150.0, 41300.0, 25569.0, 15396.0, 8960.0, 5391.0, 3198.0, 1740.0, 1008.0, 655.0, 347.0, 185.0, 112.0, 58.0, 53.0, 30.0, 10.0, 11.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.234375, -13.7950439453125, -13.355712890625, -12.9163818359375, -12.47705078125, -12.0377197265625, -11.598388671875, -11.1590576171875, -10.7197265625, -10.2803955078125, -9.841064453125, -9.4017333984375, -8.96240234375, -8.5230712890625, -8.083740234375, -7.6444091796875, -7.205078125, -6.7657470703125, -6.326416015625, -5.8870849609375, -5.44775390625, -5.0084228515625, -4.569091796875, -4.1297607421875, -3.6904296875, -3.2510986328125, -2.811767578125, -2.3724365234375, -1.93310546875, -1.4937744140625, -1.054443359375, -0.6151123046875, -0.17578125, 0.2635498046875, 0.702880859375, 1.1422119140625, 1.58154296875, 2.0208740234375, 2.460205078125, 2.8995361328125, 3.3388671875, 3.7781982421875, 4.217529296875, 4.6568603515625, 5.09619140625, 5.5355224609375, 5.974853515625, 6.4141845703125, 6.853515625, 7.2928466796875, 7.732177734375, 8.1715087890625, 8.61083984375, 9.0501708984375, 9.489501953125, 9.9288330078125, 10.3681640625, 10.8074951171875, 11.246826171875, 11.6861572265625, 12.12548828125, 12.5648193359375, 13.004150390625, 13.4434814453125, 13.8828125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 14.0, 17.0, 14.0, 18.0, 13.0, 30.0, 23.0, 27.0, 33.0, 28.0, 27.0, 32.0, 46.0, 29.0, 30.0, 34.0, 28.0, 30.0, 36.0, 35.0, 29.0, 35.0, 30.0, 30.0, 31.0, 30.0, 26.0, 14.0, 28.0, 17.0, 22.0, 22.0, 17.0, 12.0, 14.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-13.75, -13.3253173828125, -12.900634765625, -12.4759521484375, -12.05126953125, -11.6265869140625, -11.201904296875, -10.7772216796875, -10.3525390625, -9.9278564453125, -9.503173828125, -9.0784912109375, -8.65380859375, -8.2291259765625, -7.804443359375, -7.3797607421875, -6.955078125, -6.5303955078125, -6.105712890625, -5.6810302734375, -5.25634765625, -4.8316650390625, -4.406982421875, -3.9822998046875, -3.5576171875, -3.1329345703125, -2.708251953125, -2.2835693359375, -1.85888671875, -1.4342041015625, -1.009521484375, -0.5848388671875, -0.16015625, 0.2645263671875, 0.689208984375, 1.1138916015625, 1.53857421875, 1.9632568359375, 2.387939453125, 2.8126220703125, 3.2373046875, 3.6619873046875, 4.086669921875, 4.5113525390625, 4.93603515625, 5.3607177734375, 5.785400390625, 6.2100830078125, 6.634765625, 7.0594482421875, 7.484130859375, 7.9088134765625, 8.33349609375, 8.7581787109375, 9.182861328125, 9.6075439453125, 10.0322265625, 10.4569091796875, 10.881591796875, 11.3062744140625, 11.73095703125, 12.1556396484375, 12.580322265625, 13.0050048828125, 13.4296875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 11.0, 32.0, 50.0, 78.0, 147.0, 211.0, 355.0, 581.0, 935.0, 1641.0, 2647.0, 4269.0, 6910.0, 10991.0, 17106.0, 25953.0, 39649.0, 59018.0, 85163.0, 118643.0, 161566.0, 210533.0, 262318.0, 313501.0, 352629.0, 376627.0, 378524.0, 359979.0, 324347.0, 274830.0, 224013.0, 172349.0, 128091.0, 92645.0, 64616.0, 43489.0, 28909.0, 18890.0, 12042.0, 7740.0, 4628.0, 2944.0, 1844.0, 1084.0, 698.0, 427.0, 242.0, 152.0, 77.0, 56.0, 37.0, 27.0, 16.0, 4.0, 4.0, 6.0, 2.0], "bins": [-11.90625, -11.5467529296875, -11.187255859375, -10.8277587890625, -10.46826171875, -10.1087646484375, -9.749267578125, -9.3897705078125, -9.0302734375, -8.6707763671875, -8.311279296875, -7.9517822265625, -7.59228515625, -7.2327880859375, -6.873291015625, -6.5137939453125, -6.154296875, -5.7947998046875, -5.435302734375, -5.0758056640625, -4.71630859375, -4.3568115234375, -3.997314453125, -3.6378173828125, -3.2783203125, -2.9188232421875, -2.559326171875, -2.1998291015625, -1.84033203125, -1.4808349609375, -1.121337890625, -0.7618408203125, -0.40234375, -0.0428466796875, 0.316650390625, 0.6761474609375, 1.03564453125, 1.3951416015625, 1.754638671875, 2.1141357421875, 2.4736328125, 2.8331298828125, 3.192626953125, 3.5521240234375, 3.91162109375, 4.2711181640625, 4.630615234375, 4.9901123046875, 5.349609375, 5.7091064453125, 6.068603515625, 6.4281005859375, 6.78759765625, 7.1470947265625, 7.506591796875, 7.8660888671875, 8.2255859375, 8.5850830078125, 8.944580078125, 9.3040771484375, 9.66357421875, 10.0230712890625, 10.382568359375, 10.7420654296875, 11.1015625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 11.0, 25.0, 23.0, 32.0, 30.0, 31.0, 39.0, 58.0, 68.0, 82.0, 96.0, 98.0, 132.0, 142.0, 175.0, 170.0, 166.0, 189.0, 188.0, 221.0, 206.0, 193.0, 187.0, 168.0, 177.0, 146.0, 161.0, 127.0, 114.0, 107.0, 94.0, 74.0, 63.0, 58.0, 36.0, 29.0, 29.0, 23.0, 17.0, 17.0, 13.0, 6.0, 4.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4453125, -6.222900390625, -6.00048828125, -5.778076171875, -5.5556640625, -5.333251953125, -5.11083984375, -4.888427734375, -4.666015625, -4.443603515625, -4.22119140625, -3.998779296875, -3.7763671875, -3.553955078125, -3.33154296875, -3.109130859375, -2.88671875, -2.664306640625, -2.44189453125, -2.219482421875, -1.9970703125, -1.774658203125, -1.55224609375, -1.329833984375, -1.107421875, -0.885009765625, -0.66259765625, -0.440185546875, -0.2177734375, 0.004638671875, 0.22705078125, 0.449462890625, 0.671875, 0.894287109375, 1.11669921875, 1.339111328125, 1.5615234375, 1.783935546875, 2.00634765625, 2.228759765625, 2.451171875, 2.673583984375, 2.89599609375, 3.118408203125, 3.3408203125, 3.563232421875, 3.78564453125, 4.008056640625, 4.23046875, 4.452880859375, 4.67529296875, 4.897705078125, 5.1201171875, 5.342529296875, 5.56494140625, 5.787353515625, 6.009765625, 6.232177734375, 6.45458984375, 6.677001953125, 6.8994140625, 7.121826171875, 7.34423828125, 7.566650390625, 7.7890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 2.0, 8.0, 7.0, 7.0, 7.0, 6.0, 18.0, 6.0, 19.0, 19.0, 18.0, 29.0, 26.0, 34.0, 23.0, 31.0, 30.0, 34.0, 38.0, 47.0, 69.0, 43.0, 61.0, 37.0, 35.0, 35.0, 41.0, 27.0, 35.0, 35.0, 16.0, 29.0, 13.0, 20.0, 19.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.981654167175293, -13.473119735717773, -12.96458625793457, -12.456052780151367, -11.947518348693848, -11.438983917236328, -10.930450439453125, -10.421916961669922, -9.913382530212402, -9.404848098754883, -8.89631462097168, -8.387781143188477, -7.879246711730957, -7.370712757110596, -6.862178802490234, -6.353644847869873, -5.845110893249512, -5.33657693862915, -4.828042984008789, -4.319509029388428, -3.8109750747680664, -3.302441120147705, -2.7939071655273438, -2.2853732109069824, -1.776839256286621, -1.2683053016662598, -0.7597713470458984, -0.2512373924255371, 0.2572965621948242, 0.7658305168151855, 1.2743644714355469, 1.7828984260559082, 2.291433334350586, 2.7999672889709473, 3.3085012435913086, 3.81703519821167, 4.325569152832031, 4.834103107452393, 5.342637062072754, 5.851171016693115, 6.359704971313477, 6.868238925933838, 7.376772880554199, 7.8853068351745605, 8.393840789794922, 8.902374267578125, 9.410908699035645, 9.919443130493164, 10.427976608276367, 10.93651008605957, 11.44504451751709, 11.95357894897461, 12.462112426757812, 12.970645904541016, 13.479180335998535, 13.987714767456055, 14.496248245239258, 15.004781723022461, 15.51331615447998, 16.0218505859375, 16.530384063720703, 17.038917541503906, 17.54745101928711, 18.055986404418945, 18.56451988220215]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 8.0, 14.0, 7.0, 9.0, 14.0, 9.0, 16.0, 21.0, 26.0, 24.0, 20.0, 30.0, 36.0, 31.0, 35.0, 47.0, 35.0, 33.0, 51.0, 40.0, 32.0, 51.0, 42.0, 43.0, 45.0, 36.0, 40.0, 32.0, 35.0, 21.0, 22.0, 13.0, 20.0, 9.0, 9.0, 16.0, 8.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.922182083129883, -20.296356201171875, -19.670530319213867, -19.044702529907227, -18.41887664794922, -17.79305076599121, -17.167224884033203, -16.541399002075195, -15.915572166442871, -15.289746284484863, -14.663919448852539, -14.038093566894531, -13.412267684936523, -12.7864408493042, -12.160614967346191, -11.534788131713867, -10.90896224975586, -10.283136367797852, -9.657309532165527, -9.03148365020752, -8.405656814575195, -7.7798309326171875, -7.15400505065918, -6.528178691864014, -5.902352333068848, -5.276525974273682, -4.650699615478516, -4.024873733520508, -3.399047374725342, -2.773221015930176, -2.147394895553589, -1.521568775177002, -0.8957405090332031, -0.26991426944732666, 0.3559119701385498, 0.9817382097244263, 1.6075644493103027, 2.2333908081054688, 2.8592169284820557, 3.4850430488586426, 4.110869407653809, 4.736695766448975, 5.362522125244141, 5.988348007202148, 6.6141743659973145, 7.2400007247924805, 7.865826606750488, 8.491653442382812, 9.11747932434082, 9.743305206298828, 10.369132041931152, 10.99495792388916, 11.620784759521484, 12.246610641479492, 12.8724365234375, 13.498262405395508, 14.124089241027832, 14.74991512298584, 15.375741958618164, 16.001567840576172, 16.62739372253418, 17.253219604492188, 17.879047393798828, 18.504873275756836, 19.130699157714844]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 13.0, 20.0, 16.0, 28.0, 48.0, 64.0, 111.0, 142.0, 213.0, 318.0, 472.0, 637.0, 1064.0, 1562.0, 2432.0, 3669.0, 5655.0, 8762.0, 13784.0, 22172.0, 35106.0, 55707.0, 89847.0, 143732.0, 204154.0, 169817.0, 107901.0, 66783.0, 41543.0, 26294.0, 16558.0, 10570.0, 6778.0, 4248.0, 2836.0, 1868.0, 1175.0, 825.0, 507.0, 352.0, 231.0, 176.0, 107.0, 84.0, 59.0, 44.0, 26.0, 14.0, 10.0, 11.0, 9.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.998046875, -2.9090576171875, -2.820068359375, -2.7310791015625, -2.64208984375, -2.5531005859375, -2.464111328125, -2.3751220703125, -2.2861328125, -2.1971435546875, -2.108154296875, -2.0191650390625, -1.93017578125, -1.8411865234375, -1.752197265625, -1.6632080078125, -1.57421875, -1.4852294921875, -1.396240234375, -1.3072509765625, -1.21826171875, -1.1292724609375, -1.040283203125, -0.9512939453125, -0.8623046875, -0.7733154296875, -0.684326171875, -0.5953369140625, -0.50634765625, -0.4173583984375, -0.328369140625, -0.2393798828125, -0.150390625, -0.0614013671875, 0.027587890625, 0.1165771484375, 0.20556640625, 0.2945556640625, 0.383544921875, 0.4725341796875, 0.5615234375, 0.6505126953125, 0.739501953125, 0.8284912109375, 0.91748046875, 1.0064697265625, 1.095458984375, 1.1844482421875, 1.2734375, 1.3624267578125, 1.451416015625, 1.5404052734375, 1.62939453125, 1.7183837890625, 1.807373046875, 1.8963623046875, 1.9853515625, 2.0743408203125, 2.163330078125, 2.2523193359375, 2.34130859375, 2.4302978515625, 2.519287109375, 2.6082763671875, 2.697265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 8.0, 7.0, 7.0, 9.0, 9.0, 13.0, 21.0, 14.0, 20.0, 27.0, 21.0, 26.0, 25.0, 34.0, 28.0, 35.0, 29.0, 33.0, 43.0, 54.0, 35.0, 35.0, 47.0, 51.0, 51.0, 46.0, 29.0, 39.0, 24.0, 38.0, 26.0, 23.0, 15.0, 12.0, 12.0, 11.0, 13.0, 5.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.90625, -20.263916015625, -19.62158203125, -18.979248046875, -18.3369140625, -17.694580078125, -17.05224609375, -16.409912109375, -15.767578125, -15.125244140625, -14.48291015625, -13.840576171875, -13.1982421875, -12.555908203125, -11.91357421875, -11.271240234375, -10.62890625, -9.986572265625, -9.34423828125, -8.701904296875, -8.0595703125, -7.417236328125, -6.77490234375, -6.132568359375, -5.490234375, -4.847900390625, -4.20556640625, -3.563232421875, -2.9208984375, -2.278564453125, -1.63623046875, -0.993896484375, -0.3515625, 0.290771484375, 0.93310546875, 1.575439453125, 2.2177734375, 2.860107421875, 3.50244140625, 4.144775390625, 4.787109375, 5.429443359375, 6.07177734375, 6.714111328125, 7.3564453125, 7.998779296875, 8.64111328125, 9.283447265625, 9.92578125, 10.568115234375, 11.21044921875, 11.852783203125, 12.4951171875, 13.137451171875, 13.77978515625, 14.422119140625, 15.064453125, 15.706787109375, 16.34912109375, 16.991455078125, 17.6337890625, 18.276123046875, 18.91845703125, 19.560791015625, 20.203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 13.0, 12.0, 38.0, 29.0, 37.0, 72.0, 102.0, 125.0, 156.0, 246.0, 421.0, 641.0, 878.0, 1246.0, 1907.0, 2889.0, 4458.0, 6826.0, 10670.0, 16713.0, 26808.0, 43820.0, 73331.0, 125581.0, 204707.0, 206188.0, 126874.0, 73994.0, 44476.0, 27413.0, 16672.0, 10721.0, 6946.0, 4465.0, 2988.0, 1999.0, 1232.0, 875.0, 629.0, 458.0, 285.0, 163.0, 132.0, 103.0, 56.0, 56.0, 38.0, 25.0, 17.0, 10.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0], "bins": [-3.00390625, -2.91290283203125, -2.8218994140625, -2.73089599609375, -2.639892578125, -2.54888916015625, -2.4578857421875, -2.36688232421875, -2.27587890625, -2.18487548828125, -2.0938720703125, -2.00286865234375, -1.911865234375, -1.82086181640625, -1.7298583984375, -1.63885498046875, -1.5478515625, -1.45684814453125, -1.3658447265625, -1.27484130859375, -1.183837890625, -1.09283447265625, -1.0018310546875, -0.91082763671875, -0.81982421875, -0.72882080078125, -0.6378173828125, -0.54681396484375, -0.455810546875, -0.36480712890625, -0.2738037109375, -0.18280029296875, -0.091796875, -0.00079345703125, 0.0902099609375, 0.18121337890625, 0.272216796875, 0.36322021484375, 0.4542236328125, 0.54522705078125, 0.63623046875, 0.72723388671875, 0.8182373046875, 0.90924072265625, 1.000244140625, 1.09124755859375, 1.1822509765625, 1.27325439453125, 1.3642578125, 1.45526123046875, 1.5462646484375, 1.63726806640625, 1.728271484375, 1.81927490234375, 1.9102783203125, 2.00128173828125, 2.09228515625, 2.18328857421875, 2.2742919921875, 2.36529541015625, 2.456298828125, 2.54730224609375, 2.6383056640625, 2.72930908203125, 2.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 8.0, 10.0, 10.0, 16.0, 21.0, 7.0, 17.0, 13.0, 22.0, 26.0, 27.0, 39.0, 38.0, 38.0, 47.0, 23.0, 51.0, 48.0, 40.0, 38.0, 39.0, 37.0, 38.0, 35.0, 33.0, 31.0, 26.0, 32.0, 26.0, 29.0, 19.0, 27.0, 12.0, 11.0, 14.0, 8.0, 6.0, 4.0, 8.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.66650390625, -10.2626953125, -9.85888671875, -9.455078125, -9.05126953125, -8.6474609375, -8.24365234375, -7.83984375, -7.43603515625, -7.0322265625, -6.62841796875, -6.224609375, -5.82080078125, -5.4169921875, -5.01318359375, -4.609375, -4.20556640625, -3.8017578125, -3.39794921875, -2.994140625, -2.59033203125, -2.1865234375, -1.78271484375, -1.37890625, -0.97509765625, -0.5712890625, -0.16748046875, 0.236328125, 0.64013671875, 1.0439453125, 1.44775390625, 1.8515625, 2.25537109375, 2.6591796875, 3.06298828125, 3.466796875, 3.87060546875, 4.2744140625, 4.67822265625, 5.08203125, 5.48583984375, 5.8896484375, 6.29345703125, 6.697265625, 7.10107421875, 7.5048828125, 7.90869140625, 8.3125, 8.71630859375, 9.1201171875, 9.52392578125, 9.927734375, 10.33154296875, 10.7353515625, 11.13916015625, 11.54296875, 11.94677734375, 12.3505859375, 12.75439453125, 13.158203125, 13.56201171875, 13.9658203125, 14.36962890625, 14.7734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 10.0, 12.0, 17.0, 29.0, 33.0, 59.0, 88.0, 156.0, 245.0, 399.0, 631.0, 960.0, 1636.0, 2834.0, 4906.0, 8524.0, 15150.0, 29048.0, 60086.0, 152340.0, 388844.0, 222256.0, 79980.0, 36557.0, 19002.0, 10384.0, 5862.0, 3398.0, 1960.0, 1195.0, 758.0, 423.0, 251.0, 165.0, 114.0, 74.0, 67.0, 24.0, 28.0, 8.0, 11.0, 8.0, 10.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1669921875, -0.1618804931640625, -0.156768798828125, -0.1516571044921875, -0.14654541015625, -0.1414337158203125, -0.136322021484375, -0.1312103271484375, -0.1260986328125, -0.1209869384765625, -0.115875244140625, -0.1107635498046875, -0.10565185546875, -0.1005401611328125, -0.095428466796875, -0.0903167724609375, -0.085205078125, -0.0800933837890625, -0.074981689453125, -0.0698699951171875, -0.06475830078125, -0.0596466064453125, -0.054534912109375, -0.0494232177734375, -0.0443115234375, -0.0391998291015625, -0.034088134765625, -0.0289764404296875, -0.02386474609375, -0.0187530517578125, -0.013641357421875, -0.0085296630859375, -0.00341796875, 0.0016937255859375, 0.006805419921875, 0.0119171142578125, 0.01702880859375, 0.0221405029296875, 0.027252197265625, 0.0323638916015625, 0.0374755859375, 0.0425872802734375, 0.047698974609375, 0.0528106689453125, 0.05792236328125, 0.0630340576171875, 0.068145751953125, 0.0732574462890625, 0.078369140625, 0.0834808349609375, 0.088592529296875, 0.0937042236328125, 0.09881591796875, 0.1039276123046875, 0.109039306640625, 0.1141510009765625, 0.1192626953125, 0.1243743896484375, 0.129486083984375, 0.1345977783203125, 0.13970947265625, 0.1448211669921875, 0.149932861328125, 0.1550445556640625, 0.16015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 15.0, 9.0, 14.0, 15.0, 23.0, 17.0, 23.0, 25.0, 54.0, 37.0, 49.0, 35.0, 47.0, 48.0, 54.0, 54.0, 52.0, 52.0, 50.0, 46.0, 39.0, 36.0, 37.0, 22.0, 29.0, 18.0, 19.0, 15.0, 12.0, 10.0, 7.0, 3.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.2530555725097656e-05, -2.186838537454605e-05, -2.1206215023994446e-05, -2.054404467344284e-05, -1.9881874322891235e-05, -1.921970397233963e-05, -1.8557533621788025e-05, -1.789536327123642e-05, -1.7233192920684814e-05, -1.657102257013321e-05, -1.5908852219581604e-05, -1.5246681869029999e-05, -1.4584511518478394e-05, -1.3922341167926788e-05, -1.3260170817375183e-05, -1.2598000466823578e-05, -1.1935830116271973e-05, -1.1273659765720367e-05, -1.0611489415168762e-05, -9.949319064617157e-06, -9.287148714065552e-06, -8.624978363513947e-06, -7.962808012962341e-06, -7.300637662410736e-06, -6.638467311859131e-06, -5.976296961307526e-06, -5.31412661075592e-06, -4.651956260204315e-06, -3.98978590965271e-06, -3.3276155591011047e-06, -2.6654452085494995e-06, -2.0032748579978943e-06, -1.341104507446289e-06, -6.789341568946838e-07, -1.6763806343078613e-08, 6.454065442085266e-07, 1.3075768947601318e-06, 1.969747245311737e-06, 2.6319175958633423e-06, 3.2940879464149475e-06, 3.956258296966553e-06, 4.618428647518158e-06, 5.280598998069763e-06, 5.942769348621368e-06, 6.604939699172974e-06, 7.267110049724579e-06, 7.929280400276184e-06, 8.59145075082779e-06, 9.253621101379395e-06, 9.915791451931e-06, 1.0577961802482605e-05, 1.124013215303421e-05, 1.1902302503585815e-05, 1.256447285413742e-05, 1.3226643204689026e-05, 1.3888813555240631e-05, 1.4550983905792236e-05, 1.5213154256343842e-05, 1.5875324606895447e-05, 1.6537494957447052e-05, 1.7199665307998657e-05, 1.7861835658550262e-05, 1.8524006009101868e-05, 1.9186176359653473e-05, 1.9848346710205078e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 18.0, 16.0, 27.0, 64.0, 64.0, 118.0, 186.0, 246.0, 373.0, 560.0, 779.0, 1090.0, 1653.0, 2396.0, 3603.0, 5310.0, 7945.0, 12304.0, 18741.0, 30108.0, 49710.0, 89696.0, 185924.0, 303306.0, 143751.0, 73428.0, 42469.0, 25916.0, 16658.0, 10599.0, 7117.0, 4658.0, 3016.0, 2155.0, 1490.0, 938.0, 660.0, 474.0, 301.0, 235.0, 140.0, 102.0, 71.0, 38.0, 42.0, 14.0, 13.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.24412155151367188, -0.23580169677734375, -0.22748184204101562, -0.2191619873046875, -0.21084213256835938, -0.20252227783203125, -0.19420242309570312, -0.185882568359375, -0.17756271362304688, -0.16924285888671875, -0.16092300415039062, -0.1526031494140625, -0.14428329467773438, -0.13596343994140625, -0.12764358520507812, -0.11932373046875, -0.11100387573242188, -0.10268402099609375, -0.09436416625976562, -0.0860443115234375, -0.07772445678710938, -0.06940460205078125, -0.061084747314453125, -0.052764892578125, -0.044445037841796875, -0.03612518310546875, -0.027805328369140625, -0.0194854736328125, -0.011165618896484375, -0.00284576416015625, 0.005474090576171875, 0.0137939453125, 0.022113800048828125, 0.03043365478515625, 0.038753509521484375, 0.0470733642578125, 0.055393218994140625, 0.06371307373046875, 0.07203292846679688, 0.080352783203125, 0.08867263793945312, 0.09699249267578125, 0.10531234741210938, 0.1136322021484375, 0.12195205688476562, 0.13027191162109375, 0.13859176635742188, 0.14691162109375, 0.15523147583007812, 0.16355133056640625, 0.17187118530273438, 0.1801910400390625, 0.18851089477539062, 0.19683074951171875, 0.20515060424804688, 0.213470458984375, 0.22179031372070312, 0.23011016845703125, 0.23843002319335938, 0.2467498779296875, 0.2550697326660156, 0.26338958740234375, 0.2717094421386719, 0.280029296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 6.0, 4.0, 4.0, 1.0, 6.0, 8.0, 12.0, 9.0, 13.0, 20.0, 33.0, 41.0, 49.0, 81.0, 103.0, 106.0, 97.0, 112.0, 49.0, 50.0, 40.0, 34.0, 22.0, 21.0, 15.0, 13.0, 6.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.082275390625, -0.07898902893066406, -0.07570266723632812, -0.07241630554199219, -0.06912994384765625, -0.06584358215332031, -0.06255722045898438, -0.05927085876464844, -0.0559844970703125, -0.05269813537597656, -0.049411773681640625, -0.04612541198730469, -0.04283905029296875, -0.03955268859863281, -0.036266326904296875, -0.03297996520996094, -0.029693603515625, -0.026407241821289062, -0.023120880126953125, -0.019834518432617188, -0.01654815673828125, -0.013261795043945312, -0.009975433349609375, -0.0066890716552734375, -0.0034027099609375, -0.0001163482666015625, 0.003170013427734375, 0.0064563751220703125, 0.00974273681640625, 0.013029098510742188, 0.016315460205078125, 0.019601821899414062, 0.02288818359375, 0.026174545288085938, 0.029460906982421875, 0.03274726867675781, 0.03603363037109375, 0.03931999206542969, 0.042606353759765625, 0.04589271545410156, 0.0491790771484375, 0.05246543884277344, 0.055751800537109375, 0.05903816223144531, 0.06232452392578125, 0.06561088562011719, 0.06889724731445312, 0.07218360900878906, 0.075469970703125, 0.07875633239746094, 0.08204269409179688, 0.08532905578613281, 0.08861541748046875, 0.09190177917480469, 0.09518814086914062, 0.09847450256347656, 0.1017608642578125, 0.10504722595214844, 0.10833358764648438, 0.11161994934082031, 0.11490631103515625, 0.11819267272949219, 0.12147903442382812, 0.12476539611816406, 0.1280517578125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 6.0, 6.0, 11.0, 11.0, 9.0, 19.0, 17.0, 21.0, 27.0, 27.0, 34.0, 22.0, 35.0, 26.0, 35.0, 40.0, 43.0, 63.0, 48.0, 53.0, 44.0, 33.0, 36.0, 42.0, 32.0, 37.0, 26.0, 16.0, 29.0, 17.0, 22.0, 13.0, 18.0, 13.0, 7.0, 9.0, 9.0, 5.0, 2.0, 7.0, 0.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.900808334350586, -13.398384094238281, -12.895960807800293, -12.393537521362305, -11.89111328125, -11.388689041137695, -10.886265754699707, -10.383842468261719, -9.881418228149414, -9.37899398803711, -8.876570701599121, -8.374147415161133, -7.871723175048828, -7.369299411773682, -6.866875648498535, -6.364451885223389, -5.862028121948242, -5.359604358673096, -4.857180595397949, -4.354756832122803, -3.8523330688476562, -3.3499093055725098, -2.8474855422973633, -2.345061779022217, -1.8426380157470703, -1.3402142524719238, -0.8377904891967773, -0.33536672592163086, 0.16705703735351562, 0.6694808006286621, 1.1719045639038086, 1.674328327178955, 2.1767520904541016, 2.679175853729248, 3.1815996170043945, 3.684023380279541, 4.1864471435546875, 4.688870906829834, 5.1912946701049805, 5.693718433380127, 6.196142196655273, 6.69856595993042, 7.200989723205566, 7.703413486480713, 8.20583724975586, 8.708261489868164, 9.210684776306152, 9.71310806274414, 10.215532302856445, 10.71795654296875, 11.220379829406738, 11.722803115844727, 12.225227355957031, 12.727651596069336, 13.230074882507324, 13.732498168945312, 14.234922409057617, 14.737346649169922, 15.23976993560791, 15.742193222045898, 16.244617462158203, 16.747041702270508, 17.249465942382812, 17.751888275146484, 18.25431251525879]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 8.0, 14.0, 7.0, 8.0, 15.0, 7.0, 17.0, 21.0, 26.0, 25.0, 17.0, 32.0, 37.0, 30.0, 32.0, 47.0, 37.0, 30.0, 49.0, 47.0, 27.0, 53.0, 42.0, 44.0, 44.0, 31.0, 46.0, 30.0, 36.0, 21.0, 23.0, 14.0, 16.0, 14.0, 7.0, 16.0, 8.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.8687801361084, -20.247539520263672, -19.626298904418945, -19.00505828857422, -18.383819580078125, -17.7625789642334, -17.141338348388672, -16.520097732543945, -15.898857116699219, -15.277616500854492, -14.656375885009766, -14.035136222839355, -13.413895606994629, -12.792654991149902, -12.171415328979492, -11.550174713134766, -10.928934097290039, -10.307693481445312, -9.686452865600586, -9.065213203430176, -8.44397258758545, -7.822731971740723, -7.201491832733154, -6.580251693725586, -5.959011077880859, -5.337770462036133, -4.7165303230285645, -4.095290184020996, -3.4740495681762695, -2.852809190750122, -2.2315688133239746, -1.6103286743164062, -0.9890861511230469, -0.3678457736968994, 0.25339460372924805, 0.8746349811553955, 1.495875358581543, 2.1171157360076904, 2.738356113433838, 3.3595962524414062, 3.980836868286133, 4.602077484130859, 5.223317623138428, 5.844557762145996, 6.465798377990723, 7.087038993835449, 7.708279132843018, 8.329519271850586, 8.950759887695312, 9.572000503540039, 10.193241119384766, 10.814480781555176, 11.435721397399902, 12.056962013244629, 12.678201675415039, 13.299442291259766, 13.920682907104492, 14.541923522949219, 15.163164138793945, 15.784403800964355, 16.405643463134766, 17.026884078979492, 17.64812469482422, 18.269365310668945, 18.890605926513672]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 23.0, 38.0, 69.0, 96.0, 173.0, 269.0, 405.0, 711.0, 1203.0, 1865.0, 3153.0, 4744.0, 7500.0, 11803.0, 17744.0, 26522.0, 38288.0, 52886.0, 69976.0, 86697.0, 100435.0, 107988.0, 106860.0, 98640.0, 84842.0, 66979.0, 50253.0, 36622.0, 25147.0, 16688.0, 11183.0, 7118.0, 4423.0, 2723.0, 1635.0, 1065.0, 655.0, 439.0, 274.0, 166.0, 85.0, 61.0, 33.0, 13.0, 11.0, 13.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.390625, -11.0338134765625, -10.677001953125, -10.3201904296875, -9.96337890625, -9.6065673828125, -9.249755859375, -8.8929443359375, -8.5361328125, -8.1793212890625, -7.822509765625, -7.4656982421875, -7.10888671875, -6.7520751953125, -6.395263671875, -6.0384521484375, -5.681640625, -5.3248291015625, -4.968017578125, -4.6112060546875, -4.25439453125, -3.8975830078125, -3.540771484375, -3.1839599609375, -2.8271484375, -2.4703369140625, -2.113525390625, -1.7567138671875, -1.39990234375, -1.0430908203125, -0.686279296875, -0.3294677734375, 0.02734375, 0.3841552734375, 0.740966796875, 1.0977783203125, 1.45458984375, 1.8114013671875, 2.168212890625, 2.5250244140625, 2.8818359375, 3.2386474609375, 3.595458984375, 3.9522705078125, 4.30908203125, 4.6658935546875, 5.022705078125, 5.3795166015625, 5.736328125, 6.0931396484375, 6.449951171875, 6.8067626953125, 7.16357421875, 7.5203857421875, 7.877197265625, 8.2340087890625, 8.5908203125, 8.9476318359375, 9.304443359375, 9.6612548828125, 10.01806640625, 10.3748779296875, 10.731689453125, 11.0885009765625, 11.4453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 3.0, 12.0, 11.0, 7.0, 11.0, 20.0, 8.0, 19.0, 28.0, 19.0, 29.0, 32.0, 36.0, 32.0, 35.0, 39.0, 45.0, 49.0, 47.0, 59.0, 34.0, 40.0, 57.0, 41.0, 37.0, 35.0, 36.0, 33.0, 25.0, 22.0, 22.0, 20.0, 18.0, 13.0, 7.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.39404296875, -20.7255859375, -20.05712890625, -19.388671875, -18.72021484375, -18.0517578125, -17.38330078125, -16.71484375, -16.04638671875, -15.3779296875, -14.70947265625, -14.041015625, -13.37255859375, -12.7041015625, -12.03564453125, -11.3671875, -10.69873046875, -10.0302734375, -9.36181640625, -8.693359375, -8.02490234375, -7.3564453125, -6.68798828125, -6.01953125, -5.35107421875, -4.6826171875, -4.01416015625, -3.345703125, -2.67724609375, -2.0087890625, -1.34033203125, -0.671875, -0.00341796875, 0.6650390625, 1.33349609375, 2.001953125, 2.67041015625, 3.3388671875, 4.00732421875, 4.67578125, 5.34423828125, 6.0126953125, 6.68115234375, 7.349609375, 8.01806640625, 8.6865234375, 9.35498046875, 10.0234375, 10.69189453125, 11.3603515625, 12.02880859375, 12.697265625, 13.36572265625, 14.0341796875, 14.70263671875, 15.37109375, 16.03955078125, 16.7080078125, 17.37646484375, 18.044921875, 18.71337890625, 19.3818359375, 20.05029296875, 20.71875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 6.0, 8.0, 10.0, 10.0, 17.0, 31.0, 43.0, 61.0, 105.0, 166.0, 249.0, 417.0, 742.0, 1108.0, 1809.0, 2913.0, 4598.0, 7077.0, 11311.0, 17152.0, 25526.0, 37228.0, 51391.0, 67667.0, 83806.0, 97278.0, 105902.0, 106375.0, 98703.0, 85899.0, 69760.0, 53623.0, 39036.0, 27387.0, 18214.0, 11890.0, 7732.0, 4931.0, 3133.0, 1952.0, 1208.0, 801.0, 498.0, 318.0, 177.0, 119.0, 61.0, 50.0, 24.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.5401611328125, -10.189697265625, -9.8392333984375, -9.48876953125, -9.1383056640625, -8.787841796875, -8.4373779296875, -8.0869140625, -7.7364501953125, -7.385986328125, -7.0355224609375, -6.68505859375, -6.3345947265625, -5.984130859375, -5.6336669921875, -5.283203125, -4.9327392578125, -4.582275390625, -4.2318115234375, -3.88134765625, -3.5308837890625, -3.180419921875, -2.8299560546875, -2.4794921875, -2.1290283203125, -1.778564453125, -1.4281005859375, -1.07763671875, -0.7271728515625, -0.376708984375, -0.0262451171875, 0.32421875, 0.6746826171875, 1.025146484375, 1.3756103515625, 1.72607421875, 2.0765380859375, 2.427001953125, 2.7774658203125, 3.1279296875, 3.4783935546875, 3.828857421875, 4.1793212890625, 4.52978515625, 4.8802490234375, 5.230712890625, 5.5811767578125, 5.931640625, 6.2821044921875, 6.632568359375, 6.9830322265625, 7.33349609375, 7.6839599609375, 8.034423828125, 8.3848876953125, 8.7353515625, 9.0858154296875, 9.436279296875, 9.7867431640625, 10.13720703125, 10.4876708984375, 10.838134765625, 11.1885986328125, 11.5390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 3.0, 2.0, 9.0, 10.0, 14.0, 19.0, 16.0, 18.0, 22.0, 14.0, 26.0, 21.0, 37.0, 41.0, 44.0, 35.0, 45.0, 45.0, 39.0, 54.0, 53.0, 38.0, 39.0, 47.0, 37.0, 42.0, 28.0, 25.0, 19.0, 30.0, 20.0, 22.0, 17.0, 7.0, 10.0, 15.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6796875, -13.281005859375, -12.88232421875, -12.483642578125, -12.0849609375, -11.686279296875, -11.28759765625, -10.888916015625, -10.490234375, -10.091552734375, -9.69287109375, -9.294189453125, -8.8955078125, -8.496826171875, -8.09814453125, -7.699462890625, -7.30078125, -6.902099609375, -6.50341796875, -6.104736328125, -5.7060546875, -5.307373046875, -4.90869140625, -4.510009765625, -4.111328125, -3.712646484375, -3.31396484375, -2.915283203125, -2.5166015625, -2.117919921875, -1.71923828125, -1.320556640625, -0.921875, -0.523193359375, -0.12451171875, 0.274169921875, 0.6728515625, 1.071533203125, 1.47021484375, 1.868896484375, 2.267578125, 2.666259765625, 3.06494140625, 3.463623046875, 3.8623046875, 4.260986328125, 4.65966796875, 5.058349609375, 5.45703125, 5.855712890625, 6.25439453125, 6.653076171875, 7.0517578125, 7.450439453125, 7.84912109375, 8.247802734375, 8.646484375, 9.045166015625, 9.44384765625, 9.842529296875, 10.2412109375, 10.639892578125, 11.03857421875, 11.437255859375, 11.8359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 18.0, 15.0, 23.0, 52.0, 44.0, 104.0, 136.0, 244.0, 338.0, 618.0, 833.0, 1367.0, 2199.0, 3440.0, 5735.0, 9116.0, 14049.0, 22041.0, 33555.0, 48482.0, 67041.0, 86951.0, 105636.0, 115984.0, 116154.0, 106819.0, 89759.0, 69219.0, 50522.0, 34577.0, 23068.0, 14910.0, 9398.0, 6006.0, 3675.0, 2363.0, 1431.0, 957.0, 609.0, 389.0, 226.0, 156.0, 99.0, 76.0, 48.0, 25.0, 21.0, 11.0, 7.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.654296875, -3.53662109375, -3.4189453125, -3.30126953125, -3.18359375, -3.06591796875, -2.9482421875, -2.83056640625, -2.712890625, -2.59521484375, -2.4775390625, -2.35986328125, -2.2421875, -2.12451171875, -2.0068359375, -1.88916015625, -1.771484375, -1.65380859375, -1.5361328125, -1.41845703125, -1.30078125, -1.18310546875, -1.0654296875, -0.94775390625, -0.830078125, -0.71240234375, -0.5947265625, -0.47705078125, -0.359375, -0.24169921875, -0.1240234375, -0.00634765625, 0.111328125, 0.22900390625, 0.3466796875, 0.46435546875, 0.58203125, 0.69970703125, 0.8173828125, 0.93505859375, 1.052734375, 1.17041015625, 1.2880859375, 1.40576171875, 1.5234375, 1.64111328125, 1.7587890625, 1.87646484375, 1.994140625, 2.11181640625, 2.2294921875, 2.34716796875, 2.46484375, 2.58251953125, 2.7001953125, 2.81787109375, 2.935546875, 3.05322265625, 3.1708984375, 3.28857421875, 3.40625, 3.52392578125, 3.6416015625, 3.75927734375, 3.876953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 8.0, 12.0, 14.0, 19.0, 22.0, 13.0, 23.0, 30.0, 31.0, 46.0, 43.0, 43.0, 38.0, 46.0, 36.0, 51.0, 54.0, 45.0, 40.0, 43.0, 44.0, 28.0, 40.0, 32.0, 21.0, 16.0, 22.0, 19.0, 19.0, 10.0, 11.0, 18.0, 10.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00039696693420410156, -0.00038512423634529114, -0.0003732815384864807, -0.0003614388406276703, -0.00034959614276885986, -0.00033775344491004944, -0.000325910747051239, -0.0003140680491924286, -0.00030222535133361816, -0.00029038265347480774, -0.0002785399556159973, -0.0002666972577571869, -0.00025485455989837646, -0.00024301186203956604, -0.00023116916418075562, -0.0002193264663219452, -0.00020748376846313477, -0.00019564107060432434, -0.00018379837274551392, -0.0001719556748867035, -0.00016011297702789307, -0.00014827027916908264, -0.00013642758131027222, -0.0001245848834514618, -0.00011274218559265137, -0.00010089948773384094, -8.905678987503052e-05, -7.721409201622009e-05, -6.537139415740967e-05, -5.352869629859924e-05, -4.168599843978882e-05, -2.9843300580978394e-05, -1.800060272216797e-05, -6.157904863357544e-06, 5.684792995452881e-06, 1.7527490854263306e-05, 2.937018871307373e-05, 4.1212886571884155e-05, 5.305558443069458e-05, 6.4898282289505e-05, 7.674098014831543e-05, 8.858367800712585e-05, 0.00010042637586593628, 0.0001122690737247467, 0.00012411177158355713, 0.00013595446944236755, 0.00014779716730117798, 0.0001596398651599884, 0.00017148256301879883, 0.00018332526087760925, 0.00019516795873641968, 0.0002070106565952301, 0.00021885335445404053, 0.00023069605231285095, 0.00024253875017166138, 0.0002543814480304718, 0.0002662241458892822, 0.00027806684374809265, 0.0002899095416069031, 0.0003017522394657135, 0.0003135949373245239, 0.00032543763518333435, 0.0003372803330421448, 0.0003491230309009552, 0.0003609657287597656]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 9.0, 5.0, 16.0, 14.0, 25.0, 34.0, 39.0, 73.0, 106.0, 167.0, 288.0, 416.0, 644.0, 1002.0, 1558.0, 2432.0, 3955.0, 6185.0, 10067.0, 15953.0, 24990.0, 38612.0, 56680.0, 78908.0, 101523.0, 120318.0, 126441.0, 119438.0, 100976.0, 77707.0, 55967.0, 37396.0, 24392.0, 15616.0, 9923.0, 6211.0, 3850.0, 2404.0, 1507.0, 944.0, 609.0, 407.0, 253.0, 167.0, 117.0, 74.0, 53.0, 29.0, 22.0, 16.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.3359375, -4.19818115234375, -4.0604248046875, -3.92266845703125, -3.784912109375, -3.64715576171875, -3.5093994140625, -3.37164306640625, -3.23388671875, -3.09613037109375, -2.9583740234375, -2.82061767578125, -2.682861328125, -2.54510498046875, -2.4073486328125, -2.26959228515625, -2.1318359375, -1.99407958984375, -1.8563232421875, -1.71856689453125, -1.580810546875, -1.44305419921875, -1.3052978515625, -1.16754150390625, -1.02978515625, -0.89202880859375, -0.7542724609375, -0.61651611328125, -0.478759765625, -0.34100341796875, -0.2032470703125, -0.06549072265625, 0.072265625, 0.21002197265625, 0.3477783203125, 0.48553466796875, 0.623291015625, 0.76104736328125, 0.8988037109375, 1.03656005859375, 1.17431640625, 1.31207275390625, 1.4498291015625, 1.58758544921875, 1.725341796875, 1.86309814453125, 2.0008544921875, 2.13861083984375, 2.2763671875, 2.41412353515625, 2.5518798828125, 2.68963623046875, 2.827392578125, 2.96514892578125, 3.1029052734375, 3.24066162109375, 3.37841796875, 3.51617431640625, 3.6539306640625, 3.79168701171875, 3.929443359375, 4.06719970703125, 4.2049560546875, 4.34271240234375, 4.48046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 10.0, 4.0, 8.0, 9.0, 9.0, 25.0, 22.0, 28.0, 33.0, 22.0, 47.0, 37.0, 42.0, 60.0, 62.0, 61.0, 48.0, 55.0, 49.0, 60.0, 45.0, 44.0, 38.0, 32.0, 34.0, 23.0, 18.0, 14.0, 12.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.310211181640625, -2.24151611328125, -2.172821044921875, -2.1041259765625, -2.035430908203125, -1.96673583984375, -1.898040771484375, -1.829345703125, -1.760650634765625, -1.69195556640625, -1.623260498046875, -1.5545654296875, -1.485870361328125, -1.41717529296875, -1.348480224609375, -1.27978515625, -1.211090087890625, -1.14239501953125, -1.073699951171875, -1.0050048828125, -0.936309814453125, -0.86761474609375, -0.798919677734375, -0.730224609375, -0.661529541015625, -0.59283447265625, -0.524139404296875, -0.4554443359375, -0.386749267578125, -0.31805419921875, -0.249359130859375, -0.1806640625, -0.111968994140625, -0.04327392578125, 0.025421142578125, 0.0941162109375, 0.162811279296875, 0.23150634765625, 0.300201416015625, 0.368896484375, 0.437591552734375, 0.50628662109375, 0.574981689453125, 0.6436767578125, 0.712371826171875, 0.78106689453125, 0.849761962890625, 0.91845703125, 0.987152099609375, 1.05584716796875, 1.124542236328125, 1.1932373046875, 1.261932373046875, 1.33062744140625, 1.399322509765625, 1.468017578125, 1.536712646484375, 1.60540771484375, 1.674102783203125, 1.7427978515625, 1.811492919921875, 1.88018798828125, 1.948883056640625, 2.017578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 11.0, 6.0, 10.0, 12.0, 9.0, 14.0, 22.0, 19.0, 27.0, 21.0, 31.0, 29.0, 48.0, 39.0, 38.0, 45.0, 36.0, 53.0, 48.0, 42.0, 41.0, 49.0, 41.0, 33.0, 42.0, 32.0, 31.0, 25.0, 29.0, 13.0, 20.0, 17.0, 10.0, 11.0, 7.0, 9.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.244462966918945, -14.705984115600586, -14.167505264282227, -13.62902545928955, -13.090546607971191, -12.552067756652832, -12.013587951660156, -11.475109100341797, -10.936630249023438, -10.398151397705078, -9.859672546386719, -9.321192741394043, -8.782713890075684, -8.244235038757324, -7.705755710601807, -7.167276382446289, -6.62879753112793, -6.09031867980957, -5.551839351654053, -5.013360023498535, -4.474881172180176, -3.9364020824432373, -3.397922992706299, -2.8594439029693604, -2.320964813232422, -1.7824857234954834, -1.244006633758545, -0.7055275440216064, -0.16704845428466797, 0.3714306354522705, 0.909909725189209, 1.4483888149261475, 1.986867904663086, 2.5253469944000244, 3.063826084136963, 3.6023051738739014, 4.14078426361084, 4.679263114929199, 5.217742443084717, 5.756221771240234, 6.294700622558594, 6.833179473876953, 7.371658802032471, 7.910138130187988, 8.448616981506348, 8.987095832824707, 9.525575637817383, 10.064054489135742, 10.602533340454102, 11.141012191772461, 11.67949104309082, 12.217970848083496, 12.756449699401855, 13.294928550720215, 13.83340835571289, 14.37188720703125, 14.91036605834961, 15.448844909667969, 15.987323760986328, 16.525802612304688, 17.064281463623047, 17.60276222229004, 18.1412410736084, 18.679719924926758, 19.218198776245117]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 7.0, 5.0, 11.0, 7.0, 13.0, 14.0, 23.0, 21.0, 25.0, 28.0, 15.0, 29.0, 27.0, 38.0, 41.0, 46.0, 46.0, 40.0, 42.0, 41.0, 37.0, 41.0, 54.0, 37.0, 36.0, 39.0, 36.0, 31.0, 28.0, 22.0, 21.0, 20.0, 17.0, 22.0, 7.0, 5.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.634889602661133, -21.970996856689453, -21.30710220336914, -20.643207550048828, -19.97931480407715, -19.31542205810547, -18.651527404785156, -17.987632751464844, -17.323740005493164, -16.659847259521484, -15.995952606201172, -15.332058906555176, -14.66816520690918, -14.004271507263184, -13.340377807617188, -12.676484107971191, -12.012590408325195, -11.3486967086792, -10.684803009033203, -10.020909309387207, -9.357015609741211, -8.693121910095215, -8.029228210449219, -7.365334510803223, -6.701440811157227, -6.0375471115112305, -5.373653411865234, -4.709759712219238, -4.045866012573242, -3.381972312927246, -2.71807861328125, -2.054184913635254, -1.390289306640625, -0.7263956069946289, -0.06250190734863281, 0.6013917922973633, 1.2652854919433594, 1.9291791915893555, 2.5930728912353516, 3.2569665908813477, 3.9208602905273438, 4.58475399017334, 5.248647689819336, 5.912541389465332, 6.576435089111328, 7.240328788757324, 7.90422248840332, 8.568116188049316, 9.232009887695312, 9.895903587341309, 10.559797286987305, 11.2236909866333, 11.887584686279297, 12.551478385925293, 13.215372085571289, 13.879265785217285, 14.543159484863281, 15.207053184509277, 15.870946884155273, 16.534839630126953, 17.198734283447266, 17.862628936767578, 18.526521682739258, 19.190414428710938, 19.85430908203125]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 40.0, 47.0, 75.0, 134.0, 206.0, 386.0, 576.0, 868.0, 1528.0, 2435.0, 3759.0, 6041.0, 9615.0, 15290.0, 23750.0, 36583.0, 55290.0, 81602.0, 117833.0, 165207.0, 223705.0, 285516.0, 349491.0, 397795.0, 421182.0, 414169.0, 377503.0, 321978.0, 257659.0, 195204.0, 141761.0, 98806.0, 66757.0, 44333.0, 28713.0, 18281.0, 11604.0, 7250.0, 4475.0, 2713.0, 1663.0, 944.0, 617.0, 361.0, 218.0, 145.0, 71.0, 41.0, 29.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0], "bins": [-13.0546875, -12.66796875, -12.28125, -11.89453125, -11.5078125, -11.12109375, -10.734375, -10.34765625, -9.9609375, -9.57421875, -9.1875, -8.80078125, -8.4140625, -8.02734375, -7.640625, -7.25390625, -6.8671875, -6.48046875, -6.09375, -5.70703125, -5.3203125, -4.93359375, -4.546875, -4.16015625, -3.7734375, -3.38671875, -3.0, -2.61328125, -2.2265625, -1.83984375, -1.453125, -1.06640625, -0.6796875, -0.29296875, 0.09375, 0.48046875, 0.8671875, 1.25390625, 1.640625, 2.02734375, 2.4140625, 2.80078125, 3.1875, 3.57421875, 3.9609375, 4.34765625, 4.734375, 5.12109375, 5.5078125, 5.89453125, 6.28125, 6.66796875, 7.0546875, 7.44140625, 7.828125, 8.21484375, 8.6015625, 8.98828125, 9.375, 9.76171875, 10.1484375, 10.53515625, 10.921875, 11.30859375, 11.6953125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 8.0, 5.0, 8.0, 13.0, 16.0, 9.0, 16.0, 24.0, 19.0, 12.0, 18.0, 33.0, 23.0, 31.0, 35.0, 23.0, 37.0, 45.0, 32.0, 38.0, 43.0, 29.0, 28.0, 39.0, 47.0, 38.0, 35.0, 36.0, 25.0, 35.0, 35.0, 24.0, 30.0, 19.0, 13.0, 16.0, 13.0, 9.0, 8.0, 6.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.9609375, -14.4927978515625, -14.024658203125, -13.5565185546875, -13.08837890625, -12.6202392578125, -12.152099609375, -11.6839599609375, -11.2158203125, -10.7476806640625, -10.279541015625, -9.8114013671875, -9.34326171875, -8.8751220703125, -8.406982421875, -7.9388427734375, -7.470703125, -7.0025634765625, -6.534423828125, -6.0662841796875, -5.59814453125, -5.1300048828125, -4.661865234375, -4.1937255859375, -3.7255859375, -3.2574462890625, -2.789306640625, -2.3211669921875, -1.85302734375, -1.3848876953125, -0.916748046875, -0.4486083984375, 0.01953125, 0.4876708984375, 0.955810546875, 1.4239501953125, 1.89208984375, 2.3602294921875, 2.828369140625, 3.2965087890625, 3.7646484375, 4.2327880859375, 4.700927734375, 5.1690673828125, 5.63720703125, 6.1053466796875, 6.573486328125, 7.0416259765625, 7.509765625, 7.9779052734375, 8.446044921875, 8.9141845703125, 9.38232421875, 9.8504638671875, 10.318603515625, 10.7867431640625, 11.2548828125, 11.7230224609375, 12.191162109375, 12.6593017578125, 13.12744140625, 13.5955810546875, 14.063720703125, 14.5318603515625, 15.0]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 17.0, 41.0, 43.0, 102.0, 160.0, 247.0, 485.0, 868.0, 1538.0, 2555.0, 4383.0, 7003.0, 11993.0, 19081.0, 30158.0, 46320.0, 69790.0, 101207.0, 143130.0, 193001.0, 247751.0, 303707.0, 349493.0, 382319.0, 393751.0, 380742.0, 348079.0, 298285.0, 243771.0, 188703.0, 138647.0, 99157.0, 67552.0, 44577.0, 29094.0, 18356.0, 11289.0, 6843.0, 4172.0, 2422.0, 1463.0, 882.0, 485.0, 246.0, 164.0, 88.0, 53.0, 35.0, 17.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.40625, -12.0240478515625, -11.641845703125, -11.2596435546875, -10.87744140625, -10.4952392578125, -10.113037109375, -9.7308349609375, -9.3486328125, -8.9664306640625, -8.584228515625, -8.2020263671875, -7.81982421875, -7.4376220703125, -7.055419921875, -6.6732177734375, -6.291015625, -5.9088134765625, -5.526611328125, -5.1444091796875, -4.76220703125, -4.3800048828125, -3.997802734375, -3.6156005859375, -3.2333984375, -2.8511962890625, -2.468994140625, -2.0867919921875, -1.70458984375, -1.3223876953125, -0.940185546875, -0.5579833984375, -0.17578125, 0.2064208984375, 0.588623046875, 0.9708251953125, 1.35302734375, 1.7352294921875, 2.117431640625, 2.4996337890625, 2.8818359375, 3.2640380859375, 3.646240234375, 4.0284423828125, 4.41064453125, 4.7928466796875, 5.175048828125, 5.5572509765625, 5.939453125, 6.3216552734375, 6.703857421875, 7.0860595703125, 7.46826171875, 7.8504638671875, 8.232666015625, 8.6148681640625, 8.9970703125, 9.3792724609375, 9.761474609375, 10.1436767578125, 10.52587890625, 10.9080810546875, 11.290283203125, 11.6724853515625, 12.0546875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 2.0, 10.0, 10.0, 3.0, 13.0, 18.0, 19.0, 35.0, 37.0, 57.0, 72.0, 82.0, 107.0, 131.0, 124.0, 155.0, 169.0, 187.0, 179.0, 218.0, 226.0, 218.0, 207.0, 215.0, 202.0, 194.0, 175.0, 146.0, 131.0, 110.0, 109.0, 96.0, 81.0, 62.0, 72.0, 46.0, 36.0, 36.0, 23.0, 14.0, 12.0, 6.0, 10.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59375, -7.3466796875, -7.099609375, -6.8525390625, -6.60546875, -6.3583984375, -6.111328125, -5.8642578125, -5.6171875, -5.3701171875, -5.123046875, -4.8759765625, -4.62890625, -4.3818359375, -4.134765625, -3.8876953125, -3.640625, -3.3935546875, -3.146484375, -2.8994140625, -2.65234375, -2.4052734375, -2.158203125, -1.9111328125, -1.6640625, -1.4169921875, -1.169921875, -0.9228515625, -0.67578125, -0.4287109375, -0.181640625, 0.0654296875, 0.3125, 0.5595703125, 0.806640625, 1.0537109375, 1.30078125, 1.5478515625, 1.794921875, 2.0419921875, 2.2890625, 2.5361328125, 2.783203125, 3.0302734375, 3.27734375, 3.5244140625, 3.771484375, 4.0185546875, 4.265625, 4.5126953125, 4.759765625, 5.0068359375, 5.25390625, 5.5009765625, 5.748046875, 5.9951171875, 6.2421875, 6.4892578125, 6.736328125, 6.9833984375, 7.23046875, 7.4775390625, 7.724609375, 7.9716796875, 8.21875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 6.0, 5.0, 6.0, 17.0, 16.0, 24.0, 27.0, 18.0, 32.0, 42.0, 41.0, 47.0, 48.0, 54.0, 52.0, 41.0, 59.0, 37.0, 48.0, 37.0, 38.0, 49.0, 40.0, 26.0, 32.0, 22.0, 23.0, 20.0, 13.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.639983177185059, -14.0423002243042, -13.444618225097656, -12.846935272216797, -12.249252319335938, -11.651569366455078, -11.053886413574219, -10.456204414367676, -9.858521461486816, -9.260838508605957, -8.663156509399414, -8.065473556518555, -7.467790603637695, -6.870107650756836, -6.272425174713135, -5.674742698669434, -5.077059745788574, -4.479376792907715, -3.8816943168640137, -3.2840116024017334, -2.686328887939453, -2.088646173477173, -1.4909634590148926, -0.8932809829711914, -0.29559803009033203, 0.30208468437194824, 0.8997673988342285, 1.4974501132965088, 2.095132827758789, 2.6928155422210693, 3.2904982566833496, 3.888180732727051, 4.485864639282227, 5.083547592163086, 5.681230068206787, 6.278912544250488, 6.876595497131348, 7.474278450012207, 8.07196044921875, 8.66964340209961, 9.267326354980469, 9.865009307861328, 10.462692260742188, 11.06037425994873, 11.65805721282959, 12.25574016571045, 12.853422164916992, 13.451105117797852, 14.048788070678711, 14.64647102355957, 15.24415397644043, 15.841835975646973, 16.439517974853516, 17.037200927734375, 17.634883880615234, 18.232566833496094, 18.830249786376953, 19.427932739257812, 20.025615692138672, 20.62329864501953, 21.22098159790039, 21.818662643432617, 22.416345596313477, 23.014028549194336, 23.611711502075195]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 6.0, 4.0, 13.0, 5.0, 5.0, 8.0, 7.0, 15.0, 8.0, 20.0, 17.0, 24.0, 28.0, 18.0, 22.0, 33.0, 38.0, 31.0, 29.0, 37.0, 45.0, 38.0, 38.0, 39.0, 36.0, 39.0, 44.0, 39.0, 36.0, 28.0, 32.0, 27.0, 26.0, 17.0, 17.0, 17.0, 17.0, 17.0, 13.0, 15.0, 13.0, 9.0, 10.0, 12.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.830968856811523, -18.26372528076172, -17.696483612060547, -17.129240036010742, -16.561996459960938, -15.994754791259766, -15.427511215209961, -14.860268592834473, -14.293025970458984, -13.725783348083496, -13.158540725708008, -12.591297149658203, -12.024054527282715, -11.456811904907227, -10.889568328857422, -10.322325706481934, -9.755083084106445, -9.187840461730957, -8.620597839355469, -8.053354263305664, -7.486111640930176, -6.9188690185546875, -6.351625919342041, -5.7843828201293945, -5.217140197753906, -4.649897575378418, -4.0826544761657715, -3.515411615371704, -2.9481687545776367, -2.3809258937835693, -1.813683032989502, -1.2464401721954346, -0.67919921875, -0.11195635795593262, 0.45528650283813477, 1.0225293636322021, 1.5897722244262695, 2.157015085220337, 2.7242579460144043, 3.2915008068084717, 3.858743667602539, 4.425986289978027, 4.993229389190674, 5.56047248840332, 6.127715110778809, 6.694957733154297, 7.262200832366943, 7.82944393157959, 8.396686553955078, 8.963929176330566, 9.531171798706055, 10.09841537475586, 10.665657997131348, 11.232900619506836, 11.80014419555664, 12.367386817932129, 12.934629440307617, 13.501872062683105, 14.069114685058594, 14.636358261108398, 15.203600883483887, 15.770843505859375, 16.33808708190918, 16.90532875061035, 17.472572326660156]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 2.0, 9.0, 13.0, 19.0, 18.0, 38.0, 50.0, 115.0, 142.0, 181.0, 275.0, 432.0, 553.0, 826.0, 1231.0, 1843.0, 2679.0, 3838.0, 5760.0, 8342.0, 12625.0, 19039.0, 29194.0, 44586.0, 68218.0, 105220.0, 157498.0, 183381.0, 138893.0, 90996.0, 59324.0, 38161.0, 24632.0, 16477.0, 10743.0, 7351.0, 4982.0, 3485.0, 2310.0, 1588.0, 1122.0, 745.0, 522.0, 351.0, 252.0, 171.0, 103.0, 94.0, 48.0, 27.0, 20.0, 17.0, 10.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3125, -2.238677978515625, -2.16485595703125, -2.091033935546875, -2.0172119140625, -1.943389892578125, -1.86956787109375, -1.795745849609375, -1.721923828125, -1.648101806640625, -1.57427978515625, -1.500457763671875, -1.4266357421875, -1.352813720703125, -1.27899169921875, -1.205169677734375, -1.13134765625, -1.057525634765625, -0.98370361328125, -0.909881591796875, -0.8360595703125, -0.762237548828125, -0.68841552734375, -0.614593505859375, -0.540771484375, -0.466949462890625, -0.39312744140625, -0.319305419921875, -0.2454833984375, -0.171661376953125, -0.09783935546875, -0.024017333984375, 0.0498046875, 0.123626708984375, 0.19744873046875, 0.271270751953125, 0.3450927734375, 0.418914794921875, 0.49273681640625, 0.566558837890625, 0.640380859375, 0.714202880859375, 0.78802490234375, 0.861846923828125, 0.9356689453125, 1.009490966796875, 1.08331298828125, 1.157135009765625, 1.23095703125, 1.304779052734375, 1.37860107421875, 1.452423095703125, 1.5262451171875, 1.600067138671875, 1.67388916015625, 1.747711181640625, 1.821533203125, 1.895355224609375, 1.96917724609375, 2.042999267578125, 2.1168212890625, 2.190643310546875, 2.26446533203125, 2.338287353515625, 2.412109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 12.0, 8.0, 16.0, 17.0, 16.0, 21.0, 18.0, 21.0, 20.0, 20.0, 33.0, 37.0, 30.0, 39.0, 26.0, 37.0, 44.0, 56.0, 39.0, 44.0, 41.0, 38.0, 32.0, 37.0, 37.0, 23.0, 38.0, 14.0, 16.0, 22.0, 22.0, 20.0, 22.0, 13.0, 10.0, 9.0, 13.0, 5.0, 6.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.046875, -20.431396484375, -19.81591796875, -19.200439453125, -18.5849609375, -17.969482421875, -17.35400390625, -16.738525390625, -16.123046875, -15.507568359375, -14.89208984375, -14.276611328125, -13.6611328125, -13.045654296875, -12.43017578125, -11.814697265625, -11.19921875, -10.583740234375, -9.96826171875, -9.352783203125, -8.7373046875, -8.121826171875, -7.50634765625, -6.890869140625, -6.275390625, -5.659912109375, -5.04443359375, -4.428955078125, -3.8134765625, -3.197998046875, -2.58251953125, -1.967041015625, -1.3515625, -0.736083984375, -0.12060546875, 0.494873046875, 1.1103515625, 1.725830078125, 2.34130859375, 2.956787109375, 3.572265625, 4.187744140625, 4.80322265625, 5.418701171875, 6.0341796875, 6.649658203125, 7.26513671875, 7.880615234375, 8.49609375, 9.111572265625, 9.72705078125, 10.342529296875, 10.9580078125, 11.573486328125, 12.18896484375, 12.804443359375, 13.419921875, 14.035400390625, 14.65087890625, 15.266357421875, 15.8818359375, 16.497314453125, 17.11279296875, 17.728271484375, 18.34375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 9.0, 13.0, 28.0, 42.0, 51.0, 63.0, 113.0, 164.0, 225.0, 352.0, 607.0, 920.0, 1338.0, 2110.0, 3433.0, 5519.0, 9040.0, 14921.0, 25574.0, 43618.0, 76024.0, 137393.0, 232075.0, 212982.0, 120347.0, 66572.0, 38359.0, 22126.0, 13249.0, 8160.0, 4809.0, 3019.0, 1899.0, 1142.0, 750.0, 543.0, 333.0, 206.0, 128.0, 94.0, 67.0, 40.0, 28.0, 22.0, 21.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.181640625, -3.08489990234375, -2.9881591796875, -2.89141845703125, -2.794677734375, -2.69793701171875, -2.6011962890625, -2.50445556640625, -2.40771484375, -2.31097412109375, -2.2142333984375, -2.11749267578125, -2.020751953125, -1.92401123046875, -1.8272705078125, -1.73052978515625, -1.6337890625, -1.53704833984375, -1.4403076171875, -1.34356689453125, -1.246826171875, -1.15008544921875, -1.0533447265625, -0.95660400390625, -0.85986328125, -0.76312255859375, -0.6663818359375, -0.56964111328125, -0.472900390625, -0.37615966796875, -0.2794189453125, -0.18267822265625, -0.0859375, 0.01080322265625, 0.1075439453125, 0.20428466796875, 0.301025390625, 0.39776611328125, 0.4945068359375, 0.59124755859375, 0.68798828125, 0.78472900390625, 0.8814697265625, 0.97821044921875, 1.074951171875, 1.17169189453125, 1.2684326171875, 1.36517333984375, 1.4619140625, 1.55865478515625, 1.6553955078125, 1.75213623046875, 1.848876953125, 1.94561767578125, 2.0423583984375, 2.13909912109375, 2.23583984375, 2.33258056640625, 2.4293212890625, 2.52606201171875, 2.622802734375, 2.71954345703125, 2.8162841796875, 2.91302490234375, 3.009765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 10.0, 5.0, 12.0, 12.0, 16.0, 12.0, 14.0, 16.0, 21.0, 20.0, 20.0, 27.0, 31.0, 20.0, 38.0, 33.0, 41.0, 33.0, 41.0, 28.0, 35.0, 48.0, 40.0, 29.0, 30.0, 35.0, 37.0, 32.0, 29.0, 21.0, 31.0, 27.0, 22.0, 26.0, 18.0, 21.0, 12.0, 8.0, 13.0, 10.0, 5.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6015625, -10.2242431640625, -9.846923828125, -9.4696044921875, -9.09228515625, -8.7149658203125, -8.337646484375, -7.9603271484375, -7.5830078125, -7.2056884765625, -6.828369140625, -6.4510498046875, -6.07373046875, -5.6964111328125, -5.319091796875, -4.9417724609375, -4.564453125, -4.1871337890625, -3.809814453125, -3.4324951171875, -3.05517578125, -2.6778564453125, -2.300537109375, -1.9232177734375, -1.5458984375, -1.1685791015625, -0.791259765625, -0.4139404296875, -0.03662109375, 0.3406982421875, 0.718017578125, 1.0953369140625, 1.47265625, 1.8499755859375, 2.227294921875, 2.6046142578125, 2.98193359375, 3.3592529296875, 3.736572265625, 4.1138916015625, 4.4912109375, 4.8685302734375, 5.245849609375, 5.6231689453125, 6.00048828125, 6.3778076171875, 6.755126953125, 7.1324462890625, 7.509765625, 7.8870849609375, 8.264404296875, 8.6417236328125, 9.01904296875, 9.3963623046875, 9.773681640625, 10.1510009765625, 10.5283203125, 10.9056396484375, 11.282958984375, 11.6602783203125, 12.03759765625, 12.4149169921875, 12.792236328125, 13.1695556640625, 13.546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 15.0, 21.0, 24.0, 60.0, 55.0, 98.0, 144.0, 211.0, 330.0, 422.0, 668.0, 935.0, 1532.0, 2300.0, 3428.0, 5389.0, 8404.0, 13644.0, 22396.0, 38778.0, 69390.0, 138046.0, 267301.0, 224461.0, 109483.0, 57047.0, 31986.0, 19200.0, 11887.0, 7275.0, 4595.0, 3012.0, 1953.0, 1354.0, 823.0, 565.0, 420.0, 254.0, 198.0, 148.0, 96.0, 58.0, 37.0, 21.0, 19.0, 16.0, 17.0, 9.0, 10.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.08367919921875, -0.08105087280273438, -0.07842254638671875, -0.07579421997070312, -0.0731658935546875, -0.07053756713867188, -0.06790924072265625, -0.06528091430664062, -0.062652587890625, -0.060024261474609375, -0.05739593505859375, -0.054767608642578125, -0.0521392822265625, -0.049510955810546875, -0.04688262939453125, -0.044254302978515625, -0.0416259765625, -0.038997650146484375, -0.03636932373046875, -0.033740997314453125, -0.0311126708984375, -0.028484344482421875, -0.02585601806640625, -0.023227691650390625, -0.020599365234375, -0.017971038818359375, -0.01534271240234375, -0.012714385986328125, -0.0100860595703125, -0.007457733154296875, -0.00482940673828125, -0.002201080322265625, 0.00042724609375, 0.003055572509765625, 0.00568389892578125, 0.008312225341796875, 0.0109405517578125, 0.013568878173828125, 0.01619720458984375, 0.018825531005859375, 0.021453857421875, 0.024082183837890625, 0.02671051025390625, 0.029338836669921875, 0.0319671630859375, 0.034595489501953125, 0.03722381591796875, 0.039852142333984375, 0.04248046875, 0.045108795166015625, 0.04773712158203125, 0.050365447998046875, 0.0529937744140625, 0.055622100830078125, 0.05825042724609375, 0.060878753662109375, 0.063507080078125, 0.06613540649414062, 0.06876373291015625, 0.07139205932617188, 0.0740203857421875, 0.07664871215820312, 0.07927703857421875, 0.08190536499023438, 0.08453369140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 8.0, 9.0, 9.0, 17.0, 19.0, 21.0, 14.0, 19.0, 23.0, 39.0, 22.0, 32.0, 38.0, 46.0, 36.0, 40.0, 37.0, 43.0, 42.0, 50.0, 53.0, 35.0, 25.0, 41.0, 34.0, 26.0, 27.0, 24.0, 31.0, 22.0, 17.0, 18.0, 18.0, 15.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4781951904296875e-05, -1.4321878552436829e-05, -1.3861805200576782e-05, -1.3401731848716736e-05, -1.294165849685669e-05, -1.2481585144996643e-05, -1.2021511793136597e-05, -1.156143844127655e-05, -1.1101365089416504e-05, -1.0641291737556458e-05, -1.0181218385696411e-05, -9.721145033836365e-06, -9.261071681976318e-06, -8.800998330116272e-06, -8.340924978256226e-06, -7.88085162639618e-06, -7.420778274536133e-06, -6.9607049226760864e-06, -6.50063157081604e-06, -6.040558218955994e-06, -5.580484867095947e-06, -5.120411515235901e-06, -4.6603381633758545e-06, -4.200264811515808e-06, -3.7401914596557617e-06, -3.2801181077957153e-06, -2.820044755935669e-06, -2.3599714040756226e-06, -1.8998980522155762e-06, -1.4398247003555298e-06, -9.797513484954834e-07, -5.19677996635437e-07, -5.960464477539063e-08, 4.0046870708465576e-07, 8.605420589447021e-07, 1.3206154108047485e-06, 1.780688762664795e-06, 2.2407621145248413e-06, 2.7008354663848877e-06, 3.160908818244934e-06, 3.6209821701049805e-06, 4.081055521965027e-06, 4.541128873825073e-06, 5.00120222568512e-06, 5.461275577545166e-06, 5.921348929405212e-06, 6.381422281265259e-06, 6.841495633125305e-06, 7.3015689849853516e-06, 7.761642336845398e-06, 8.221715688705444e-06, 8.68178904056549e-06, 9.141862392425537e-06, 9.601935744285583e-06, 1.006200909614563e-05, 1.0522082448005676e-05, 1.0982155799865723e-05, 1.1442229151725769e-05, 1.1902302503585815e-05, 1.2362375855445862e-05, 1.2822449207305908e-05, 1.3282522559165955e-05, 1.3742595911026001e-05, 1.4202669262886047e-05, 1.4662742614746094e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 9.0, 5.0, 13.0, 28.0, 40.0, 64.0, 75.0, 121.0, 201.0, 338.0, 383.0, 696.0, 921.0, 1449.0, 2229.0, 3361.0, 5106.0, 7990.0, 12269.0, 19521.0, 32115.0, 54967.0, 100658.0, 207228.0, 279572.0, 138500.0, 72217.0, 40975.0, 24204.0, 15258.0, 9773.0, 6184.0, 4137.0, 2635.0, 1813.0, 1174.0, 718.0, 550.0, 347.0, 247.0, 145.0, 116.0, 65.0, 44.0, 33.0, 21.0, 12.0, 12.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.203369140625, -0.19705963134765625, -0.1907501220703125, -0.18444061279296875, -0.178131103515625, -0.17182159423828125, -0.1655120849609375, -0.15920257568359375, -0.15289306640625, -0.14658355712890625, -0.1402740478515625, -0.13396453857421875, -0.127655029296875, -0.12134552001953125, -0.1150360107421875, -0.10872650146484375, -0.1024169921875, -0.09610748291015625, -0.0897979736328125, -0.08348846435546875, -0.077178955078125, -0.07086944580078125, -0.0645599365234375, -0.05825042724609375, -0.05194091796875, -0.04563140869140625, -0.0393218994140625, -0.03301239013671875, -0.026702880859375, -0.02039337158203125, -0.0140838623046875, -0.00777435302734375, -0.00146484375, 0.00484466552734375, 0.0111541748046875, 0.01746368408203125, 0.023773193359375, 0.03008270263671875, 0.0363922119140625, 0.04270172119140625, 0.04901123046875, 0.05532073974609375, 0.0616302490234375, 0.06793975830078125, 0.074249267578125, 0.08055877685546875, 0.0868682861328125, 0.09317779541015625, 0.0994873046875, 0.10579681396484375, 0.1121063232421875, 0.11841583251953125, 0.124725341796875, 0.13103485107421875, 0.1373443603515625, 0.14365386962890625, 0.14996337890625, 0.15627288818359375, 0.1625823974609375, 0.16889190673828125, 0.175201416015625, 0.18151092529296875, 0.1878204345703125, 0.19412994384765625, 0.200439453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 13.0, 25.0, 19.0, 28.0, 43.0, 50.0, 73.0, 145.0, 216.0, 113.0, 93.0, 59.0, 35.0, 19.0, 21.0, 13.0, 11.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.1098623275756836, -0.10552787780761719, -0.10119342803955078, -0.09685897827148438, -0.09252452850341797, -0.08819007873535156, -0.08385562896728516, -0.07952117919921875, -0.07518672943115234, -0.07085227966308594, -0.06651782989501953, -0.062183380126953125, -0.05784893035888672, -0.05351448059082031, -0.049180030822753906, -0.0448455810546875, -0.040511131286621094, -0.03617668151855469, -0.03184223175048828, -0.027507781982421875, -0.02317333221435547, -0.018838882446289062, -0.014504432678222656, -0.01016998291015625, -0.005835533142089844, -0.0015010833740234375, 0.0028333663940429688, 0.007167816162109375, 0.011502265930175781, 0.015836715698242188, 0.020171165466308594, 0.024505615234375, 0.028840065002441406, 0.03317451477050781, 0.03750896453857422, 0.041843414306640625, 0.04617786407470703, 0.05051231384277344, 0.054846763610839844, 0.05918121337890625, 0.06351566314697266, 0.06785011291503906, 0.07218456268310547, 0.07651901245117188, 0.08085346221923828, 0.08518791198730469, 0.0895223617553711, 0.0938568115234375, 0.0981912612915039, 0.10252571105957031, 0.10686016082763672, 0.11119461059570312, 0.11552906036376953, 0.11986351013183594, 0.12419795989990234, 0.12853240966796875, 0.13286685943603516, 0.13720130920410156, 0.14153575897216797, 0.14587020874023438, 0.15020465850830078, 0.1545391082763672, 0.1588735580444336, 0.1632080078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 10.0, 5.0, 7.0, 12.0, 14.0, 25.0, 14.0, 25.0, 20.0, 32.0, 38.0, 46.0, 43.0, 55.0, 57.0, 48.0, 52.0, 40.0, 42.0, 46.0, 36.0, 44.0, 46.0, 33.0, 33.0, 26.0, 24.0, 26.0, 17.0, 12.0, 13.0, 9.0, 6.0, 8.0, 7.0, 4.0, 2.0, 11.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.52010726928711, -13.925849914550781, -13.331592559814453, -12.737336158752441, -12.143078804016113, -11.548821449279785, -10.954565048217773, -10.360307693481445, -9.766050338745117, -9.171792984008789, -8.577535629272461, -7.983279228210449, -7.389021873474121, -6.794764518737793, -6.200507640838623, -5.606250762939453, -5.011993408203125, -4.417736053466797, -3.823479175567627, -3.229222059249878, -2.634964942932129, -2.04070782661438, -1.4464507102966309, -0.8521938323974609, -0.2579364776611328, 0.3363206386566162, 0.9305777549743652, 1.5248348712921143, 2.1190919876098633, 2.7133491039276123, 3.3076062202453613, 3.9018630981445312, 4.496120452880859, 5.0903778076171875, 5.684634685516357, 6.278891563415527, 6.8731489181518555, 7.467406272888184, 8.061662673950195, 8.655920028686523, 9.250177383422852, 9.84443473815918, 10.438692092895508, 11.03294849395752, 11.627205848693848, 12.221463203430176, 12.815719604492188, 13.409976959228516, 14.004234313964844, 14.598491668701172, 15.1927490234375, 15.787005424499512, 16.381263732910156, 16.97551918029785, 17.56977653503418, 18.164033889770508, 18.758291244506836, 19.352548599243164, 19.946805953979492, 20.54106330871582, 21.135318756103516, 21.729576110839844, 22.323833465576172, 22.9180908203125, 23.512348175048828]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 6.0, 13.0, 3.0, 5.0, 8.0, 9.0, 14.0, 7.0, 23.0, 16.0, 26.0, 27.0, 20.0, 18.0, 36.0, 39.0, 27.0, 33.0, 35.0, 44.0, 39.0, 40.0, 36.0, 39.0, 35.0, 47.0, 36.0, 37.0, 27.0, 32.0, 25.0, 29.0, 15.0, 18.0, 17.0, 17.0, 16.0, 13.0, 15.0, 13.0, 9.0, 10.0, 12.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.767269134521484, -18.201866149902344, -17.636463165283203, -17.071060180664062, -16.505657196044922, -15.940254211425781, -15.37485122680664, -14.8094482421875, -14.24404525756836, -13.678642272949219, -13.113239288330078, -12.547836303710938, -11.982433319091797, -11.417030334472656, -10.851627349853516, -10.286224365234375, -9.720821380615234, -9.155418395996094, -8.590015411376953, -8.024612426757812, -7.459209442138672, -6.893806457519531, -6.328403472900391, -5.76300048828125, -5.197597503662109, -4.632194519042969, -4.066791534423828, -3.5013885498046875, -2.935985565185547, -2.3705825805664062, -1.8051795959472656, -1.239776611328125, -0.6743717193603516, -0.10896873474121094, 0.4564342498779297, 1.0218372344970703, 1.587240219116211, 2.1526432037353516, 2.718046188354492, 3.283449172973633, 3.8488521575927734, 4.414255142211914, 4.979658126831055, 5.545061111450195, 6.110464096069336, 6.675867080688477, 7.241270065307617, 7.806673049926758, 8.372076034545898, 8.937479019165039, 9.50288200378418, 10.06828498840332, 10.633687973022461, 11.199090957641602, 11.764493942260742, 12.329896926879883, 12.895299911499023, 13.460702896118164, 14.026105880737305, 14.591508865356445, 15.156911849975586, 15.722314834594727, 16.287717819213867, 16.853120803833008, 17.41852378845215]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 2.0, 13.0, 20.0, 20.0, 63.0, 81.0, 126.0, 201.0, 291.0, 451.0, 730.0, 1119.0, 1842.0, 2843.0, 4440.0, 6764.0, 10286.0, 15381.0, 21942.0, 30911.0, 42621.0, 55021.0, 70343.0, 83260.0, 93571.0, 98372.0, 98063.0, 90277.0, 78822.0, 65236.0, 51410.0, 38328.0, 27369.0, 19691.0, 13159.0, 9023.0, 5951.0, 3802.0, 2446.0, 1540.0, 970.0, 621.0, 400.0, 269.0, 153.0, 119.0, 78.0, 35.0, 30.0, 17.0, 16.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-10.484375, -10.1650390625, -9.845703125, -9.5263671875, -9.20703125, -8.8876953125, -8.568359375, -8.2490234375, -7.9296875, -7.6103515625, -7.291015625, -6.9716796875, -6.65234375, -6.3330078125, -6.013671875, -5.6943359375, -5.375, -5.0556640625, -4.736328125, -4.4169921875, -4.09765625, -3.7783203125, -3.458984375, -3.1396484375, -2.8203125, -2.5009765625, -2.181640625, -1.8623046875, -1.54296875, -1.2236328125, -0.904296875, -0.5849609375, -0.265625, 0.0537109375, 0.373046875, 0.6923828125, 1.01171875, 1.3310546875, 1.650390625, 1.9697265625, 2.2890625, 2.6083984375, 2.927734375, 3.2470703125, 3.56640625, 3.8857421875, 4.205078125, 4.5244140625, 4.84375, 5.1630859375, 5.482421875, 5.8017578125, 6.12109375, 6.4404296875, 6.759765625, 7.0791015625, 7.3984375, 7.7177734375, 8.037109375, 8.3564453125, 8.67578125, 8.9951171875, 9.314453125, 9.6337890625, 9.953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 11.0, 6.0, 8.0, 8.0, 5.0, 11.0, 15.0, 17.0, 14.0, 22.0, 25.0, 20.0, 22.0, 20.0, 29.0, 36.0, 34.0, 41.0, 32.0, 46.0, 42.0, 40.0, 32.0, 30.0, 32.0, 32.0, 38.0, 43.0, 34.0, 21.0, 24.0, 23.0, 22.0, 22.0, 18.0, 20.0, 16.0, 9.0, 17.0, 11.0, 6.0, 9.0, 9.0, 5.0, 2.0, 7.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0], "bins": [-18.390625, -17.84912109375, -17.3076171875, -16.76611328125, -16.224609375, -15.68310546875, -15.1416015625, -14.60009765625, -14.05859375, -13.51708984375, -12.9755859375, -12.43408203125, -11.892578125, -11.35107421875, -10.8095703125, -10.26806640625, -9.7265625, -9.18505859375, -8.6435546875, -8.10205078125, -7.560546875, -7.01904296875, -6.4775390625, -5.93603515625, -5.39453125, -4.85302734375, -4.3115234375, -3.77001953125, -3.228515625, -2.68701171875, -2.1455078125, -1.60400390625, -1.0625, -0.52099609375, 0.0205078125, 0.56201171875, 1.103515625, 1.64501953125, 2.1865234375, 2.72802734375, 3.26953125, 3.81103515625, 4.3525390625, 4.89404296875, 5.435546875, 5.97705078125, 6.5185546875, 7.06005859375, 7.6015625, 8.14306640625, 8.6845703125, 9.22607421875, 9.767578125, 10.30908203125, 10.8505859375, 11.39208984375, 11.93359375, 12.47509765625, 13.0166015625, 13.55810546875, 14.099609375, 14.64111328125, 15.1826171875, 15.72412109375, 16.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 18.0, 27.0, 39.0, 58.0, 101.0, 173.0, 310.0, 490.0, 686.0, 1150.0, 1822.0, 3035.0, 4596.0, 7157.0, 10822.0, 16594.0, 23969.0, 34041.0, 46287.0, 60896.0, 75471.0, 88809.0, 98227.0, 101202.0, 98220.0, 88569.0, 75385.0, 59985.0, 46066.0, 34056.0, 23658.0, 16248.0, 10994.0, 7110.0, 4550.0, 2907.0, 1829.0, 1124.0, 738.0, 419.0, 273.0, 177.0, 95.0, 75.0, 30.0, 22.0, 17.0, 13.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.6640625, -10.3358154296875, -10.007568359375, -9.6793212890625, -9.35107421875, -9.0228271484375, -8.694580078125, -8.3663330078125, -8.0380859375, -7.7098388671875, -7.381591796875, -7.0533447265625, -6.72509765625, -6.3968505859375, -6.068603515625, -5.7403564453125, -5.412109375, -5.0838623046875, -4.755615234375, -4.4273681640625, -4.09912109375, -3.7708740234375, -3.442626953125, -3.1143798828125, -2.7861328125, -2.4578857421875, -2.129638671875, -1.8013916015625, -1.47314453125, -1.1448974609375, -0.816650390625, -0.4884033203125, -0.16015625, 0.1680908203125, 0.496337890625, 0.8245849609375, 1.15283203125, 1.4810791015625, 1.809326171875, 2.1375732421875, 2.4658203125, 2.7940673828125, 3.122314453125, 3.4505615234375, 3.77880859375, 4.1070556640625, 4.435302734375, 4.7635498046875, 5.091796875, 5.4200439453125, 5.748291015625, 6.0765380859375, 6.40478515625, 6.7330322265625, 7.061279296875, 7.3895263671875, 7.7177734375, 8.0460205078125, 8.374267578125, 8.7025146484375, 9.03076171875, 9.3590087890625, 9.687255859375, 10.0155029296875, 10.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 13.0, 11.0, 3.0, 11.0, 12.0, 16.0, 13.0, 20.0, 34.0, 27.0, 27.0, 33.0, 27.0, 30.0, 25.0, 41.0, 53.0, 40.0, 30.0, 51.0, 33.0, 34.0, 44.0, 30.0, 32.0, 36.0, 31.0, 29.0, 25.0, 28.0, 29.0, 22.0, 21.0, 17.0, 13.0, 6.0, 12.0, 3.0, 2.0, 6.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.5081787109375, -11.149169921875, -10.7901611328125, -10.43115234375, -10.0721435546875, -9.713134765625, -9.3541259765625, -8.9951171875, -8.6361083984375, -8.277099609375, -7.9180908203125, -7.55908203125, -7.2000732421875, -6.841064453125, -6.4820556640625, -6.123046875, -5.7640380859375, -5.405029296875, -5.0460205078125, -4.68701171875, -4.3280029296875, -3.968994140625, -3.6099853515625, -3.2509765625, -2.8919677734375, -2.532958984375, -2.1739501953125, -1.81494140625, -1.4559326171875, -1.096923828125, -0.7379150390625, -0.37890625, -0.0198974609375, 0.339111328125, 0.6981201171875, 1.05712890625, 1.4161376953125, 1.775146484375, 2.1341552734375, 2.4931640625, 2.8521728515625, 3.211181640625, 3.5701904296875, 3.92919921875, 4.2882080078125, 4.647216796875, 5.0062255859375, 5.365234375, 5.7242431640625, 6.083251953125, 6.4422607421875, 6.80126953125, 7.1602783203125, 7.519287109375, 7.8782958984375, 8.2373046875, 8.5963134765625, 8.955322265625, 9.3143310546875, 9.67333984375, 10.0323486328125, 10.391357421875, 10.7503662109375, 11.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 8.0, 14.0, 23.0, 31.0, 55.0, 88.0, 155.0, 226.0, 344.0, 621.0, 931.0, 1542.0, 2459.0, 3972.0, 6268.0, 9960.0, 15486.0, 23603.0, 35334.0, 49379.0, 67093.0, 86047.0, 101193.0, 110376.0, 111759.0, 102912.0, 88361.0, 70206.0, 52255.0, 37143.0, 25219.0, 16900.0, 10592.0, 6730.0, 4268.0, 2620.0, 1637.0, 1024.0, 675.0, 421.0, 232.0, 151.0, 96.0, 60.0, 31.0, 14.0, 14.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.572265625, -3.460906982421875, -3.34954833984375, -3.238189697265625, -3.1268310546875, -3.015472412109375, -2.90411376953125, -2.792755126953125, -2.681396484375, -2.570037841796875, -2.45867919921875, -2.347320556640625, -2.2359619140625, -2.124603271484375, -2.01324462890625, -1.901885986328125, -1.79052734375, -1.679168701171875, -1.56781005859375, -1.456451416015625, -1.3450927734375, -1.233734130859375, -1.12237548828125, -1.011016845703125, -0.899658203125, -0.788299560546875, -0.67694091796875, -0.565582275390625, -0.4542236328125, -0.342864990234375, -0.23150634765625, -0.120147705078125, -0.0087890625, 0.102569580078125, 0.21392822265625, 0.325286865234375, 0.4366455078125, 0.548004150390625, 0.65936279296875, 0.770721435546875, 0.882080078125, 0.993438720703125, 1.10479736328125, 1.216156005859375, 1.3275146484375, 1.438873291015625, 1.55023193359375, 1.661590576171875, 1.77294921875, 1.884307861328125, 1.99566650390625, 2.107025146484375, 2.2183837890625, 2.329742431640625, 2.44110107421875, 2.552459716796875, 2.663818359375, 2.775177001953125, 2.88653564453125, 2.997894287109375, 3.1092529296875, 3.220611572265625, 3.33197021484375, 3.443328857421875, 3.5546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 10.0, 10.0, 16.0, 16.0, 20.0, 26.0, 23.0, 39.0, 28.0, 37.0, 35.0, 40.0, 39.0, 49.0, 51.0, 47.0, 45.0, 48.0, 59.0, 51.0, 36.0, 35.0, 37.0, 29.0, 23.0, 26.0, 24.0, 16.0, 16.0, 12.0, 9.0, 11.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003979206085205078, -0.00038371607661247253, -0.00036951154470443726, -0.000355307012796402, -0.0003411024808883667, -0.0003268979489803314, -0.00031269341707229614, -0.00029848888516426086, -0.0002842843532562256, -0.0002700798213481903, -0.00025587528944015503, -0.00024167075753211975, -0.00022746622562408447, -0.0002132616937160492, -0.00019905716180801392, -0.00018485262989997864, -0.00017064809799194336, -0.00015644356608390808, -0.0001422390341758728, -0.00012803450226783752, -0.00011382997035980225, -9.962543845176697e-05, -8.542090654373169e-05, -7.121637463569641e-05, -5.701184272766113e-05, -4.2807310819625854e-05, -2.8602778911590576e-05, -1.4398247003555298e-05, -1.9371509552001953e-07, 1.4010816812515259e-05, 2.8215348720550537e-05, 4.2419880628585815e-05, 5.6624412536621094e-05, 7.082894444465637e-05, 8.503347635269165e-05, 9.923800826072693e-05, 0.00011344254016876221, 0.00012764707207679749, 0.00014185160398483276, 0.00015605613589286804, 0.00017026066780090332, 0.0001844651997089386, 0.00019866973161697388, 0.00021287426352500916, 0.00022707879543304443, 0.0002412833273410797, 0.000255487859249115, 0.00026969239115715027, 0.00028389692306518555, 0.0002981014549732208, 0.0003123059868812561, 0.0003265105187892914, 0.00034071505069732666, 0.00035491958260536194, 0.0003691241145133972, 0.0003833286464214325, 0.0003975331783294678, 0.00041173771023750305, 0.00042594224214553833, 0.0004401467740535736, 0.0004543513059616089, 0.00046855583786964417, 0.00048276036977767944, 0.0004969649016857147, 0.00051116943359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 13.0, 16.0, 27.0, 33.0, 48.0, 91.0, 128.0, 222.0, 372.0, 573.0, 986.0, 1723.0, 2696.0, 4637.0, 7698.0, 12472.0, 20458.0, 32586.0, 49202.0, 70533.0, 94589.0, 115004.0, 126618.0, 124788.0, 110599.0, 88685.0, 64330.0, 44211.0, 29014.0, 18370.0, 11150.0, 6649.0, 3982.0, 2328.0, 1483.0, 871.0, 535.0, 324.0, 220.0, 101.0, 67.0, 47.0, 28.0, 21.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.33984375, -4.20367431640625, -4.0675048828125, -3.93133544921875, -3.795166015625, -3.65899658203125, -3.5228271484375, -3.38665771484375, -3.25048828125, -3.11431884765625, -2.9781494140625, -2.84197998046875, -2.705810546875, -2.56964111328125, -2.4334716796875, -2.29730224609375, -2.1611328125, -2.02496337890625, -1.8887939453125, -1.75262451171875, -1.616455078125, -1.48028564453125, -1.3441162109375, -1.20794677734375, -1.07177734375, -0.93560791015625, -0.7994384765625, -0.66326904296875, -0.527099609375, -0.39093017578125, -0.2547607421875, -0.11859130859375, 0.017578125, 0.15374755859375, 0.2899169921875, 0.42608642578125, 0.562255859375, 0.69842529296875, 0.8345947265625, 0.97076416015625, 1.10693359375, 1.24310302734375, 1.3792724609375, 1.51544189453125, 1.651611328125, 1.78778076171875, 1.9239501953125, 2.06011962890625, 2.1962890625, 2.33245849609375, 2.4686279296875, 2.60479736328125, 2.740966796875, 2.87713623046875, 3.0133056640625, 3.14947509765625, 3.28564453125, 3.42181396484375, 3.5579833984375, 3.69415283203125, 3.830322265625, 3.96649169921875, 4.1026611328125, 4.23883056640625, 4.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 7.0, 2.0, 9.0, 12.0, 11.0, 13.0, 12.0, 23.0, 32.0, 31.0, 49.0, 32.0, 27.0, 38.0, 52.0, 44.0, 56.0, 55.0, 47.0, 47.0, 31.0, 44.0, 41.0, 39.0, 28.0, 28.0, 38.0, 26.0, 27.0, 10.0, 14.0, 11.0, 13.0, 9.0, 8.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8212890625, -1.7668914794921875, -1.712493896484375, -1.6580963134765625, -1.60369873046875, -1.5493011474609375, -1.494903564453125, -1.4405059814453125, -1.3861083984375, -1.3317108154296875, -1.277313232421875, -1.2229156494140625, -1.16851806640625, -1.1141204833984375, -1.059722900390625, -1.0053253173828125, -0.950927734375, -0.8965301513671875, -0.842132568359375, -0.7877349853515625, -0.73333740234375, -0.6789398193359375, -0.624542236328125, -0.5701446533203125, -0.5157470703125, -0.4613494873046875, -0.406951904296875, -0.3525543212890625, -0.29815673828125, -0.2437591552734375, -0.189361572265625, -0.1349639892578125, -0.08056640625, -0.0261688232421875, 0.028228759765625, 0.0826263427734375, 0.13702392578125, 0.1914215087890625, 0.245819091796875, 0.3002166748046875, 0.3546142578125, 0.4090118408203125, 0.463409423828125, 0.5178070068359375, 0.57220458984375, 0.6266021728515625, 0.680999755859375, 0.7353973388671875, 0.789794921875, 0.8441925048828125, 0.898590087890625, 0.9529876708984375, 1.00738525390625, 1.0617828369140625, 1.116180419921875, 1.1705780029296875, 1.2249755859375, 1.2793731689453125, 1.333770751953125, 1.3881683349609375, 1.44256591796875, 1.4969635009765625, 1.551361083984375, 1.6057586669921875, 1.66015625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 1.0, 7.0, 3.0, 5.0, 7.0, 10.0, 17.0, 14.0, 28.0, 22.0, 26.0, 20.0, 32.0, 34.0, 59.0, 47.0, 49.0, 49.0, 38.0, 52.0, 34.0, 50.0, 46.0, 48.0, 45.0, 41.0, 24.0, 24.0, 36.0, 22.0, 19.0, 16.0, 11.0, 14.0, 16.0, 5.0, 7.0, 6.0, 2.0, 4.0, 8.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.756897926330566, -13.184160232543945, -12.61142349243164, -12.03868579864502, -11.465949058532715, -10.893211364746094, -10.320474624633789, -9.747736930847168, -9.174999237060547, -8.602261543273926, -8.029524803161621, -7.456787109375, -6.884050369262695, -6.311312675476074, -5.738575458526611, -5.165838241577148, -4.593101501464844, -4.020364284515381, -3.447627067565918, -2.874889612197876, -2.302152395248413, -1.7294151782989502, -1.1566777229309082, -0.5839405059814453, -0.011203289031982422, 0.5615339875221252, 1.134271264076233, 1.7070086002349854, 2.2797458171844482, 2.852483034133911, 3.425220489501953, 3.997957706451416, 4.570695877075195, 5.143433094024658, 5.716170310974121, 6.288908004760742, 6.861644744873047, 7.434382438659668, 8.007120132446289, 8.579856872558594, 9.152593612670898, 9.72533130645752, 10.298068046569824, 10.870805740356445, 11.44354248046875, 12.016280174255371, 12.589017868041992, 13.161754608154297, 13.734492301940918, 14.307229995727539, 14.879966735839844, 15.452704429626465, 16.025442123413086, 16.59817886352539, 17.170915603637695, 17.74365234375, 18.316390991210938, 18.889127731323242, 19.46186637878418, 20.034603118896484, 20.60733985900879, 21.180076599121094, 21.75281524658203, 22.325551986694336, 22.89828872680664]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 9.0, 13.0, 7.0, 11.0, 16.0, 13.0, 25.0, 21.0, 33.0, 28.0, 37.0, 48.0, 41.0, 43.0, 42.0, 39.0, 46.0, 44.0, 53.0, 50.0, 32.0, 39.0, 45.0, 21.0, 41.0, 29.0, 28.0, 22.0, 14.0, 15.0, 16.0, 15.0, 7.0, 8.0, 9.0, 4.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40592384338379, -21.72707176208496, -21.048219680786133, -20.369367599487305, -19.690515518188477, -19.01166343688965, -18.33281135559082, -17.653959274291992, -16.975107192993164, -16.296255111694336, -15.617403030395508, -14.93855094909668, -14.259698867797852, -13.580846786499023, -12.901994705200195, -12.223142623901367, -11.544291496276855, -10.865439414978027, -10.1865873336792, -9.507735252380371, -8.828883171081543, -8.150031089782715, -7.471179485321045, -6.792327404022217, -6.113475322723389, -5.4346232414245605, -4.755771160125732, -4.0769195556640625, -3.3980672359466553, -2.719215154647827, -2.040363311767578, -1.36151123046875, -0.6826591491699219, -0.0038071274757385254, 0.6750448942184448, 1.3538968563079834, 2.0327489376068115, 2.7116010189056396, 3.3904528617858887, 4.069304943084717, 4.748157024383545, 5.427009105682373, 6.105861186981201, 6.784712791442871, 7.463564872741699, 8.142416954040527, 8.821269035339355, 9.500121116638184, 10.178973197937012, 10.85782527923584, 11.536677360534668, 12.215529441833496, 12.894381523132324, 13.573233604431152, 14.252084732055664, 14.930936813354492, 15.60978889465332, 16.28864097595215, 16.967493057250977, 17.646345138549805, 18.325197219848633, 19.00404930114746, 19.68290138244629, 20.361753463745117, 21.040605545043945]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 10.0, 12.0, 25.0, 37.0, 77.0, 107.0, 133.0, 256.0, 444.0, 697.0, 1116.0, 1762.0, 2828.0, 4540.0, 6871.0, 10968.0, 16674.0, 25120.0, 37819.0, 54640.0, 79577.0, 111668.0, 151646.0, 200545.0, 253125.0, 305414.0, 349525.0, 376537.0, 384452.0, 366839.0, 330109.0, 281540.0, 228147.0, 177269.0, 132956.0, 95805.0, 67636.0, 46852.0, 31462.0, 20872.0, 13715.0, 8933.0, 5744.0, 3638.0, 2323.0, 1458.0, 867.0, 608.0, 349.0, 220.0, 129.0, 82.0, 55.0, 29.0, 16.0, 9.0, 4.0], "bins": [-13.0859375, -12.7149658203125, -12.343994140625, -11.9730224609375, -11.60205078125, -11.2310791015625, -10.860107421875, -10.4891357421875, -10.1181640625, -9.7471923828125, -9.376220703125, -9.0052490234375, -8.63427734375, -8.2633056640625, -7.892333984375, -7.5213623046875, -7.150390625, -6.7794189453125, -6.408447265625, -6.0374755859375, -5.66650390625, -5.2955322265625, -4.924560546875, -4.5535888671875, -4.1826171875, -3.8116455078125, -3.440673828125, -3.0697021484375, -2.69873046875, -2.3277587890625, -1.956787109375, -1.5858154296875, -1.21484375, -0.8438720703125, -0.472900390625, -0.1019287109375, 0.26904296875, 0.6400146484375, 1.010986328125, 1.3819580078125, 1.7529296875, 2.1239013671875, 2.494873046875, 2.8658447265625, 3.23681640625, 3.6077880859375, 3.978759765625, 4.3497314453125, 4.720703125, 5.0916748046875, 5.462646484375, 5.8336181640625, 6.20458984375, 6.5755615234375, 6.946533203125, 7.3175048828125, 7.6884765625, 8.0594482421875, 8.430419921875, 8.8013916015625, 9.17236328125, 9.5433349609375, 9.914306640625, 10.2852783203125, 10.65625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 16.0, 19.0, 12.0, 18.0, 32.0, 20.0, 35.0, 34.0, 44.0, 33.0, 38.0, 43.0, 41.0, 45.0, 52.0, 41.0, 48.0, 32.0, 45.0, 38.0, 38.0, 33.0, 28.0, 22.0, 23.0, 20.0, 27.0, 16.0, 12.0, 9.0, 7.0, 8.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.28125, -16.734375, -16.1875, -15.640625, -15.09375, -14.546875, -14.0, -13.453125, -12.90625, -12.359375, -11.8125, -11.265625, -10.71875, -10.171875, -9.625, -9.078125, -8.53125, -7.984375, -7.4375, -6.890625, -6.34375, -5.796875, -5.25, -4.703125, -4.15625, -3.609375, -3.0625, -2.515625, -1.96875, -1.421875, -0.875, -0.328125, 0.21875, 0.765625, 1.3125, 1.859375, 2.40625, 2.953125, 3.5, 4.046875, 4.59375, 5.140625, 5.6875, 6.234375, 6.78125, 7.328125, 7.875, 8.421875, 8.96875, 9.515625, 10.0625, 10.609375, 11.15625, 11.703125, 12.25, 12.796875, 13.34375, 13.890625, 14.4375, 14.984375, 15.53125, 16.078125, 16.625, 17.171875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 13.0, 13.0, 27.0, 65.0, 98.0, 134.0, 214.0, 422.0, 704.0, 1183.0, 2008.0, 3194.0, 5396.0, 8759.0, 13732.0, 21321.0, 33049.0, 48799.0, 71728.0, 101932.0, 138403.0, 182221.0, 230167.0, 279200.0, 320240.0, 352131.0, 365669.0, 361344.0, 338999.0, 303003.0, 256339.0, 208729.0, 161680.0, 120417.0, 87688.0, 60326.0, 41221.0, 27302.0, 17760.0, 10985.0, 7088.0, 4237.0, 2591.0, 1565.0, 957.0, 483.0, 315.0, 201.0, 104.0, 58.0, 31.0, 17.0, 10.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.3681640625, -10.986328125, -10.6044921875, -10.22265625, -9.8408203125, -9.458984375, -9.0771484375, -8.6953125, -8.3134765625, -7.931640625, -7.5498046875, -7.16796875, -6.7861328125, -6.404296875, -6.0224609375, -5.640625, -5.2587890625, -4.876953125, -4.4951171875, -4.11328125, -3.7314453125, -3.349609375, -2.9677734375, -2.5859375, -2.2041015625, -1.822265625, -1.4404296875, -1.05859375, -0.6767578125, -0.294921875, 0.0869140625, 0.46875, 0.8505859375, 1.232421875, 1.6142578125, 1.99609375, 2.3779296875, 2.759765625, 3.1416015625, 3.5234375, 3.9052734375, 4.287109375, 4.6689453125, 5.05078125, 5.4326171875, 5.814453125, 6.1962890625, 6.578125, 6.9599609375, 7.341796875, 7.7236328125, 8.10546875, 8.4873046875, 8.869140625, 9.2509765625, 9.6328125, 10.0146484375, 10.396484375, 10.7783203125, 11.16015625, 11.5419921875, 11.923828125, 12.3056640625, 12.6875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 8.0, 9.0, 22.0, 12.0, 22.0, 31.0, 21.0, 43.0, 66.0, 64.0, 84.0, 91.0, 87.0, 123.0, 147.0, 144.0, 200.0, 174.0, 198.0, 223.0, 196.0, 186.0, 221.0, 187.0, 167.0, 172.0, 167.0, 160.0, 109.0, 123.0, 103.0, 105.0, 82.0, 58.0, 47.0, 57.0, 49.0, 20.0, 25.0, 17.0, 15.0, 13.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.109375, -7.8592529296875, -7.609130859375, -7.3590087890625, -7.10888671875, -6.8587646484375, -6.608642578125, -6.3585205078125, -6.1083984375, -5.8582763671875, -5.608154296875, -5.3580322265625, -5.10791015625, -4.8577880859375, -4.607666015625, -4.3575439453125, -4.107421875, -3.8572998046875, -3.607177734375, -3.3570556640625, -3.10693359375, -2.8568115234375, -2.606689453125, -2.3565673828125, -2.1064453125, -1.8563232421875, -1.606201171875, -1.3560791015625, -1.10595703125, -0.8558349609375, -0.605712890625, -0.3555908203125, -0.10546875, 0.1446533203125, 0.394775390625, 0.6448974609375, 0.89501953125, 1.1451416015625, 1.395263671875, 1.6453857421875, 1.8955078125, 2.1456298828125, 2.395751953125, 2.6458740234375, 2.89599609375, 3.1461181640625, 3.396240234375, 3.6463623046875, 3.896484375, 4.1466064453125, 4.396728515625, 4.6468505859375, 4.89697265625, 5.1470947265625, 5.397216796875, 5.6473388671875, 5.8974609375, 6.1475830078125, 6.397705078125, 6.6478271484375, 6.89794921875, 7.1480712890625, 7.398193359375, 7.6483154296875, 7.8984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 6.0, 8.0, 17.0, 15.0, 30.0, 23.0, 27.0, 27.0, 41.0, 38.0, 51.0, 43.0, 41.0, 37.0, 54.0, 52.0, 46.0, 47.0, 58.0, 42.0, 43.0, 29.0, 37.0, 33.0, 28.0, 23.0, 16.0, 12.0, 11.0, 8.0, 7.0, 9.0, 7.0, 12.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.6616153717041, -20.02762222290039, -19.39362907409668, -18.75963592529297, -18.125642776489258, -17.491649627685547, -16.857656478881836, -16.223663330078125, -15.589670181274414, -14.955677032470703, -14.321683883666992, -13.687690734863281, -13.05369758605957, -12.41970443725586, -11.785711288452148, -11.151718139648438, -10.517724990844727, -9.883731842041016, -9.249738693237305, -8.615745544433594, -7.981752395629883, -7.347759246826172, -6.713766098022461, -6.07977294921875, -5.445779800415039, -4.811786651611328, -4.177793502807617, -3.5438003540039062, -2.9098072052001953, -2.2758140563964844, -1.6418209075927734, -1.0078277587890625, -0.37383270263671875, 0.2601604461669922, 0.8941535949707031, 1.528146743774414, 2.162139892578125, 2.796133041381836, 3.430126190185547, 4.064119338989258, 4.698112487792969, 5.33210563659668, 5.966098785400391, 6.600091934204102, 7.2340850830078125, 7.868078231811523, 8.502071380615234, 9.136064529418945, 9.770057678222656, 10.404050827026367, 11.038043975830078, 11.672037124633789, 12.3060302734375, 12.940023422241211, 13.574016571044922, 14.208009719848633, 14.842002868652344, 15.475996017456055, 16.109989166259766, 16.743982315063477, 17.377975463867188, 18.0119686126709, 18.64596176147461, 19.27995491027832, 19.91394805908203]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 9.0, 12.0, 10.0, 12.0, 8.0, 17.0, 18.0, 24.0, 25.0, 24.0, 20.0, 31.0, 33.0, 34.0, 37.0, 27.0, 47.0, 31.0, 48.0, 48.0, 43.0, 48.0, 37.0, 30.0, 25.0, 22.0, 24.0, 36.0, 29.0, 23.0, 23.0, 16.0, 18.0, 17.0, 10.0, 10.0, 5.0, 11.0, 10.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-18.28009605407715, -17.677419662475586, -17.074743270874023, -16.47206687927246, -15.869390487670898, -15.266714096069336, -14.664037704467773, -14.061361312866211, -13.458684921264648, -12.856008529663086, -12.253332138061523, -11.650655746459961, -11.047979354858398, -10.445302963256836, -9.842626571655273, -9.239950180053711, -8.637274742126465, -8.034598350524902, -7.43192195892334, -6.829245567321777, -6.226569175720215, -5.623892784118652, -5.021216869354248, -4.4185404777526855, -3.815864086151123, -3.2131876945495605, -2.610511302947998, -2.0078351497650146, -1.4051587581634521, -0.8024823665618896, -0.19980621337890625, 0.40287017822265625, 1.0055465698242188, 1.6082229614257812, 2.2108993530273438, 2.813575506210327, 3.4162518978118896, 4.018928527832031, 4.6216044425964355, 5.224280834197998, 5.8269572257995605, 6.429633617401123, 7.0323100090026855, 7.63498592376709, 8.237662315368652, 8.840338706970215, 9.443015098571777, 10.04569149017334, 10.648367881774902, 11.251044273376465, 11.853720664978027, 12.45639705657959, 13.059073448181152, 13.661749839782715, 14.264425277709961, 14.867101669311523, 15.469778060913086, 16.07245445251465, 16.67513084411621, 17.277807235717773, 17.880483627319336, 18.4831600189209, 19.08583641052246, 19.688512802124023, 20.291189193725586]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 11.0, 9.0, 29.0, 29.0, 30.0, 66.0, 107.0, 139.0, 238.0, 350.0, 522.0, 807.0, 1267.0, 2079.0, 3406.0, 5578.0, 9311.0, 15761.0, 28103.0, 49531.0, 89016.0, 162415.0, 246329.0, 188899.0, 106563.0, 58960.0, 32806.0, 18489.0, 10789.0, 6459.0, 3886.0, 2442.0, 1422.0, 947.0, 593.0, 373.0, 263.0, 183.0, 96.0, 84.0, 63.0, 39.0, 22.0, 12.0, 13.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.048828125, -2.94598388671875, -2.8431396484375, -2.74029541015625, -2.637451171875, -2.53460693359375, -2.4317626953125, -2.32891845703125, -2.22607421875, -2.12322998046875, -2.0203857421875, -1.91754150390625, -1.814697265625, -1.71185302734375, -1.6090087890625, -1.50616455078125, -1.4033203125, -1.30047607421875, -1.1976318359375, -1.09478759765625, -0.991943359375, -0.88909912109375, -0.7862548828125, -0.68341064453125, -0.58056640625, -0.47772216796875, -0.3748779296875, -0.27203369140625, -0.169189453125, -0.06634521484375, 0.0364990234375, 0.13934326171875, 0.2421875, 0.34503173828125, 0.4478759765625, 0.55072021484375, 0.653564453125, 0.75640869140625, 0.8592529296875, 0.96209716796875, 1.06494140625, 1.16778564453125, 1.2706298828125, 1.37347412109375, 1.476318359375, 1.57916259765625, 1.6820068359375, 1.78485107421875, 1.8876953125, 1.99053955078125, 2.0933837890625, 2.19622802734375, 2.299072265625, 2.40191650390625, 2.5047607421875, 2.60760498046875, 2.71044921875, 2.81329345703125, 2.9161376953125, 3.01898193359375, 3.121826171875, 3.22467041015625, 3.3275146484375, 3.43035888671875, 3.533203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 6.0, 6.0, 16.0, 9.0, 11.0, 20.0, 11.0, 20.0, 15.0, 32.0, 24.0, 23.0, 39.0, 30.0, 29.0, 31.0, 41.0, 35.0, 45.0, 51.0, 34.0, 41.0, 35.0, 37.0, 30.0, 36.0, 27.0, 27.0, 27.0, 21.0, 25.0, 24.0, 16.0, 15.0, 15.0, 19.0, 8.0, 6.0, 19.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.671875, -19.039306640625, -18.40673828125, -17.774169921875, -17.1416015625, -16.509033203125, -15.87646484375, -15.243896484375, -14.611328125, -13.978759765625, -13.34619140625, -12.713623046875, -12.0810546875, -11.448486328125, -10.81591796875, -10.183349609375, -9.55078125, -8.918212890625, -8.28564453125, -7.653076171875, -7.0205078125, -6.387939453125, -5.75537109375, -5.122802734375, -4.490234375, -3.857666015625, -3.22509765625, -2.592529296875, -1.9599609375, -1.327392578125, -0.69482421875, -0.062255859375, 0.5703125, 1.202880859375, 1.83544921875, 2.468017578125, 3.1005859375, 3.733154296875, 4.36572265625, 4.998291015625, 5.630859375, 6.263427734375, 6.89599609375, 7.528564453125, 8.1611328125, 8.793701171875, 9.42626953125, 10.058837890625, 10.69140625, 11.323974609375, 11.95654296875, 12.589111328125, 13.2216796875, 13.854248046875, 14.48681640625, 15.119384765625, 15.751953125, 16.384521484375, 17.01708984375, 17.649658203125, 18.2822265625, 18.914794921875, 19.54736328125, 20.179931640625, 20.8125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 9.0, 12.0, 29.0, 29.0, 44.0, 79.0, 112.0, 173.0, 228.0, 356.0, 487.0, 723.0, 1048.0, 1637.0, 2393.0, 3605.0, 5652.0, 8464.0, 13095.0, 20512.0, 32873.0, 53630.0, 89556.0, 151963.0, 219360.0, 173313.0, 103649.0, 61781.0, 37456.0, 23162.0, 14989.0, 9522.0, 6128.0, 4119.0, 2734.0, 1840.0, 1240.0, 786.0, 557.0, 376.0, 253.0, 180.0, 125.0, 80.0, 67.0, 43.0, 21.0, 16.0, 19.0, 5.0, 6.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.857421875, -2.76708984375, -2.6767578125, -2.58642578125, -2.49609375, -2.40576171875, -2.3154296875, -2.22509765625, -2.134765625, -2.04443359375, -1.9541015625, -1.86376953125, -1.7734375, -1.68310546875, -1.5927734375, -1.50244140625, -1.412109375, -1.32177734375, -1.2314453125, -1.14111328125, -1.05078125, -0.96044921875, -0.8701171875, -0.77978515625, -0.689453125, -0.59912109375, -0.5087890625, -0.41845703125, -0.328125, -0.23779296875, -0.1474609375, -0.05712890625, 0.033203125, 0.12353515625, 0.2138671875, 0.30419921875, 0.39453125, 0.48486328125, 0.5751953125, 0.66552734375, 0.755859375, 0.84619140625, 0.9365234375, 1.02685546875, 1.1171875, 1.20751953125, 1.2978515625, 1.38818359375, 1.478515625, 1.56884765625, 1.6591796875, 1.74951171875, 1.83984375, 1.93017578125, 2.0205078125, 2.11083984375, 2.201171875, 2.29150390625, 2.3818359375, 2.47216796875, 2.5625, 2.65283203125, 2.7431640625, 2.83349609375, 2.923828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 11.0, 14.0, 16.0, 6.0, 15.0, 16.0, 19.0, 11.0, 23.0, 20.0, 27.0, 25.0, 29.0, 37.0, 31.0, 47.0, 40.0, 28.0, 49.0, 42.0, 46.0, 34.0, 32.0, 25.0, 29.0, 34.0, 34.0, 21.0, 28.0, 25.0, 23.0, 21.0, 21.0, 20.0, 14.0, 11.0, 9.0, 7.0, 11.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.109375, -12.7166748046875, -12.323974609375, -11.9312744140625, -11.53857421875, -11.1458740234375, -10.753173828125, -10.3604736328125, -9.9677734375, -9.5750732421875, -9.182373046875, -8.7896728515625, -8.39697265625, -8.0042724609375, -7.611572265625, -7.2188720703125, -6.826171875, -6.4334716796875, -6.040771484375, -5.6480712890625, -5.25537109375, -4.8626708984375, -4.469970703125, -4.0772705078125, -3.6845703125, -3.2918701171875, -2.899169921875, -2.5064697265625, -2.11376953125, -1.7210693359375, -1.328369140625, -0.9356689453125, -0.54296875, -0.1502685546875, 0.242431640625, 0.6351318359375, 1.02783203125, 1.4205322265625, 1.813232421875, 2.2059326171875, 2.5986328125, 2.9913330078125, 3.384033203125, 3.7767333984375, 4.16943359375, 4.5621337890625, 4.954833984375, 5.3475341796875, 5.740234375, 6.1329345703125, 6.525634765625, 6.9183349609375, 7.31103515625, 7.7037353515625, 8.096435546875, 8.4891357421875, 8.8818359375, 9.2745361328125, 9.667236328125, 10.0599365234375, 10.45263671875, 10.8453369140625, 11.238037109375, 11.6307373046875, 12.0234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 11.0, 21.0, 36.0, 48.0, 82.0, 96.0, 184.0, 319.0, 589.0, 968.0, 1602.0, 2937.0, 5198.0, 9718.0, 18285.0, 36801.0, 81277.0, 215560.0, 377296.0, 167179.0, 65386.0, 30757.0, 15470.0, 8298.0, 4449.0, 2482.0, 1443.0, 844.0, 475.0, 289.0, 158.0, 101.0, 54.0, 35.0, 27.0, 23.0, 15.0, 7.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1182861328125, -0.11463260650634766, -0.11097908020019531, -0.10732555389404297, -0.10367202758789062, -0.10001850128173828, -0.09636497497558594, -0.0927114486694336, -0.08905792236328125, -0.0854043960571289, -0.08175086975097656, -0.07809734344482422, -0.07444381713867188, -0.07079029083251953, -0.06713676452636719, -0.06348323822021484, -0.0598297119140625, -0.056176185607910156, -0.05252265930175781, -0.04886913299560547, -0.045215606689453125, -0.04156208038330078, -0.03790855407714844, -0.034255027770996094, -0.03060150146484375, -0.026947975158691406, -0.023294448852539062, -0.01964092254638672, -0.015987396240234375, -0.012333869934082031, -0.008680343627929688, -0.005026817321777344, -0.001373291015625, 0.0022802352905273438, 0.0059337615966796875, 0.009587287902832031, 0.013240814208984375, 0.01689434051513672, 0.020547866821289062, 0.024201393127441406, 0.02785491943359375, 0.031508445739746094, 0.03516197204589844, 0.03881549835205078, 0.042469024658203125, 0.04612255096435547, 0.04977607727050781, 0.053429603576660156, 0.0570831298828125, 0.060736656188964844, 0.06439018249511719, 0.06804370880126953, 0.07169723510742188, 0.07535076141357422, 0.07900428771972656, 0.0826578140258789, 0.08631134033203125, 0.0899648666381836, 0.09361839294433594, 0.09727191925048828, 0.10092544555664062, 0.10457897186279297, 0.10823249816894531, 0.11188602447509766, 0.11553955078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 17.0, 27.0, 20.0, 26.0, 20.0, 27.0, 36.0, 16.0, 40.0, 41.0, 32.0, 41.0, 58.0, 49.0, 39.0, 54.0, 38.0, 49.0, 31.0, 48.0, 32.0, 33.0, 27.0, 25.0, 17.0, 23.0, 15.0, 14.0, 14.0, 7.0, 7.0, 5.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4543533325195312e-05, -1.407042145729065e-05, -1.3597309589385986e-05, -1.3124197721481323e-05, -1.265108585357666e-05, -1.2177973985671997e-05, -1.1704862117767334e-05, -1.1231750249862671e-05, -1.0758638381958008e-05, -1.0285526514053345e-05, -9.812414646148682e-06, -9.339302778244019e-06, -8.866190910339355e-06, -8.393079042434692e-06, -7.91996717453003e-06, -7.446855306625366e-06, -6.973743438720703e-06, -6.50063157081604e-06, -6.027519702911377e-06, -5.554407835006714e-06, -5.081295967102051e-06, -4.608184099197388e-06, -4.135072231292725e-06, -3.6619603633880615e-06, -3.1888484954833984e-06, -2.7157366275787354e-06, -2.2426247596740723e-06, -1.7695128917694092e-06, -1.296401023864746e-06, -8.23289155960083e-07, -3.501772880554199e-07, 1.2293457984924316e-07, 5.960464477539062e-07, 1.0691583156585693e-06, 1.5422701835632324e-06, 2.0153820514678955e-06, 2.4884939193725586e-06, 2.9616057872772217e-06, 3.4347176551818848e-06, 3.907829523086548e-06, 4.380941390991211e-06, 4.854053258895874e-06, 5.327165126800537e-06, 5.8002769947052e-06, 6.273388862609863e-06, 6.746500730514526e-06, 7.2196125984191895e-06, 7.692724466323853e-06, 8.165836334228516e-06, 8.638948202133179e-06, 9.112060070037842e-06, 9.585171937942505e-06, 1.0058283805847168e-05, 1.0531395673751831e-05, 1.1004507541656494e-05, 1.1477619409561157e-05, 1.195073127746582e-05, 1.2423843145370483e-05, 1.2896955013275146e-05, 1.337006688117981e-05, 1.3843178749084473e-05, 1.4316290616989136e-05, 1.4789402484893799e-05, 1.5262514352798462e-05, 1.5735626220703125e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 10.0, 14.0, 9.0, 32.0, 24.0, 33.0, 53.0, 82.0, 124.0, 187.0, 303.0, 411.0, 603.0, 924.0, 1337.0, 2085.0, 3218.0, 4944.0, 7723.0, 11815.0, 18429.0, 29428.0, 48457.0, 85628.0, 164317.0, 288222.0, 164875.0, 84852.0, 48510.0, 29335.0, 18523.0, 11870.0, 7689.0, 4946.0, 3310.0, 2136.0, 1330.0, 889.0, 617.0, 409.0, 295.0, 157.0, 119.0, 91.0, 62.0, 27.0, 30.0, 15.0, 12.0, 8.0, 9.0, 9.0, 6.0, 1.0, 1.0, 2.0, 5.0], "bins": [-0.218505859375, -0.21178245544433594, -0.20505905151367188, -0.1983356475830078, -0.19161224365234375, -0.1848888397216797, -0.17816543579101562, -0.17144203186035156, -0.1647186279296875, -0.15799522399902344, -0.15127182006835938, -0.1445484161376953, -0.13782501220703125, -0.1311016082763672, -0.12437820434570312, -0.11765480041503906, -0.110931396484375, -0.10420799255371094, -0.09748458862304688, -0.09076118469238281, -0.08403778076171875, -0.07731437683105469, -0.07059097290039062, -0.06386756896972656, -0.0571441650390625, -0.05042076110839844, -0.043697357177734375, -0.03697395324707031, -0.03025054931640625, -0.023527145385742188, -0.016803741455078125, -0.010080337524414062, -0.00335693359375, 0.0033664703369140625, 0.010089874267578125, 0.016813278198242188, 0.02353668212890625, 0.030260086059570312, 0.036983489990234375, 0.04370689392089844, 0.0504302978515625, 0.05715370178222656, 0.06387710571289062, 0.07060050964355469, 0.07732391357421875, 0.08404731750488281, 0.09077072143554688, 0.09749412536621094, 0.104217529296875, 0.11094093322753906, 0.11766433715820312, 0.12438774108886719, 0.13111114501953125, 0.1378345489501953, 0.14455795288085938, 0.15128135681152344, 0.1580047607421875, 0.16472816467285156, 0.17145156860351562, 0.1781749725341797, 0.18489837646484375, 0.1916217803955078, 0.19834518432617188, 0.20506858825683594, 0.2117919921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 19.0, 17.0, 40.0, 49.0, 79.0, 88.0, 105.0, 132.0, 114.0, 89.0, 58.0, 54.0, 36.0, 20.0, 17.0, 14.0, 6.0, 5.0, 5.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08135986328125, -0.07859420776367188, -0.07582855224609375, -0.07306289672851562, -0.0702972412109375, -0.06753158569335938, -0.06476593017578125, -0.062000274658203125, -0.059234619140625, -0.056468963623046875, -0.05370330810546875, -0.050937652587890625, -0.0481719970703125, -0.045406341552734375, -0.04264068603515625, -0.039875030517578125, -0.037109375, -0.034343719482421875, -0.03157806396484375, -0.028812408447265625, -0.0260467529296875, -0.023281097412109375, -0.02051544189453125, -0.017749786376953125, -0.014984130859375, -0.012218475341796875, -0.00945281982421875, -0.006687164306640625, -0.0039215087890625, -0.001155853271484375, 0.00160980224609375, 0.004375457763671875, 0.00714111328125, 0.009906768798828125, 0.01267242431640625, 0.015438079833984375, 0.0182037353515625, 0.020969390869140625, 0.02373504638671875, 0.026500701904296875, 0.029266357421875, 0.032032012939453125, 0.03479766845703125, 0.037563323974609375, 0.0403289794921875, 0.043094635009765625, 0.04586029052734375, 0.048625946044921875, 0.0513916015625, 0.054157257080078125, 0.05692291259765625, 0.059688568115234375, 0.0624542236328125, 0.06521987915039062, 0.06798553466796875, 0.07075119018554688, 0.073516845703125, 0.07628250122070312, 0.07904815673828125, 0.08181381225585938, 0.0845794677734375, 0.08734512329101562, 0.09011077880859375, 0.09287643432617188, 0.09564208984375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 8.0, 8.0, 6.0, 12.0, 16.0, 21.0, 30.0, 19.0, 27.0, 29.0, 49.0, 39.0, 47.0, 48.0, 32.0, 43.0, 52.0, 55.0, 51.0, 44.0, 54.0, 41.0, 43.0, 37.0, 28.0, 28.0, 28.0, 25.0, 10.0, 8.0, 15.0, 5.0, 10.0, 8.0, 10.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.452543258666992, -19.818645477294922, -19.18474578857422, -18.55084800720215, -17.916948318481445, -17.283050537109375, -16.649150848388672, -16.0152530670166, -15.381355285644531, -14.747456550598145, -14.113557815551758, -13.479660034179688, -12.8457612991333, -12.211862564086914, -11.577963829040527, -10.94406509399414, -10.310166358947754, -9.676267623901367, -9.04236888885498, -8.408470153808594, -7.774572372436523, -7.140673637390137, -6.50677490234375, -5.8728766441345215, -5.238977909088135, -4.605079174041748, -3.9711809158325195, -3.337282180786133, -2.703383684158325, -2.0694851875305176, -1.4355864524841309, -0.8016881942749023, -0.16778945922851562, 0.46610909700393677, 1.1000076532363892, 1.7339062690734863, 2.367804765701294, 3.0017032623291016, 3.6356019973754883, 4.269500255584717, 4.9033989906311035, 5.53729772567749, 6.171195983886719, 6.8050947189331055, 7.438993453979492, 8.072891235351562, 8.706790924072266, 9.340688705444336, 9.974587440490723, 10.60848617553711, 11.242384910583496, 11.876283645629883, 12.510181427001953, 13.14408016204834, 13.777978897094727, 14.411876678466797, 15.0457763671875, 15.679675102233887, 16.313573837280273, 16.947471618652344, 17.581371307373047, 18.215269088745117, 18.849166870117188, 19.48306655883789, 20.11696434020996]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 13.0, 10.0, 11.0, 8.0, 16.0, 21.0, 22.0, 26.0, 23.0, 19.0, 32.0, 34.0, 34.0, 36.0, 28.0, 47.0, 32.0, 46.0, 48.0, 45.0, 47.0, 37.0, 30.0, 26.0, 22.0, 24.0, 34.0, 29.0, 24.0, 23.0, 16.0, 17.0, 17.0, 11.0, 9.0, 5.0, 11.0, 10.0, 7.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-18.260574340820312, -17.657394409179688, -17.054214477539062, -16.451034545898438, -15.847855567932129, -15.244675636291504, -14.641495704650879, -14.03831672668457, -13.435136795043945, -12.83195686340332, -12.228776931762695, -11.62559700012207, -11.022418022155762, -10.419238090515137, -9.816058158874512, -9.212879180908203, -8.609698295593262, -8.006518363952637, -7.40333890914917, -6.800158977508545, -6.196979522705078, -5.593799591064453, -4.990619659423828, -4.387440204620361, -3.7842602729797363, -3.1810805797576904, -2.5779008865356445, -1.9747209548950195, -1.3715412616729736, -0.7683615684509277, -0.16518163681030273, 0.43799781799316406, 1.041177749633789, 1.644357442855835, 2.247537136077881, 2.850717067718506, 3.4538967609405518, 4.057076454162598, 4.660256385803223, 5.2634358406066895, 5.8666157722473145, 6.4697957038879395, 7.072975158691406, 7.676155090332031, 8.279335021972656, 8.882514953613281, 9.485694885253906, 10.088873863220215, 10.69205379486084, 11.295233726501465, 11.89841365814209, 12.501592636108398, 13.104772567749023, 13.707952499389648, 14.311132431030273, 14.914312362670898, 15.517492294311523, 16.12067222595215, 16.723852157592773, 17.3270320892334, 17.930212020874023, 18.533390045166016, 19.13656997680664, 19.739749908447266, 20.34292984008789]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 8.0, 9.0, 10.0, 23.0, 34.0, 50.0, 69.0, 151.0, 181.0, 261.0, 459.0, 749.0, 1154.0, 1836.0, 2975.0, 4421.0, 6723.0, 10272.0, 15429.0, 22216.0, 31648.0, 43565.0, 57349.0, 71097.0, 84104.0, 93599.0, 98772.0, 97561.0, 89496.0, 78820.0, 64298.0, 50429.0, 37436.0, 27157.0, 18979.0, 12986.0, 8648.0, 5563.0, 3619.0, 2285.0, 1487.0, 994.0, 589.0, 396.0, 263.0, 157.0, 88.0, 53.0, 37.0, 28.0, 13.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6484375, -9.3243408203125, -9.000244140625, -8.6761474609375, -8.35205078125, -8.0279541015625, -7.703857421875, -7.3797607421875, -7.0556640625, -6.7315673828125, -6.407470703125, -6.0833740234375, -5.75927734375, -5.4351806640625, -5.111083984375, -4.7869873046875, -4.462890625, -4.1387939453125, -3.814697265625, -3.4906005859375, -3.16650390625, -2.8424072265625, -2.518310546875, -2.1942138671875, -1.8701171875, -1.5460205078125, -1.221923828125, -0.8978271484375, -0.57373046875, -0.2496337890625, 0.074462890625, 0.3985595703125, 0.72265625, 1.0467529296875, 1.370849609375, 1.6949462890625, 2.01904296875, 2.3431396484375, 2.667236328125, 2.9913330078125, 3.3154296875, 3.6395263671875, 3.963623046875, 4.2877197265625, 4.61181640625, 4.9359130859375, 5.260009765625, 5.5841064453125, 5.908203125, 6.2322998046875, 6.556396484375, 6.8804931640625, 7.20458984375, 7.5286865234375, 7.852783203125, 8.1768798828125, 8.5009765625, 8.8250732421875, 9.149169921875, 9.4732666015625, 9.79736328125, 10.1214599609375, 10.445556640625, 10.7696533203125, 11.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 8.0, 2.0, 3.0, 5.0, 9.0, 12.0, 10.0, 11.0, 16.0, 11.0, 20.0, 19.0, 27.0, 22.0, 33.0, 19.0, 25.0, 50.0, 34.0, 42.0, 38.0, 40.0, 50.0, 49.0, 40.0, 45.0, 40.0, 31.0, 32.0, 38.0, 28.0, 24.0, 24.0, 23.0, 22.0, 18.0, 11.0, 9.0, 15.0, 10.0, 5.0, 10.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.390625, -18.7421875, -18.09375, -17.4453125, -16.796875, -16.1484375, -15.5, -14.8515625, -14.203125, -13.5546875, -12.90625, -12.2578125, -11.609375, -10.9609375, -10.3125, -9.6640625, -9.015625, -8.3671875, -7.71875, -7.0703125, -6.421875, -5.7734375, -5.125, -4.4765625, -3.828125, -3.1796875, -2.53125, -1.8828125, -1.234375, -0.5859375, 0.0625, 0.7109375, 1.359375, 2.0078125, 2.65625, 3.3046875, 3.953125, 4.6015625, 5.25, 5.8984375, 6.546875, 7.1953125, 7.84375, 8.4921875, 9.140625, 9.7890625, 10.4375, 11.0859375, 11.734375, 12.3828125, 13.03125, 13.6796875, 14.328125, 14.9765625, 15.625, 16.2734375, 16.921875, 17.5703125, 18.21875, 18.8671875, 19.515625, 20.1640625, 20.8125, 21.4609375, 22.109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 22.0, 34.0, 50.0, 77.0, 135.0, 203.0, 334.0, 491.0, 755.0, 1236.0, 1889.0, 3075.0, 4719.0, 7170.0, 10596.0, 15605.0, 22155.0, 31162.0, 41546.0, 54069.0, 66906.0, 78954.0, 88064.0, 93815.0, 93835.0, 88793.0, 78993.0, 67329.0, 54220.0, 41852.0, 31104.0, 22717.0, 15488.0, 10787.0, 7211.0, 4784.0, 3022.0, 1988.0, 1214.0, 806.0, 517.0, 308.0, 189.0, 123.0, 83.0, 48.0, 27.0, 22.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-10.2109375, -9.901611328125, -9.59228515625, -9.282958984375, -8.9736328125, -8.664306640625, -8.35498046875, -8.045654296875, -7.736328125, -7.427001953125, -7.11767578125, -6.808349609375, -6.4990234375, -6.189697265625, -5.88037109375, -5.571044921875, -5.26171875, -4.952392578125, -4.64306640625, -4.333740234375, -4.0244140625, -3.715087890625, -3.40576171875, -3.096435546875, -2.787109375, -2.477783203125, -2.16845703125, -1.859130859375, -1.5498046875, -1.240478515625, -0.93115234375, -0.621826171875, -0.3125, -0.003173828125, 0.30615234375, 0.615478515625, 0.9248046875, 1.234130859375, 1.54345703125, 1.852783203125, 2.162109375, 2.471435546875, 2.78076171875, 3.090087890625, 3.3994140625, 3.708740234375, 4.01806640625, 4.327392578125, 4.63671875, 4.946044921875, 5.25537109375, 5.564697265625, 5.8740234375, 6.183349609375, 6.49267578125, 6.802001953125, 7.111328125, 7.420654296875, 7.72998046875, 8.039306640625, 8.3486328125, 8.657958984375, 8.96728515625, 9.276611328125, 9.5859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 7.0, 5.0, 8.0, 4.0, 6.0, 8.0, 10.0, 7.0, 14.0, 11.0, 20.0, 22.0, 17.0, 19.0, 33.0, 29.0, 31.0, 30.0, 28.0, 29.0, 34.0, 48.0, 35.0, 42.0, 38.0, 32.0, 36.0, 40.0, 36.0, 40.0, 25.0, 33.0, 27.0, 30.0, 19.0, 22.0, 10.0, 16.0, 15.0, 21.0, 17.0, 7.0, 9.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -11.03564453125, -10.6572265625, -10.27880859375, -9.900390625, -9.52197265625, -9.1435546875, -8.76513671875, -8.38671875, -8.00830078125, -7.6298828125, -7.25146484375, -6.873046875, -6.49462890625, -6.1162109375, -5.73779296875, -5.359375, -4.98095703125, -4.6025390625, -4.22412109375, -3.845703125, -3.46728515625, -3.0888671875, -2.71044921875, -2.33203125, -1.95361328125, -1.5751953125, -1.19677734375, -0.818359375, -0.43994140625, -0.0615234375, 0.31689453125, 0.6953125, 1.07373046875, 1.4521484375, 1.83056640625, 2.208984375, 2.58740234375, 2.9658203125, 3.34423828125, 3.72265625, 4.10107421875, 4.4794921875, 4.85791015625, 5.236328125, 5.61474609375, 5.9931640625, 6.37158203125, 6.75, 7.12841796875, 7.5068359375, 7.88525390625, 8.263671875, 8.64208984375, 9.0205078125, 9.39892578125, 9.77734375, 10.15576171875, 10.5341796875, 10.91259765625, 11.291015625, 11.66943359375, 12.0478515625, 12.42626953125, 12.8046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 7.0, 21.0, 31.0, 51.0, 97.0, 129.0, 222.0, 350.0, 540.0, 892.0, 1386.0, 2241.0, 3389.0, 5337.0, 8265.0, 12513.0, 18603.0, 26320.0, 36942.0, 48931.0, 62793.0, 76785.0, 87791.0, 95433.0, 97824.0, 93812.0, 85673.0, 72217.0, 58953.0, 45534.0, 33434.0, 23947.0, 16579.0, 11119.0, 7270.0, 4772.0, 3095.0, 1999.0, 1161.0, 759.0, 499.0, 301.0, 176.0, 144.0, 79.0, 47.0, 40.0, 22.0, 10.0, 8.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.751007080078125, -2.65045166015625, -2.549896240234375, -2.4493408203125, -2.348785400390625, -2.24822998046875, -2.147674560546875, -2.047119140625, -1.946563720703125, -1.84600830078125, -1.745452880859375, -1.6448974609375, -1.544342041015625, -1.44378662109375, -1.343231201171875, -1.24267578125, -1.142120361328125, -1.04156494140625, -0.941009521484375, -0.8404541015625, -0.739898681640625, -0.63934326171875, -0.538787841796875, -0.438232421875, -0.337677001953125, -0.23712158203125, -0.136566162109375, -0.0360107421875, 0.064544677734375, 0.16510009765625, 0.265655517578125, 0.3662109375, 0.466766357421875, 0.56732177734375, 0.667877197265625, 0.7684326171875, 0.868988037109375, 0.96954345703125, 1.070098876953125, 1.170654296875, 1.271209716796875, 1.37176513671875, 1.472320556640625, 1.5728759765625, 1.673431396484375, 1.77398681640625, 1.874542236328125, 1.97509765625, 2.075653076171875, 2.17620849609375, 2.276763916015625, 2.3773193359375, 2.477874755859375, 2.57843017578125, 2.678985595703125, 2.779541015625, 2.880096435546875, 2.98065185546875, 3.081207275390625, 3.1817626953125, 3.282318115234375, 3.38287353515625, 3.483428955078125, 3.583984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 10.0, 5.0, 13.0, 8.0, 15.0, 9.0, 11.0, 17.0, 23.0, 31.0, 28.0, 25.0, 30.0, 41.0, 38.0, 69.0, 42.0, 52.0, 52.0, 41.0, 45.0, 47.0, 66.0, 41.0, 46.0, 42.0, 25.0, 19.0, 27.0, 18.0, 12.0, 13.0, 7.0, 4.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0005736351013183594, -0.0005589835345745087, -0.000544331967830658, -0.0005296804010868073, -0.0005150288343429565, -0.0005003772675991058, -0.0004857257008552551, -0.0004710741341114044, -0.0004564225673675537, -0.000441771000623703, -0.0004271194338798523, -0.0004124678671360016, -0.0003978163003921509, -0.00038316473364830017, -0.00036851316690444946, -0.00035386160016059875, -0.00033921003341674805, -0.00032455846667289734, -0.00030990689992904663, -0.0002952553331851959, -0.0002806037664413452, -0.0002659521996974945, -0.0002513006329536438, -0.0002366490662097931, -0.00022199749946594238, -0.00020734593272209167, -0.00019269436597824097, -0.00017804279923439026, -0.00016339123249053955, -0.00014873966574668884, -0.00013408809900283813, -0.00011943653225898743, -0.00010478496551513672, -9.013339877128601e-05, -7.54818320274353e-05, -6.0830265283584595e-05, -4.617869853973389e-05, -3.152713179588318e-05, -1.687556505203247e-05, -2.2239983081817627e-06, 1.2427568435668945e-05, 2.7079135179519653e-05, 4.173070192337036e-05, 5.638226866722107e-05, 7.103383541107178e-05, 8.568540215492249e-05, 0.0001003369688987732, 0.0001149885356426239, 0.0001296401023864746, 0.00014429166913032532, 0.00015894323587417603, 0.00017359480261802673, 0.00018824636936187744, 0.00020289793610572815, 0.00021754950284957886, 0.00023220106959342957, 0.0002468526363372803, 0.000261504203081131, 0.0002761557698249817, 0.0002908073365688324, 0.0003054589033126831, 0.0003201104700565338, 0.0003347620368003845, 0.00034941360354423523, 0.00036406517028808594]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 8.0, 34.0, 35.0, 62.0, 97.0, 136.0, 255.0, 421.0, 738.0, 1168.0, 1957.0, 3258.0, 5579.0, 9241.0, 15333.0, 24277.0, 37354.0, 55042.0, 75309.0, 96372.0, 113244.0, 120981.0, 118026.0, 104004.0, 83965.0, 62529.0, 44054.0, 28697.0, 18169.0, 11338.0, 6751.0, 3977.0, 2452.0, 1496.0, 863.0, 494.0, 322.0, 219.0, 108.0, 73.0, 44.0, 30.0, 16.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.18438720703125, -4.0523681640625, -3.92034912109375, -3.788330078125, -3.65631103515625, -3.5242919921875, -3.39227294921875, -3.26025390625, -3.12823486328125, -2.9962158203125, -2.86419677734375, -2.732177734375, -2.60015869140625, -2.4681396484375, -2.33612060546875, -2.2041015625, -2.07208251953125, -1.9400634765625, -1.80804443359375, -1.676025390625, -1.54400634765625, -1.4119873046875, -1.27996826171875, -1.14794921875, -1.01593017578125, -0.8839111328125, -0.75189208984375, -0.619873046875, -0.48785400390625, -0.3558349609375, -0.22381591796875, -0.091796875, 0.04022216796875, 0.1722412109375, 0.30426025390625, 0.436279296875, 0.56829833984375, 0.7003173828125, 0.83233642578125, 0.96435546875, 1.09637451171875, 1.2283935546875, 1.36041259765625, 1.492431640625, 1.62445068359375, 1.7564697265625, 1.88848876953125, 2.0205078125, 2.15252685546875, 2.2845458984375, 2.41656494140625, 2.548583984375, 2.68060302734375, 2.8126220703125, 2.94464111328125, 3.07666015625, 3.20867919921875, 3.3406982421875, 3.47271728515625, 3.604736328125, 3.73675537109375, 3.8687744140625, 4.00079345703125, 4.1328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 11.0, 6.0, 7.0, 11.0, 17.0, 19.0, 16.0, 22.0, 23.0, 35.0, 34.0, 33.0, 46.0, 53.0, 39.0, 48.0, 47.0, 44.0, 64.0, 49.0, 49.0, 48.0, 41.0, 44.0, 35.0, 33.0, 22.0, 28.0, 17.0, 19.0, 15.0, 4.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8157958984375, -1.752685546875, -1.6895751953125, -1.62646484375, -1.5633544921875, -1.500244140625, -1.4371337890625, -1.3740234375, -1.3109130859375, -1.247802734375, -1.1846923828125, -1.12158203125, -1.0584716796875, -0.995361328125, -0.9322509765625, -0.869140625, -0.8060302734375, -0.742919921875, -0.6798095703125, -0.61669921875, -0.5535888671875, -0.490478515625, -0.4273681640625, -0.3642578125, -0.3011474609375, -0.238037109375, -0.1749267578125, -0.11181640625, -0.0487060546875, 0.014404296875, 0.0775146484375, 0.140625, 0.2037353515625, 0.266845703125, 0.3299560546875, 0.39306640625, 0.4561767578125, 0.519287109375, 0.5823974609375, 0.6455078125, 0.7086181640625, 0.771728515625, 0.8348388671875, 0.89794921875, 0.9610595703125, 1.024169921875, 1.0872802734375, 1.150390625, 1.2135009765625, 1.276611328125, 1.3397216796875, 1.40283203125, 1.4659423828125, 1.529052734375, 1.5921630859375, 1.6552734375, 1.7183837890625, 1.781494140625, 1.8446044921875, 1.90771484375, 1.9708251953125, 2.033935546875, 2.0970458984375, 2.16015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 4.0, 10.0, 5.0, 12.0, 15.0, 18.0, 27.0, 26.0, 44.0, 40.0, 25.0, 33.0, 48.0, 47.0, 48.0, 51.0, 49.0, 47.0, 61.0, 45.0, 36.0, 49.0, 32.0, 31.0, 31.0, 31.0, 32.0, 21.0, 9.0, 10.0, 19.0, 12.0, 6.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.989988327026367, -19.344646453857422, -18.699304580688477, -18.05396270751953, -17.408620834350586, -16.76327896118164, -16.117937088012695, -15.472594261169434, -14.827252388000488, -14.181910514831543, -13.536568641662598, -12.891226768493652, -12.24588394165039, -11.600542068481445, -10.9552001953125, -10.309858322143555, -9.66451644897461, -9.019174575805664, -8.373832702636719, -7.728490352630615, -7.08314847946167, -6.437806606292725, -5.792464256286621, -5.147122383117676, -4.5017805099487305, -3.856438636779785, -3.2110965251922607, -2.5657544136047363, -1.920412540435791, -1.2750706672668457, -0.6297285556793213, 0.015613555908203125, 0.6609535217285156, 1.3062955141067505, 1.9516375064849854, 2.5969796180725098, 3.242321491241455, 3.8876633644104004, 4.533005714416504, 5.178347587585449, 5.8236894607543945, 6.46903133392334, 7.114373207092285, 7.759715557098389, 8.405057907104492, 9.050399780273438, 9.695741653442383, 10.341083526611328, 10.986425399780273, 11.631767272949219, 12.277109146118164, 12.92245101928711, 13.567792892456055, 14.213134765625, 14.858477592468262, 15.503819465637207, 16.14916229248047, 16.794504165649414, 17.43984603881836, 18.085187911987305, 18.73052978515625, 19.375871658325195, 20.02121353149414, 20.66655731201172, 21.31189727783203]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 12.0, 11.0, 14.0, 9.0, 12.0, 15.0, 17.0, 18.0, 20.0, 14.0, 32.0, 30.0, 29.0, 47.0, 43.0, 47.0, 32.0, 35.0, 41.0, 48.0, 29.0, 48.0, 40.0, 26.0, 35.0, 37.0, 27.0, 34.0, 17.0, 20.0, 21.0, 16.0, 16.0, 17.0, 11.0, 25.0, 14.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.22197151184082, -19.555076599121094, -18.88818359375, -18.221288681030273, -17.554393768310547, -16.887500762939453, -16.220605850219727, -15.553711891174316, -14.886817932128906, -14.219923973083496, -13.553030014038086, -12.88613510131836, -12.21924114227295, -11.552347183227539, -10.885452270507812, -10.218558311462402, -9.551664352416992, -8.884770393371582, -8.217876434326172, -7.550981521606445, -6.884087562561035, -6.217193603515625, -5.550299167633057, -4.883404731750488, -4.216510772705078, -3.549616575241089, -2.8827223777770996, -2.2158281803131104, -1.548933982849121, -0.8820397853851318, -0.21514558792114258, 0.4517488479614258, 1.1186408996582031, 1.7855350971221924, 2.4524292945861816, 3.119323492050171, 3.78621768951416, 4.45311164855957, 5.120006084442139, 5.786900520324707, 6.453794479370117, 7.120688438415527, 7.787582874298096, 8.454477310180664, 9.121371269226074, 9.788265228271484, 10.455160140991211, 11.122054100036621, 11.788948059082031, 12.455842018127441, 13.122735977172852, 13.789630889892578, 14.456524848937988, 15.123418807983398, 15.790313720703125, 16.45720672607422, 17.124101638793945, 17.790996551513672, 18.457889556884766, 19.124784469604492, 19.79167938232422, 20.458572387695312, 21.12546730041504, 21.792362213134766, 22.45925521850586]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 15.0, 16.0, 46.0, 56.0, 110.0, 188.0, 366.0, 596.0, 952.0, 1572.0, 2625.0, 4359.0, 7012.0, 11319.0, 17769.0, 28193.0, 42912.0, 64469.0, 94063.0, 132491.0, 180098.0, 235211.0, 293162.0, 344353.0, 381701.0, 397313.0, 388896.0, 357033.0, 306639.0, 251062.0, 195067.0, 144705.0, 103399.0, 71660.0, 48613.0, 32050.0, 20479.0, 12857.0, 8134.0, 4933.0, 3115.0, 1851.0, 1170.0, 652.0, 390.0, 246.0, 161.0, 82.0, 47.0, 36.0, 25.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.25, -13.8131103515625, -13.376220703125, -12.9393310546875, -12.50244140625, -12.0655517578125, -11.628662109375, -11.1917724609375, -10.7548828125, -10.3179931640625, -9.881103515625, -9.4442138671875, -9.00732421875, -8.5704345703125, -8.133544921875, -7.6966552734375, -7.259765625, -6.8228759765625, -6.385986328125, -5.9490966796875, -5.51220703125, -5.0753173828125, -4.638427734375, -4.2015380859375, -3.7646484375, -3.3277587890625, -2.890869140625, -2.4539794921875, -2.01708984375, -1.5802001953125, -1.143310546875, -0.7064208984375, -0.26953125, 0.1673583984375, 0.604248046875, 1.0411376953125, 1.47802734375, 1.9149169921875, 2.351806640625, 2.7886962890625, 3.2255859375, 3.6624755859375, 4.099365234375, 4.5362548828125, 4.97314453125, 5.4100341796875, 5.846923828125, 6.2838134765625, 6.720703125, 7.1575927734375, 7.594482421875, 8.0313720703125, 8.46826171875, 8.9051513671875, 9.342041015625, 9.7789306640625, 10.2158203125, 10.6527099609375, 11.089599609375, 11.5264892578125, 11.96337890625, 12.4002685546875, 12.837158203125, 13.2740478515625, 13.7109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 4.0, 5.0, 5.0, 13.0, 19.0, 10.0, 15.0, 20.0, 14.0, 21.0, 37.0, 23.0, 31.0, 34.0, 42.0, 40.0, 49.0, 46.0, 42.0, 40.0, 43.0, 44.0, 43.0, 35.0, 36.0, 32.0, 24.0, 23.0, 28.0, 18.0, 26.0, 16.0, 15.0, 19.0, 22.0, 9.0, 15.0, 7.0, 9.0, 11.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.890625, -18.296875, -17.703125, -17.109375, -16.515625, -15.921875, -15.328125, -14.734375, -14.140625, -13.546875, -12.953125, -12.359375, -11.765625, -11.171875, -10.578125, -9.984375, -9.390625, -8.796875, -8.203125, -7.609375, -7.015625, -6.421875, -5.828125, -5.234375, -4.640625, -4.046875, -3.453125, -2.859375, -2.265625, -1.671875, -1.078125, -0.484375, 0.109375, 0.703125, 1.296875, 1.890625, 2.484375, 3.078125, 3.671875, 4.265625, 4.859375, 5.453125, 6.046875, 6.640625, 7.234375, 7.828125, 8.421875, 9.015625, 9.609375, 10.203125, 10.796875, 11.390625, 11.984375, 12.578125, 13.171875, 13.765625, 14.359375, 14.953125, 15.546875, 16.140625, 16.734375, 17.328125, 17.921875, 18.515625, 19.109375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 20.0, 40.0, 46.0, 90.0, 158.0, 263.0, 440.0, 827.0, 1429.0, 2386.0, 4064.0, 6565.0, 10685.0, 17287.0, 27561.0, 42406.0, 63990.0, 91809.0, 127833.0, 173735.0, 224113.0, 275350.0, 322707.0, 358214.0, 378509.0, 375501.0, 353580.0, 315210.0, 266247.0, 214497.0, 165281.0, 120972.0, 86945.0, 59416.0, 39239.0, 25756.0, 15999.0, 10050.0, 6170.0, 3643.0, 2207.0, 1301.0, 754.0, 405.0, 281.0, 132.0, 78.0, 36.0, 26.0, 13.0, 8.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.7734375, -14.3245849609375, -13.875732421875, -13.4268798828125, -12.97802734375, -12.5291748046875, -12.080322265625, -11.6314697265625, -11.1826171875, -10.7337646484375, -10.284912109375, -9.8360595703125, -9.38720703125, -8.9383544921875, -8.489501953125, -8.0406494140625, -7.591796875, -7.1429443359375, -6.694091796875, -6.2452392578125, -5.79638671875, -5.3475341796875, -4.898681640625, -4.4498291015625, -4.0009765625, -3.5521240234375, -3.103271484375, -2.6544189453125, -2.20556640625, -1.7567138671875, -1.307861328125, -0.8590087890625, -0.41015625, 0.0386962890625, 0.487548828125, 0.9364013671875, 1.38525390625, 1.8341064453125, 2.282958984375, 2.7318115234375, 3.1806640625, 3.6295166015625, 4.078369140625, 4.5272216796875, 4.97607421875, 5.4249267578125, 5.873779296875, 6.3226318359375, 6.771484375, 7.2203369140625, 7.669189453125, 8.1180419921875, 8.56689453125, 9.0157470703125, 9.464599609375, 9.9134521484375, 10.3623046875, 10.8111572265625, 11.260009765625, 11.7088623046875, 12.15771484375, 12.6065673828125, 13.055419921875, 13.5042724609375, 13.953125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 12.0, 12.0, 19.0, 21.0, 41.0, 50.0, 51.0, 73.0, 88.0, 91.0, 110.0, 110.0, 157.0, 165.0, 185.0, 203.0, 212.0, 225.0, 212.0, 214.0, 222.0, 192.0, 181.0, 178.0, 160.0, 152.0, 122.0, 114.0, 85.0, 79.0, 75.0, 55.0, 48.0, 40.0, 31.0, 22.0, 19.0, 12.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.2589111328125, -7.963134765625, -7.6673583984375, -7.37158203125, -7.0758056640625, -6.780029296875, -6.4842529296875, -6.1884765625, -5.8927001953125, -5.596923828125, -5.3011474609375, -5.00537109375, -4.7095947265625, -4.413818359375, -4.1180419921875, -3.822265625, -3.5264892578125, -3.230712890625, -2.9349365234375, -2.63916015625, -2.3433837890625, -2.047607421875, -1.7518310546875, -1.4560546875, -1.1602783203125, -0.864501953125, -0.5687255859375, -0.27294921875, 0.0228271484375, 0.318603515625, 0.6143798828125, 0.91015625, 1.2059326171875, 1.501708984375, 1.7974853515625, 2.09326171875, 2.3890380859375, 2.684814453125, 2.9805908203125, 3.2763671875, 3.5721435546875, 3.867919921875, 4.1636962890625, 4.45947265625, 4.7552490234375, 5.051025390625, 5.3468017578125, 5.642578125, 5.9383544921875, 6.234130859375, 6.5299072265625, 6.82568359375, 7.1214599609375, 7.417236328125, 7.7130126953125, 8.0087890625, 8.3045654296875, 8.600341796875, 8.8961181640625, 9.19189453125, 9.4876708984375, 9.783447265625, 10.0792236328125, 10.375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 4.0, 12.0, 9.0, 13.0, 20.0, 27.0, 37.0, 18.0, 42.0, 35.0, 35.0, 37.0, 44.0, 54.0, 40.0, 43.0, 50.0, 47.0, 58.0, 45.0, 31.0, 31.0, 35.0, 27.0, 25.0, 23.0, 29.0, 24.0, 21.0, 12.0, 18.0, 13.0, 7.0, 10.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.590007781982422, -18.876171112060547, -18.162334442138672, -17.448497772216797, -16.734661102294922, -16.020822525024414, -15.306985855102539, -14.593149185180664, -13.879312515258789, -13.165475845336914, -12.451639175415039, -11.737801551818848, -11.023964881896973, -10.310128211975098, -9.596290588378906, -8.882453918457031, -8.168617248535156, -7.454780578613281, -6.740943431854248, -6.027106285095215, -5.31326961517334, -4.599432945251465, -3.8855957984924316, -3.1717586517333984, -2.4579219818115234, -1.7440850734710693, -1.0302481651306152, -0.31641125679016113, 0.39742565155029297, 1.111262559890747, 1.8250994682312012, 2.5389366149902344, 3.2527732849121094, 3.9666101932525635, 4.680447101593018, 5.394284248352051, 6.108120918273926, 6.821957588195801, 7.535794734954834, 8.249631881713867, 8.963468551635742, 9.677305221557617, 10.391141891479492, 11.104979515075684, 11.818816184997559, 12.532652854919434, 13.246490478515625, 13.9603271484375, 14.674163818359375, 15.38800048828125, 16.101837158203125, 16.815673828125, 17.529510498046875, 18.243349075317383, 18.957185745239258, 19.671022415161133, 20.384859085083008, 21.098695755004883, 21.812532424926758, 22.526369094848633, 23.24020767211914, 23.954044342041016, 24.66788101196289, 25.381717681884766, 26.09555435180664]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 6.0, 9.0, 10.0, 13.0, 13.0, 10.0, 15.0, 22.0, 22.0, 27.0, 28.0, 22.0, 41.0, 28.0, 55.0, 41.0, 45.0, 46.0, 43.0, 41.0, 52.0, 38.0, 41.0, 42.0, 32.0, 26.0, 22.0, 22.0, 29.0, 27.0, 16.0, 14.0, 20.0, 13.0, 10.0, 12.0, 6.0, 12.0, 9.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28847312927246, -21.549365997314453, -20.810258865356445, -20.071151733398438, -19.33204460144043, -18.592937469482422, -17.853830337524414, -17.114723205566406, -16.3756160736084, -15.63650894165039, -14.897401809692383, -14.158294677734375, -13.419187545776367, -12.68008041381836, -11.940973281860352, -11.201866149902344, -10.46275806427002, -9.723650932312012, -8.984543800354004, -8.245436668395996, -7.506329536437988, -6.7672224044799805, -6.0281147956848145, -5.289007663726807, -4.549900531768799, -3.810793399810791, -3.071686267852783, -2.3325788974761963, -1.5934717655181885, -0.8543646335601807, -0.11525726318359375, 0.6238498687744141, 1.3629570007324219, 2.1020641326904297, 2.8411712646484375, 3.5802786350250244, 4.319385528564453, 5.058492660522461, 5.797600269317627, 6.536707401275635, 7.275814533233643, 8.014922142028809, 8.754029273986816, 9.493136405944824, 10.232243537902832, 10.97135066986084, 11.710457801818848, 12.449564933776855, 13.188672065734863, 13.927779197692871, 14.666886329650879, 15.405993461608887, 16.14510154724121, 16.88420867919922, 17.623315811157227, 18.362422943115234, 19.101530075073242, 19.84063720703125, 20.579744338989258, 21.318851470947266, 22.057958602905273, 22.79706573486328, 23.53617286682129, 24.275279998779297, 25.014387130737305]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 8.0, 15.0, 18.0, 27.0, 34.0, 45.0, 71.0, 108.0, 147.0, 212.0, 245.0, 447.0, 613.0, 931.0, 1247.0, 1954.0, 2591.0, 3904.0, 5790.0, 8406.0, 12391.0, 19033.0, 29377.0, 46311.0, 74246.0, 118934.0, 176743.0, 186000.0, 130437.0, 81535.0, 51017.0, 31895.0, 21077.0, 13825.0, 9105.0, 6336.0, 4155.0, 2867.0, 1944.0, 1356.0, 977.0, 662.0, 489.0, 315.0, 210.0, 162.0, 119.0, 74.0, 41.0, 39.0, 22.0, 20.0, 16.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.60546875, -2.521697998046875, -2.43792724609375, -2.354156494140625, -2.2703857421875, -2.186614990234375, -2.10284423828125, -2.019073486328125, -1.935302734375, -1.851531982421875, -1.76776123046875, -1.683990478515625, -1.6002197265625, -1.516448974609375, -1.43267822265625, -1.348907470703125, -1.26513671875, -1.181365966796875, -1.09759521484375, -1.013824462890625, -0.9300537109375, -0.846282958984375, -0.76251220703125, -0.678741455078125, -0.594970703125, -0.511199951171875, -0.42742919921875, -0.343658447265625, -0.2598876953125, -0.176116943359375, -0.09234619140625, -0.008575439453125, 0.0751953125, 0.158966064453125, 0.24273681640625, 0.326507568359375, 0.4102783203125, 0.494049072265625, 0.57781982421875, 0.661590576171875, 0.745361328125, 0.829132080078125, 0.91290283203125, 0.996673583984375, 1.0804443359375, 1.164215087890625, 1.24798583984375, 1.331756591796875, 1.41552734375, 1.499298095703125, 1.58306884765625, 1.666839599609375, 1.7506103515625, 1.834381103515625, 1.91815185546875, 2.001922607421875, 2.085693359375, 2.169464111328125, 2.25323486328125, 2.337005615234375, 2.4207763671875, 2.504547119140625, 2.58831787109375, 2.672088623046875, 2.755859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 10.0, 13.0, 14.0, 8.0, 9.0, 20.0, 22.0, 27.0, 22.0, 14.0, 23.0, 38.0, 35.0, 44.0, 45.0, 38.0, 34.0, 47.0, 45.0, 45.0, 44.0, 34.0, 45.0, 29.0, 34.0, 27.0, 30.0, 34.0, 13.0, 24.0, 22.0, 14.0, 13.0, 13.0, 15.0, 6.0, 14.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.21875, -20.475341796875, -19.73193359375, -18.988525390625, -18.2451171875, -17.501708984375, -16.75830078125, -16.014892578125, -15.271484375, -14.528076171875, -13.78466796875, -13.041259765625, -12.2978515625, -11.554443359375, -10.81103515625, -10.067626953125, -9.32421875, -8.580810546875, -7.83740234375, -7.093994140625, -6.3505859375, -5.607177734375, -4.86376953125, -4.120361328125, -3.376953125, -2.633544921875, -1.89013671875, -1.146728515625, -0.4033203125, 0.340087890625, 1.08349609375, 1.826904296875, 2.5703125, 3.313720703125, 4.05712890625, 4.800537109375, 5.5439453125, 6.287353515625, 7.03076171875, 7.774169921875, 8.517578125, 9.260986328125, 10.00439453125, 10.747802734375, 11.4912109375, 12.234619140625, 12.97802734375, 13.721435546875, 14.46484375, 15.208251953125, 15.95166015625, 16.695068359375, 17.4384765625, 18.181884765625, 18.92529296875, 19.668701171875, 20.412109375, 21.155517578125, 21.89892578125, 22.642333984375, 23.3857421875, 24.129150390625, 24.87255859375, 25.615966796875, 26.359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 13.0, 13.0, 19.0, 30.0, 48.0, 81.0, 132.0, 155.0, 240.0, 346.0, 454.0, 726.0, 1085.0, 1655.0, 2320.0, 3721.0, 5524.0, 8723.0, 13824.0, 21598.0, 34891.0, 58063.0, 99014.0, 170657.0, 230253.0, 159601.0, 91282.0, 54080.0, 32858.0, 20258.0, 12959.0, 8172.0, 5308.0, 3401.0, 2301.0, 1511.0, 1024.0, 665.0, 484.0, 338.0, 205.0, 165.0, 116.0, 67.0, 43.0, 41.0, 17.0, 22.0, 11.0, 8.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-3.302734375, -3.197662353515625, -3.09259033203125, -2.987518310546875, -2.8824462890625, -2.777374267578125, -2.67230224609375, -2.567230224609375, -2.462158203125, -2.357086181640625, -2.25201416015625, -2.146942138671875, -2.0418701171875, -1.936798095703125, -1.83172607421875, -1.726654052734375, -1.62158203125, -1.516510009765625, -1.41143798828125, -1.306365966796875, -1.2012939453125, -1.096221923828125, -0.99114990234375, -0.886077880859375, -0.781005859375, -0.675933837890625, -0.57086181640625, -0.465789794921875, -0.3607177734375, -0.255645751953125, -0.15057373046875, -0.045501708984375, 0.0595703125, 0.164642333984375, 0.26971435546875, 0.374786376953125, 0.4798583984375, 0.584930419921875, 0.69000244140625, 0.795074462890625, 0.900146484375, 1.005218505859375, 1.11029052734375, 1.215362548828125, 1.3204345703125, 1.425506591796875, 1.53057861328125, 1.635650634765625, 1.74072265625, 1.845794677734375, 1.95086669921875, 2.055938720703125, 2.1610107421875, 2.266082763671875, 2.37115478515625, 2.476226806640625, 2.581298828125, 2.686370849609375, 2.79144287109375, 2.896514892578125, 3.0015869140625, 3.106658935546875, 3.21173095703125, 3.316802978515625, 3.421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 11.0, 4.0, 16.0, 19.0, 18.0, 20.0, 27.0, 19.0, 25.0, 23.0, 30.0, 35.0, 27.0, 41.0, 34.0, 35.0, 53.0, 29.0, 48.0, 41.0, 38.0, 26.0, 33.0, 33.0, 31.0, 31.0, 26.0, 35.0, 14.0, 20.0, 21.0, 16.0, 11.0, 8.0, 11.0, 12.0, 5.0, 8.0, 8.0, 8.0, 7.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.125, -13.695556640625, -13.26611328125, -12.836669921875, -12.4072265625, -11.977783203125, -11.54833984375, -11.118896484375, -10.689453125, -10.260009765625, -9.83056640625, -9.401123046875, -8.9716796875, -8.542236328125, -8.11279296875, -7.683349609375, -7.25390625, -6.824462890625, -6.39501953125, -5.965576171875, -5.5361328125, -5.106689453125, -4.67724609375, -4.247802734375, -3.818359375, -3.388916015625, -2.95947265625, -2.530029296875, -2.1005859375, -1.671142578125, -1.24169921875, -0.812255859375, -0.3828125, 0.046630859375, 0.47607421875, 0.905517578125, 1.3349609375, 1.764404296875, 2.19384765625, 2.623291015625, 3.052734375, 3.482177734375, 3.91162109375, 4.341064453125, 4.7705078125, 5.199951171875, 5.62939453125, 6.058837890625, 6.48828125, 6.917724609375, 7.34716796875, 7.776611328125, 8.2060546875, 8.635498046875, 9.06494140625, 9.494384765625, 9.923828125, 10.353271484375, 10.78271484375, 11.212158203125, 11.6416015625, 12.071044921875, 12.50048828125, 12.929931640625, 13.359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 11.0, 11.0, 22.0, 23.0, 34.0, 46.0, 70.0, 97.0, 139.0, 213.0, 280.0, 385.0, 614.0, 865.0, 1332.0, 1921.0, 2871.0, 4410.0, 6969.0, 11026.0, 17740.0, 29094.0, 49672.0, 89861.0, 177785.0, 262300.0, 175076.0, 89554.0, 48744.0, 28882.0, 17623.0, 10672.0, 6842.0, 4462.0, 2849.0, 1988.0, 1238.0, 873.0, 612.0, 430.0, 272.0, 189.0, 125.0, 98.0, 53.0, 69.0, 37.0, 18.0, 16.0, 10.0, 10.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.0770263671875, -0.07458019256591797, -0.07213401794433594, -0.0696878433227539, -0.06724166870117188, -0.06479549407958984, -0.06234931945800781, -0.05990314483642578, -0.05745697021484375, -0.05501079559326172, -0.05256462097167969, -0.050118446350097656, -0.047672271728515625, -0.045226097106933594, -0.04277992248535156, -0.04033374786376953, -0.0378875732421875, -0.03544139862060547, -0.03299522399902344, -0.030549049377441406, -0.028102874755859375, -0.025656700134277344, -0.023210525512695312, -0.02076435089111328, -0.01831817626953125, -0.01587200164794922, -0.013425827026367188, -0.010979652404785156, -0.008533477783203125, -0.006087303161621094, -0.0036411285400390625, -0.0011949539184570312, 0.001251220703125, 0.0036973953247070312, 0.0061435699462890625, 0.008589744567871094, 0.011035919189453125, 0.013482093811035156, 0.015928268432617188, 0.01837444305419922, 0.02082061767578125, 0.02326679229736328, 0.025712966918945312, 0.028159141540527344, 0.030605316162109375, 0.033051490783691406, 0.03549766540527344, 0.03794384002685547, 0.0403900146484375, 0.04283618927001953, 0.04528236389160156, 0.047728538513183594, 0.050174713134765625, 0.052620887756347656, 0.05506706237792969, 0.05751323699951172, 0.05995941162109375, 0.06240558624267578, 0.06485176086425781, 0.06729793548583984, 0.06974411010742188, 0.0721902847290039, 0.07463645935058594, 0.07708263397216797, 0.07952880859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 7.0, 10.0, 3.0, 17.0, 14.0, 19.0, 14.0, 26.0, 24.0, 31.0, 29.0, 43.0, 29.0, 47.0, 46.0, 46.0, 50.0, 35.0, 38.0, 41.0, 48.0, 36.0, 37.0, 45.0, 33.0, 27.0, 16.0, 31.0, 14.0, 22.0, 16.0, 23.0, 9.0, 7.0, 8.0, 11.0, 7.0, 10.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4424324035644531e-05, -1.3940967619419098e-05, -1.3457611203193665e-05, -1.2974254786968231e-05, -1.2490898370742798e-05, -1.2007541954517365e-05, -1.1524185538291931e-05, -1.1040829122066498e-05, -1.0557472705841064e-05, -1.0074116289615631e-05, -9.590759873390198e-06, -9.107403457164764e-06, -8.624047040939331e-06, -8.140690624713898e-06, -7.657334208488464e-06, -7.173977792263031e-06, -6.690621376037598e-06, -6.207264959812164e-06, -5.723908543586731e-06, -5.240552127361298e-06, -4.757195711135864e-06, -4.273839294910431e-06, -3.7904828786849976e-06, -3.307126462459564e-06, -2.823770046234131e-06, -2.3404136300086975e-06, -1.8570572137832642e-06, -1.3737007975578308e-06, -8.903443813323975e-07, -4.069879651069641e-07, 7.636845111846924e-08, 5.597248673439026e-07, 1.043081283569336e-06, 1.5264376997947693e-06, 2.0097941160202026e-06, 2.493150532245636e-06, 2.9765069484710693e-06, 3.4598633646965027e-06, 3.943219780921936e-06, 4.426576197147369e-06, 4.909932613372803e-06, 5.393289029598236e-06, 5.8766454458236694e-06, 6.360001862049103e-06, 6.843358278274536e-06, 7.3267146944999695e-06, 7.810071110725403e-06, 8.293427526950836e-06, 8.77678394317627e-06, 9.260140359401703e-06, 9.743496775627136e-06, 1.022685319185257e-05, 1.0710209608078003e-05, 1.1193566024303436e-05, 1.167692244052887e-05, 1.2160278856754303e-05, 1.2643635272979736e-05, 1.312699168920517e-05, 1.3610348105430603e-05, 1.4093704521656036e-05, 1.457706093788147e-05, 1.5060417354106903e-05, 1.5543773770332336e-05, 1.602713018655777e-05, 1.6510486602783203e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 13.0, 27.0, 20.0, 37.0, 52.0, 81.0, 143.0, 198.0, 294.0, 442.0, 725.0, 1058.0, 1592.0, 2426.0, 3573.0, 5215.0, 7941.0, 12221.0, 18810.0, 28798.0, 46825.0, 76914.0, 139697.0, 262414.0, 185715.0, 96349.0, 56844.0, 35226.0, 22391.0, 14451.0, 9378.0, 6246.0, 4219.0, 2651.0, 1863.0, 1243.0, 822.0, 560.0, 386.0, 257.0, 155.0, 98.0, 66.0, 41.0, 38.0, 18.0, 15.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1578369140625, -0.15252304077148438, -0.14720916748046875, -0.14189529418945312, -0.1365814208984375, -0.13126754760742188, -0.12595367431640625, -0.12063980102539062, -0.115325927734375, -0.11001205444335938, -0.10469818115234375, -0.09938430786132812, -0.0940704345703125, -0.08875656127929688, -0.08344268798828125, -0.07812881469726562, -0.07281494140625, -0.06750106811523438, -0.06218719482421875, -0.056873321533203125, -0.0515594482421875, -0.046245574951171875, -0.04093170166015625, -0.035617828369140625, -0.030303955078125, -0.024990081787109375, -0.01967620849609375, -0.014362335205078125, -0.0090484619140625, -0.003734588623046875, 0.00157928466796875, 0.006893157958984375, 0.01220703125, 0.017520904541015625, 0.02283477783203125, 0.028148651123046875, 0.0334625244140625, 0.038776397705078125, 0.04409027099609375, 0.049404144287109375, 0.054718017578125, 0.060031890869140625, 0.06534576416015625, 0.07065963745117188, 0.0759735107421875, 0.08128738403320312, 0.08660125732421875, 0.09191513061523438, 0.09722900390625, 0.10254287719726562, 0.10785675048828125, 0.11317062377929688, 0.1184844970703125, 0.12379837036132812, 0.12911224365234375, 0.13442611694335938, 0.139739990234375, 0.14505386352539062, 0.15036773681640625, 0.15568161010742188, 0.1609954833984375, 0.16630935668945312, 0.17162322998046875, 0.17693710327148438, 0.1822509765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 7.0, 4.0, 9.0, 11.0, 9.0, 11.0, 10.0, 20.0, 19.0, 15.0, 23.0, 25.0, 28.0, 39.0, 56.0, 72.0, 71.0, 70.0, 62.0, 68.0, 53.0, 45.0, 43.0, 25.0, 28.0, 21.0, 22.0, 22.0, 13.0, 11.0, 12.0, 2.0, 12.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06420516967773438, -0.06218719482421875, -0.060169219970703125, -0.0581512451171875, -0.056133270263671875, -0.05411529541015625, -0.052097320556640625, -0.050079345703125, -0.048061370849609375, -0.04604339599609375, -0.044025421142578125, -0.0420074462890625, -0.039989471435546875, -0.03797149658203125, -0.035953521728515625, -0.033935546875, -0.031917572021484375, -0.02989959716796875, -0.027881622314453125, -0.0258636474609375, -0.023845672607421875, -0.02182769775390625, -0.019809722900390625, -0.017791748046875, -0.015773773193359375, -0.01375579833984375, -0.011737823486328125, -0.0097198486328125, -0.007701873779296875, -0.00568389892578125, -0.003665924072265625, -0.00164794921875, 0.000370025634765625, 0.00238800048828125, 0.004405975341796875, 0.0064239501953125, 0.008441925048828125, 0.01045989990234375, 0.012477874755859375, 0.014495849609375, 0.016513824462890625, 0.01853179931640625, 0.020549774169921875, 0.0225677490234375, 0.024585723876953125, 0.02660369873046875, 0.028621673583984375, 0.0306396484375, 0.032657623291015625, 0.03467559814453125, 0.036693572998046875, 0.0387115478515625, 0.040729522705078125, 0.04274749755859375, 0.044765472412109375, 0.046783447265625, 0.048801422119140625, 0.05081939697265625, 0.052837371826171875, 0.0548553466796875, 0.056873321533203125, 0.05889129638671875, 0.060909271240234375, 0.06292724609375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 3.0, 3.0, 10.0, 6.0, 13.0, 18.0, 23.0, 31.0, 29.0, 41.0, 37.0, 29.0, 40.0, 44.0, 45.0, 49.0, 42.0, 50.0, 35.0, 65.0, 51.0, 34.0, 30.0, 38.0, 30.0, 21.0, 25.0, 33.0, 20.0, 18.0, 20.0, 14.0, 14.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.10551643371582, -19.38246726989746, -18.6594181060791, -17.936370849609375, -17.213321685791016, -16.490272521972656, -15.767223358154297, -15.044174194335938, -14.321125030517578, -13.598075866699219, -12.875027656555176, -12.151978492736816, -11.428929328918457, -10.705881118774414, -9.982831954956055, -9.259782791137695, -8.536734580993652, -7.813685894012451, -7.090636730194092, -6.367588043212891, -5.644538879394531, -4.92149019241333, -4.198441505432129, -3.4753923416137695, -2.7523436546325684, -2.029294729232788, -1.3062459230422974, -0.5831971168518066, 0.13985180854797363, 0.8629007339477539, 1.585949420928955, 2.3089985847473145, 3.0320472717285156, 3.755096197128296, 4.478145122528076, 5.201193809509277, 5.924242973327637, 6.647291660308838, 7.370340347290039, 8.093389511108398, 8.816438674926758, 9.539487838745117, 10.26253604888916, 10.98558521270752, 11.708634376525879, 12.431682586669922, 13.154731750488281, 13.87778091430664, 14.600829124450684, 15.323878288269043, 16.046926498413086, 16.769975662231445, 17.493024826049805, 18.216073989868164, 18.93912124633789, 19.66217041015625, 20.38521957397461, 21.10826873779297, 21.831317901611328, 22.554367065429688, 23.277414321899414, 24.000463485717773, 24.723512649536133, 25.446561813354492, 26.16961097717285]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 6.0, 9.0, 10.0, 12.0, 14.0, 10.0, 15.0, 22.0, 23.0, 25.0, 29.0, 23.0, 39.0, 30.0, 54.0, 40.0, 47.0, 43.0, 43.0, 40.0, 54.0, 39.0, 41.0, 40.0, 34.0, 26.0, 24.0, 20.0, 30.0, 26.0, 16.0, 13.0, 23.0, 11.0, 10.0, 12.0, 6.0, 12.0, 9.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.158723831176758, -21.42060089111328, -20.682476043701172, -19.944353103637695, -19.20623016357422, -18.468107223510742, -17.729984283447266, -16.991859436035156, -16.25373649597168, -15.515613555908203, -14.77748966217041, -14.039365768432617, -13.30124282836914, -12.563119888305664, -11.824995994567871, -11.086872100830078, -10.348749160766602, -9.610626220703125, -8.872502326965332, -8.134378433227539, -7.3962554931640625, -6.658132076263428, -5.920008659362793, -5.181885242462158, -4.443761825561523, -3.7056384086608887, -2.967514991760254, -2.229391574859619, -1.4912681579589844, -0.7531447410583496, -0.015021324157714844, 0.7231020927429199, 1.4612255096435547, 2.1993489265441895, 2.937472343444824, 3.675595760345459, 4.413719177246094, 5.1518425941467285, 5.889966011047363, 6.628089427947998, 7.366212844848633, 8.10433578491211, 8.842459678649902, 9.580583572387695, 10.318706512451172, 11.056829452514648, 11.794953346252441, 12.533077239990234, 13.271200180053711, 14.009323120117188, 14.74744701385498, 15.485570907592773, 16.22369384765625, 16.961816787719727, 17.699939727783203, 18.438064575195312, 19.17618751525879, 19.914310455322266, 20.652435302734375, 21.39055824279785, 22.128681182861328, 22.866804122924805, 23.60492706298828, 24.34305191040039, 25.081174850463867]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 10.0, 15.0, 31.0, 46.0, 79.0, 100.0, 176.0, 275.0, 411.0, 597.0, 916.0, 1393.0, 2175.0, 3399.0, 5116.0, 7483.0, 10902.0, 15609.0, 22301.0, 30108.0, 39969.0, 51153.0, 62981.0, 74414.0, 83290.0, 88463.0, 89884.0, 86221.0, 79110.0, 69167.0, 56856.0, 45747.0, 35079.0, 25935.0, 18854.0, 13153.0, 9047.0, 5989.0, 4114.0, 2729.0, 1808.0, 1176.0, 778.0, 509.0, 354.0, 200.0, 162.0, 98.0, 67.0, 42.0, 22.0, 16.0, 11.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-10.046875, -9.7353515625, -9.423828125, -9.1123046875, -8.80078125, -8.4892578125, -8.177734375, -7.8662109375, -7.5546875, -7.2431640625, -6.931640625, -6.6201171875, -6.30859375, -5.9970703125, -5.685546875, -5.3740234375, -5.0625, -4.7509765625, -4.439453125, -4.1279296875, -3.81640625, -3.5048828125, -3.193359375, -2.8818359375, -2.5703125, -2.2587890625, -1.947265625, -1.6357421875, -1.32421875, -1.0126953125, -0.701171875, -0.3896484375, -0.078125, 0.2333984375, 0.544921875, 0.8564453125, 1.16796875, 1.4794921875, 1.791015625, 2.1025390625, 2.4140625, 2.7255859375, 3.037109375, 3.3486328125, 3.66015625, 3.9716796875, 4.283203125, 4.5947265625, 4.90625, 5.2177734375, 5.529296875, 5.8408203125, 6.15234375, 6.4638671875, 6.775390625, 7.0869140625, 7.3984375, 7.7099609375, 8.021484375, 8.3330078125, 8.64453125, 8.9560546875, 9.267578125, 9.5791015625, 9.890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 5.0, 7.0, 7.0, 13.0, 14.0, 15.0, 16.0, 19.0, 23.0, 25.0, 39.0, 30.0, 43.0, 38.0, 45.0, 35.0, 42.0, 39.0, 45.0, 47.0, 42.0, 36.0, 39.0, 31.0, 35.0, 29.0, 25.0, 27.0, 16.0, 14.0, 25.0, 16.0, 13.0, 15.0, 11.0, 12.0, 14.0, 7.0, 4.0, 4.0, 9.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.125, -20.4111328125, -19.697265625, -18.9833984375, -18.26953125, -17.5556640625, -16.841796875, -16.1279296875, -15.4140625, -14.7001953125, -13.986328125, -13.2724609375, -12.55859375, -11.8447265625, -11.130859375, -10.4169921875, -9.703125, -8.9892578125, -8.275390625, -7.5615234375, -6.84765625, -6.1337890625, -5.419921875, -4.7060546875, -3.9921875, -3.2783203125, -2.564453125, -1.8505859375, -1.13671875, -0.4228515625, 0.291015625, 1.0048828125, 1.71875, 2.4326171875, 3.146484375, 3.8603515625, 4.57421875, 5.2880859375, 6.001953125, 6.7158203125, 7.4296875, 8.1435546875, 8.857421875, 9.5712890625, 10.28515625, 10.9990234375, 11.712890625, 12.4267578125, 13.140625, 13.8544921875, 14.568359375, 15.2822265625, 15.99609375, 16.7099609375, 17.423828125, 18.1376953125, 18.8515625, 19.5654296875, 20.279296875, 20.9931640625, 21.70703125, 22.4208984375, 23.134765625, 23.8486328125, 24.5625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 20.0, 24.0, 47.0, 54.0, 122.0, 164.0, 290.0, 462.0, 651.0, 1026.0, 1613.0, 2617.0, 3843.0, 5898.0, 8552.0, 12361.0, 17456.0, 24564.0, 32697.0, 43540.0, 54014.0, 65667.0, 75435.0, 83939.0, 88095.0, 87830.0, 84123.0, 76186.0, 65817.0, 54223.0, 43426.0, 33667.0, 24565.0, 17656.0, 12363.0, 8650.0, 5820.0, 3925.0, 2584.0, 1623.0, 1069.0, 698.0, 422.0, 299.0, 169.0, 112.0, 63.0, 41.0, 28.0, 17.0, 13.0, 7.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.953125, -9.6422119140625, -9.331298828125, -9.0203857421875, -8.70947265625, -8.3985595703125, -8.087646484375, -7.7767333984375, -7.4658203125, -7.1549072265625, -6.843994140625, -6.5330810546875, -6.22216796875, -5.9112548828125, -5.600341796875, -5.2894287109375, -4.978515625, -4.6676025390625, -4.356689453125, -4.0457763671875, -3.73486328125, -3.4239501953125, -3.113037109375, -2.8021240234375, -2.4912109375, -2.1802978515625, -1.869384765625, -1.5584716796875, -1.24755859375, -0.9366455078125, -0.625732421875, -0.3148193359375, -0.00390625, 0.3070068359375, 0.617919921875, 0.9288330078125, 1.23974609375, 1.5506591796875, 1.861572265625, 2.1724853515625, 2.4833984375, 2.7943115234375, 3.105224609375, 3.4161376953125, 3.72705078125, 4.0379638671875, 4.348876953125, 4.6597900390625, 4.970703125, 5.2816162109375, 5.592529296875, 5.9034423828125, 6.21435546875, 6.5252685546875, 6.836181640625, 7.1470947265625, 7.4580078125, 7.7689208984375, 8.079833984375, 8.3907470703125, 8.70166015625, 9.0125732421875, 9.323486328125, 9.6343994140625, 9.9453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 7.0, 9.0, 13.0, 12.0, 14.0, 12.0, 21.0, 27.0, 31.0, 21.0, 30.0, 32.0, 31.0, 34.0, 42.0, 27.0, 51.0, 40.0, 39.0, 43.0, 38.0, 43.0, 31.0, 38.0, 39.0, 41.0, 46.0, 33.0, 15.0, 23.0, 17.0, 16.0, 13.0, 9.0, 15.0, 9.0, 6.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.2747802734375, -13.807373046875, -13.3399658203125, -12.87255859375, -12.4051513671875, -11.937744140625, -11.4703369140625, -11.0029296875, -10.5355224609375, -10.068115234375, -9.6007080078125, -9.13330078125, -8.6658935546875, -8.198486328125, -7.7310791015625, -7.263671875, -6.7962646484375, -6.328857421875, -5.8614501953125, -5.39404296875, -4.9266357421875, -4.459228515625, -3.9918212890625, -3.5244140625, -3.0570068359375, -2.589599609375, -2.1221923828125, -1.65478515625, -1.1873779296875, -0.719970703125, -0.2525634765625, 0.21484375, 0.6822509765625, 1.149658203125, 1.6170654296875, 2.08447265625, 2.5518798828125, 3.019287109375, 3.4866943359375, 3.9541015625, 4.4215087890625, 4.888916015625, 5.3563232421875, 5.82373046875, 6.2911376953125, 6.758544921875, 7.2259521484375, 7.693359375, 8.1607666015625, 8.628173828125, 9.0955810546875, 9.56298828125, 10.0303955078125, 10.497802734375, 10.9652099609375, 11.4326171875, 11.9000244140625, 12.367431640625, 12.8348388671875, 13.30224609375, 13.7696533203125, 14.237060546875, 14.7044677734375, 15.171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 14.0, 24.0, 25.0, 44.0, 86.0, 122.0, 215.0, 290.0, 461.0, 716.0, 1074.0, 1619.0, 2473.0, 3763.0, 5699.0, 8408.0, 12067.0, 17170.0, 24080.0, 32373.0, 42910.0, 54419.0, 66560.0, 77498.0, 85459.0, 89858.0, 89547.0, 85013.0, 76595.0, 65909.0, 53675.0, 42497.0, 32089.0, 23264.0, 16877.0, 11540.0, 8063.0, 5500.0, 3532.0, 2377.0, 1579.0, 1096.0, 709.0, 437.0, 301.0, 186.0, 120.0, 89.0, 62.0, 31.0, 15.0, 11.0, 11.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.00390625, -2.896484375, -2.7890625, -2.681640625, -2.57421875, -2.466796875, -2.359375, -2.251953125, -2.14453125, -2.037109375, -1.9296875, -1.822265625, -1.71484375, -1.607421875, -1.5, -1.392578125, -1.28515625, -1.177734375, -1.0703125, -0.962890625, -0.85546875, -0.748046875, -0.640625, -0.533203125, -0.42578125, -0.318359375, -0.2109375, -0.103515625, 0.00390625, 0.111328125, 0.21875, 0.326171875, 0.43359375, 0.541015625, 0.6484375, 0.755859375, 0.86328125, 0.970703125, 1.078125, 1.185546875, 1.29296875, 1.400390625, 1.5078125, 1.615234375, 1.72265625, 1.830078125, 1.9375, 2.044921875, 2.15234375, 2.259765625, 2.3671875, 2.474609375, 2.58203125, 2.689453125, 2.796875, 2.904296875, 3.01171875, 3.119140625, 3.2265625, 3.333984375, 3.44140625, 3.548828125, 3.65625, 3.763671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 6.0, 8.0, 7.0, 13.0, 15.0, 14.0, 25.0, 26.0, 25.0, 33.0, 34.0, 45.0, 35.0, 43.0, 26.0, 51.0, 47.0, 48.0, 47.0, 38.0, 42.0, 44.0, 38.0, 41.0, 48.0, 23.0, 26.0, 21.0, 19.0, 18.0, 16.0, 14.0, 10.0, 7.0, 10.0, 4.0, 4.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004868507385253906, -0.0004713982343673706, -0.0004559457302093506, -0.00044049322605133057, -0.00042504072189331055, -0.00040958821773529053, -0.0003941357135772705, -0.0003786832094192505, -0.00036323070526123047, -0.00034777820110321045, -0.00033232569694519043, -0.0003168731927871704, -0.0003014206886291504, -0.00028596818447113037, -0.00027051568031311035, -0.00025506317615509033, -0.0002396106719970703, -0.0002241581678390503, -0.00020870566368103027, -0.00019325315952301025, -0.00017780065536499023, -0.00016234815120697021, -0.0001468956470489502, -0.00013144314289093018, -0.00011599063873291016, -0.00010053813457489014, -8.508563041687012e-05, -6.96331262588501e-05, -5.418062210083008e-05, -3.872811794281006e-05, -2.327561378479004e-05, -7.82310962677002e-06, 7.62939453125e-06, 2.308189868927002e-05, 3.853440284729004e-05, 5.398690700531006e-05, 6.943941116333008e-05, 8.48919153213501e-05, 0.00010034441947937012, 0.00011579692363739014, 0.00013124942779541016, 0.00014670193195343018, 0.0001621544361114502, 0.00017760694026947021, 0.00019305944442749023, 0.00020851194858551025, 0.00022396445274353027, 0.0002394169569015503, 0.0002548694610595703, 0.00027032196521759033, 0.00028577446937561035, 0.00030122697353363037, 0.0003166794776916504, 0.0003321319818496704, 0.00034758448600769043, 0.00036303699016571045, 0.00037848949432373047, 0.0003939419984817505, 0.0004093945026397705, 0.00042484700679779053, 0.00044029951095581055, 0.00045575201511383057, 0.0004712045192718506, 0.0004866570234298706, 0.0005021095275878906]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 10.0, 11.0, 17.0, 34.0, 52.0, 76.0, 101.0, 161.0, 302.0, 479.0, 832.0, 1381.0, 2392.0, 4307.0, 7805.0, 13999.0, 24599.0, 41411.0, 65032.0, 93728.0, 122966.0, 140101.0, 140356.0, 123849.0, 96135.0, 66904.0, 42881.0, 25460.0, 14630.0, 8067.0, 4425.0, 2544.0, 1383.0, 837.0, 474.0, 307.0, 188.0, 115.0, 63.0, 40.0, 34.0, 16.0, 15.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.55914306640625, -5.3800048828125, -5.20086669921875, -5.021728515625, -4.84259033203125, -4.6634521484375, -4.48431396484375, -4.30517578125, -4.12603759765625, -3.9468994140625, -3.76776123046875, -3.588623046875, -3.40948486328125, -3.2303466796875, -3.05120849609375, -2.8720703125, -2.69293212890625, -2.5137939453125, -2.33465576171875, -2.155517578125, -1.97637939453125, -1.7972412109375, -1.61810302734375, -1.43896484375, -1.25982666015625, -1.0806884765625, -0.90155029296875, -0.722412109375, -0.54327392578125, -0.3641357421875, -0.18499755859375, -0.005859375, 0.17327880859375, 0.3524169921875, 0.53155517578125, 0.710693359375, 0.88983154296875, 1.0689697265625, 1.24810791015625, 1.42724609375, 1.60638427734375, 1.7855224609375, 1.96466064453125, 2.143798828125, 2.32293701171875, 2.5020751953125, 2.68121337890625, 2.8603515625, 3.03948974609375, 3.2186279296875, 3.39776611328125, 3.576904296875, 3.75604248046875, 3.9351806640625, 4.11431884765625, 4.29345703125, 4.47259521484375, 4.6517333984375, 4.83087158203125, 5.010009765625, 5.18914794921875, 5.3682861328125, 5.54742431640625, 5.7265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 11.0, 12.0, 16.0, 28.0, 35.0, 52.0, 50.0, 73.0, 66.0, 77.0, 71.0, 86.0, 79.0, 57.0, 53.0, 50.0, 39.0, 34.0, 18.0, 21.0, 14.0, 9.0, 7.0, 10.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.54962158203125, -2.4508056640625, -2.35198974609375, -2.253173828125, -2.15435791015625, -2.0555419921875, -1.95672607421875, -1.85791015625, -1.75909423828125, -1.6602783203125, -1.56146240234375, -1.462646484375, -1.36383056640625, -1.2650146484375, -1.16619873046875, -1.0673828125, -0.96856689453125, -0.8697509765625, -0.77093505859375, -0.672119140625, -0.57330322265625, -0.4744873046875, -0.37567138671875, -0.27685546875, -0.17803955078125, -0.0792236328125, 0.01959228515625, 0.118408203125, 0.21722412109375, 0.3160400390625, 0.41485595703125, 0.513671875, 0.61248779296875, 0.7113037109375, 0.81011962890625, 0.908935546875, 1.00775146484375, 1.1065673828125, 1.20538330078125, 1.30419921875, 1.40301513671875, 1.5018310546875, 1.60064697265625, 1.699462890625, 1.79827880859375, 1.8970947265625, 1.99591064453125, 2.0947265625, 2.19354248046875, 2.2923583984375, 2.39117431640625, 2.489990234375, 2.58880615234375, 2.6876220703125, 2.78643798828125, 2.88525390625, 2.98406982421875, 3.0828857421875, 3.18170166015625, 3.280517578125, 3.37933349609375, 3.4781494140625, 3.57696533203125, 3.67578125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 10.0, 4.0, 8.0, 15.0, 14.0, 16.0, 20.0, 24.0, 31.0, 31.0, 34.0, 38.0, 49.0, 44.0, 34.0, 50.0, 46.0, 43.0, 60.0, 50.0, 54.0, 34.0, 34.0, 29.0, 38.0, 25.0, 35.0, 26.0, 16.0, 18.0, 17.0, 13.0, 11.0, 4.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.055950164794922, -20.318437576293945, -19.580923080444336, -18.84341049194336, -18.10589599609375, -17.368383407592773, -16.630870819091797, -15.893357276916504, -15.155843734741211, -14.418330192565918, -13.680816650390625, -12.943304061889648, -12.205790519714355, -11.468276977539062, -10.730764389038086, -9.993250846862793, -9.2557373046875, -8.518223762512207, -7.780710697174072, -7.0431976318359375, -6.3056840896606445, -5.568170547485352, -4.830657482147217, -4.093144416809082, -3.355630874633789, -2.618117570877075, -1.8806042671203613, -1.1430909633636475, -0.4055776596069336, 0.3319356441497803, 1.0694489479064941, 1.806962013244629, 2.544473648071289, 3.281986951828003, 4.019500255584717, 4.757013320922852, 5.4945268630981445, 6.2320404052734375, 6.969553470611572, 7.707066535949707, 8.444580078125, 9.182093620300293, 9.919607162475586, 10.657119750976562, 11.394633293151855, 12.132146835327148, 12.869659423828125, 13.607172966003418, 14.344686508178711, 15.082200050354004, 15.819713592529297, 16.557226181030273, 17.29473876953125, 18.03225326538086, 18.769765853881836, 19.507278442382812, 20.244792938232422, 20.9823055267334, 21.719820022583008, 22.457332611083984, 23.194847106933594, 23.93235969543457, 24.669872283935547, 25.407386779785156, 26.144899368286133]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 5.0, 11.0, 15.0, 12.0, 17.0, 19.0, 17.0, 19.0, 16.0, 20.0, 20.0, 26.0, 41.0, 33.0, 42.0, 37.0, 33.0, 41.0, 41.0, 29.0, 42.0, 27.0, 30.0, 36.0, 31.0, 28.0, 32.0, 36.0, 33.0, 23.0, 20.0, 17.0, 18.0, 12.0, 14.0, 14.0, 14.0, 10.0, 7.0, 8.0, 5.0, 2.0, 1.0, 6.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.244949340820312, -20.54758644104004, -19.8502254486084, -19.152862548828125, -18.455501556396484, -17.75813865661621, -17.060775756835938, -16.363414764404297, -15.666051864624023, -14.968689918518066, -14.27132797241211, -13.573965072631836, -12.876603126525879, -12.179241180419922, -11.481878280639648, -10.784516334533691, -10.087154388427734, -9.389792442321777, -8.69243049621582, -7.995067596435547, -7.29770565032959, -6.600343704223633, -5.902981281280518, -5.205618858337402, -4.508256912231445, -3.810894727706909, -3.113532543182373, -2.416170358657837, -1.7188081741333008, -1.0214459896087646, -0.3240838050842285, 0.3732786178588867, 1.0706405639648438, 1.7680027484893799, 2.465364933013916, 3.162727117538452, 3.8600893020629883, 4.557451248168945, 5.2548136711120605, 5.952176094055176, 6.649538040161133, 7.34689998626709, 8.044261932373047, 8.74162483215332, 9.438986778259277, 10.136348724365234, 10.833711624145508, 11.531073570251465, 12.228435516357422, 12.925797462463379, 13.623159408569336, 14.32052230834961, 15.017884254455566, 15.715246200561523, 16.412609100341797, 17.109970092773438, 17.80733299255371, 18.504695892333984, 19.202056884765625, 19.8994197845459, 20.596782684326172, 21.294143676757812, 21.991506576538086, 22.68886947631836, 23.38623046875]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 9.0, 13.0, 25.0, 32.0, 61.0, 85.0, 150.0, 231.0, 388.0, 637.0, 1021.0, 1711.0, 2809.0, 4456.0, 7241.0, 11192.0, 17135.0, 26202.0, 40102.0, 57452.0, 82096.0, 114521.0, 154157.0, 200747.0, 249627.0, 299891.0, 339749.0, 364447.0, 371885.0, 359539.0, 328077.0, 283398.0, 233772.0, 183669.0, 139324.0, 101167.0, 72459.0, 49494.0, 33328.0, 22198.0, 14603.0, 9298.0, 5978.0, 3786.0, 2335.0, 1468.0, 981.0, 565.0, 341.0, 177.0, 100.0, 65.0, 36.0, 29.0, 10.0, 13.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-15.3203125, -14.8309326171875, -14.341552734375, -13.8521728515625, -13.36279296875, -12.8734130859375, -12.384033203125, -11.8946533203125, -11.4052734375, -10.9158935546875, -10.426513671875, -9.9371337890625, -9.44775390625, -8.9583740234375, -8.468994140625, -7.9796142578125, -7.490234375, -7.0008544921875, -6.511474609375, -6.0220947265625, -5.53271484375, -5.0433349609375, -4.553955078125, -4.0645751953125, -3.5751953125, -3.0858154296875, -2.596435546875, -2.1070556640625, -1.61767578125, -1.1282958984375, -0.638916015625, -0.1495361328125, 0.33984375, 0.8292236328125, 1.318603515625, 1.8079833984375, 2.29736328125, 2.7867431640625, 3.276123046875, 3.7655029296875, 4.2548828125, 4.7442626953125, 5.233642578125, 5.7230224609375, 6.21240234375, 6.7017822265625, 7.191162109375, 7.6805419921875, 8.169921875, 8.6593017578125, 9.148681640625, 9.6380615234375, 10.12744140625, 10.6168212890625, 11.106201171875, 11.5955810546875, 12.0849609375, 12.5743408203125, 13.063720703125, 13.5531005859375, 14.04248046875, 14.5318603515625, 15.021240234375, 15.5106201171875, 16.0]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 8.0, 11.0, 8.0, 11.0, 14.0, 25.0, 16.0, 14.0, 17.0, 23.0, 23.0, 33.0, 25.0, 31.0, 29.0, 41.0, 32.0, 34.0, 34.0, 36.0, 32.0, 42.0, 38.0, 30.0, 28.0, 38.0, 36.0, 29.0, 34.0, 22.0, 25.0, 17.0, 17.0, 16.0, 18.0, 17.0, 20.0, 12.0, 9.0, 5.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0], "bins": [-19.265625, -18.6513671875, -18.037109375, -17.4228515625, -16.80859375, -16.1943359375, -15.580078125, -14.9658203125, -14.3515625, -13.7373046875, -13.123046875, -12.5087890625, -11.89453125, -11.2802734375, -10.666015625, -10.0517578125, -9.4375, -8.8232421875, -8.208984375, -7.5947265625, -6.98046875, -6.3662109375, -5.751953125, -5.1376953125, -4.5234375, -3.9091796875, -3.294921875, -2.6806640625, -2.06640625, -1.4521484375, -0.837890625, -0.2236328125, 0.390625, 1.0048828125, 1.619140625, 2.2333984375, 2.84765625, 3.4619140625, 4.076171875, 4.6904296875, 5.3046875, 5.9189453125, 6.533203125, 7.1474609375, 7.76171875, 8.3759765625, 8.990234375, 9.6044921875, 10.21875, 10.8330078125, 11.447265625, 12.0615234375, 12.67578125, 13.2900390625, 13.904296875, 14.5185546875, 15.1328125, 15.7470703125, 16.361328125, 16.9755859375, 17.58984375, 18.2041015625, 18.818359375, 19.4326171875, 20.046875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 9.0, 28.0, 44.0, 71.0, 115.0, 284.0, 406.0, 759.0, 1326.0, 2446.0, 4342.0, 7719.0, 13263.0, 22447.0, 37630.0, 60941.0, 95656.0, 142795.0, 201659.0, 270704.0, 341678.0, 401014.0, 437632.0, 440497.0, 411464.0, 357677.0, 289614.0, 219212.0, 155765.0, 105152.0, 68496.0, 42410.0, 25610.0, 15166.0, 8918.0, 5138.0, 2782.0, 1523.0, 822.0, 478.0, 267.0, 132.0, 80.0, 44.0, 32.0, 14.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.21875, -20.578125, -19.9375, -19.296875, -18.65625, -18.015625, -17.375, -16.734375, -16.09375, -15.453125, -14.8125, -14.171875, -13.53125, -12.890625, -12.25, -11.609375, -10.96875, -10.328125, -9.6875, -9.046875, -8.40625, -7.765625, -7.125, -6.484375, -5.84375, -5.203125, -4.5625, -3.921875, -3.28125, -2.640625, -2.0, -1.359375, -0.71875, -0.078125, 0.5625, 1.203125, 1.84375, 2.484375, 3.125, 3.765625, 4.40625, 5.046875, 5.6875, 6.328125, 6.96875, 7.609375, 8.25, 8.890625, 9.53125, 10.171875, 10.8125, 11.453125, 12.09375, 12.734375, 13.375, 14.015625, 14.65625, 15.296875, 15.9375, 16.578125, 17.21875, 17.859375, 18.5, 19.140625, 19.78125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 10.0, 21.0, 25.0, 37.0, 36.0, 49.0, 47.0, 62.0, 94.0, 71.0, 101.0, 105.0, 109.0, 140.0, 137.0, 158.0, 161.0, 179.0, 191.0, 194.0, 193.0, 186.0, 172.0, 169.0, 166.0, 170.0, 157.0, 129.0, 117.0, 103.0, 105.0, 70.0, 64.0, 63.0, 50.0, 52.0, 27.0, 33.0, 27.0, 16.0, 13.0, 13.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.484375, -9.1710205078125, -8.857666015625, -8.5443115234375, -8.23095703125, -7.9176025390625, -7.604248046875, -7.2908935546875, -6.9775390625, -6.6641845703125, -6.350830078125, -6.0374755859375, -5.72412109375, -5.4107666015625, -5.097412109375, -4.7840576171875, -4.470703125, -4.1573486328125, -3.843994140625, -3.5306396484375, -3.21728515625, -2.9039306640625, -2.590576171875, -2.2772216796875, -1.9638671875, -1.6505126953125, -1.337158203125, -1.0238037109375, -0.71044921875, -0.3970947265625, -0.083740234375, 0.2296142578125, 0.54296875, 0.8563232421875, 1.169677734375, 1.4830322265625, 1.79638671875, 2.1097412109375, 2.423095703125, 2.7364501953125, 3.0498046875, 3.3631591796875, 3.676513671875, 3.9898681640625, 4.30322265625, 4.6165771484375, 4.929931640625, 5.2432861328125, 5.556640625, 5.8699951171875, 6.183349609375, 6.4967041015625, 6.81005859375, 7.1234130859375, 7.436767578125, 7.7501220703125, 8.0634765625, 8.3768310546875, 8.690185546875, 9.0035400390625, 9.31689453125, 9.6302490234375, 9.943603515625, 10.2569580078125, 10.5703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 8.0, 7.0, 8.0, 17.0, 13.0, 26.0, 22.0, 33.0, 38.0, 30.0, 39.0, 45.0, 38.0, 61.0, 57.0, 51.0, 58.0, 46.0, 38.0, 52.0, 42.0, 33.0, 56.0, 32.0, 19.0, 24.0, 26.0, 16.0, 13.0, 18.0, 8.0, 11.0, 5.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.26637840270996, -27.259370803833008, -26.252361297607422, -25.24535369873047, -24.238344192504883, -23.23133659362793, -22.224327087402344, -21.21731948852539, -20.210311889648438, -19.203304290771484, -18.1962947845459, -17.189287185668945, -16.18227767944336, -15.175270080566406, -14.168261528015137, -13.161252975463867, -12.154243469238281, -11.147234916687012, -10.140226364135742, -9.133218765258789, -8.126209259033203, -7.119201183319092, -6.1121931076049805, -5.105184555053711, -4.098176002502441, -3.091167449951172, -2.0841591358184814, -1.077150821685791, -0.07014226913452148, 0.936866283416748, 1.9438743591308594, 2.950882911682129, 3.9578933715820312, 4.964901924133301, 5.97191047668457, 6.978918552398682, 7.985927104949951, 8.992935180664062, 9.999943733215332, 11.006952285766602, 12.013960838317871, 13.02096939086914, 14.02797794342041, 15.03498649597168, 16.041994094848633, 17.04900360107422, 18.056011199951172, 19.063018798828125, 20.07002830505371, 21.077035903930664, 22.08404541015625, 23.091053009033203, 24.09806251525879, 25.105070114135742, 26.112079620361328, 27.11908721923828, 28.126094818115234, 29.133102416992188, 30.140111923217773, 31.147119522094727, 32.15412902832031, 33.161136627197266, 34.16814422607422, 35.17515563964844, 36.18216323852539]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 7.0, 5.0, 4.0, 11.0, 15.0, 13.0, 14.0, 25.0, 19.0, 21.0, 18.0, 12.0, 30.0, 35.0, 31.0, 44.0, 31.0, 38.0, 35.0, 40.0, 40.0, 39.0, 44.0, 41.0, 50.0, 32.0, 26.0, 31.0, 36.0, 18.0, 25.0, 32.0, 18.0, 19.0, 17.0, 11.0, 9.0, 13.0, 5.0, 13.0, 3.0, 5.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-28.070402145385742, -27.211172103881836, -26.35194206237793, -25.492712020874023, -24.633481979370117, -23.77425193786621, -22.915021896362305, -22.0557918548584, -21.196561813354492, -20.337331771850586, -19.47810173034668, -18.618871688842773, -17.759641647338867, -16.90041160583496, -16.041181564331055, -15.181951522827148, -14.322720527648926, -13.46349048614502, -12.604260444641113, -11.745030403137207, -10.8858003616333, -10.026569366455078, -9.167339324951172, -8.308109283447266, -7.448879718780518, -6.589649677276611, -5.730419635772705, -4.871189117431641, -4.011959075927734, -3.152729034423828, -2.293498992919922, -1.4342689514160156, -0.5750389099121094, 0.28419119119644165, 1.1434212923049927, 2.0026514530181885, 2.8618814945220947, 3.72111177444458, 4.580341815948486, 5.439571857452393, 6.298801898956299, 7.158031940460205, 8.01726245880127, 8.876492500305176, 9.735722541809082, 10.594952583312988, 11.454182624816895, 12.3134126663208, 13.172642707824707, 14.031872749328613, 14.89110279083252, 15.750332832336426, 16.60956382751465, 17.468793869018555, 18.32802391052246, 19.187253952026367, 20.046483993530273, 20.90571403503418, 21.764944076538086, 22.624174118041992, 23.4834041595459, 24.342634201049805, 25.20186424255371, 26.061094284057617, 26.920324325561523]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 20.0, 21.0, 56.0, 66.0, 86.0, 126.0, 204.0, 356.0, 576.0, 954.0, 1395.0, 2301.0, 3779.0, 6312.0, 10820.0, 18362.0, 31755.0, 58266.0, 108795.0, 204253.0, 257945.0, 155121.0, 82188.0, 44520.0, 24596.0, 14141.0, 8419.0, 5016.0, 3109.0, 1855.0, 1136.0, 682.0, 468.0, 316.0, 200.0, 118.0, 60.0, 52.0, 32.0, 20.0, 12.0, 11.0, 9.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.91241455078125, -3.7740478515625, -3.63568115234375, -3.497314453125, -3.35894775390625, -3.2205810546875, -3.08221435546875, -2.94384765625, -2.80548095703125, -2.6671142578125, -2.52874755859375, -2.390380859375, -2.25201416015625, -2.1136474609375, -1.97528076171875, -1.8369140625, -1.69854736328125, -1.5601806640625, -1.42181396484375, -1.283447265625, -1.14508056640625, -1.0067138671875, -0.86834716796875, -0.72998046875, -0.59161376953125, -0.4532470703125, -0.31488037109375, -0.176513671875, -0.03814697265625, 0.1002197265625, 0.23858642578125, 0.376953125, 0.51531982421875, 0.6536865234375, 0.79205322265625, 0.930419921875, 1.06878662109375, 1.2071533203125, 1.34552001953125, 1.48388671875, 1.62225341796875, 1.7606201171875, 1.89898681640625, 2.037353515625, 2.17572021484375, 2.3140869140625, 2.45245361328125, 2.5908203125, 2.72918701171875, 2.8675537109375, 3.00592041015625, 3.144287109375, 3.28265380859375, 3.4210205078125, 3.55938720703125, 3.69775390625, 3.83612060546875, 3.9744873046875, 4.11285400390625, 4.251220703125, 4.38958740234375, 4.5279541015625, 4.66632080078125, 4.8046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 4.0, 8.0, 13.0, 8.0, 19.0, 15.0, 24.0, 18.0, 19.0, 18.0, 28.0, 44.0, 30.0, 39.0, 38.0, 54.0, 53.0, 41.0, 37.0, 40.0, 45.0, 46.0, 49.0, 37.0, 27.0, 38.0, 26.0, 30.0, 22.0, 19.0, 15.0, 17.0, 18.0, 10.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-34.6875, -33.70654296875, -32.7255859375, -31.74462890625, -30.763671875, -29.78271484375, -28.8017578125, -27.82080078125, -26.83984375, -25.85888671875, -24.8779296875, -23.89697265625, -22.916015625, -21.93505859375, -20.9541015625, -19.97314453125, -18.9921875, -18.01123046875, -17.0302734375, -16.04931640625, -15.068359375, -14.08740234375, -13.1064453125, -12.12548828125, -11.14453125, -10.16357421875, -9.1826171875, -8.20166015625, -7.220703125, -6.23974609375, -5.2587890625, -4.27783203125, -3.296875, -2.31591796875, -1.3349609375, -0.35400390625, 0.626953125, 1.60791015625, 2.5888671875, 3.56982421875, 4.55078125, 5.53173828125, 6.5126953125, 7.49365234375, 8.474609375, 9.45556640625, 10.4365234375, 11.41748046875, 12.3984375, 13.37939453125, 14.3603515625, 15.34130859375, 16.322265625, 17.30322265625, 18.2841796875, 19.26513671875, 20.24609375, 21.22705078125, 22.2080078125, 23.18896484375, 24.169921875, 25.15087890625, 26.1318359375, 27.11279296875, 28.09375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 17.0, 21.0, 16.0, 27.0, 38.0, 71.0, 95.0, 110.0, 171.0, 259.0, 344.0, 465.0, 699.0, 961.0, 1470.0, 2173.0, 3041.0, 4595.0, 6919.0, 10136.0, 15297.0, 23584.0, 36700.0, 58502.0, 96715.0, 158424.0, 209388.0, 157166.0, 95521.0, 58112.0, 37101.0, 23659.0, 15355.0, 10170.0, 6702.0, 4554.0, 3019.0, 2141.0, 1491.0, 1005.0, 707.0, 478.0, 365.0, 221.0, 169.0, 129.0, 77.0, 53.0, 34.0, 22.0, 26.0, 12.0, 8.0, 7.0, 9.0, 1.0, 1.0, 3.0], "bins": [-3.857421875, -3.73870849609375, -3.6199951171875, -3.50128173828125, -3.382568359375, -3.26385498046875, -3.1451416015625, -3.02642822265625, -2.90771484375, -2.78900146484375, -2.6702880859375, -2.55157470703125, -2.432861328125, -2.31414794921875, -2.1954345703125, -2.07672119140625, -1.9580078125, -1.83929443359375, -1.7205810546875, -1.60186767578125, -1.483154296875, -1.36444091796875, -1.2457275390625, -1.12701416015625, -1.00830078125, -0.88958740234375, -0.7708740234375, -0.65216064453125, -0.533447265625, -0.41473388671875, -0.2960205078125, -0.17730712890625, -0.05859375, 0.06011962890625, 0.1788330078125, 0.29754638671875, 0.416259765625, 0.53497314453125, 0.6536865234375, 0.77239990234375, 0.89111328125, 1.00982666015625, 1.1285400390625, 1.24725341796875, 1.365966796875, 1.48468017578125, 1.6033935546875, 1.72210693359375, 1.8408203125, 1.95953369140625, 2.0782470703125, 2.19696044921875, 2.315673828125, 2.43438720703125, 2.5531005859375, 2.67181396484375, 2.79052734375, 2.90924072265625, 3.0279541015625, 3.14666748046875, 3.265380859375, 3.38409423828125, 3.5028076171875, 3.62152099609375, 3.740234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 9.0, 6.0, 9.0, 19.0, 8.0, 18.0, 18.0, 23.0, 19.0, 22.0, 22.0, 27.0, 34.0, 29.0, 34.0, 35.0, 44.0, 32.0, 32.0, 46.0, 40.0, 28.0, 41.0, 39.0, 37.0, 28.0, 29.0, 27.0, 29.0, 29.0, 27.0, 18.0, 26.0, 10.0, 17.0, 15.0, 15.0, 7.0, 11.0, 6.0, 1.0, 6.0, 3.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.8021240234375, -17.276123046875, -16.7501220703125, -16.22412109375, -15.6981201171875, -15.172119140625, -14.6461181640625, -14.1201171875, -13.5941162109375, -13.068115234375, -12.5421142578125, -12.01611328125, -11.4901123046875, -10.964111328125, -10.4381103515625, -9.912109375, -9.3861083984375, -8.860107421875, -8.3341064453125, -7.80810546875, -7.2821044921875, -6.756103515625, -6.2301025390625, -5.7041015625, -5.1781005859375, -4.652099609375, -4.1260986328125, -3.60009765625, -3.0740966796875, -2.548095703125, -2.0220947265625, -1.49609375, -0.9700927734375, -0.444091796875, 0.0819091796875, 0.60791015625, 1.1339111328125, 1.659912109375, 2.1859130859375, 2.7119140625, 3.2379150390625, 3.763916015625, 4.2899169921875, 4.81591796875, 5.3419189453125, 5.867919921875, 6.3939208984375, 6.919921875, 7.4459228515625, 7.971923828125, 8.4979248046875, 9.02392578125, 9.5499267578125, 10.075927734375, 10.6019287109375, 11.1279296875, 11.6539306640625, 12.179931640625, 12.7059326171875, 13.23193359375, 13.7579345703125, 14.283935546875, 14.8099365234375, 15.3359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 7.0, 7.0, 6.0, 8.0, 5.0, 21.0, 24.0, 26.0, 53.0, 66.0, 97.0, 116.0, 162.0, 241.0, 345.0, 452.0, 676.0, 979.0, 1433.0, 2041.0, 3064.0, 4681.0, 7105.0, 11019.0, 17985.0, 29494.0, 51211.0, 95765.0, 186598.0, 260988.0, 167439.0, 85691.0, 46642.0, 27348.0, 16501.0, 10103.0, 6595.0, 4355.0, 2807.0, 1953.0, 1325.0, 919.0, 624.0, 441.0, 307.0, 252.0, 177.0, 113.0, 87.0, 59.0, 37.0, 29.0, 25.0, 18.0, 12.0, 9.0, 5.0, 11.0, 1.0, 2.0, 5.0], "bins": [-0.09564208984375, -0.09269142150878906, -0.08974075317382812, -0.08679008483886719, -0.08383941650390625, -0.08088874816894531, -0.07793807983398438, -0.07498741149902344, -0.0720367431640625, -0.06908607482910156, -0.06613540649414062, -0.06318473815917969, -0.06023406982421875, -0.05728340148925781, -0.054332733154296875, -0.05138206481933594, -0.048431396484375, -0.04548072814941406, -0.042530059814453125, -0.03957939147949219, -0.03662872314453125, -0.03367805480957031, -0.030727386474609375, -0.027776718139648438, -0.0248260498046875, -0.021875381469726562, -0.018924713134765625, -0.015974044799804688, -0.01302337646484375, -0.010072708129882812, -0.007122039794921875, -0.0041713714599609375, -0.001220703125, 0.0017299652099609375, 0.004680633544921875, 0.0076313018798828125, 0.01058197021484375, 0.013532638549804688, 0.016483306884765625, 0.019433975219726562, 0.0223846435546875, 0.025335311889648438, 0.028285980224609375, 0.031236648559570312, 0.03418731689453125, 0.03713798522949219, 0.040088653564453125, 0.04303932189941406, 0.045989990234375, 0.04894065856933594, 0.051891326904296875, 0.05484199523925781, 0.05779266357421875, 0.06074333190917969, 0.06369400024414062, 0.06664466857910156, 0.0695953369140625, 0.07254600524902344, 0.07549667358398438, 0.07844734191894531, 0.08139801025390625, 0.08434867858886719, 0.08729934692382812, 0.09025001525878906, 0.09320068359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 1.0, 8.0, 10.0, 14.0, 14.0, 10.0, 14.0, 22.0, 17.0, 33.0, 22.0, 26.0, 39.0, 24.0, 42.0, 31.0, 41.0, 38.0, 44.0, 41.0, 50.0, 46.0, 34.0, 40.0, 36.0, 33.0, 43.0, 30.0, 20.0, 25.0, 19.0, 13.0, 24.0, 18.0, 12.0, 18.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8298625946044922e-05, -1.7726793885231018e-05, -1.7154961824417114e-05, -1.658312976360321e-05, -1.6011297702789307e-05, -1.5439465641975403e-05, -1.4867633581161499e-05, -1.4295801520347595e-05, -1.3723969459533691e-05, -1.3152137398719788e-05, -1.2580305337905884e-05, -1.200847327709198e-05, -1.1436641216278076e-05, -1.0864809155464172e-05, -1.0292977094650269e-05, -9.721145033836365e-06, -9.149312973022461e-06, -8.577480912208557e-06, -8.005648851394653e-06, -7.4338167905807495e-06, -6.861984729766846e-06, -6.290152668952942e-06, -5.718320608139038e-06, -5.146488547325134e-06, -4.5746564865112305e-06, -4.002824425697327e-06, -3.430992364883423e-06, -2.859160304069519e-06, -2.2873282432556152e-06, -1.7154961824417114e-06, -1.1436641216278076e-06, -5.718320608139038e-07, 0.0, 5.718320608139038e-07, 1.1436641216278076e-06, 1.7154961824417114e-06, 2.2873282432556152e-06, 2.859160304069519e-06, 3.430992364883423e-06, 4.002824425697327e-06, 4.5746564865112305e-06, 5.146488547325134e-06, 5.718320608139038e-06, 6.290152668952942e-06, 6.861984729766846e-06, 7.4338167905807495e-06, 8.005648851394653e-06, 8.577480912208557e-06, 9.149312973022461e-06, 9.721145033836365e-06, 1.0292977094650269e-05, 1.0864809155464172e-05, 1.1436641216278076e-05, 1.200847327709198e-05, 1.2580305337905884e-05, 1.3152137398719788e-05, 1.3723969459533691e-05, 1.4295801520347595e-05, 1.4867633581161499e-05, 1.5439465641975403e-05, 1.6011297702789307e-05, 1.658312976360321e-05, 1.7154961824417114e-05, 1.7726793885231018e-05, 1.8298625946044922e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 18.0, 17.0, 49.0, 62.0, 79.0, 109.0, 179.0, 271.0, 397.0, 598.0, 868.0, 1358.0, 1848.0, 2811.0, 3928.0, 6028.0, 8896.0, 12914.0, 19369.0, 29786.0, 46232.0, 75647.0, 133030.0, 242290.0, 188768.0, 101790.0, 59434.0, 37352.0, 24237.0, 16120.0, 10996.0, 7430.0, 5004.0, 3379.0, 2377.0, 1610.0, 1043.0, 733.0, 516.0, 362.0, 211.0, 135.0, 78.0, 73.0, 50.0, 27.0, 19.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.1991748809814453, -0.19290542602539062, -0.18663597106933594, -0.18036651611328125, -0.17409706115722656, -0.16782760620117188, -0.1615581512451172, -0.1552886962890625, -0.1490192413330078, -0.14274978637695312, -0.13648033142089844, -0.13021087646484375, -0.12394142150878906, -0.11767196655273438, -0.11140251159667969, -0.105133056640625, -0.09886360168457031, -0.09259414672851562, -0.08632469177246094, -0.08005523681640625, -0.07378578186035156, -0.06751632690429688, -0.06124687194824219, -0.0549774169921875, -0.04870796203613281, -0.042438507080078125, -0.03616905212402344, -0.02989959716796875, -0.023630142211914062, -0.017360687255859375, -0.011091232299804688, -0.00482177734375, 0.0014476776123046875, 0.007717132568359375, 0.013986587524414062, 0.02025604248046875, 0.026525497436523438, 0.032794952392578125, 0.03906440734863281, 0.0453338623046875, 0.05160331726074219, 0.057872772216796875, 0.06414222717285156, 0.07041168212890625, 0.07668113708496094, 0.08295059204101562, 0.08922004699707031, 0.095489501953125, 0.10175895690917969, 0.10802841186523438, 0.11429786682128906, 0.12056732177734375, 0.12683677673339844, 0.13310623168945312, 0.1393756866455078, 0.1456451416015625, 0.1519145965576172, 0.15818405151367188, 0.16445350646972656, 0.17072296142578125, 0.17699241638183594, 0.18326187133789062, 0.1895313262939453, 0.19580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 8.0, 12.0, 8.0, 16.0, 22.0, 38.0, 37.0, 49.0, 61.0, 79.0, 109.0, 102.0, 97.0, 80.0, 63.0, 53.0, 34.0, 25.0, 20.0, 16.0, 10.0, 5.0, 8.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09957218170166016, -0.09617805480957031, -0.09278392791748047, -0.08938980102539062, -0.08599567413330078, -0.08260154724121094, -0.0792074203491211, -0.07581329345703125, -0.0724191665649414, -0.06902503967285156, -0.06563091278076172, -0.062236785888671875, -0.05884265899658203, -0.05544853210449219, -0.052054405212402344, -0.0486602783203125, -0.045266151428222656, -0.04187202453613281, -0.03847789764404297, -0.035083770751953125, -0.03168964385986328, -0.028295516967773438, -0.024901390075683594, -0.02150726318359375, -0.018113136291503906, -0.014719009399414062, -0.011324882507324219, -0.007930755615234375, -0.004536628723144531, -0.0011425018310546875, 0.0022516250610351562, 0.005645751953125, 0.009039878845214844, 0.012434005737304688, 0.01582813262939453, 0.019222259521484375, 0.02261638641357422, 0.026010513305664062, 0.029404640197753906, 0.03279876708984375, 0.036192893981933594, 0.03958702087402344, 0.04298114776611328, 0.046375274658203125, 0.04976940155029297, 0.05316352844238281, 0.056557655334472656, 0.0599517822265625, 0.06334590911865234, 0.06674003601074219, 0.07013416290283203, 0.07352828979492188, 0.07692241668701172, 0.08031654357910156, 0.0837106704711914, 0.08710479736328125, 0.0904989242553711, 0.09389305114746094, 0.09728717803955078, 0.10068130493164062, 0.10407543182373047, 0.10746955871582031, 0.11086368560791016, 0.1142578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 9.0, 18.0, 20.0, 29.0, 29.0, 36.0, 33.0, 41.0, 38.0, 42.0, 60.0, 57.0, 51.0, 52.0, 44.0, 48.0, 51.0, 37.0, 38.0, 45.0, 42.0, 24.0, 21.0, 27.0, 19.0, 12.0, 15.0, 12.0, 11.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.633695602416992, -27.625804901123047, -26.6179141998291, -25.610023498535156, -24.60213279724121, -23.594242095947266, -22.586349487304688, -21.578460693359375, -20.570568084716797, -19.56267738342285, -18.554786682128906, -17.54689598083496, -16.539005279541016, -15.53111457824707, -14.523222923278809, -13.515332221984863, -12.507442474365234, -11.499551773071289, -10.491661071777344, -9.483770370483398, -8.475879669189453, -7.46798849105835, -6.460097312927246, -5.452206611633301, -4.4443159103393555, -3.43642520904541, -2.4285342693328857, -1.4206433296203613, -0.412752628326416, 0.5951380729675293, 1.6030292510986328, 2.610919952392578, 3.6188087463378906, 4.626699447631836, 5.634590148925781, 6.642481327056885, 7.65037202835083, 8.658262252807617, 9.666153907775879, 10.674044609069824, 11.68193531036377, 12.689826011657715, 13.69771671295166, 14.705608367919922, 15.713499069213867, 16.721389770507812, 17.729280471801758, 18.737171173095703, 19.74506187438965, 20.752952575683594, 21.76084327697754, 22.768733978271484, 23.77662467956543, 24.784515380859375, 25.792407989501953, 26.800296783447266, 27.808189392089844, 28.81608009338379, 29.823970794677734, 30.83186149597168, 31.839752197265625, 32.8476448059082, 33.855533599853516, 34.863426208496094, 35.871315002441406]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 8.0, 3.0, 5.0, 10.0, 14.0, 12.0, 16.0, 25.0, 17.0, 24.0, 14.0, 15.0, 29.0, 34.0, 29.0, 41.0, 37.0, 37.0, 36.0, 38.0, 36.0, 42.0, 46.0, 43.0, 47.0, 37.0, 23.0, 31.0, 38.0, 17.0, 27.0, 29.0, 19.0, 20.0, 17.0, 12.0, 8.0, 14.0, 5.0, 13.0, 3.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-28.29906463623047, -27.437580108642578, -26.576095581054688, -25.714611053466797, -24.85312843322754, -23.99164390563965, -23.130159378051758, -22.268674850463867, -21.407190322875977, -20.545705795288086, -19.684221267700195, -18.822738647460938, -17.961254119873047, -17.099769592285156, -16.238285064697266, -15.376800537109375, -14.5153169631958, -13.65383243560791, -12.792348861694336, -11.930864334106445, -11.069379806518555, -10.207895278930664, -9.34641170501709, -8.4849271774292, -7.623443126678467, -6.761959075927734, -5.900474548339844, -5.038990497589111, -4.177506446838379, -3.3160219192504883, -2.454537868499756, -1.5930533409118652, -0.7315692901611328, 0.12991493940353394, 0.9913991689682007, 1.8528833389282227, 2.714367628097534, 3.5758519172668457, 4.437335968017578, 5.298820495605469, 6.160304546356201, 7.021788597106934, 7.883273124694824, 8.744756698608398, 9.606241226196289, 10.46772575378418, 11.32921028137207, 12.190694808959961, 13.052178382873535, 13.913662910461426, 14.775146484375, 15.63663101196289, 16.49811553955078, 17.359600067138672, 18.221084594726562, 19.082569122314453, 19.94405174255371, 20.8055362701416, 21.667020797729492, 22.52850341796875, 23.38998794555664, 24.25147247314453, 25.112957000732422, 25.974441528320312, 26.835926055908203]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 13.0, 25.0, 38.0, 57.0, 109.0, 170.0, 258.0, 441.0, 590.0, 994.0, 1599.0, 2522.0, 3797.0, 5779.0, 8728.0, 12719.0, 18121.0, 25311.0, 34461.0, 45586.0, 57916.0, 69734.0, 80731.0, 87501.0, 92296.0, 90354.0, 84688.0, 74589.0, 63614.0, 50849.0, 39687.0, 29082.0, 21265.0, 14922.0, 10267.0, 6936.0, 4566.0, 2971.0, 1974.0, 1203.0, 848.0, 502.0, 298.0, 191.0, 104.0, 55.0, 41.0, 30.0, 12.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1640625, -10.7884521484375, -10.412841796875, -10.0372314453125, -9.66162109375, -9.2860107421875, -8.910400390625, -8.5347900390625, -8.1591796875, -7.7835693359375, -7.407958984375, -7.0323486328125, -6.65673828125, -6.2811279296875, -5.905517578125, -5.5299072265625, -5.154296875, -4.7786865234375, -4.403076171875, -4.0274658203125, -3.65185546875, -3.2762451171875, -2.900634765625, -2.5250244140625, -2.1494140625, -1.7738037109375, -1.398193359375, -1.0225830078125, -0.64697265625, -0.2713623046875, 0.104248046875, 0.4798583984375, 0.85546875, 1.2310791015625, 1.606689453125, 1.9822998046875, 2.35791015625, 2.7335205078125, 3.109130859375, 3.4847412109375, 3.8603515625, 4.2359619140625, 4.611572265625, 4.9871826171875, 5.36279296875, 5.7384033203125, 6.114013671875, 6.4896240234375, 6.865234375, 7.2408447265625, 7.616455078125, 7.9920654296875, 8.36767578125, 8.7432861328125, 9.118896484375, 9.4945068359375, 9.8701171875, 10.2457275390625, 10.621337890625, 10.9969482421875, 11.37255859375, 11.7481689453125, 12.123779296875, 12.4993896484375, 12.875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 7.0, 3.0, 9.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 26.0, 21.0, 17.0, 20.0, 19.0, 36.0, 42.0, 24.0, 34.0, 45.0, 37.0, 43.0, 40.0, 45.0, 38.0, 43.0, 41.0, 30.0, 34.0, 45.0, 27.0, 19.0, 18.0, 32.0, 21.0, 24.0, 17.0, 15.0, 22.0, 10.0, 10.0, 10.0, 7.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.34375, -28.453125, -27.5625, -26.671875, -25.78125, -24.890625, -24.0, -23.109375, -22.21875, -21.328125, -20.4375, -19.546875, -18.65625, -17.765625, -16.875, -15.984375, -15.09375, -14.203125, -13.3125, -12.421875, -11.53125, -10.640625, -9.75, -8.859375, -7.96875, -7.078125, -6.1875, -5.296875, -4.40625, -3.515625, -2.625, -1.734375, -0.84375, 0.046875, 0.9375, 1.828125, 2.71875, 3.609375, 4.5, 5.390625, 6.28125, 7.171875, 8.0625, 8.953125, 9.84375, 10.734375, 11.625, 12.515625, 13.40625, 14.296875, 15.1875, 16.078125, 16.96875, 17.859375, 18.75, 19.640625, 20.53125, 21.421875, 22.3125, 23.203125, 24.09375, 24.984375, 25.875, 26.765625, 27.65625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 22.0, 36.0, 31.0, 42.0, 88.0, 95.0, 199.0, 274.0, 435.0, 626.0, 1042.0, 1472.0, 2335.0, 3635.0, 5457.0, 7933.0, 12018.0, 17351.0, 23914.0, 32922.0, 43761.0, 55470.0, 68137.0, 78875.0, 87156.0, 91882.0, 91311.0, 85479.0, 76497.0, 65190.0, 52594.0, 40918.0, 30787.0, 22418.0, 15833.0, 10819.0, 7382.0, 4814.0, 3277.0, 2113.0, 1370.0, 917.0, 589.0, 358.0, 239.0, 167.0, 87.0, 65.0, 45.0, 21.0, 24.0, 13.0, 4.0, 7.0, 3.0, 1.0, 3.0], "bins": [-12.6953125, -12.3092041015625, -11.923095703125, -11.5369873046875, -11.15087890625, -10.7647705078125, -10.378662109375, -9.9925537109375, -9.6064453125, -9.2203369140625, -8.834228515625, -8.4481201171875, -8.06201171875, -7.6759033203125, -7.289794921875, -6.9036865234375, -6.517578125, -6.1314697265625, -5.745361328125, -5.3592529296875, -4.97314453125, -4.5870361328125, -4.200927734375, -3.8148193359375, -3.4287109375, -3.0426025390625, -2.656494140625, -2.2703857421875, -1.88427734375, -1.4981689453125, -1.112060546875, -0.7259521484375, -0.33984375, 0.0462646484375, 0.432373046875, 0.8184814453125, 1.20458984375, 1.5906982421875, 1.976806640625, 2.3629150390625, 2.7490234375, 3.1351318359375, 3.521240234375, 3.9073486328125, 4.29345703125, 4.6795654296875, 5.065673828125, 5.4517822265625, 5.837890625, 6.2239990234375, 6.610107421875, 6.9962158203125, 7.38232421875, 7.7684326171875, 8.154541015625, 8.5406494140625, 8.9267578125, 9.3128662109375, 9.698974609375, 10.0850830078125, 10.47119140625, 10.8572998046875, 11.243408203125, 11.6295166015625, 12.015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 5.0, 9.0, 13.0, 12.0, 21.0, 19.0, 28.0, 20.0, 26.0, 36.0, 29.0, 34.0, 41.0, 28.0, 41.0, 45.0, 43.0, 53.0, 46.0, 49.0, 43.0, 34.0, 51.0, 31.0, 37.0, 27.0, 30.0, 22.0, 19.0, 12.0, 16.0, 20.0, 13.0, 4.0, 5.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.140625, -19.5078125, -18.875, -18.2421875, -17.609375, -16.9765625, -16.34375, -15.7109375, -15.078125, -14.4453125, -13.8125, -13.1796875, -12.546875, -11.9140625, -11.28125, -10.6484375, -10.015625, -9.3828125, -8.75, -8.1171875, -7.484375, -6.8515625, -6.21875, -5.5859375, -4.953125, -4.3203125, -3.6875, -3.0546875, -2.421875, -1.7890625, -1.15625, -0.5234375, 0.109375, 0.7421875, 1.375, 2.0078125, 2.640625, 3.2734375, 3.90625, 4.5390625, 5.171875, 5.8046875, 6.4375, 7.0703125, 7.703125, 8.3359375, 8.96875, 9.6015625, 10.234375, 10.8671875, 11.5, 12.1328125, 12.765625, 13.3984375, 14.03125, 14.6640625, 15.296875, 15.9296875, 16.5625, 17.1953125, 17.828125, 18.4609375, 19.09375, 19.7265625, 20.359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 18.0, 22.0, 68.0, 67.0, 147.0, 189.0, 344.0, 580.0, 955.0, 1576.0, 2506.0, 4077.0, 6622.0, 10471.0, 15996.0, 24542.0, 35758.0, 49828.0, 66169.0, 81875.0, 94818.0, 103823.0, 104753.0, 99991.0, 88025.0, 73230.0, 56871.0, 41748.0, 29156.0, 20029.0, 12811.0, 8289.0, 5105.0, 3173.0, 1864.0, 1194.0, 713.0, 446.0, 241.0, 155.0, 116.0, 58.0, 40.0, 25.0, 19.0, 20.0, 8.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.4969482421875, -4.337646484375, -4.1783447265625, -4.01904296875, -3.8597412109375, -3.700439453125, -3.5411376953125, -3.3818359375, -3.2225341796875, -3.063232421875, -2.9039306640625, -2.74462890625, -2.5853271484375, -2.426025390625, -2.2667236328125, -2.107421875, -1.9481201171875, -1.788818359375, -1.6295166015625, -1.47021484375, -1.3109130859375, -1.151611328125, -0.9923095703125, -0.8330078125, -0.6737060546875, -0.514404296875, -0.3551025390625, -0.19580078125, -0.0364990234375, 0.122802734375, 0.2821044921875, 0.44140625, 0.6007080078125, 0.760009765625, 0.9193115234375, 1.07861328125, 1.2379150390625, 1.397216796875, 1.5565185546875, 1.7158203125, 1.8751220703125, 2.034423828125, 2.1937255859375, 2.35302734375, 2.5123291015625, 2.671630859375, 2.8309326171875, 2.990234375, 3.1495361328125, 3.308837890625, 3.4681396484375, 3.62744140625, 3.7867431640625, 3.946044921875, 4.1053466796875, 4.2646484375, 4.4239501953125, 4.583251953125, 4.7425537109375, 4.90185546875, 5.0611572265625, 5.220458984375, 5.3797607421875, 5.5390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 3.0, 7.0, 4.0, 8.0, 7.0, 14.0, 19.0, 13.0, 31.0, 11.0, 39.0, 28.0, 33.0, 53.0, 42.0, 41.0, 39.0, 51.0, 56.0, 38.0, 45.0, 43.0, 41.0, 35.0, 29.0, 28.0, 31.0, 35.0, 35.0, 21.0, 17.0, 18.0, 15.0, 18.0, 10.0, 8.0, 6.0, 6.0, 9.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006251335144042969, -0.0006050616502761841, -0.0005849897861480713, -0.0005649179220199585, -0.0005448460578918457, -0.0005247741937637329, -0.0005047023296356201, -0.0004846304655075073, -0.00046455860137939453, -0.00044448673725128174, -0.00042441487312316895, -0.00040434300899505615, -0.00038427114486694336, -0.00036419928073883057, -0.0003441274166107178, -0.000324055552482605, -0.0003039836883544922, -0.0002839118242263794, -0.0002638399600982666, -0.0002437680959701538, -0.00022369623184204102, -0.00020362436771392822, -0.00018355250358581543, -0.00016348063945770264, -0.00014340877532958984, -0.00012333691120147705, -0.00010326504707336426, -8.319318294525146e-05, -6.312131881713867e-05, -4.304945468902588e-05, -2.2977590560913086e-05, -2.905726432800293e-06, 1.71661376953125e-05, 3.723800182342529e-05, 5.7309865951538086e-05, 7.738173007965088e-05, 9.745359420776367e-05, 0.00011752545833587646, 0.00013759732246398926, 0.00015766918659210205, 0.00017774105072021484, 0.00019781291484832764, 0.00021788477897644043, 0.00023795664310455322, 0.000258028507232666, 0.0002781003713607788, 0.0002981722354888916, 0.0003182440996170044, 0.0003383159637451172, 0.00035838782787323, 0.0003784596920013428, 0.00039853155612945557, 0.00041860342025756836, 0.00043867528438568115, 0.00045874714851379395, 0.00047881901264190674, 0.0004988908767700195, 0.0005189627408981323, 0.0005390346050262451, 0.0005591064691543579, 0.0005791783332824707, 0.0005992501974105835, 0.0006193220615386963, 0.0006393939256668091, 0.0006594657897949219]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 19.0, 21.0, 27.0, 47.0, 79.0, 148.0, 208.0, 354.0, 528.0, 926.0, 1456.0, 2433.0, 4226.0, 6729.0, 11386.0, 18063.0, 27982.0, 42246.0, 59558.0, 80044.0, 99224.0, 112139.0, 118207.0, 111845.0, 97762.0, 79215.0, 58755.0, 41604.0, 27771.0, 17612.0, 10927.0, 6787.0, 3950.0, 2524.0, 1472.0, 873.0, 523.0, 310.0, 213.0, 135.0, 76.0, 53.0, 36.0, 15.0, 15.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.58624267578125, -5.4029541015625, -5.21966552734375, -5.036376953125, -4.85308837890625, -4.6697998046875, -4.48651123046875, -4.30322265625, -4.11993408203125, -3.9366455078125, -3.75335693359375, -3.570068359375, -3.38677978515625, -3.2034912109375, -3.02020263671875, -2.8369140625, -2.65362548828125, -2.4703369140625, -2.28704833984375, -2.103759765625, -1.92047119140625, -1.7371826171875, -1.55389404296875, -1.37060546875, -1.18731689453125, -1.0040283203125, -0.82073974609375, -0.637451171875, -0.45416259765625, -0.2708740234375, -0.08758544921875, 0.095703125, 0.27899169921875, 0.4622802734375, 0.64556884765625, 0.828857421875, 1.01214599609375, 1.1954345703125, 1.37872314453125, 1.56201171875, 1.74530029296875, 1.9285888671875, 2.11187744140625, 2.295166015625, 2.47845458984375, 2.6617431640625, 2.84503173828125, 3.0283203125, 3.21160888671875, 3.3948974609375, 3.57818603515625, 3.761474609375, 3.94476318359375, 4.1280517578125, 4.31134033203125, 4.49462890625, 4.67791748046875, 4.8612060546875, 5.04449462890625, 5.227783203125, 5.41107177734375, 5.5943603515625, 5.77764892578125, 5.9609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 8.0, 12.0, 17.0, 24.0, 13.0, 15.0, 20.0, 27.0, 35.0, 33.0, 47.0, 52.0, 57.0, 60.0, 57.0, 52.0, 48.0, 45.0, 52.0, 35.0, 37.0, 47.0, 29.0, 31.0, 22.0, 20.0, 19.0, 19.0, 12.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.540985107421875, -2.45111083984375, -2.361236572265625, -2.2713623046875, -2.181488037109375, -2.09161376953125, -2.001739501953125, -1.911865234375, -1.821990966796875, -1.73211669921875, -1.642242431640625, -1.5523681640625, -1.462493896484375, -1.37261962890625, -1.282745361328125, -1.19287109375, -1.102996826171875, -1.01312255859375, -0.923248291015625, -0.8333740234375, -0.743499755859375, -0.65362548828125, -0.563751220703125, -0.473876953125, -0.384002685546875, -0.29412841796875, -0.204254150390625, -0.1143798828125, -0.024505615234375, 0.06536865234375, 0.155242919921875, 0.2451171875, 0.334991455078125, 0.42486572265625, 0.514739990234375, 0.6046142578125, 0.694488525390625, 0.78436279296875, 0.874237060546875, 0.964111328125, 1.053985595703125, 1.14385986328125, 1.233734130859375, 1.3236083984375, 1.413482666015625, 1.50335693359375, 1.593231201171875, 1.68310546875, 1.772979736328125, 1.86285400390625, 1.952728271484375, 2.0426025390625, 2.132476806640625, 2.22235107421875, 2.312225341796875, 2.402099609375, 2.491973876953125, 2.58184814453125, 2.671722412109375, 2.7615966796875, 2.851470947265625, 2.94134521484375, 3.031219482421875, 3.12109375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 7.0, 8.0, 17.0, 20.0, 23.0, 25.0, 29.0, 34.0, 35.0, 44.0, 43.0, 38.0, 65.0, 47.0, 41.0, 51.0, 34.0, 58.0, 45.0, 43.0, 43.0, 35.0, 35.0, 30.0, 24.0, 25.0, 18.0, 17.0, 12.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-29.038381576538086, -28.069211959838867, -27.10004425048828, -26.130874633789062, -25.161705017089844, -24.192535400390625, -23.223365783691406, -22.25419807434082, -21.2850284576416, -20.315858840942383, -19.346691131591797, -18.377521514892578, -17.40835189819336, -16.43918228149414, -15.470013618469238, -14.500844955444336, -13.531675338745117, -12.562505722045898, -11.593337059020996, -10.624168395996094, -9.654998779296875, -8.685829162597656, -7.716660499572754, -6.747491359710693, -5.778322219848633, -4.809153079986572, -3.8399839401245117, -2.870814800262451, -1.9016456604003906, -0.9324765205383301, 0.03669261932373047, 1.005861759185791, 1.9750328063964844, 2.944201946258545, 3.9133710861206055, 4.882540225982666, 5.851709365844727, 6.820878505706787, 7.790047645568848, 8.75921630859375, 9.728385925292969, 10.697555541992188, 11.66672420501709, 12.635892868041992, 13.605062484741211, 14.57423210144043, 15.543400764465332, 16.512569427490234, 17.481739044189453, 18.450908660888672, 19.42007827758789, 20.389245986938477, 21.358415603637695, 22.327585220336914, 23.2967529296875, 24.26592254638672, 25.235092163085938, 26.204261779785156, 27.173431396484375, 28.14259910583496, 29.11176872253418, 30.0809383392334, 31.050106048583984, 32.0192756652832, 32.98844528198242]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 8.0, 16.0, 18.0, 12.0, 11.0, 19.0, 14.0, 23.0, 37.0, 23.0, 30.0, 38.0, 37.0, 34.0, 44.0, 38.0, 50.0, 35.0, 46.0, 43.0, 34.0, 38.0, 40.0, 41.0, 29.0, 33.0, 26.0, 24.0, 24.0, 27.0, 13.0, 11.0, 14.0, 10.0, 13.0, 7.0, 5.0, 4.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.32804489135742, -35.28412628173828, -34.24020767211914, -33.196285247802734, -32.152366638183594, -31.108448028564453, -30.064529418945312, -29.02060890197754, -27.976688385009766, -26.932769775390625, -25.88884925842285, -24.84493064880371, -23.801010131835938, -22.757091522216797, -21.713172912597656, -20.669252395629883, -19.625333786010742, -18.5814151763916, -17.537494659423828, -16.493576049804688, -15.449655532836914, -14.405736923217773, -13.361817359924316, -12.31789779663086, -11.273978233337402, -10.230058670043945, -9.186139106750488, -8.142219543457031, -7.098300457000732, -6.054380893707275, -5.010461807250977, -3.9665422439575195, -2.9226226806640625, -1.878703236579895, -0.8347837924957275, 0.2091355323791504, 1.2530550956726074, 2.2969746589660645, 3.3408937454223633, 4.38481330871582, 5.428732872009277, 6.472652435302734, 7.516571998596191, 8.560491561889648, 9.604410171508789, 10.648330688476562, 11.692249298095703, 12.73616886138916, 13.780088424682617, 14.824007987976074, 15.867927551269531, 16.911846160888672, 17.955766677856445, 18.999685287475586, 20.04360580444336, 21.0875244140625, 22.13144302368164, 23.17536163330078, 24.219282150268555, 25.263200759887695, 26.30712127685547, 27.35103988647461, 28.39495849609375, 29.438879013061523, 30.482799530029297]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 22.0, 32.0, 36.0, 83.0, 160.0, 249.0, 369.0, 678.0, 1120.0, 1734.0, 2893.0, 4851.0, 7642.0, 12161.0, 19829.0, 30566.0, 46333.0, 70380.0, 102451.0, 144796.0, 196940.0, 256585.0, 316472.0, 370762.0, 403870.0, 411042.0, 389506.0, 345703.0, 290207.0, 227561.0, 170103.0, 122646.0, 84954.0, 57589.0, 37960.0, 24651.0, 15775.0, 9783.0, 6066.0, 3751.0, 2239.0, 1521.0, 877.0, 573.0, 298.0, 195.0, 113.0, 70.0, 32.0, 26.0, 10.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.65625, -21.9541015625, -21.251953125, -20.5498046875, -19.84765625, -19.1455078125, -18.443359375, -17.7412109375, -17.0390625, -16.3369140625, -15.634765625, -14.9326171875, -14.23046875, -13.5283203125, -12.826171875, -12.1240234375, -11.421875, -10.7197265625, -10.017578125, -9.3154296875, -8.61328125, -7.9111328125, -7.208984375, -6.5068359375, -5.8046875, -5.1025390625, -4.400390625, -3.6982421875, -2.99609375, -2.2939453125, -1.591796875, -0.8896484375, -0.1875, 0.5146484375, 1.216796875, 1.9189453125, 2.62109375, 3.3232421875, 4.025390625, 4.7275390625, 5.4296875, 6.1318359375, 6.833984375, 7.5361328125, 8.23828125, 8.9404296875, 9.642578125, 10.3447265625, 11.046875, 11.7490234375, 12.451171875, 13.1533203125, 13.85546875, 14.5576171875, 15.259765625, 15.9619140625, 16.6640625, 17.3662109375, 18.068359375, 18.7705078125, 19.47265625, 20.1748046875, 20.876953125, 21.5791015625, 22.28125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 12.0, 7.0, 9.0, 13.0, 10.0, 11.0, 14.0, 19.0, 25.0, 35.0, 30.0, 37.0, 30.0, 31.0, 40.0, 45.0, 39.0, 49.0, 37.0, 41.0, 37.0, 37.0, 46.0, 33.0, 35.0, 31.0, 32.0, 36.0, 31.0, 21.0, 22.0, 18.0, 15.0, 13.0, 10.0, 5.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.0, -32.027587890625, -31.05517578125, -30.082763671875, -29.1103515625, -28.137939453125, -27.16552734375, -26.193115234375, -25.220703125, -24.248291015625, -23.27587890625, -22.303466796875, -21.3310546875, -20.358642578125, -19.38623046875, -18.413818359375, -17.44140625, -16.468994140625, -15.49658203125, -14.524169921875, -13.5517578125, -12.579345703125, -11.60693359375, -10.634521484375, -9.662109375, -8.689697265625, -7.71728515625, -6.744873046875, -5.7724609375, -4.800048828125, -3.82763671875, -2.855224609375, -1.8828125, -0.910400390625, 0.06201171875, 1.034423828125, 2.0068359375, 2.979248046875, 3.95166015625, 4.924072265625, 5.896484375, 6.868896484375, 7.84130859375, 8.813720703125, 9.7861328125, 10.758544921875, 11.73095703125, 12.703369140625, 13.67578125, 14.648193359375, 15.62060546875, 16.593017578125, 17.5654296875, 18.537841796875, 19.51025390625, 20.482666015625, 21.455078125, 22.427490234375, 23.39990234375, 24.372314453125, 25.3447265625, 26.317138671875, 27.28955078125, 28.261962890625, 29.234375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 8.0, 14.0, 18.0, 29.0, 46.0, 87.0, 122.0, 202.0, 320.0, 565.0, 845.0, 1269.0, 2259.0, 3583.0, 5981.0, 9259.0, 14895.0, 23113.0, 35322.0, 53428.0, 79082.0, 112495.0, 156054.0, 206316.0, 261005.0, 314570.0, 359178.0, 384947.0, 388824.0, 370778.0, 333052.0, 281312.0, 226414.0, 174213.0, 127608.0, 90093.0, 61735.0, 41263.0, 26717.0, 17652.0, 11074.0, 7156.0, 4447.0, 2619.0, 1670.0, 1079.0, 605.0, 359.0, 236.0, 156.0, 92.0, 56.0, 29.0, 17.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0], "bins": [-24.5625, -23.79931640625, -23.0361328125, -22.27294921875, -21.509765625, -20.74658203125, -19.9833984375, -19.22021484375, -18.45703125, -17.69384765625, -16.9306640625, -16.16748046875, -15.404296875, -14.64111328125, -13.8779296875, -13.11474609375, -12.3515625, -11.58837890625, -10.8251953125, -10.06201171875, -9.298828125, -8.53564453125, -7.7724609375, -7.00927734375, -6.24609375, -5.48291015625, -4.7197265625, -3.95654296875, -3.193359375, -2.43017578125, -1.6669921875, -0.90380859375, -0.140625, 0.62255859375, 1.3857421875, 2.14892578125, 2.912109375, 3.67529296875, 4.4384765625, 5.20166015625, 5.96484375, 6.72802734375, 7.4912109375, 8.25439453125, 9.017578125, 9.78076171875, 10.5439453125, 11.30712890625, 12.0703125, 12.83349609375, 13.5966796875, 14.35986328125, 15.123046875, 15.88623046875, 16.6494140625, 17.41259765625, 18.17578125, 18.93896484375, 19.7021484375, 20.46533203125, 21.228515625, 21.99169921875, 22.7548828125, 23.51806640625, 24.28125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 1.0, 5.0, 8.0, 12.0, 18.0, 17.0, 24.0, 23.0, 36.0, 45.0, 37.0, 48.0, 84.0, 64.0, 81.0, 109.0, 108.0, 157.0, 162.0, 166.0, 174.0, 186.0, 191.0, 182.0, 212.0, 196.0, 167.0, 178.0, 176.0, 170.0, 141.0, 137.0, 121.0, 96.0, 88.0, 79.0, 64.0, 60.0, 53.0, 38.0, 46.0, 32.0, 23.0, 16.0, 10.0, 5.0, 7.0, 6.0, 6.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-14.6875, -14.2421875, -13.796875, -13.3515625, -12.90625, -12.4609375, -12.015625, -11.5703125, -11.125, -10.6796875, -10.234375, -9.7890625, -9.34375, -8.8984375, -8.453125, -8.0078125, -7.5625, -7.1171875, -6.671875, -6.2265625, -5.78125, -5.3359375, -4.890625, -4.4453125, -4.0, -3.5546875, -3.109375, -2.6640625, -2.21875, -1.7734375, -1.328125, -0.8828125, -0.4375, 0.0078125, 0.453125, 0.8984375, 1.34375, 1.7890625, 2.234375, 2.6796875, 3.125, 3.5703125, 4.015625, 4.4609375, 4.90625, 5.3515625, 5.796875, 6.2421875, 6.6875, 7.1328125, 7.578125, 8.0234375, 8.46875, 8.9140625, 9.359375, 9.8046875, 10.25, 10.6953125, 11.140625, 11.5859375, 12.03125, 12.4765625, 12.921875, 13.3671875, 13.8125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 3.0, 10.0, 14.0, 14.0, 16.0, 23.0, 35.0, 23.0, 31.0, 39.0, 46.0, 51.0, 38.0, 43.0, 55.0, 60.0, 65.0, 51.0, 39.0, 49.0, 44.0, 32.0, 38.0, 26.0, 27.0, 24.0, 21.0, 15.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-45.22449493408203, -43.83989715576172, -42.455299377441406, -41.07070541381836, -39.68610763549805, -38.301509857177734, -36.91691589355469, -35.532318115234375, -34.14772033691406, -32.76312255859375, -31.37852668762207, -29.99393081665039, -28.609333038330078, -27.224735260009766, -25.840139389038086, -24.455543518066406, -23.070945739746094, -21.68634796142578, -20.3017520904541, -18.917156219482422, -17.53255844116211, -16.147960662841797, -14.763364791870117, -13.378767967224121, -11.994171142578125, -10.609574317932129, -9.224977493286133, -7.840380668640137, -6.455783843994141, -5.0711870193481445, -3.6865901947021484, -2.3019933700561523, -0.9173927307128906, 0.46720409393310547, 1.8518009185791016, 3.2363977432250977, 4.620994567871094, 6.00559139251709, 7.390188217163086, 8.774785041809082, 10.159381866455078, 11.543978691101074, 12.92857551574707, 14.313172340393066, 15.697769165039062, 17.082366943359375, 18.466962814331055, 19.851558685302734, 21.236156463623047, 22.62075424194336, 24.00535011291504, 25.38994598388672, 26.77454376220703, 28.159141540527344, 29.543737411499023, 30.928333282470703, 32.312931060791016, 33.69752883911133, 35.082122802734375, 36.46672058105469, 37.851318359375, 39.23591613769531, 40.620513916015625, 42.00510787963867, 43.389705657958984]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 13.0, 15.0, 16.0, 21.0, 24.0, 21.0, 44.0, 30.0, 25.0, 33.0, 45.0, 37.0, 42.0, 40.0, 49.0, 41.0, 33.0, 43.0, 32.0, 31.0, 32.0, 36.0, 24.0, 31.0, 24.0, 22.0, 31.0, 19.0, 18.0, 17.0, 6.0, 8.0, 6.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.9935188293457, -40.708412170410156, -39.42330551147461, -38.13820266723633, -36.85309600830078, -35.567989349365234, -34.28288269042969, -32.99777603149414, -31.712671279907227, -30.42756462097168, -29.142459869384766, -27.85735321044922, -26.572246551513672, -25.287141799926758, -24.00203514099121, -22.716930389404297, -21.43182373046875, -20.146717071533203, -18.86161231994629, -17.576505661010742, -16.291400909423828, -15.006294250488281, -13.721187591552734, -12.436081886291504, -11.150976181030273, -9.865870475769043, -8.580764770507812, -7.295658111572266, -6.010552406311035, -4.725446701049805, -3.440340518951416, -2.1552343368530273, -0.8701324462890625, 0.41497349739074707, 1.7000794410705566, 2.985185384750366, 4.270291328430176, 5.555397033691406, 6.840503215789795, 8.125609397888184, 9.410715103149414, 10.695820808410645, 11.980926513671875, 13.266033172607422, 14.551138877868652, 15.836244583129883, 17.12135124206543, 18.406455993652344, 19.69156265258789, 20.976669311523438, 22.26177406311035, 23.5468807220459, 24.831985473632812, 26.11709213256836, 27.402198791503906, 28.687305450439453, 29.972410202026367, 31.257516860961914, 32.54262161254883, 33.827728271484375, 35.11283493041992, 36.39794158935547, 37.68304443359375, 38.9681510925293, 40.253257751464844]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 9.0, 11.0, 22.0, 27.0, 36.0, 65.0, 83.0, 172.0, 230.0, 356.0, 606.0, 934.0, 1616.0, 2764.0, 4866.0, 8639.0, 16234.0, 31448.0, 62997.0, 130136.0, 251858.0, 259758.0, 137760.0, 66476.0, 32979.0, 16869.0, 9083.0, 5171.0, 2927.0, 1716.0, 1023.0, 630.0, 365.0, 229.0, 150.0, 104.0, 59.0, 59.0, 26.0, 21.0, 18.0, 8.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.90625, -6.690673828125, -6.47509765625, -6.259521484375, -6.0439453125, -5.828369140625, -5.61279296875, -5.397216796875, -5.181640625, -4.966064453125, -4.75048828125, -4.534912109375, -4.3193359375, -4.103759765625, -3.88818359375, -3.672607421875, -3.45703125, -3.241455078125, -3.02587890625, -2.810302734375, -2.5947265625, -2.379150390625, -2.16357421875, -1.947998046875, -1.732421875, -1.516845703125, -1.30126953125, -1.085693359375, -0.8701171875, -0.654541015625, -0.43896484375, -0.223388671875, -0.0078125, 0.207763671875, 0.42333984375, 0.638916015625, 0.8544921875, 1.070068359375, 1.28564453125, 1.501220703125, 1.716796875, 1.932373046875, 2.14794921875, 2.363525390625, 2.5791015625, 2.794677734375, 3.01025390625, 3.225830078125, 3.44140625, 3.656982421875, 3.87255859375, 4.088134765625, 4.3037109375, 4.519287109375, 4.73486328125, 4.950439453125, 5.166015625, 5.381591796875, 5.59716796875, 5.812744140625, 6.0283203125, 6.243896484375, 6.45947265625, 6.675048828125, 6.890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 3.0, 6.0, 9.0, 13.0, 7.0, 9.0, 18.0, 18.0, 14.0, 23.0, 23.0, 32.0, 21.0, 25.0, 31.0, 34.0, 33.0, 45.0, 44.0, 47.0, 34.0, 41.0, 46.0, 31.0, 34.0, 36.0, 33.0, 37.0, 26.0, 31.0, 26.0, 29.0, 28.0, 19.0, 21.0, 7.0, 15.0, 13.0, 6.0, 5.0, 4.0, 7.0, 1.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-43.09375, -41.74951171875, -40.4052734375, -39.06103515625, -37.716796875, -36.37255859375, -35.0283203125, -33.68408203125, -32.33984375, -30.99560546875, -29.6513671875, -28.30712890625, -26.962890625, -25.61865234375, -24.2744140625, -22.93017578125, -21.5859375, -20.24169921875, -18.8974609375, -17.55322265625, -16.208984375, -14.86474609375, -13.5205078125, -12.17626953125, -10.83203125, -9.48779296875, -8.1435546875, -6.79931640625, -5.455078125, -4.11083984375, -2.7666015625, -1.42236328125, -0.078125, 1.26611328125, 2.6103515625, 3.95458984375, 5.298828125, 6.64306640625, 7.9873046875, 9.33154296875, 10.67578125, 12.02001953125, 13.3642578125, 14.70849609375, 16.052734375, 17.39697265625, 18.7412109375, 20.08544921875, 21.4296875, 22.77392578125, 24.1181640625, 25.46240234375, 26.806640625, 28.15087890625, 29.4951171875, 30.83935546875, 32.18359375, 33.52783203125, 34.8720703125, 36.21630859375, 37.560546875, 38.90478515625, 40.2490234375, 41.59326171875, 42.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 5.0, 11.0, 25.0, 27.0, 39.0, 42.0, 64.0, 105.0, 167.0, 203.0, 316.0, 429.0, 710.0, 1030.0, 1538.0, 2304.0, 3376.0, 5246.0, 8066.0, 12678.0, 20587.0, 34526.0, 58954.0, 108722.0, 199327.0, 241067.0, 150994.0, 80698.0, 45206.0, 26529.0, 16204.0, 10233.0, 6544.0, 4140.0, 2838.0, 1819.0, 1214.0, 826.0, 558.0, 404.0, 288.0, 170.0, 100.0, 66.0, 52.0, 38.0, 28.0, 14.0, 13.0, 11.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4609375, -6.26666259765625, -6.0723876953125, -5.87811279296875, -5.683837890625, -5.48956298828125, -5.2952880859375, -5.10101318359375, -4.90673828125, -4.71246337890625, -4.5181884765625, -4.32391357421875, -4.129638671875, -3.93536376953125, -3.7410888671875, -3.54681396484375, -3.3525390625, -3.15826416015625, -2.9639892578125, -2.76971435546875, -2.575439453125, -2.38116455078125, -2.1868896484375, -1.99261474609375, -1.79833984375, -1.60406494140625, -1.4097900390625, -1.21551513671875, -1.021240234375, -0.82696533203125, -0.6326904296875, -0.43841552734375, -0.244140625, -0.04986572265625, 0.1444091796875, 0.33868408203125, 0.532958984375, 0.72723388671875, 0.9215087890625, 1.11578369140625, 1.31005859375, 1.50433349609375, 1.6986083984375, 1.89288330078125, 2.087158203125, 2.28143310546875, 2.4757080078125, 2.66998291015625, 2.8642578125, 3.05853271484375, 3.2528076171875, 3.44708251953125, 3.641357421875, 3.83563232421875, 4.0299072265625, 4.22418212890625, 4.41845703125, 4.61273193359375, 4.8070068359375, 5.00128173828125, 5.195556640625, 5.38983154296875, 5.5841064453125, 5.77838134765625, 5.97265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 13.0, 12.0, 13.0, 15.0, 21.0, 21.0, 25.0, 21.0, 23.0, 33.0, 34.0, 41.0, 42.0, 45.0, 39.0, 41.0, 46.0, 45.0, 32.0, 44.0, 50.0, 44.0, 42.0, 35.0, 40.0, 29.0, 33.0, 18.0, 16.0, 17.0, 14.0, 9.0, 16.0, 10.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.96875, -34.03271484375, -33.0966796875, -32.16064453125, -31.224609375, -30.28857421875, -29.3525390625, -28.41650390625, -27.48046875, -26.54443359375, -25.6083984375, -24.67236328125, -23.736328125, -22.80029296875, -21.8642578125, -20.92822265625, -19.9921875, -19.05615234375, -18.1201171875, -17.18408203125, -16.248046875, -15.31201171875, -14.3759765625, -13.43994140625, -12.50390625, -11.56787109375, -10.6318359375, -9.69580078125, -8.759765625, -7.82373046875, -6.8876953125, -5.95166015625, -5.015625, -4.07958984375, -3.1435546875, -2.20751953125, -1.271484375, -0.33544921875, 0.6005859375, 1.53662109375, 2.47265625, 3.40869140625, 4.3447265625, 5.28076171875, 6.216796875, 7.15283203125, 8.0888671875, 9.02490234375, 9.9609375, 10.89697265625, 11.8330078125, 12.76904296875, 13.705078125, 14.64111328125, 15.5771484375, 16.51318359375, 17.44921875, 18.38525390625, 19.3212890625, 20.25732421875, 21.193359375, 22.12939453125, 23.0654296875, 24.00146484375, 24.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 8.0, 10.0, 12.0, 32.0, 46.0, 41.0, 93.0, 113.0, 174.0, 227.0, 374.0, 517.0, 790.0, 1177.0, 1731.0, 2803.0, 4372.0, 6968.0, 11353.0, 19527.0, 34824.0, 66068.0, 141298.0, 290024.0, 237924.0, 105662.0, 51991.0, 27903.0, 16200.0, 9591.0, 6025.0, 3656.0, 2378.0, 1510.0, 995.0, 665.0, 424.0, 325.0, 221.0, 145.0, 104.0, 72.0, 54.0, 36.0, 26.0, 14.0, 13.0, 9.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.163330078125, -0.15819740295410156, -0.15306472778320312, -0.1479320526123047, -0.14279937744140625, -0.1376667022705078, -0.13253402709960938, -0.12740135192871094, -0.1222686767578125, -0.11713600158691406, -0.11200332641601562, -0.10687065124511719, -0.10173797607421875, -0.09660530090332031, -0.09147262573242188, -0.08633995056152344, -0.081207275390625, -0.07607460021972656, -0.07094192504882812, -0.06580924987792969, -0.06067657470703125, -0.05554389953613281, -0.050411224365234375, -0.04527854919433594, -0.0401458740234375, -0.03501319885253906, -0.029880523681640625, -0.024747848510742188, -0.01961517333984375, -0.014482498168945312, -0.009349822998046875, -0.0042171478271484375, 0.00091552734375, 0.0060482025146484375, 0.011180877685546875, 0.016313552856445312, 0.02144622802734375, 0.026578903198242188, 0.031711578369140625, 0.03684425354003906, 0.0419769287109375, 0.04710960388183594, 0.052242279052734375, 0.05737495422363281, 0.06250762939453125, 0.06764030456542969, 0.07277297973632812, 0.07790565490722656, 0.083038330078125, 0.08817100524902344, 0.09330368041992188, 0.09843635559082031, 0.10356903076171875, 0.10870170593261719, 0.11383438110351562, 0.11896705627441406, 0.1240997314453125, 0.12923240661621094, 0.13436508178710938, 0.1394977569580078, 0.14463043212890625, 0.1497631072998047, 0.15489578247070312, 0.16002845764160156, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 7.0, 6.0, 15.0, 20.0, 17.0, 19.0, 26.0, 26.0, 42.0, 34.0, 39.0, 52.0, 46.0, 46.0, 49.0, 65.0, 47.0, 42.0, 44.0, 47.0, 36.0, 29.0, 34.0, 32.0, 16.0, 24.0, 16.0, 16.0, 15.0, 12.0, 11.0, 7.0, 9.0, 6.0, 4.0, 9.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.236532211303711e-05, -3.1412579119205475e-05, -3.045983612537384e-05, -2.9507093131542206e-05, -2.855435013771057e-05, -2.7601607143878937e-05, -2.6648864150047302e-05, -2.5696121156215668e-05, -2.4743378162384033e-05, -2.37906351685524e-05, -2.2837892174720764e-05, -2.188514918088913e-05, -2.0932406187057495e-05, -1.997966319322586e-05, -1.9026920199394226e-05, -1.807417720556259e-05, -1.7121434211730957e-05, -1.6168691217899323e-05, -1.5215948224067688e-05, -1.4263205230236053e-05, -1.3310462236404419e-05, -1.2357719242572784e-05, -1.140497624874115e-05, -1.0452233254909515e-05, -9.499490261077881e-06, -8.546747267246246e-06, -7.594004273414612e-06, -6.641261279582977e-06, -5.688518285751343e-06, -4.735775291919708e-06, -3.7830322980880737e-06, -2.830289304256439e-06, -1.8775463104248047e-06, -9.248033165931702e-07, 2.7939677238464355e-08, 9.806826710700989e-07, 1.9334256649017334e-06, 2.886168658733368e-06, 3.8389116525650024e-06, 4.791654646396637e-06, 5.7443976402282715e-06, 6.697140634059906e-06, 7.64988362789154e-06, 8.602626621723175e-06, 9.55536961555481e-06, 1.0508112609386444e-05, 1.1460855603218079e-05, 1.2413598597049713e-05, 1.3366341590881348e-05, 1.4319084584712982e-05, 1.5271827578544617e-05, 1.622457057237625e-05, 1.7177313566207886e-05, 1.813005656003952e-05, 1.9082799553871155e-05, 2.003554254770279e-05, 2.0988285541534424e-05, 2.194102853536606e-05, 2.2893771529197693e-05, 2.3846514523029327e-05, 2.4799257516860962e-05, 2.5752000510692596e-05, 2.670474350452423e-05, 2.7657486498355865e-05, 2.86102294921875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 15.0, 19.0, 28.0, 49.0, 63.0, 113.0, 161.0, 228.0, 321.0, 558.0, 870.0, 1358.0, 2209.0, 3300.0, 5314.0, 8135.0, 13083.0, 21016.0, 33844.0, 59174.0, 112898.0, 258060.0, 261651.0, 114712.0, 59333.0, 34620.0, 21215.0, 13107.0, 8367.0, 5342.0, 3327.0, 2181.0, 1422.0, 857.0, 573.0, 337.0, 228.0, 155.0, 113.0, 64.0, 41.0, 34.0, 19.0, 13.0, 5.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40185546875, -0.3893013000488281, -0.37674713134765625, -0.3641929626464844, -0.3516387939453125, -0.3390846252441406, -0.32653045654296875, -0.3139762878417969, -0.301422119140625, -0.2888679504394531, -0.27631378173828125, -0.2637596130371094, -0.2512054443359375, -0.23865127563476562, -0.22609710693359375, -0.21354293823242188, -0.20098876953125, -0.18843460083007812, -0.17588043212890625, -0.16332626342773438, -0.1507720947265625, -0.13821792602539062, -0.12566375732421875, -0.11310958862304688, -0.100555419921875, -0.08800125122070312, -0.07544708251953125, -0.06289291381835938, -0.0503387451171875, -0.037784576416015625, -0.02523040771484375, -0.012676239013671875, -0.0001220703125, 0.012432098388671875, 0.02498626708984375, 0.037540435791015625, 0.0500946044921875, 0.06264877319335938, 0.07520294189453125, 0.08775711059570312, 0.100311279296875, 0.11286544799804688, 0.12541961669921875, 0.13797378540039062, 0.1505279541015625, 0.16308212280273438, 0.17563629150390625, 0.18819046020507812, 0.20074462890625, 0.21329879760742188, 0.22585296630859375, 0.23840713500976562, 0.2509613037109375, 0.2635154724121094, 0.27606964111328125, 0.2886238098144531, 0.301177978515625, 0.3137321472167969, 0.32628631591796875, 0.3388404846191406, 0.3513946533203125, 0.3639488220214844, 0.37650299072265625, 0.3890571594238281, 0.401611328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 2.0, 9.0, 8.0, 12.0, 15.0, 19.0, 24.0, 55.0, 64.0, 93.0, 138.0, 133.0, 117.0, 75.0, 51.0, 46.0, 24.0, 18.0, 16.0, 19.0, 9.0, 6.0, 8.0, 1.0, 3.0, 6.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.144287109375, -0.13939666748046875, -0.1345062255859375, -0.12961578369140625, -0.124725341796875, -0.11983489990234375, -0.1149444580078125, -0.11005401611328125, -0.10516357421875, -0.10027313232421875, -0.0953826904296875, -0.09049224853515625, -0.085601806640625, -0.08071136474609375, -0.0758209228515625, -0.07093048095703125, -0.0660400390625, -0.06114959716796875, -0.0562591552734375, -0.05136871337890625, -0.046478271484375, -0.04158782958984375, -0.0366973876953125, -0.03180694580078125, -0.02691650390625, -0.02202606201171875, -0.0171356201171875, -0.01224517822265625, -0.007354736328125, -0.00246429443359375, 0.0024261474609375, 0.00731658935546875, 0.01220703125, 0.01709747314453125, 0.0219879150390625, 0.02687835693359375, 0.031768798828125, 0.03665924072265625, 0.0415496826171875, 0.04644012451171875, 0.05133056640625, 0.05622100830078125, 0.0611114501953125, 0.06600189208984375, 0.070892333984375, 0.07578277587890625, 0.0806732177734375, 0.08556365966796875, 0.0904541015625, 0.09534454345703125, 0.1002349853515625, 0.10512542724609375, 0.110015869140625, 0.11490631103515625, 0.1197967529296875, 0.12468719482421875, 0.12957763671875, 0.13446807861328125, 0.1393585205078125, 0.14424896240234375, 0.149139404296875, 0.15402984619140625, 0.1589202880859375, 0.16381072998046875, 0.168701171875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 3.0, 8.0, 12.0, 19.0, 17.0, 24.0, 26.0, 28.0, 31.0, 44.0, 40.0, 52.0, 39.0, 45.0, 53.0, 66.0, 53.0, 49.0, 44.0, 52.0, 38.0, 31.0, 41.0, 30.0, 24.0, 25.0, 20.0, 15.0, 13.0, 7.0, 8.0, 5.0, 7.0, 3.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-45.227149963378906, -43.85004425048828, -42.47293472290039, -41.095829010009766, -39.718719482421875, -38.34161376953125, -36.964508056640625, -35.587398529052734, -34.21029281616211, -32.833187103271484, -31.456077575683594, -30.07897186279297, -28.70186424255371, -27.324756622314453, -25.947649002075195, -24.570541381835938, -23.19343376159668, -21.816326141357422, -20.439218521118164, -19.062110900878906, -17.68500518798828, -16.307897567749023, -14.930789947509766, -13.553683280944824, -12.176575660705566, -10.799468040466309, -9.422361373901367, -8.04525375366211, -6.66814661026001, -5.29103946685791, -3.9139318466186523, -2.536825180053711, -1.1597175598144531, 0.21738970279693604, 1.5944969654083252, 2.971604347229004, 4.3487114906311035, 5.725818634033203, 7.102926254272461, 8.480032920837402, 9.85714054107666, 11.234248161315918, 12.61135482788086, 13.988462448120117, 15.365570068359375, 16.74267578125, 18.11978530883789, 19.496891021728516, 20.873998641967773, 22.25110626220703, 23.62821388244629, 25.005321502685547, 26.382427215576172, 27.75953483581543, 29.136642456054688, 30.513748168945312, 31.890857696533203, 33.26796340942383, 34.64507293701172, 36.022178649902344, 37.399288177490234, 38.77639389038086, 40.15350341796875, 41.530609130859375, 42.90771484375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 5.0, 8.0, 11.0, 11.0, 14.0, 13.0, 15.0, 16.0, 22.0, 21.0, 22.0, 42.0, 32.0, 26.0, 33.0, 43.0, 33.0, 47.0, 38.0, 50.0, 42.0, 31.0, 47.0, 31.0, 29.0, 31.0, 39.0, 25.0, 28.0, 25.0, 23.0, 31.0, 17.0, 20.0, 16.0, 6.0, 10.0, 5.0, 5.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.083160400390625, -40.79657745361328, -39.50999450683594, -38.223411560058594, -36.936832427978516, -35.65024948120117, -34.36366653442383, -33.077083587646484, -31.79050064086914, -30.503917694091797, -29.217336654663086, -27.930753707885742, -26.6441707611084, -25.357589721679688, -24.071006774902344, -22.784423828125, -21.49784278869629, -20.211259841918945, -18.924678802490234, -17.63809585571289, -16.351512908935547, -15.06493091583252, -13.778348922729492, -12.491765975952148, -11.205183982849121, -9.918601989746094, -8.63201904296875, -7.345437049865723, -6.058854579925537, -4.772272109985352, -3.485690116882324, -2.1991071701049805, -0.9125251770019531, 0.37405717372894287, 1.6606395244598389, 2.9472217559814453, 4.233804225921631, 5.520386695861816, 6.806968688964844, 8.093551635742188, 9.380133628845215, 10.666715621948242, 11.953298568725586, 13.239880561828613, 14.52646255493164, 15.813045501708984, 17.099628448486328, 18.386211395263672, 19.672792434692383, 20.959375381469727, 22.245956420898438, 23.53253936767578, 24.819122314453125, 26.10570526123047, 27.39228630065918, 28.678869247436523, 29.965450286865234, 31.252033233642578, 32.53861618041992, 33.8251953125, 35.111778259277344, 36.39836120605469, 37.68494415283203, 38.971527099609375, 40.25811004638672]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 14.0, 34.0, 45.0, 65.0, 145.0, 198.0, 300.0, 467.0, 747.0, 1161.0, 1929.0, 3117.0, 4886.0, 7866.0, 12285.0, 18455.0, 28095.0, 40426.0, 55823.0, 72772.0, 90057.0, 104180.0, 110282.0, 108074.0, 97672.0, 81825.0, 63566.0, 47125.0, 33310.0, 22457.0, 14951.0, 9620.0, 6072.0, 3906.0, 2386.0, 1573.0, 934.0, 648.0, 366.0, 259.0, 154.0, 116.0, 65.0, 40.0, 29.0, 14.0, 7.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0], "bins": [-21.390625, -20.756591796875, -20.12255859375, -19.488525390625, -18.8544921875, -18.220458984375, -17.58642578125, -16.952392578125, -16.318359375, -15.684326171875, -15.05029296875, -14.416259765625, -13.7822265625, -13.148193359375, -12.51416015625, -11.880126953125, -11.24609375, -10.612060546875, -9.97802734375, -9.343994140625, -8.7099609375, -8.075927734375, -7.44189453125, -6.807861328125, -6.173828125, -5.539794921875, -4.90576171875, -4.271728515625, -3.6376953125, -3.003662109375, -2.36962890625, -1.735595703125, -1.1015625, -0.467529296875, 0.16650390625, 0.800537109375, 1.4345703125, 2.068603515625, 2.70263671875, 3.336669921875, 3.970703125, 4.604736328125, 5.23876953125, 5.872802734375, 6.5068359375, 7.140869140625, 7.77490234375, 8.408935546875, 9.04296875, 9.677001953125, 10.31103515625, 10.945068359375, 11.5791015625, 12.213134765625, 12.84716796875, 13.481201171875, 14.115234375, 14.749267578125, 15.38330078125, 16.017333984375, 16.6513671875, 17.285400390625, 17.91943359375, 18.553466796875, 19.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 2.0, 3.0, 9.0, 8.0, 11.0, 7.0, 13.0, 11.0, 16.0, 20.0, 13.0, 25.0, 23.0, 24.0, 37.0, 31.0, 25.0, 46.0, 33.0, 38.0, 34.0, 41.0, 34.0, 37.0, 42.0, 40.0, 36.0, 33.0, 33.0, 26.0, 25.0, 25.0, 22.0, 27.0, 30.0, 23.0, 20.0, 11.0, 15.0, 8.0, 9.0, 7.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.46533203125, -35.2431640625, -34.02099609375, -32.798828125, -31.57666015625, -30.3544921875, -29.13232421875, -27.91015625, -26.68798828125, -25.4658203125, -24.24365234375, -23.021484375, -21.79931640625, -20.5771484375, -19.35498046875, -18.1328125, -16.91064453125, -15.6884765625, -14.46630859375, -13.244140625, -12.02197265625, -10.7998046875, -9.57763671875, -8.35546875, -7.13330078125, -5.9111328125, -4.68896484375, -3.466796875, -2.24462890625, -1.0224609375, 0.19970703125, 1.421875, 2.64404296875, 3.8662109375, 5.08837890625, 6.310546875, 7.53271484375, 8.7548828125, 9.97705078125, 11.19921875, 12.42138671875, 13.6435546875, 14.86572265625, 16.087890625, 17.31005859375, 18.5322265625, 19.75439453125, 20.9765625, 22.19873046875, 23.4208984375, 24.64306640625, 25.865234375, 27.08740234375, 28.3095703125, 29.53173828125, 30.75390625, 31.97607421875, 33.1982421875, 34.42041015625, 35.642578125, 36.86474609375, 38.0869140625, 39.30908203125, 40.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 13.0, 13.0, 26.0, 41.0, 58.0, 110.0, 135.0, 210.0, 360.0, 542.0, 922.0, 1534.0, 2318.0, 3911.0, 6405.0, 10348.0, 16782.0, 26181.0, 40350.0, 59108.0, 81375.0, 103945.0, 121262.0, 126213.0, 117517.0, 99174.0, 76516.0, 54365.0, 36461.0, 23420.0, 15042.0, 9033.0, 5686.0, 3562.0, 2176.0, 1325.0, 787.0, 504.0, 282.0, 204.0, 141.0, 73.0, 44.0, 31.0, 21.0, 13.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.875, -25.075927734375, -24.27685546875, -23.477783203125, -22.6787109375, -21.879638671875, -21.08056640625, -20.281494140625, -19.482421875, -18.683349609375, -17.88427734375, -17.085205078125, -16.2861328125, -15.487060546875, -14.68798828125, -13.888916015625, -13.08984375, -12.290771484375, -11.49169921875, -10.692626953125, -9.8935546875, -9.094482421875, -8.29541015625, -7.496337890625, -6.697265625, -5.898193359375, -5.09912109375, -4.300048828125, -3.5009765625, -2.701904296875, -1.90283203125, -1.103759765625, -0.3046875, 0.494384765625, 1.29345703125, 2.092529296875, 2.8916015625, 3.690673828125, 4.48974609375, 5.288818359375, 6.087890625, 6.886962890625, 7.68603515625, 8.485107421875, 9.2841796875, 10.083251953125, 10.88232421875, 11.681396484375, 12.48046875, 13.279541015625, 14.07861328125, 14.877685546875, 15.6767578125, 16.475830078125, 17.27490234375, 18.073974609375, 18.873046875, 19.672119140625, 20.47119140625, 21.270263671875, 22.0693359375, 22.868408203125, 23.66748046875, 24.466552734375, 25.265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 8.0, 5.0, 13.0, 19.0, 18.0, 20.0, 20.0, 31.0, 20.0, 36.0, 32.0, 46.0, 49.0, 49.0, 51.0, 44.0, 42.0, 33.0, 46.0, 45.0, 45.0, 45.0, 41.0, 32.0, 24.0, 27.0, 28.0, 17.0, 24.0, 19.0, 18.0, 6.0, 10.0, 4.0, 13.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.772705078125, -29.81103515625, -28.849365234375, -27.8876953125, -26.926025390625, -25.96435546875, -25.002685546875, -24.041015625, -23.079345703125, -22.11767578125, -21.156005859375, -20.1943359375, -19.232666015625, -18.27099609375, -17.309326171875, -16.34765625, -15.385986328125, -14.42431640625, -13.462646484375, -12.5009765625, -11.539306640625, -10.57763671875, -9.615966796875, -8.654296875, -7.692626953125, -6.73095703125, -5.769287109375, -4.8076171875, -3.845947265625, -2.88427734375, -1.922607421875, -0.9609375, 0.000732421875, 0.96240234375, 1.924072265625, 2.8857421875, 3.847412109375, 4.80908203125, 5.770751953125, 6.732421875, 7.694091796875, 8.65576171875, 9.617431640625, 10.5791015625, 11.540771484375, 12.50244140625, 13.464111328125, 14.42578125, 15.387451171875, 16.34912109375, 17.310791015625, 18.2724609375, 19.234130859375, 20.19580078125, 21.157470703125, 22.119140625, 23.080810546875, 24.04248046875, 25.004150390625, 25.9658203125, 26.927490234375, 27.88916015625, 28.850830078125, 29.8125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 11.0, 9.0, 11.0, 23.0, 31.0, 54.0, 69.0, 137.0, 183.0, 341.0, 532.0, 830.0, 1340.0, 2282.0, 3739.0, 5865.0, 9020.0, 13954.0, 21132.0, 30813.0, 42983.0, 56647.0, 72083.0, 84917.0, 95283.0, 100906.0, 99130.0, 92779.0, 80467.0, 65859.0, 51375.0, 37956.0, 26725.0, 18190.0, 12127.0, 7771.0, 4987.0, 3092.0, 1788.0, 1168.0, 731.0, 428.0, 273.0, 200.0, 111.0, 67.0, 48.0, 32.0, 22.0, 17.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0], "bins": [-7.32421875, -7.093994140625, -6.86376953125, -6.633544921875, -6.4033203125, -6.173095703125, -5.94287109375, -5.712646484375, -5.482421875, -5.252197265625, -5.02197265625, -4.791748046875, -4.5615234375, -4.331298828125, -4.10107421875, -3.870849609375, -3.640625, -3.410400390625, -3.18017578125, -2.949951171875, -2.7197265625, -2.489501953125, -2.25927734375, -2.029052734375, -1.798828125, -1.568603515625, -1.33837890625, -1.108154296875, -0.8779296875, -0.647705078125, -0.41748046875, -0.187255859375, 0.04296875, 0.273193359375, 0.50341796875, 0.733642578125, 0.9638671875, 1.194091796875, 1.42431640625, 1.654541015625, 1.884765625, 2.114990234375, 2.34521484375, 2.575439453125, 2.8056640625, 3.035888671875, 3.26611328125, 3.496337890625, 3.7265625, 3.956787109375, 4.18701171875, 4.417236328125, 4.6474609375, 4.877685546875, 5.10791015625, 5.338134765625, 5.568359375, 5.798583984375, 6.02880859375, 6.259033203125, 6.4892578125, 6.719482421875, 6.94970703125, 7.179931640625, 7.41015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 12.0, 9.0, 12.0, 22.0, 12.0, 20.0, 23.0, 27.0, 28.0, 25.0, 46.0, 42.0, 41.0, 45.0, 57.0, 50.0, 47.0, 41.0, 37.0, 44.0, 49.0, 32.0, 37.0, 24.0, 37.0, 30.0, 25.0, 18.0, 13.0, 19.0, 13.0, 12.0, 9.0, 3.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009937286376953125, -0.0009638965129852295, -0.0009340643882751465, -0.0009042322635650635, -0.0008744001388549805, -0.0008445680141448975, -0.0008147358894348145, -0.0007849037647247314, -0.0007550716400146484, -0.0007252395153045654, -0.0006954073905944824, -0.0006655752658843994, -0.0006357431411743164, -0.0006059110164642334, -0.0005760788917541504, -0.0005462467670440674, -0.0005164146423339844, -0.00048658251762390137, -0.00045675039291381836, -0.00042691826820373535, -0.00039708614349365234, -0.00036725401878356934, -0.00033742189407348633, -0.0003075897693634033, -0.0002777576446533203, -0.0002479255199432373, -0.0002180933952331543, -0.0001882612705230713, -0.00015842914581298828, -0.00012859702110290527, -9.876489639282227e-05, -6.893277168273926e-05, -3.910064697265625e-05, -9.268522262573242e-06, 2.0563602447509766e-05, 5.0395727157592773e-05, 8.022785186767578e-05, 0.00011005997657775879, 0.0001398921012878418, 0.0001697242259979248, 0.0001995563507080078, 0.00022938847541809082, 0.00025922060012817383, 0.00028905272483825684, 0.00031888484954833984, 0.00034871697425842285, 0.00037854909896850586, 0.00040838122367858887, 0.0004382133483886719, 0.0004680454730987549, 0.0004978775978088379, 0.0005277097225189209, 0.0005575418472290039, 0.0005873739719390869, 0.0006172060966491699, 0.0006470382213592529, 0.0006768703460693359, 0.0007067024707794189, 0.000736534595489502, 0.000766366720199585, 0.000796198844909668, 0.000826030969619751, 0.000855863094329834, 0.000885695219039917, 0.00091552734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 17.0, 34.0, 60.0, 75.0, 122.0, 202.0, 340.0, 614.0, 1033.0, 1958.0, 3367.0, 5888.0, 10587.0, 18266.0, 29873.0, 47009.0, 68841.0, 92840.0, 114779.0, 128422.0, 128186.0, 114211.0, 93827.0, 68804.0, 46731.0, 30006.0, 17863.0, 10673.0, 6067.0, 3324.0, 1961.0, 1065.0, 622.0, 357.0, 195.0, 132.0, 77.0, 36.0, 28.0, 17.0, 16.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.0234375, -9.710205078125, -9.39697265625, -9.083740234375, -8.7705078125, -8.457275390625, -8.14404296875, -7.830810546875, -7.517578125, -7.204345703125, -6.89111328125, -6.577880859375, -6.2646484375, -5.951416015625, -5.63818359375, -5.324951171875, -5.01171875, -4.698486328125, -4.38525390625, -4.072021484375, -3.7587890625, -3.445556640625, -3.13232421875, -2.819091796875, -2.505859375, -2.192626953125, -1.87939453125, -1.566162109375, -1.2529296875, -0.939697265625, -0.62646484375, -0.313232421875, 0.0, 0.313232421875, 0.62646484375, 0.939697265625, 1.2529296875, 1.566162109375, 1.87939453125, 2.192626953125, 2.505859375, 2.819091796875, 3.13232421875, 3.445556640625, 3.7587890625, 4.072021484375, 4.38525390625, 4.698486328125, 5.01171875, 5.324951171875, 5.63818359375, 5.951416015625, 6.2646484375, 6.577880859375, 6.89111328125, 7.204345703125, 7.517578125, 7.830810546875, 8.14404296875, 8.457275390625, 8.7705078125, 9.083740234375, 9.39697265625, 9.710205078125, 10.0234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 7.0, 5.0, 3.0, 1.0, 8.0, 5.0, 7.0, 6.0, 13.0, 15.0, 7.0, 13.0, 17.0, 13.0, 27.0, 28.0, 25.0, 24.0, 32.0, 54.0, 43.0, 35.0, 33.0, 46.0, 38.0, 37.0, 37.0, 34.0, 23.0, 33.0, 47.0, 35.0, 23.0, 24.0, 32.0, 20.0, 22.0, 21.0, 15.0, 14.0, 12.0, 14.0, 14.0, 8.0, 4.0, 7.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0], "bins": [-3.4296875, -3.334259033203125, -3.23883056640625, -3.143402099609375, -3.0479736328125, -2.952545166015625, -2.85711669921875, -2.761688232421875, -2.666259765625, -2.570831298828125, -2.47540283203125, -2.379974365234375, -2.2845458984375, -2.189117431640625, -2.09368896484375, -1.998260498046875, -1.90283203125, -1.807403564453125, -1.71197509765625, -1.616546630859375, -1.5211181640625, -1.425689697265625, -1.33026123046875, -1.234832763671875, -1.139404296875, -1.043975830078125, -0.94854736328125, -0.853118896484375, -0.7576904296875, -0.662261962890625, -0.56683349609375, -0.471405029296875, -0.3759765625, -0.280548095703125, -0.18511962890625, -0.089691162109375, 0.0057373046875, 0.101165771484375, 0.19659423828125, 0.292022705078125, 0.387451171875, 0.482879638671875, 0.57830810546875, 0.673736572265625, 0.7691650390625, 0.864593505859375, 0.96002197265625, 1.055450439453125, 1.15087890625, 1.246307373046875, 1.34173583984375, 1.437164306640625, 1.5325927734375, 1.628021240234375, 1.72344970703125, 1.818878173828125, 1.914306640625, 2.009735107421875, 2.10516357421875, 2.200592041015625, 2.2960205078125, 2.391448974609375, 2.48687744140625, 2.582305908203125, 2.677734375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 2.0, 4.0, 4.0, 11.0, 11.0, 14.0, 21.0, 28.0, 39.0, 39.0, 32.0, 34.0, 42.0, 42.0, 61.0, 54.0, 71.0, 57.0, 56.0, 46.0, 50.0, 40.0, 37.0, 30.0, 28.0, 37.0, 15.0, 22.0, 11.0, 10.0, 11.0, 6.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.339393615722656, -44.845157623291016, -43.350921630859375, -41.856689453125, -40.36245346069336, -38.86821746826172, -37.373985290527344, -35.8797492980957, -34.38551330566406, -32.89127731323242, -31.397043228149414, -29.902809143066406, -28.408573150634766, -26.914337158203125, -25.420103073120117, -23.92586898803711, -22.43163299560547, -20.937397003173828, -19.44316291809082, -17.948928833007812, -16.454692840576172, -14.960457801818848, -13.466222763061523, -11.9719877243042, -10.477752685546875, -8.98351764678955, -7.489282608032227, -5.995047569274902, -4.500812530517578, -3.006577491760254, -1.5123424530029297, -0.01810741424560547, 1.4761276245117188, 2.970362663269043, 4.464597702026367, 5.958832740783691, 7.453067779541016, 8.94730281829834, 10.441537857055664, 11.935772895812988, 13.430007934570312, 14.924242973327637, 16.41847801208496, 17.91271209716797, 19.40694808959961, 20.90118408203125, 22.395418167114258, 23.889652252197266, 25.383888244628906, 26.878124237060547, 28.372358322143555, 29.866592407226562, 31.360828399658203, 32.855064392089844, 34.34929656982422, 35.84353256225586, 37.3377685546875, 38.83200454711914, 40.32624053955078, 41.820472717285156, 43.3147087097168, 44.80894470214844, 46.30317687988281, 47.79741287231445, 49.291648864746094]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 11.0, 14.0, 10.0, 18.0, 19.0, 21.0, 22.0, 25.0, 35.0, 39.0, 49.0, 37.0, 42.0, 25.0, 39.0, 39.0, 36.0, 33.0, 39.0, 38.0, 41.0, 40.0, 33.0, 40.0, 26.0, 22.0, 24.0, 27.0, 21.0, 27.0, 18.0, 13.0, 11.0, 11.0, 8.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.7633171081543, -47.23638916015625, -45.7094612121582, -44.182533264160156, -42.65560531616211, -41.12867736816406, -39.60174560546875, -38.07482147216797, -36.547889709472656, -35.02096176147461, -33.49403381347656, -31.967105865478516, -30.44017791748047, -28.913249969482422, -27.386320114135742, -25.859392166137695, -24.33246612548828, -22.805538177490234, -21.278610229492188, -19.75168228149414, -18.224754333496094, -16.697826385498047, -15.170896530151367, -13.64396858215332, -12.117040634155273, -10.590112686157227, -9.06318473815918, -7.536255836486816, -6.0093278884887695, -4.482399940490723, -2.9554710388183594, -1.4285430908203125, 0.09838104248046875, 1.6253092288970947, 3.1522374153137207, 4.679165840148926, 6.206093788146973, 7.7330217361450195, 9.259950637817383, 10.78687858581543, 12.313806533813477, 13.840734481811523, 15.36766242980957, 16.89459228515625, 18.421520233154297, 19.948448181152344, 21.47537612915039, 23.002304077148438, 24.529232025146484, 26.05615997314453, 27.583087921142578, 29.110015869140625, 30.636943817138672, 32.16387176513672, 33.69080352783203, 35.21772766113281, 36.744659423828125, 38.27158737182617, 39.79851531982422, 41.325443267822266, 42.85237121582031, 44.37929916381836, 45.906227111816406, 47.43315887451172, 48.9600830078125]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 8.0, 7.0, 15.0, 8.0, 16.0, 30.0, 37.0, 59.0, 99.0, 96.0, 166.0, 230.0, 301.0, 447.0, 567.0, 741.0, 1040.0, 1346.0, 1710.0, 2185.0, 2887.0, 3518.0, 4230.0, 5094.0, 1001540.0, 5034.0, 4219.0, 3486.0, 2780.0, 2117.0, 1637.0, 1288.0, 961.0, 693.0, 537.0, 375.0, 269.0, 221.0, 164.0, 118.0, 93.0, 67.0, 46.0, 35.0, 25.0, 21.0, 18.0, 6.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-338.8955993652344, -328.1161804199219, -317.3367614746094, -306.5573425292969, -295.7779541015625, -284.99853515625, -274.2191162109375, -263.439697265625, -252.6602783203125, -241.880859375, -231.1014404296875, -220.32203674316406, -209.54261779785156, -198.76319885253906, -187.98379516601562, -177.20437622070312, -166.42495727539062, -155.64553833007812, -144.86611938476562, -134.0867156982422, -123.30729675292969, -112.52787780761719, -101.74846649169922, -90.96905517578125, -80.18963623046875, -69.41021728515625, -58.63080596923828, -47.85139083862305, -37.07197570800781, -26.292560577392578, -15.513145446777344, -4.733734130859375, 6.04571533203125, 16.825130462646484, 27.60454559326172, 38.38396072387695, 49.16337585449219, 59.94279098510742, 70.72220611572266, 81.50161743164062, 92.28103637695312, 103.06045532226562, 113.8398666381836, 124.61927795410156, 135.39869689941406, 146.17811584472656, 156.95751953125, 167.7369384765625, 178.516357421875, 189.2957763671875, 200.0751953125, 210.85459899902344, 221.63401794433594, 232.41343688964844, 243.19284057617188, 253.97225952148438, 264.7516784667969, 275.5310974121094, 286.3105163574219, 297.0899353027344, 307.86932373046875, 318.64874267578125, 329.42816162109375, 340.20758056640625, 350.98699951171875]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 14.0, 8.0, 12.0, 14.0, 7.0, 19.0, 19.0, 24.0, 26.0, 24.0, 35.0, 39.0, 48.0, 60.0, 78.0, 117.0, 179.0, 280.0, 570.0, 1124.0, 2216.0, 4607.0, 10240.0, 22296.0, 42994.0, 51226108.0, 95861.0, 33024.0, 16678.0, 7467.0, 3282.0, 1636.0, 842.0, 473.0, 266.0, 148.0, 99.0, 64.0, 59.0, 45.0, 41.0, 42.0, 27.0, 21.0, 23.0, 18.0, 9.0, 14.0, 8.0, 12.0, 2.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-934.5, -905.109375, -875.71875, -846.328125, -816.9375, -787.546875, -758.15625, -728.765625, -699.375, -669.984375, -640.59375, -611.203125, -581.8125, -552.421875, -523.03125, -493.640625, -464.25, -434.859375, -405.46875, -376.078125, -346.6875, -317.296875, -287.90625, -258.515625, -229.125, -199.734375, -170.34375, -140.953125, -111.5625, -82.171875, -52.78125, -23.390625, 6.0, 35.390625, 64.78125, 94.171875, 123.5625, 152.953125, 182.34375, 211.734375, 241.125, 270.515625, 299.90625, 329.296875, 358.6875, 388.078125, 417.46875, 446.859375, 476.25, 505.640625, 535.03125, 564.421875, 593.8125, 623.203125, 652.59375, 681.984375, 711.375, 740.765625, 770.15625, 799.546875, 828.9375, 858.328125, 887.71875, 917.109375, 946.5]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 6.0, 16.0, 19.0, 17.0, 23.0, 27.0, 53.0, 47.0, 60.0, 143.0, 171.0, 248.0, 382.0, 557.0, 750.0, 1029.0, 1463.0, 2337.0, 3524.0, 5503.0, 8557.0, 14017.0, 23501.0, 42019.0, 78435.0, 158892.0, 358761.0, 1391899.0, 3376041.0, 432828.0, 184749.0, 89384.0, 47153.0, 25931.0, 15591.0, 9394.0, 5938.0, 3764.0, 2607.0, 1747.0, 1124.0, 800.0, 569.0, 442.0, 259.0, 215.0, 115.0, 109.0, 78.0, 33.0, 28.0, 26.0, 26.0, 15.0, 7.0, 4.0, 10.0, 2.0, 4.0], "bins": [-8.515625, -8.25836181640625, -8.0010986328125, -7.74383544921875, -7.486572265625, -7.22930908203125, -6.9720458984375, -6.71478271484375, -6.45751953125, -6.20025634765625, -5.9429931640625, -5.68572998046875, -5.428466796875, -5.17120361328125, -4.9139404296875, -4.65667724609375, -4.3994140625, -4.14215087890625, -3.8848876953125, -3.62762451171875, -3.370361328125, -3.11309814453125, -2.8558349609375, -2.59857177734375, -2.34130859375, -2.08404541015625, -1.8267822265625, -1.56951904296875, -1.312255859375, -1.05499267578125, -0.7977294921875, -0.54046630859375, -0.283203125, -0.02593994140625, 0.2313232421875, 0.48858642578125, 0.745849609375, 1.00311279296875, 1.2603759765625, 1.51763916015625, 1.77490234375, 2.03216552734375, 2.2894287109375, 2.54669189453125, 2.803955078125, 3.06121826171875, 3.3184814453125, 3.57574462890625, 3.8330078125, 4.09027099609375, 4.3475341796875, 4.60479736328125, 4.862060546875, 5.11932373046875, 5.3765869140625, 5.63385009765625, 5.89111328125, 6.14837646484375, 6.4056396484375, 6.66290283203125, 6.920166015625, 7.17742919921875, 7.4346923828125, 7.69195556640625, 7.94921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 11.0, 14.0, 7.0, 12.0, 12.0, 19.0, 21.0, 14.0, 18.0, 26.0, 19.0, 33.0, 29.0, 37.0, 39.0, 29.0, 32.0, 38.0, 65.0, 425.0, 456.0, 171.0, 78.0, 45.0, 43.0, 37.0, 28.0, 25.0, 27.0, 25.0, 27.0, 18.0, 22.0, 16.0, 10.0, 12.0, 14.0, 4.0, 7.0, 6.0, 10.0, 4.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.671875, -20.991943359375, -20.31201171875, -19.632080078125, -18.9521484375, -18.272216796875, -17.59228515625, -16.912353515625, -16.232421875, -15.552490234375, -14.87255859375, -14.192626953125, -13.5126953125, -12.832763671875, -12.15283203125, -11.472900390625, -10.79296875, -10.113037109375, -9.43310546875, -8.753173828125, -8.0732421875, -7.393310546875, -6.71337890625, -6.033447265625, -5.353515625, -4.673583984375, -3.99365234375, -3.313720703125, -2.6337890625, -1.953857421875, -1.27392578125, -0.593994140625, 0.0859375, 0.765869140625, 1.44580078125, 2.125732421875, 2.8056640625, 3.485595703125, 4.16552734375, 4.845458984375, 5.525390625, 6.205322265625, 6.88525390625, 7.565185546875, 8.2451171875, 8.925048828125, 9.60498046875, 10.284912109375, 10.96484375, 11.644775390625, 12.32470703125, 13.004638671875, 13.6845703125, 14.364501953125, 15.04443359375, 15.724365234375, 16.404296875, 17.084228515625, 17.76416015625, 18.444091796875, 19.1240234375, 19.803955078125, 20.48388671875, 21.163818359375, 21.84375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 8.0, 12.0, 14.0, 22.0, 35.0, 34.0, 57.0, 62.0, 105.0, 197.0, 231.0, 362.0, 569.0, 954.0, 1500.0, 2759.0, 4552.0, 8159.0, 15161.0, 28617.0, 57942.0, 126658.0, 362904.0, 4103543.0, 1139322.0, 244589.0, 94490.0, 45332.0, 23592.0, 12770.0, 6898.0, 4097.0, 2321.0, 1313.0, 725.0, 504.0, 368.0, 199.0, 128.0, 91.0, 78.0, 42.0, 38.0, 25.0, 13.0, 10.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.2265625, -13.7933349609375, -13.360107421875, -12.9268798828125, -12.49365234375, -12.0604248046875, -11.627197265625, -11.1939697265625, -10.7607421875, -10.3275146484375, -9.894287109375, -9.4610595703125, -9.02783203125, -8.5946044921875, -8.161376953125, -7.7281494140625, -7.294921875, -6.8616943359375, -6.428466796875, -5.9952392578125, -5.56201171875, -5.1287841796875, -4.695556640625, -4.2623291015625, -3.8291015625, -3.3958740234375, -2.962646484375, -2.5294189453125, -2.09619140625, -1.6629638671875, -1.229736328125, -0.7965087890625, -0.36328125, 0.0699462890625, 0.503173828125, 0.9364013671875, 1.36962890625, 1.8028564453125, 2.236083984375, 2.6693115234375, 3.1025390625, 3.5357666015625, 3.968994140625, 4.4022216796875, 4.83544921875, 5.2686767578125, 5.701904296875, 6.1351318359375, 6.568359375, 7.0015869140625, 7.434814453125, 7.8680419921875, 8.30126953125, 8.7344970703125, 9.167724609375, 9.6009521484375, 10.0341796875, 10.4674072265625, 10.900634765625, 11.3338623046875, 11.76708984375, 12.2003173828125, 12.633544921875, 13.0667724609375, 13.5]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 7.0, 6.0, 8.0, 14.0, 17.0, 21.0, 17.0, 28.0, 20.0, 29.0, 17.0, 31.0, 27.0, 39.0, 35.0, 41.0, 44.0, 59.0, 255.0, 652.0, 155.0, 108.0, 60.0, 42.0, 44.0, 30.0, 31.0, 29.0, 26.0, 32.0, 22.0, 14.0, 11.0, 13.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.33203125, -18.6171875, -17.90234375, -17.1875, -16.47265625, -15.7578125, -15.04296875, -14.328125, -13.61328125, -12.8984375, -12.18359375, -11.46875, -10.75390625, -10.0390625, -9.32421875, -8.609375, -7.89453125, -7.1796875, -6.46484375, -5.75, -5.03515625, -4.3203125, -3.60546875, -2.890625, -2.17578125, -1.4609375, -0.74609375, -0.03125, 0.68359375, 1.3984375, 2.11328125, 2.828125, 3.54296875, 4.2578125, 4.97265625, 5.6875, 6.40234375, 7.1171875, 7.83203125, 8.546875, 9.26171875, 9.9765625, 10.69140625, 11.40625, 12.12109375, 12.8359375, 13.55078125, 14.265625, 14.98046875, 15.6953125, 16.41015625, 17.125, 17.83984375, 18.5546875, 19.26953125, 19.984375, 20.69921875, 21.4140625, 22.12890625, 22.84375, 23.55859375, 24.2734375, 24.98828125, 25.703125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 12.0, 9.0, 9.0, 7.0, 18.0, 35.0, 30.0, 59.0, 65.0, 100.0, 110.0, 130.0, 224.0, 322.0, 479.0, 787.0, 1224.0, 2166.0, 4295.0, 10111.0, 33290.0, 5707690.0, 478841.0, 31677.0, 9832.0, 4116.0, 2193.0, 1295.0, 703.0, 429.0, 346.0, 221.0, 170.0, 125.0, 57.0, 66.0, 42.0, 30.0, 26.0, 16.0, 22.0, 9.0, 10.0, 5.0, 7.0, 8.0, 2.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-81.0625, -78.3583984375, -75.654296875, -72.9501953125, -70.24609375, -67.5419921875, -64.837890625, -62.1337890625, -59.4296875, -56.7255859375, -54.021484375, -51.3173828125, -48.61328125, -45.9091796875, -43.205078125, -40.5009765625, -37.796875, -35.0927734375, -32.388671875, -29.6845703125, -26.98046875, -24.2763671875, -21.572265625, -18.8681640625, -16.1640625, -13.4599609375, -10.755859375, -8.0517578125, -5.34765625, -2.6435546875, 0.060546875, 2.7646484375, 5.46875, 8.1728515625, 10.876953125, 13.5810546875, 16.28515625, 18.9892578125, 21.693359375, 24.3974609375, 27.1015625, 29.8056640625, 32.509765625, 35.2138671875, 37.91796875, 40.6220703125, 43.326171875, 46.0302734375, 48.734375, 51.4384765625, 54.142578125, 56.8466796875, 59.55078125, 62.2548828125, 64.958984375, 67.6630859375, 70.3671875, 73.0712890625, 75.775390625, 78.4794921875, 81.18359375, 83.8876953125, 86.591796875, 89.2958984375, 92.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 2.0, 10.0, 10.0, 10.0, 13.0, 17.0, 20.0, 21.0, 38.0, 41.0, 40.0, 62.0, 54.0, 162.0, 790.0, 225.0, 130.0, 75.0, 70.0, 49.0, 37.0, 35.0, 22.0, 20.0, 17.0, 13.0, 8.0, 8.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.34375, -30.30908203125, -29.2744140625, -28.23974609375, -27.205078125, -26.17041015625, -25.1357421875, -24.10107421875, -23.06640625, -22.03173828125, -20.9970703125, -19.96240234375, -18.927734375, -17.89306640625, -16.8583984375, -15.82373046875, -14.7890625, -13.75439453125, -12.7197265625, -11.68505859375, -10.650390625, -9.61572265625, -8.5810546875, -7.54638671875, -6.51171875, -5.47705078125, -4.4423828125, -3.40771484375, -2.373046875, -1.33837890625, -0.3037109375, 0.73095703125, 1.765625, 2.80029296875, 3.8349609375, 4.86962890625, 5.904296875, 6.93896484375, 7.9736328125, 9.00830078125, 10.04296875, 11.07763671875, 12.1123046875, 13.14697265625, 14.181640625, 15.21630859375, 16.2509765625, 17.28564453125, 18.3203125, 19.35498046875, 20.3896484375, 21.42431640625, 22.458984375, 23.49365234375, 24.5283203125, 25.56298828125, 26.59765625, 27.63232421875, 28.6669921875, 29.70166015625, 30.736328125, 31.77099609375, 32.8056640625, 33.84033203125, 34.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 73.0, 838.0, 55.0, 16.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.84063720703125, -92.20392608642578, -79.56720733642578, -66.93049621582031, -54.29378128051758, -41.657066345214844, -29.020355224609375, -16.383636474609375, -3.7469253540039062, 8.889788627624512, 21.52650260925293, 34.16321563720703, 46.799930572509766, 59.4366455078125, 72.07335662841797, 84.71007537841797, 97.34678649902344, 109.9834976196289, 122.6202163696289, 135.25692749023438, 147.89364624023438, 160.53036499023438, 173.1670684814453, 185.8037872314453, 198.44049072265625, 211.07720947265625, 223.7139129638672, 236.3506317138672, 248.9873504638672, 261.6240539550781, 274.2607727050781, 286.8974914550781, 299.5342102050781, 312.1709289550781, 324.8076477050781, 337.4443359375, 350.0810546875, 362.7177734375, 375.3544921875, 387.9912109375, 400.6279296875, 413.2646484375, 425.9013671875, 438.5380859375, 451.1747741699219, 463.8114929199219, 476.4482116699219, 489.0849304199219, 501.72161865234375, 514.3583374023438, 526.9950561523438, 539.6317749023438, 552.2684936523438, 564.9052124023438, 577.5418701171875, 590.1785888671875, 602.8153686523438, 615.4520874023438, 628.0888061523438, 640.7255249023438, 653.3622436523438, 665.9989624023438, 678.6356201171875, 691.2723388671875, 703.9090576171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [7.0, 1.0, 6.0, 6.0, 24.0, 44.0, 154.0, 324.0, 275.0, 89.0, 34.0, 21.0, 15.0, 8.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.29730224609375, -42.16850280761719, -36.039703369140625, -29.91090202331543, -23.782102584838867, -17.653303146362305, -11.52450180053711, -5.395702362060547, 0.7330970764160156, 6.861896991729736, 12.990696907043457, 19.119497299194336, 25.2482967376709, 31.37709617614746, 37.505897521972656, 43.63469696044922, 49.76349639892578, 55.892295837402344, 62.021095275878906, 68.14989471435547, 74.27869415283203, 80.4074935913086, 86.53630065917969, 92.66510009765625, 98.79389953613281, 104.92269897460938, 111.05149841308594, 117.1802978515625, 123.30909729003906, 129.43789672851562, 135.5666961669922, 141.69549560546875, 147.8242950439453, 153.95309448242188, 160.08189392089844, 166.210693359375, 172.33949279785156, 178.46829223632812, 184.5970916748047, 190.72589111328125, 196.8546905517578, 202.98348999023438, 209.11228942871094, 215.2410888671875, 221.36988830566406, 227.49868774414062, 233.6274871826172, 239.75628662109375, 245.88510131835938, 252.01390075683594, 258.1427001953125, 264.2715148925781, 270.4002990722656, 276.52911376953125, 282.65789794921875, 288.7867126464844, 294.9154968261719, 301.0443115234375, 307.173095703125, 313.3019104003906, 319.4306945800781, 325.55950927734375, 331.68829345703125, 337.8171081542969, 343.9458923339844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 7.0, 6.0, 9.0, 8.0, 14.0, 13.0, 16.0, 24.0, 28.0, 39.0, 63.0, 92.0, 112.0, 170.0, 276.0, 393.0, 614.0, 1018.0, 1756.0, 3191.0, 6666.0, 16799.0, 74917.0, 3971473.0, 85694.0, 16641.0, 6363.0, 3094.0, 1638.0, 1098.0, 632.0, 413.0, 273.0, 198.0, 140.0, 95.0, 79.0, 48.0, 28.0, 28.0, 27.0, 18.0, 12.0, 12.0, 12.0, 9.0, 8.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0], "bins": [-1.2822265625, -1.243988037109375, -1.20574951171875, -1.167510986328125, -1.1292724609375, -1.091033935546875, -1.05279541015625, -1.014556884765625, -0.976318359375, -0.938079833984375, -0.89984130859375, -0.861602783203125, -0.8233642578125, -0.785125732421875, -0.74688720703125, -0.708648681640625, -0.67041015625, -0.632171630859375, -0.59393310546875, -0.555694580078125, -0.5174560546875, -0.479217529296875, -0.44097900390625, -0.402740478515625, -0.364501953125, -0.326263427734375, -0.28802490234375, -0.249786376953125, -0.2115478515625, -0.173309326171875, -0.13507080078125, -0.096832275390625, -0.05859375, -0.020355224609375, 0.01788330078125, 0.056121826171875, 0.0943603515625, 0.132598876953125, 0.17083740234375, 0.209075927734375, 0.247314453125, 0.285552978515625, 0.32379150390625, 0.362030029296875, 0.4002685546875, 0.438507080078125, 0.47674560546875, 0.514984130859375, 0.55322265625, 0.591461181640625, 0.62969970703125, 0.667938232421875, 0.7061767578125, 0.744415283203125, 0.78265380859375, 0.820892333984375, 0.859130859375, 0.897369384765625, 0.93560791015625, 0.973846435546875, 1.0120849609375, 1.050323486328125, 1.08856201171875, 1.126800537109375, 1.1650390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 9.0, 9.0, 7.0, 5.0, 18.0, 20.0, 56.0, 368.0, 374.0, 56.0, 22.0, 13.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18062591552734375, -0.1749725341796875, -0.16931915283203125, -0.163665771484375, -0.15801239013671875, -0.1523590087890625, -0.14670562744140625, -0.14105224609375, -0.13539886474609375, -0.1297454833984375, -0.12409210205078125, -0.118438720703125, -0.11278533935546875, -0.1071319580078125, -0.10147857666015625, -0.0958251953125, -0.09017181396484375, -0.0845184326171875, -0.07886505126953125, -0.073211669921875, -0.06755828857421875, -0.0619049072265625, -0.05625152587890625, -0.05059814453125, -0.04494476318359375, -0.0392913818359375, -0.03363800048828125, -0.027984619140625, -0.02233123779296875, -0.0166778564453125, -0.01102447509765625, -0.00537109375, 0.00028228759765625, 0.0059356689453125, 0.01158905029296875, 0.017242431640625, 0.02289581298828125, 0.0285491943359375, 0.03420257568359375, 0.03985595703125, 0.04550933837890625, 0.0511627197265625, 0.05681610107421875, 0.062469482421875, 0.06812286376953125, 0.0737762451171875, 0.07942962646484375, 0.0850830078125, 0.09073638916015625, 0.0963897705078125, 0.10204315185546875, 0.107696533203125, 0.11334991455078125, 0.1190032958984375, 0.12465667724609375, 0.13031005859375, 0.13596343994140625, 0.1416168212890625, 0.14727020263671875, 0.152923583984375, 0.15857696533203125, 0.1642303466796875, 0.16988372802734375, 0.175537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 2.0, 14.0, 15.0, 12.0, 16.0, 23.0, 55.0, 54.0, 92.0, 149.0, 239.0, 440.0, 732.0, 1396.0, 2973.0, 6920.0, 21056.0, 104301.0, 3267454.0, 704266.0, 58243.0, 15228.0, 5479.0, 2328.0, 1189.0, 644.0, 335.0, 198.0, 153.0, 74.0, 63.0, 37.0, 26.0, 16.0, 15.0, 12.0, 12.0, 6.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1530303955078125, -1.115631103515625, -1.0782318115234375, -1.04083251953125, -1.0034332275390625, -0.966033935546875, -0.9286346435546875, -0.8912353515625, -0.8538360595703125, -0.816436767578125, -0.7790374755859375, -0.74163818359375, -0.7042388916015625, -0.666839599609375, -0.6294403076171875, -0.592041015625, -0.5546417236328125, -0.517242431640625, -0.4798431396484375, -0.44244384765625, -0.4050445556640625, -0.367645263671875, -0.3302459716796875, -0.2928466796875, -0.2554473876953125, -0.218048095703125, -0.1806488037109375, -0.14324951171875, -0.1058502197265625, -0.068450927734375, -0.0310516357421875, 0.00634765625, 0.0437469482421875, 0.081146240234375, 0.1185455322265625, 0.15594482421875, 0.1933441162109375, 0.230743408203125, 0.2681427001953125, 0.3055419921875, 0.3429412841796875, 0.380340576171875, 0.4177398681640625, 0.45513916015625, 0.4925384521484375, 0.529937744140625, 0.5673370361328125, 0.604736328125, 0.6421356201171875, 0.679534912109375, 0.7169342041015625, 0.75433349609375, 0.7917327880859375, 0.829132080078125, 0.8665313720703125, 0.9039306640625, 0.9413299560546875, 0.978729248046875, 1.0161285400390625, 1.05352783203125, 1.0909271240234375, 1.128326416015625, 1.1657257080078125, 1.203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 6.0, 10.0, 14.0, 24.0, 20.0, 30.0, 52.0, 63.0, 87.0, 134.0, 215.0, 505.0, 1220.0, 696.0, 330.0, 181.0, 136.0, 91.0, 54.0, 38.0, 44.0, 23.0, 19.0, 12.0, 6.0, 17.0, 5.0, 5.0, 6.0, 3.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24895095825195312, -0.24057769775390625, -0.23220443725585938, -0.2238311767578125, -0.21545791625976562, -0.20708465576171875, -0.19871139526367188, -0.190338134765625, -0.18196487426757812, -0.17359161376953125, -0.16521835327148438, -0.1568450927734375, -0.14847183227539062, -0.14009857177734375, -0.13172531127929688, -0.12335205078125, -0.11497879028320312, -0.10660552978515625, -0.09823226928710938, -0.0898590087890625, -0.08148574829101562, -0.07311248779296875, -0.06473922729492188, -0.056365966796875, -0.047992706298828125, -0.03961944580078125, -0.031246185302734375, -0.0228729248046875, -0.014499664306640625, -0.00612640380859375, 0.002246856689453125, 0.0106201171875, 0.018993377685546875, 0.02736663818359375, 0.035739898681640625, 0.0441131591796875, 0.052486419677734375, 0.06085968017578125, 0.06923294067382812, 0.077606201171875, 0.08597946166992188, 0.09435272216796875, 0.10272598266601562, 0.1110992431640625, 0.11947250366210938, 0.12784576416015625, 0.13621902465820312, 0.14459228515625, 0.15296554565429688, 0.16133880615234375, 0.16971206665039062, 0.1780853271484375, 0.18645858764648438, 0.19483184814453125, 0.20320510864257812, 0.211578369140625, 0.21995162963867188, 0.22832489013671875, 0.23669815063476562, 0.2450714111328125, 0.2534446716308594, 0.26181793212890625, 0.2701911926269531, 0.278564453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 16.0, 44.0, 170.0, 357.0, 248.0, 83.0, 46.0, 12.0, 13.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7438559532165527, -3.5920450687408447, -3.4402341842651367, -3.288423538208008, -3.1366126537323, -2.984801769256592, -2.832991123199463, -2.681180238723755, -2.529369354248047, -2.377558469772339, -2.225747585296631, -2.073936939239502, -1.922126054763794, -1.770315170288086, -1.6185044050216675, -1.466693639755249, -1.314882755279541, -1.163071870803833, -1.0112611055374146, -0.8594502806663513, -0.7076394557952881, -0.5558286309242249, -0.4040178060531616, -0.25220704078674316, -0.10039615631103516, 0.051414668560028076, 0.2032254934310913, 0.35503631830215454, 0.5068471431732178, 0.658657968044281, 0.8104687929153442, 0.9622795581817627, 1.1140904426574707, 1.2659013271331787, 1.4177120923995972, 1.5695228576660156, 1.7213337421417236, 1.8731446266174316, 2.0249552726745605, 2.1767661571502686, 2.3285770416259766, 2.4803879261016846, 2.6321988105773926, 2.7840094566345215, 2.9358203411102295, 3.0876312255859375, 3.2394418716430664, 3.3912527561187744, 3.5430636405944824, 3.6948745250701904, 3.8466854095458984, 3.9984960556030273, 4.150306701660156, 4.302117824554443, 4.453928470611572, 4.605739593505859, 4.757550239562988, 4.909360885620117, 5.061172008514404, 5.212982654571533, 5.36479377746582, 5.516604423522949, 5.668415069580078, 5.820225715637207, 5.972036838531494]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 15.0, 12.0, 15.0, 20.0, 29.0, 36.0, 47.0, 46.0, 44.0, 52.0, 43.0, 50.0, 60.0, 63.0, 62.0, 60.0, 54.0, 46.0, 44.0, 46.0, 34.0, 26.0, 17.0, 19.0, 17.0, 5.0, 5.0, 13.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2556431293487549, -1.2096362113952637, -1.163629174232483, -1.1176222562789917, -1.0716153383255005, -1.0256083011627197, -0.9796013832092285, -0.9335944056510925, -0.8875874280929565, -0.8415804505348206, -0.7955735325813293, -0.7495665550231934, -0.7035595774650574, -0.6575525999069214, -0.6115456819534302, -0.5655387043952942, -0.519531786441803, -0.4735248386859894, -0.4275178611278534, -0.3815109133720398, -0.3355039358139038, -0.2894969880580902, -0.2434900403022766, -0.19748306274414062, -0.15147611498832703, -0.10546915233135223, -0.05946219712495804, -0.013455241918563843, 0.03255172073841095, 0.07855868339538574, 0.12456563115119934, 0.17057260870933533, 0.21657955646514893, 0.2625865042209625, 0.3085934817790985, 0.3546004295349121, 0.4006074070930481, 0.4466143548488617, 0.4926213026046753, 0.5386282801628113, 0.5846352577209473, 0.6306422352790833, 0.6766491532325745, 0.7226561307907104, 0.7686631083488464, 0.8146700859069824, 0.8606770038604736, 0.9066839814186096, 0.9526908993721008, 0.9986978769302368, 1.044704794883728, 1.0907118320465088, 1.13671875, 1.1827256679534912, 1.2287325859069824, 1.2747396230697632, 1.3207465410232544, 1.3667534589767456, 1.4127604961395264, 1.4587674140930176, 1.5047743320465088, 1.5507813692092896, 1.5967882871627808, 1.6427953243255615, 1.6888022422790527]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 6.0, 13.0, 14.0, 18.0, 43.0, 41.0, 74.0, 107.0, 138.0, 223.0, 360.0, 619.0, 1200.0, 2417.0, 6019.0, 19430.0, 386716.0, 597847.0, 21279.0, 6375.0, 2543.0, 1273.0, 691.0, 362.0, 228.0, 163.0, 97.0, 73.0, 57.0, 30.0, 32.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4500579833984375, -1.400115966796875, -1.3501739501953125, -1.30023193359375, -1.2502899169921875, -1.200347900390625, -1.1504058837890625, -1.1004638671875, -1.0505218505859375, -1.000579833984375, -0.9506378173828125, -0.90069580078125, -0.8507537841796875, -0.800811767578125, -0.7508697509765625, -0.700927734375, -0.6509857177734375, -0.601043701171875, -0.5511016845703125, -0.50115966796875, -0.4512176513671875, -0.401275634765625, -0.3513336181640625, -0.3013916015625, -0.2514495849609375, -0.201507568359375, -0.1515655517578125, -0.10162353515625, -0.0516815185546875, -0.001739501953125, 0.0482025146484375, 0.09814453125, 0.1480865478515625, 0.198028564453125, 0.2479705810546875, 0.29791259765625, 0.3478546142578125, 0.397796630859375, 0.4477386474609375, 0.4976806640625, 0.5476226806640625, 0.597564697265625, 0.6475067138671875, 0.69744873046875, 0.7473907470703125, 0.797332763671875, 0.8472747802734375, 0.897216796875, 0.9471588134765625, 0.997100830078125, 1.0470428466796875, 1.09698486328125, 1.1469268798828125, 1.196868896484375, 1.2468109130859375, 1.2967529296875, 1.3466949462890625, 1.396636962890625, 1.4465789794921875, 1.49652099609375, 1.5464630126953125, 1.596405029296875, 1.6463470458984375, 1.6962890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 13.0, 11.0, 14.0, 26.0, 77.0, 199.0, 317.0, 201.0, 68.0, 22.0, 11.0, 6.0, 6.0, 2.0, 6.0, 5.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.1799640655517578, -0.17364883422851562, -0.16733360290527344, -0.16101837158203125, -0.15470314025878906, -0.14838790893554688, -0.1420726776123047, -0.1357574462890625, -0.1294422149658203, -0.12312698364257812, -0.11681175231933594, -0.11049652099609375, -0.10418128967285156, -0.09786605834960938, -0.09155082702636719, -0.085235595703125, -0.07892036437988281, -0.07260513305664062, -0.06628990173339844, -0.05997467041015625, -0.05365943908691406, -0.047344207763671875, -0.04102897644042969, -0.0347137451171875, -0.028398513793945312, -0.022083282470703125, -0.015768051147460938, -0.00945281982421875, -0.0031375885009765625, 0.003177642822265625, 0.009492874145507812, 0.01580810546875, 0.022123336791992188, 0.028438568115234375, 0.03475379943847656, 0.04106903076171875, 0.04738426208496094, 0.053699493408203125, 0.06001472473144531, 0.0663299560546875, 0.07264518737792969, 0.07896041870117188, 0.08527565002441406, 0.09159088134765625, 0.09790611267089844, 0.10422134399414062, 0.11053657531738281, 0.116851806640625, 0.12316703796386719, 0.12948226928710938, 0.13579750061035156, 0.14211273193359375, 0.14842796325683594, 0.15474319458007812, 0.1610584259033203, 0.1673736572265625, 0.1736888885498047, 0.18000411987304688, 0.18631935119628906, 0.19263458251953125, 0.19894981384277344, 0.20526504516601562, 0.2115802764892578, 0.2178955078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 9.0, 21.0, 27.0, 27.0, 43.0, 79.0, 105.0, 220.0, 409.0, 910.0, 2454.0, 9221.0, 76196.0, 859168.0, 85317.0, 10073.0, 2422.0, 868.0, 420.0, 215.0, 114.0, 62.0, 45.0, 30.0, 22.0, 10.0, 16.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.964691162109375, -1.89813232421875, -1.831573486328125, -1.7650146484375, -1.698455810546875, -1.63189697265625, -1.565338134765625, -1.498779296875, -1.432220458984375, -1.36566162109375, -1.299102783203125, -1.2325439453125, -1.165985107421875, -1.09942626953125, -1.032867431640625, -0.96630859375, -0.899749755859375, -0.83319091796875, -0.766632080078125, -0.7000732421875, -0.633514404296875, -0.56695556640625, -0.500396728515625, -0.433837890625, -0.367279052734375, -0.30072021484375, -0.234161376953125, -0.1676025390625, -0.101043701171875, -0.03448486328125, 0.032073974609375, 0.0986328125, 0.165191650390625, 0.23175048828125, 0.298309326171875, 0.3648681640625, 0.431427001953125, 0.49798583984375, 0.564544677734375, 0.631103515625, 0.697662353515625, 0.76422119140625, 0.830780029296875, 0.8973388671875, 0.963897705078125, 1.03045654296875, 1.097015380859375, 1.16357421875, 1.230133056640625, 1.29669189453125, 1.363250732421875, 1.4298095703125, 1.496368408203125, 1.56292724609375, 1.629486083984375, 1.696044921875, 1.762603759765625, 1.82916259765625, 1.895721435546875, 1.9622802734375, 2.028839111328125, 2.09539794921875, 2.161956787109375, 2.228515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 4.0, 6.0, 14.0, 14.0, 14.0, 19.0, 26.0, 16.0, 31.0, 37.0, 34.0, 28.0, 34.0, 43.0, 33.0, 43.0, 35.0, 33.0, 43.0, 33.0, 47.0, 39.0, 36.0, 40.0, 51.0, 30.0, 26.0, 31.0, 19.0, 27.0, 19.0, 14.0, 17.0, 12.0, 7.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5092697143554688, -0.4921722412109375, -0.47507476806640625, -0.457977294921875, -0.44087982177734375, -0.4237823486328125, -0.40668487548828125, -0.38958740234375, -0.37248992919921875, -0.3553924560546875, -0.33829498291015625, -0.321197509765625, -0.30410003662109375, -0.2870025634765625, -0.26990509033203125, -0.2528076171875, -0.23571014404296875, -0.2186126708984375, -0.20151519775390625, -0.184417724609375, -0.16732025146484375, -0.1502227783203125, -0.13312530517578125, -0.11602783203125, -0.09893035888671875, -0.0818328857421875, -0.06473541259765625, -0.047637939453125, -0.03054046630859375, -0.0134429931640625, 0.00365447998046875, 0.020751953125, 0.03784942626953125, 0.0549468994140625, 0.07204437255859375, 0.089141845703125, 0.10623931884765625, 0.1233367919921875, 0.14043426513671875, 0.15753173828125, 0.17462921142578125, 0.1917266845703125, 0.20882415771484375, 0.225921630859375, 0.24301910400390625, 0.2601165771484375, 0.27721405029296875, 0.2943115234375, 0.31140899658203125, 0.3285064697265625, 0.34560394287109375, 0.362701416015625, 0.37979888916015625, 0.3968963623046875, 0.41399383544921875, 0.43109130859375, 0.44818878173828125, 0.4652862548828125, 0.48238372802734375, 0.499481201171875, 0.5165786743164062, 0.5336761474609375, 0.5507736206054688, 0.56787109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 1.0, 2.0, 1.0, 3.0, 6.0, 15.0, 11.0, 25.0, 30.0, 39.0, 66.0, 93.0, 152.0, 231.0, 423.0, 844.0, 2071.0, 8647.0, 696025.0, 328447.0, 7624.0, 1947.0, 803.0, 374.0, 224.0, 145.0, 93.0, 51.0, 45.0, 32.0, 26.0, 20.0, 9.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.505126953125, -2.40478515625, -2.304443359375, -2.2041015625, -2.103759765625, -2.00341796875, -1.903076171875, -1.802734375, -1.702392578125, -1.60205078125, -1.501708984375, -1.4013671875, -1.301025390625, -1.20068359375, -1.100341796875, -1.0, -0.899658203125, -0.79931640625, -0.698974609375, -0.5986328125, -0.498291015625, -0.39794921875, -0.297607421875, -0.197265625, -0.096923828125, 0.00341796875, 0.103759765625, 0.2041015625, 0.304443359375, 0.40478515625, 0.505126953125, 0.60546875, 0.705810546875, 0.80615234375, 0.906494140625, 1.0068359375, 1.107177734375, 1.20751953125, 1.307861328125, 1.408203125, 1.508544921875, 1.60888671875, 1.709228515625, 1.8095703125, 1.909912109375, 2.01025390625, 2.110595703125, 2.2109375, 2.311279296875, 2.41162109375, 2.511962890625, 2.6123046875, 2.712646484375, 2.81298828125, 2.913330078125, 3.013671875, 3.114013671875, 3.21435546875, 3.314697265625, 3.4150390625, 3.515380859375, 3.61572265625, 3.716064453125, 3.81640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 10.0, 5.0, 5.0, 11.0, 13.0, 23.0, 32.0, 34.0, 53.0, 79.0, 149.0, 208.0, 119.0, 58.0, 46.0, 22.0, 27.0, 20.0, 14.0, 9.0, 6.0, 7.0, 6.0, 5.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000457763671875, -0.0004362165927886963, -0.0004146695137023926, -0.00039312243461608887, -0.00037157535552978516, -0.00035002827644348145, -0.00032848119735717773, -0.000306934118270874, -0.0002853870391845703, -0.0002638399600982666, -0.0002422928810119629, -0.00022074580192565918, -0.00019919872283935547, -0.00017765164375305176, -0.00015610456466674805, -0.00013455748558044434, -0.00011301040649414062, -9.146332740783691e-05, -6.99162483215332e-05, -4.836916923522949e-05, -2.682209014892578e-05, -5.27501106262207e-06, 1.627206802368164e-05, 3.781914710998535e-05, 5.936622619628906e-05, 8.091330528259277e-05, 0.00010246038436889648, 0.0001240074634552002, 0.0001455545425415039, 0.00016710162162780762, 0.00018864870071411133, 0.00021019577980041504, 0.00023174285888671875, 0.00025328993797302246, 0.00027483701705932617, 0.0002963840961456299, 0.0003179311752319336, 0.0003394782543182373, 0.000361025333404541, 0.0003825724124908447, 0.00040411949157714844, 0.00042566657066345215, 0.00044721364974975586, 0.00046876072883605957, 0.0004903078079223633, 0.000511854887008667, 0.0005334019660949707, 0.0005549490451812744, 0.0005764961242675781, 0.0005980432033538818, 0.0006195902824401855, 0.0006411373615264893, 0.000662684440612793, 0.0006842315196990967, 0.0007057785987854004, 0.0007273256778717041, 0.0007488727569580078, 0.0007704198360443115, 0.0007919669151306152, 0.0008135139942169189, 0.0008350610733032227, 0.0008566081523895264, 0.0008781552314758301, 0.0008997023105621338, 0.0009212493896484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 10.0, 10.0, 19.0, 24.0, 38.0, 58.0, 65.0, 106.0, 174.0, 271.0, 491.0, 826.0, 1593.0, 3587.0, 10628.0, 52261.0, 911997.0, 49037.0, 10243.0, 3539.0, 1551.0, 776.0, 451.0, 256.0, 179.0, 106.0, 71.0, 49.0, 24.0, 30.0, 14.0, 15.0, 8.0, 9.0, 5.0, 2.0, 4.0, 2.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.693359375, -2.607818603515625, -2.52227783203125, -2.436737060546875, -2.3511962890625, -2.265655517578125, -2.18011474609375, -2.094573974609375, -2.009033203125, -1.923492431640625, -1.83795166015625, -1.752410888671875, -1.6668701171875, -1.581329345703125, -1.49578857421875, -1.410247802734375, -1.32470703125, -1.239166259765625, -1.15362548828125, -1.068084716796875, -0.9825439453125, -0.897003173828125, -0.81146240234375, -0.725921630859375, -0.640380859375, -0.554840087890625, -0.46929931640625, -0.383758544921875, -0.2982177734375, -0.212677001953125, -0.12713623046875, -0.041595458984375, 0.0439453125, 0.129486083984375, 0.21502685546875, 0.300567626953125, 0.3861083984375, 0.471649169921875, 0.55718994140625, 0.642730712890625, 0.728271484375, 0.813812255859375, 0.89935302734375, 0.984893798828125, 1.0704345703125, 1.155975341796875, 1.24151611328125, 1.327056884765625, 1.41259765625, 1.498138427734375, 1.58367919921875, 1.669219970703125, 1.7547607421875, 1.840301513671875, 1.92584228515625, 2.011383056640625, 2.096923828125, 2.182464599609375, 2.26800537109375, 2.353546142578125, 2.4390869140625, 2.524627685546875, 2.61016845703125, 2.695709228515625, 2.78125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 7.0, 23.0, 21.0, 32.0, 77.0, 172.0, 302.0, 186.0, 88.0, 23.0, 16.0, 11.0, 9.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.0160980224609375, -1.954071044921875, -1.8920440673828125, -1.83001708984375, -1.7679901123046875, -1.705963134765625, -1.6439361572265625, -1.5819091796875, -1.5198822021484375, -1.457855224609375, -1.3958282470703125, -1.33380126953125, -1.2717742919921875, -1.209747314453125, -1.1477203369140625, -1.085693359375, -1.0236663818359375, -0.961639404296875, -0.8996124267578125, -0.83758544921875, -0.7755584716796875, -0.713531494140625, -0.6515045166015625, -0.5894775390625, -0.5274505615234375, -0.465423583984375, -0.4033966064453125, -0.34136962890625, -0.2793426513671875, -0.217315673828125, -0.1552886962890625, -0.09326171875, -0.0312347412109375, 0.030792236328125, 0.0928192138671875, 0.15484619140625, 0.2168731689453125, 0.278900146484375, 0.3409271240234375, 0.4029541015625, 0.4649810791015625, 0.527008056640625, 0.5890350341796875, 0.65106201171875, 0.7130889892578125, 0.775115966796875, 0.8371429443359375, 0.899169921875, 0.9611968994140625, 1.023223876953125, 1.0852508544921875, 1.14727783203125, 1.2093048095703125, 1.271331787109375, 1.3333587646484375, 1.3953857421875, 1.4574127197265625, 1.519439697265625, 1.5814666748046875, 1.64349365234375, 1.7055206298828125, 1.767547607421875, 1.8295745849609375, 1.8916015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 19.0, 55.0, 141.0, 361.0, 205.0, 88.0, 56.0, 32.0, 9.0, 12.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.705343246459961, -12.226470947265625, -11.747598648071289, -11.268726348876953, -10.789855003356934, -10.310982704162598, -9.832110404968262, -9.353238105773926, -8.87436580657959, -8.395493507385254, -7.916621685028076, -7.43774938583374, -6.958877086639404, -6.480005264282227, -6.001132965087891, -5.522260665893555, -5.043388843536377, -4.564516544342041, -4.085644721984863, -3.6067724227905273, -3.1279001235961914, -2.6490280628204346, -2.1701560020446777, -1.6912837028503418, -1.212411642074585, -0.7335394620895386, -0.25466734170913696, 0.22420477867126465, 0.703076958656311, 1.1819491386413574, 1.6608211994171143, 2.13969349861145, 2.618565559387207, 3.097437620162964, 3.5763099193573, 4.055181980133057, 4.534054279327393, 5.01292610168457, 5.491798400878906, 5.970670700073242, 6.449542999267578, 6.928415298461914, 7.407287120819092, 7.886159420013428, 8.365031242370605, 8.843903541564941, 9.322775840759277, 9.801648139953613, 10.280519485473633, 10.759391784667969, 11.238264083862305, 11.71713638305664, 12.19600772857666, 12.674880027770996, 13.153752326965332, 13.632624626159668, 14.111496925354004, 14.59036922454834, 15.069241523742676, 15.548112869262695, 16.02698516845703, 16.505857467651367, 16.984729766845703, 17.46360206604004, 17.942474365234375]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 6.0, 13.0, 12.0, 13.0, 31.0, 32.0, 52.0, 85.0, 108.0, 102.0, 114.0, 105.0, 85.0, 76.0, 36.0, 39.0, 20.0, 15.0, 12.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.027713775634766, -13.679011344909668, -13.330307960510254, -12.981605529785156, -12.632903099060059, -12.284200668334961, -11.935497283935547, -11.58679485321045, -11.238092422485352, -10.889389991760254, -10.54068660736084, -10.191984176635742, -9.843281745910645, -9.494579315185547, -9.145875930786133, -8.797173500061035, -8.448471069335938, -8.09976863861084, -7.751065731048584, -7.402362823486328, -7.0536603927612305, -6.704957485198975, -6.356254577636719, -6.007552146911621, -5.658848762512207, -5.310145854949951, -4.9614434242248535, -4.612740516662598, -4.2640380859375, -3.915335178375244, -3.5666325092315674, -3.2179298400878906, -2.869227409362793, -2.520524740219116, -2.1718220710754395, -1.8231192827224731, -1.4744166135787964, -1.1257139444351196, -0.7770111560821533, -0.42830848693847656, -0.0796058177947998, 0.26909688115119934, 0.6177995800971985, 0.96650230884552, 1.3152049779891968, 1.6639076471328735, 2.01261043548584, 2.3613131046295166, 2.7100157737731934, 3.05871844291687, 3.407421112060547, 3.7561240196228027, 4.1048264503479, 4.453529357910156, 4.802231788635254, 5.15093469619751, 5.499637603759766, 5.8483405113220215, 6.197042942047119, 6.545745849609375, 6.894448280334473, 7.2431511878967285, 7.591854095458984, 7.940556526184082, 8.28925895690918]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 15.0, 22.0, 62.0, 292.0, 153654.0, 4039112.0, 807.0, 180.0, 46.0, 30.0, 14.0, 11.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.378662109375, -18.24169921875, -17.104736328125, -15.9677734375, -14.830810546875, -13.69384765625, -12.556884765625, -11.419921875, -10.282958984375, -9.14599609375, -8.009033203125, -6.8720703125, -5.735107421875, -4.59814453125, -3.461181640625, -2.32421875, -1.187255859375, -0.05029296875, 1.086669921875, 2.2236328125, 3.360595703125, 4.49755859375, 5.634521484375, 6.771484375, 7.908447265625, 9.04541015625, 10.182373046875, 11.3193359375, 12.456298828125, 13.59326171875, 14.730224609375, 15.8671875, 17.004150390625, 18.14111328125, 19.278076171875, 20.4150390625, 21.552001953125, 22.68896484375, 23.825927734375, 24.962890625, 26.099853515625, 27.23681640625, 28.373779296875, 29.5107421875, 30.647705078125, 31.78466796875, 32.921630859375, 34.05859375, 35.195556640625, 36.33251953125, 37.469482421875, 38.6064453125, 39.743408203125, 40.88037109375, 42.017333984375, 43.154296875, 44.291259765625, 45.42822265625, 46.565185546875, 47.7021484375, 48.839111328125, 49.97607421875, 51.113037109375, 52.25]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 7.0, 10.0, 4.0, 7.0, 5.0, 14.0, 11.0, 25.0, 34.0, 69.0, 100.0, 138.0, 181.0, 143.0, 84.0, 68.0, 32.0, 22.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16455078125, -0.15960121154785156, -0.15465164184570312, -0.1497020721435547, -0.14475250244140625, -0.1398029327392578, -0.13485336303710938, -0.12990379333496094, -0.1249542236328125, -0.12000465393066406, -0.11505508422851562, -0.11010551452636719, -0.10515594482421875, -0.10020637512207031, -0.09525680541992188, -0.09030723571777344, -0.085357666015625, -0.08040809631347656, -0.07545852661132812, -0.07050895690917969, -0.06555938720703125, -0.06060981750488281, -0.055660247802734375, -0.05071067810058594, -0.0457611083984375, -0.04081153869628906, -0.035861968994140625, -0.030912399291992188, -0.02596282958984375, -0.021013259887695312, -0.016063690185546875, -0.011114120483398438, -0.00616455078125, -0.0012149810791015625, 0.003734588623046875, 0.008684158325195312, 0.01363372802734375, 0.018583297729492188, 0.023532867431640625, 0.028482437133789062, 0.0334320068359375, 0.03838157653808594, 0.043331146240234375, 0.04828071594238281, 0.05323028564453125, 0.05817985534667969, 0.06312942504882812, 0.06807899475097656, 0.073028564453125, 0.07797813415527344, 0.08292770385742188, 0.08787727355957031, 0.09282684326171875, 0.09777641296386719, 0.10272598266601562, 0.10767555236816406, 0.1126251220703125, 0.11757469177246094, 0.12252426147460938, 0.1274738311767578, 0.13242340087890625, 0.1373729705810547, 0.14232254028320312, 0.14727210998535156, 0.1522216796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 19.0, 27.0, 43.0, 54.0, 90.0, 127.0, 210.0, 405.0, 1498.0, 52023.0, 4131180.0, 7771.0, 619.0, 138.0, 44.0, 15.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.546875, -14.26873779296875, -13.9906005859375, -13.71246337890625, -13.434326171875, -13.15618896484375, -12.8780517578125, -12.59991455078125, -12.32177734375, -12.04364013671875, -11.7655029296875, -11.48736572265625, -11.209228515625, -10.93109130859375, -10.6529541015625, -10.37481689453125, -10.0966796875, -9.81854248046875, -9.5404052734375, -9.26226806640625, -8.984130859375, -8.70599365234375, -8.4278564453125, -8.14971923828125, -7.87158203125, -7.59344482421875, -7.3153076171875, -7.03717041015625, -6.759033203125, -6.48089599609375, -6.2027587890625, -5.92462158203125, -5.646484375, -5.36834716796875, -5.0902099609375, -4.81207275390625, -4.533935546875, -4.25579833984375, -3.9776611328125, -3.69952392578125, -3.42138671875, -3.14324951171875, -2.8651123046875, -2.58697509765625, -2.308837890625, -2.03070068359375, -1.7525634765625, -1.47442626953125, -1.1962890625, -0.91815185546875, -0.6400146484375, -0.36187744140625, -0.083740234375, 0.19439697265625, 0.4725341796875, 0.75067138671875, 1.02880859375, 1.30694580078125, 1.5850830078125, 1.86322021484375, 2.141357421875, 2.41949462890625, 2.6976318359375, 2.97576904296875, 3.25390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 9.0, 12.0, 19.0, 25.0, 42.0, 69.0, 114.0, 269.0, 586.0, 1502.0, 896.0, 227.0, 89.0, 48.0, 31.0, 27.0, 15.0, 20.0, 17.0, 14.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25, -0.24102783203125, -0.2320556640625, -0.22308349609375, -0.214111328125, -0.20513916015625, -0.1961669921875, -0.18719482421875, -0.17822265625, -0.16925048828125, -0.1602783203125, -0.15130615234375, -0.142333984375, -0.13336181640625, -0.1243896484375, -0.11541748046875, -0.1064453125, -0.09747314453125, -0.0885009765625, -0.07952880859375, -0.070556640625, -0.06158447265625, -0.0526123046875, -0.04364013671875, -0.03466796875, -0.02569580078125, -0.0167236328125, -0.00775146484375, 0.001220703125, 0.01019287109375, 0.0191650390625, 0.02813720703125, 0.037109375, 0.04608154296875, 0.0550537109375, 0.06402587890625, 0.072998046875, 0.08197021484375, 0.0909423828125, 0.09991455078125, 0.10888671875, 0.11785888671875, 0.1268310546875, 0.13580322265625, 0.144775390625, 0.15374755859375, 0.1627197265625, 0.17169189453125, 0.1806640625, 0.18963623046875, 0.1986083984375, 0.20758056640625, 0.216552734375, 0.22552490234375, 0.2344970703125, 0.24346923828125, 0.25244140625, 0.26141357421875, 0.2703857421875, 0.27935791015625, 0.288330078125, 0.29730224609375, 0.3062744140625, 0.31524658203125, 0.32421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 64.0, 911.0, 26.0, 5.0], "bins": [-70.32695770263672, -69.18630981445312, -68.045654296875, -66.9050064086914, -65.76435852050781, -64.62370300292969, -63.483055114746094, -62.342403411865234, -61.201751708984375, -60.061100006103516, -58.92045211791992, -57.77980041503906, -56.6391487121582, -55.498497009277344, -54.35784912109375, -53.21719741821289, -52.07654571533203, -50.93589401245117, -49.79524612426758, -48.65459442138672, -47.51394271850586, -46.373291015625, -45.232643127441406, -44.09199142456055, -42.95134353637695, -41.810691833496094, -40.6700439453125, -39.52939224243164, -38.38874053955078, -37.24808883666992, -36.10744094848633, -34.96678924560547, -33.826133728027344, -32.685482025146484, -31.544832229614258, -30.40418243408203, -29.263530731201172, -28.122880935668945, -26.98223114013672, -25.84157943725586, -24.700929641723633, -23.560279846191406, -22.419628143310547, -21.27897834777832, -20.13832664489746, -18.997676849365234, -17.857025146484375, -16.71637535095215, -15.575724601745605, -14.435073852539062, -13.29442310333252, -12.153772354125977, -11.01312255859375, -9.87247085571289, -8.731821060180664, -7.591170310974121, -6.450519561767578, -5.309868812561035, -4.169218063354492, -3.0285677909851074, -1.8879170417785645, -0.7472662925720215, 0.3933839797973633, 1.5340347290039062, 2.67468523979187]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 9.0, 7.0, 24.0, 39.0, 54.0, 83.0, 87.0, 127.0, 128.0, 116.0, 109.0, 74.0, 56.0, 30.0, 20.0, 14.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.321140289306641, -7.164836883544922, -7.008533477783203, -6.852229595184326, -6.695926189422607, -6.539622783660889, -6.383318901062012, -6.227015495300293, -6.070712089538574, -5.9144086837768555, -5.758105278015137, -5.60180139541626, -5.445497989654541, -5.289194583892822, -5.132890701293945, -4.976587295532227, -4.820283889770508, -4.663980484008789, -4.50767707824707, -4.351373195648193, -4.195069789886475, -4.038766384124756, -3.882462739944458, -3.72615909576416, -3.5698556900024414, -3.4135522842407227, -3.257248640060425, -3.100944995880127, -2.944641590118408, -2.7883381843566895, -2.6320345401763916, -2.4757308959960938, -2.319427490234375, -2.1631240844726562, -2.0068204402923584, -1.85051691532135, -1.6942133903503418, -1.5379098653793335, -1.3816063404083252, -1.225302815437317, -1.0689992904663086, -0.9126957654953003, -0.756392240524292, -0.6000887155532837, -0.4437851905822754, -0.2874816656112671, -0.1311781406402588, 0.02512538433074951, 0.1814289093017578, 0.3377324342727661, 0.4940359592437744, 0.6503394842147827, 0.806643009185791, 0.9629465341567993, 1.1192500591278076, 1.275553584098816, 1.4318571090698242, 1.5881606340408325, 1.7444641590118408, 1.9007676839828491, 2.0570712089538574, 2.213374614715576, 2.369678258895874, 2.525981903076172, 2.6822853088378906]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 8.0, 9.0, 23.0, 11.0, 24.0, 21.0, 30.0, 38.0, 54.0, 83.0, 180.0, 600.0, 3403.0, 34635.0, 878186.0, 122119.0, 7463.0, 1051.0, 243.0, 96.0, 58.0, 36.0, 37.0, 34.0, 23.0, 21.0, 18.0, 8.0, 9.0, 3.0, 7.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.375, -3.2777099609375, -3.180419921875, -3.0831298828125, -2.98583984375, -2.8885498046875, -2.791259765625, -2.6939697265625, -2.5966796875, -2.4993896484375, -2.402099609375, -2.3048095703125, -2.20751953125, -2.1102294921875, -2.012939453125, -1.9156494140625, -1.818359375, -1.7210693359375, -1.623779296875, -1.5264892578125, -1.42919921875, -1.3319091796875, -1.234619140625, -1.1373291015625, -1.0400390625, -0.9427490234375, -0.845458984375, -0.7481689453125, -0.65087890625, -0.5535888671875, -0.456298828125, -0.3590087890625, -0.26171875, -0.1644287109375, -0.067138671875, 0.0301513671875, 0.12744140625, 0.2247314453125, 0.322021484375, 0.4193115234375, 0.5166015625, 0.6138916015625, 0.711181640625, 0.8084716796875, 0.90576171875, 1.0030517578125, 1.100341796875, 1.1976318359375, 1.294921875, 1.3922119140625, 1.489501953125, 1.5867919921875, 1.68408203125, 1.7813720703125, 1.878662109375, 1.9759521484375, 2.0732421875, 2.1705322265625, 2.267822265625, 2.3651123046875, 2.46240234375, 2.5596923828125, 2.656982421875, 2.7542724609375, 2.8515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 8.0, 6.0, 12.0, 40.0, 73.0, 122.0, 198.0, 233.0, 170.0, 74.0, 32.0, 23.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.451416015625, -0.4429044723510742, -0.43439292907714844, -0.42588138580322266, -0.4173698425292969, -0.4088582992553711, -0.4003467559814453, -0.39183521270751953, -0.38332366943359375, -0.37481212615966797, -0.3663005828857422, -0.3577890396118164, -0.3492774963378906, -0.34076595306396484, -0.33225440979003906, -0.3237428665161133, -0.3152313232421875, -0.3067197799682617, -0.29820823669433594, -0.28969669342041016, -0.2811851501464844, -0.2726736068725586, -0.2641620635986328, -0.25565052032470703, -0.24713897705078125, -0.23862743377685547, -0.2301158905029297, -0.2216043472290039, -0.21309280395507812, -0.20458126068115234, -0.19606971740722656, -0.18755817413330078, -0.179046630859375, -0.17053508758544922, -0.16202354431152344, -0.15351200103759766, -0.14500045776367188, -0.1364889144897461, -0.1279773712158203, -0.11946582794189453, -0.11095428466796875, -0.10244274139404297, -0.09393119812011719, -0.0854196548461914, -0.07690811157226562, -0.06839656829833984, -0.05988502502441406, -0.05137348175048828, -0.0428619384765625, -0.03435039520263672, -0.025838851928710938, -0.017327308654785156, -0.008815765380859375, -0.00030422210693359375, 0.008207321166992188, 0.01671886444091797, 0.02523040771484375, 0.03374195098876953, 0.04225349426269531, 0.050765037536621094, 0.059276580810546875, 0.06778812408447266, 0.07629966735839844, 0.08481121063232422, 0.09332275390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 7.0, 6.0, 11.0, 15.0, 31.0, 35.0, 67.0, 112.0, 250.0, 580.0, 1564.0, 5066.0, 18994.0, 91692.0, 594034.0, 278195.0, 42973.0, 10093.0, 2979.0, 1044.0, 420.0, 168.0, 95.0, 41.0, 19.0, 18.0, 11.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.2108612060546875, -1.168792724609375, -1.1267242431640625, -1.08465576171875, -1.0425872802734375, -1.000518798828125, -0.9584503173828125, -0.9163818359375, -0.8743133544921875, -0.832244873046875, -0.7901763916015625, -0.74810791015625, -0.7060394287109375, -0.663970947265625, -0.6219024658203125, -0.579833984375, -0.5377655029296875, -0.495697021484375, -0.4536285400390625, -0.41156005859375, -0.3694915771484375, -0.327423095703125, -0.2853546142578125, -0.2432861328125, -0.2012176513671875, -0.159149169921875, -0.1170806884765625, -0.07501220703125, -0.0329437255859375, 0.009124755859375, 0.0511932373046875, 0.09326171875, 0.1353302001953125, 0.177398681640625, 0.2194671630859375, 0.26153564453125, 0.3036041259765625, 0.345672607421875, 0.3877410888671875, 0.4298095703125, 0.4718780517578125, 0.513946533203125, 0.5560150146484375, 0.59808349609375, 0.6401519775390625, 0.682220458984375, 0.7242889404296875, 0.766357421875, 0.8084259033203125, 0.850494384765625, 0.8925628662109375, 0.93463134765625, 0.9766998291015625, 1.018768310546875, 1.0608367919921875, 1.1029052734375, 1.1449737548828125, 1.187042236328125, 1.2291107177734375, 1.27117919921875, 1.3132476806640625, 1.355316162109375, 1.3973846435546875, 1.439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 2.0, 9.0, 6.0, 7.0, 13.0, 18.0, 12.0, 20.0, 25.0, 28.0, 21.0, 22.0, 30.0, 23.0, 29.0, 39.0, 41.0, 40.0, 40.0, 38.0, 40.0, 44.0, 35.0, 39.0, 42.0, 40.0, 26.0, 35.0, 33.0, 21.0, 28.0, 26.0, 17.0, 17.0, 22.0, 10.0, 11.0, 6.0, 11.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.385986328125, -0.3734169006347656, -0.36084747314453125, -0.3482780456542969, -0.3357086181640625, -0.3231391906738281, -0.31056976318359375, -0.2980003356933594, -0.285430908203125, -0.2728614807128906, -0.26029205322265625, -0.24772262573242188, -0.2351531982421875, -0.22258377075195312, -0.21001434326171875, -0.19744491577148438, -0.18487548828125, -0.17230606079101562, -0.15973663330078125, -0.14716720581054688, -0.1345977783203125, -0.12202835083007812, -0.10945892333984375, -0.09688949584960938, -0.084320068359375, -0.07175064086914062, -0.05918121337890625, -0.046611785888671875, -0.0340423583984375, -0.021472930908203125, -0.00890350341796875, 0.003665924072265625, 0.0162353515625, 0.028804779052734375, 0.04137420654296875, 0.053943634033203125, 0.0665130615234375, 0.07908248901367188, 0.09165191650390625, 0.10422134399414062, 0.116790771484375, 0.12936019897460938, 0.14192962646484375, 0.15449905395507812, 0.1670684814453125, 0.17963790893554688, 0.19220733642578125, 0.20477676391601562, 0.21734619140625, 0.22991561889648438, 0.24248504638671875, 0.2550544738769531, 0.2676239013671875, 0.2801933288574219, 0.29276275634765625, 0.3053321838378906, 0.317901611328125, 0.3304710388183594, 0.34304046630859375, 0.3556098937988281, 0.3681793212890625, 0.3807487487792969, 0.39331817626953125, 0.4058876037597656, 0.41845703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 8.0, 6.0, 4.0, 10.0, 12.0, 22.0, 23.0, 24.0, 62.0, 91.0, 166.0, 288.0, 529.0, 1107.0, 2810.0, 10186.0, 125511.0, 879993.0, 20091.0, 4253.0, 1622.0, 703.0, 394.0, 239.0, 128.0, 82.0, 58.0, 38.0, 25.0, 13.0, 16.0, 12.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.5, -6.33416748046875, -6.1683349609375, -6.00250244140625, -5.836669921875, -5.67083740234375, -5.5050048828125, -5.33917236328125, -5.17333984375, -5.00750732421875, -4.8416748046875, -4.67584228515625, -4.510009765625, -4.34417724609375, -4.1783447265625, -4.01251220703125, -3.8466796875, -3.68084716796875, -3.5150146484375, -3.34918212890625, -3.183349609375, -3.01751708984375, -2.8516845703125, -2.68585205078125, -2.52001953125, -2.35418701171875, -2.1883544921875, -2.02252197265625, -1.856689453125, -1.69085693359375, -1.5250244140625, -1.35919189453125, -1.193359375, -1.02752685546875, -0.8616943359375, -0.69586181640625, -0.530029296875, -0.36419677734375, -0.1983642578125, -0.03253173828125, 0.13330078125, 0.29913330078125, 0.4649658203125, 0.63079833984375, 0.796630859375, 0.96246337890625, 1.1282958984375, 1.29412841796875, 1.4599609375, 1.62579345703125, 1.7916259765625, 1.95745849609375, 2.123291015625, 2.28912353515625, 2.4549560546875, 2.62078857421875, 2.78662109375, 2.95245361328125, 3.1182861328125, 3.28411865234375, 3.449951171875, 3.61578369140625, 3.7816162109375, 3.94744873046875, 4.11328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 6.0, 5.0, 12.0, 12.0, 31.0, 37.0, 65.0, 86.0, 166.0, 223.0, 133.0, 62.0, 36.0, 28.0, 24.0, 9.0, 12.0, 10.0, 4.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006322860717773438, -0.0006138309836387634, -0.0005953758955001831, -0.0005769208073616028, -0.0005584657192230225, -0.0005400106310844421, -0.0005215555429458618, -0.0005031004548072815, -0.00048464536666870117, -0.00046619027853012085, -0.00044773519039154053, -0.0004292801022529602, -0.0004108250141143799, -0.00039236992597579956, -0.00037391483783721924, -0.0003554597496986389, -0.0003370046615600586, -0.00031854957342147827, -0.00030009448528289795, -0.0002816393971443176, -0.0002631843090057373, -0.000244729220867157, -0.00022627413272857666, -0.00020781904458999634, -0.00018936395645141602, -0.0001709088683128357, -0.00015245378017425537, -0.00013399869203567505, -0.00011554360389709473, -9.70885157585144e-05, -7.863342761993408e-05, -6.017833948135376e-05, -4.172325134277344e-05, -2.3268163204193115e-05, -4.813075065612793e-06, 1.364201307296753e-05, 3.209710121154785e-05, 5.0552189350128174e-05, 6.90072774887085e-05, 8.746236562728882e-05, 0.00010591745376586914, 0.00012437254190444946, 0.00014282763004302979, 0.0001612827181816101, 0.00017973780632019043, 0.00019819289445877075, 0.00021664798259735107, 0.0002351030707359314, 0.0002535581588745117, 0.00027201324701309204, 0.00029046833515167236, 0.0003089234232902527, 0.000327378511428833, 0.00034583359956741333, 0.00036428868770599365, 0.000382743775844574, 0.0004011988639831543, 0.0004196539521217346, 0.00043810904026031494, 0.00045656412839889526, 0.0004750192165374756, 0.0004934743046760559, 0.0005119293928146362, 0.0005303844809532166, 0.0005488395690917969]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 8.0, 8.0, 15.0, 16.0, 27.0, 49.0, 85.0, 176.0, 337.0, 822.0, 2122.0, 6915.0, 33008.0, 810810.0, 170826.0, 16253.0, 4365.0, 1460.0, 615.0, 269.0, 114.0, 86.0, 51.0, 46.0, 21.0, 12.0, 8.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.135772705078125, -3.00396728515625, -2.872161865234375, -2.7403564453125, -2.608551025390625, -2.47674560546875, -2.344940185546875, -2.213134765625, -2.081329345703125, -1.94952392578125, -1.817718505859375, -1.6859130859375, -1.554107666015625, -1.42230224609375, -1.290496826171875, -1.15869140625, -1.026885986328125, -0.89508056640625, -0.763275146484375, -0.6314697265625, -0.499664306640625, -0.36785888671875, -0.236053466796875, -0.104248046875, 0.027557373046875, 0.15936279296875, 0.291168212890625, 0.4229736328125, 0.554779052734375, 0.68658447265625, 0.818389892578125, 0.9501953125, 1.082000732421875, 1.21380615234375, 1.345611572265625, 1.4774169921875, 1.609222412109375, 1.74102783203125, 1.872833251953125, 2.004638671875, 2.136444091796875, 2.26824951171875, 2.400054931640625, 2.5318603515625, 2.663665771484375, 2.79547119140625, 2.927276611328125, 3.05908203125, 3.190887451171875, 3.32269287109375, 3.454498291015625, 3.5863037109375, 3.718109130859375, 3.84991455078125, 3.981719970703125, 4.113525390625, 4.245330810546875, 4.37713623046875, 4.508941650390625, 4.6407470703125, 4.772552490234375, 4.90435791015625, 5.036163330078125, 5.16796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 2.0, 10.0, 14.0, 23.0, 30.0, 47.0, 83.0, 168.0, 226.0, 152.0, 87.0, 48.0, 34.0, 23.0, 16.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5060272216796875, -1.438812255859375, -1.3715972900390625, -1.30438232421875, -1.2371673583984375, -1.169952392578125, -1.1027374267578125, -1.0355224609375, -0.9683074951171875, -0.901092529296875, -0.8338775634765625, -0.76666259765625, -0.6994476318359375, -0.632232666015625, -0.5650177001953125, -0.497802734375, -0.4305877685546875, -0.363372802734375, -0.2961578369140625, -0.22894287109375, -0.1617279052734375, -0.094512939453125, -0.0272979736328125, 0.0399169921875, 0.1071319580078125, 0.174346923828125, 0.2415618896484375, 0.30877685546875, 0.3759918212890625, 0.443206787109375, 0.5104217529296875, 0.57763671875, 0.6448516845703125, 0.712066650390625, 0.7792816162109375, 0.84649658203125, 0.9137115478515625, 0.980926513671875, 1.0481414794921875, 1.1153564453125, 1.1825714111328125, 1.249786376953125, 1.3170013427734375, 1.38421630859375, 1.4514312744140625, 1.518646240234375, 1.5858612060546875, 1.653076171875, 1.7202911376953125, 1.787506103515625, 1.8547210693359375, 1.92193603515625, 1.9891510009765625, 2.056365966796875, 2.1235809326171875, 2.1907958984375, 2.2580108642578125, 2.325225830078125, 2.3924407958984375, 2.45965576171875, 2.5268707275390625, 2.594085693359375, 2.6613006591796875, 2.728515625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 11.0, 29.0, 64.0, 133.0, 261.0, 227.0, 131.0, 57.0, 36.0, 19.0, 15.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015359878540039, -7.662660598754883, -7.309961318969727, -6.95726203918457, -6.604562759399414, -6.251863479614258, -5.899164199829102, -5.546464920043945, -5.193765640258789, -4.841066360473633, -4.488367080688477, -4.13566780090332, -3.782968521118164, -3.430269241333008, -3.0775701999664307, -2.7248709201812744, -2.3721718788146973, -2.019472599029541, -1.6667733192443848, -1.314074158668518, -0.9613748788833618, -0.6086755990982056, -0.25597643852233887, 0.09672284126281738, 0.44942212104797363, 0.8021214008331299, 1.1548206806182861, 1.5075198411941528, 1.860219120979309, 2.212918281555176, 2.565617561340332, 2.9183168411254883, 3.2710161209106445, 3.623715400695801, 3.976414680480957, 4.329113960266113, 4.6818132400512695, 5.034512519836426, 5.387211799621582, 5.739911079406738, 6.0926103591918945, 6.445309638977051, 6.798008918762207, 7.150708198547363, 7.5034074783325195, 7.856106758117676, 8.208806037902832, 8.561505317687988, 8.914203643798828, 9.266902923583984, 9.61960220336914, 9.972301483154297, 10.325000762939453, 10.67770004272461, 11.030399322509766, 11.383098602294922, 11.735797882080078, 12.088497161865234, 12.44119644165039, 12.793895721435547, 13.146595001220703, 13.49929428100586, 13.851993560791016, 14.204692840576172, 14.557392120361328]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 12.0, 9.0, 14.0, 22.0, 27.0, 39.0, 52.0, 65.0, 91.0, 106.0, 109.0, 108.0, 94.0, 78.0, 51.0, 47.0, 26.0, 18.0, 22.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.437831878662109, -4.1784749031066895, -3.9191179275512695, -3.6597609519958496, -3.4004039764404297, -3.1410470008850098, -2.88169002532959, -2.62233304977417, -2.36297607421875, -2.10361909866333, -1.8442621231079102, -1.5849051475524902, -1.3255481719970703, -1.0661911964416504, -0.8068342208862305, -0.5474772453308105, -0.2881202697753906, -0.028763294219970703, 0.23059368133544922, 0.48995065689086914, 0.7493076324462891, 1.008664608001709, 1.268021583557129, 1.5273785591125488, 1.7867355346679688, 2.0460925102233887, 2.3054494857788086, 2.5648064613342285, 2.8241634368896484, 3.0835204124450684, 3.3428773880004883, 3.602234363555908, 3.8615903854370117, 4.120947360992432, 4.380304336547852, 4.6396613121032715, 4.899018287658691, 5.158375263214111, 5.417732238769531, 5.677089214324951, 5.936446189880371, 6.195803165435791, 6.455160140991211, 6.714517116546631, 6.973874092102051, 7.233231067657471, 7.492588043212891, 7.7519450187683105, 8.01130199432373, 8.270658493041992, 8.53001594543457, 8.789373397827148, 9.04872989654541, 9.308086395263672, 9.56744384765625, 9.826801300048828, 10.08615779876709, 10.345514297485352, 10.60487174987793, 10.864229202270508, 11.12358570098877, 11.382942199707031, 11.64229965209961, 11.901657104492188, 12.16101360321045]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 7.0, 7.0, 16.0, 9.0, 9.0, 20.0, 9.0, 42.0, 74.0, 349.0, 4069.0, 4100126.0, 87727.0, 1425.0, 191.0, 47.0, 20.0, 20.0, 12.0, 20.0, 9.0, 13.0, 6.0, 2.0, 7.0, 8.0, 6.0, 3.0, 8.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0546875, -13.6265869140625, -13.198486328125, -12.7703857421875, -12.34228515625, -11.9141845703125, -11.486083984375, -11.0579833984375, -10.6298828125, -10.2017822265625, -9.773681640625, -9.3455810546875, -8.91748046875, -8.4893798828125, -8.061279296875, -7.6331787109375, -7.205078125, -6.7769775390625, -6.348876953125, -5.9207763671875, -5.49267578125, -5.0645751953125, -4.636474609375, -4.2083740234375, -3.7802734375, -3.3521728515625, -2.924072265625, -2.4959716796875, -2.06787109375, -1.6397705078125, -1.211669921875, -0.7835693359375, -0.35546875, 0.0726318359375, 0.500732421875, 0.9288330078125, 1.35693359375, 1.7850341796875, 2.213134765625, 2.6412353515625, 3.0693359375, 3.4974365234375, 3.925537109375, 4.3536376953125, 4.78173828125, 5.2098388671875, 5.637939453125, 6.0660400390625, 6.494140625, 6.9222412109375, 7.350341796875, 7.7784423828125, 8.20654296875, 8.6346435546875, 9.062744140625, 9.4908447265625, 9.9189453125, 10.3470458984375, 10.775146484375, 11.2032470703125, 11.63134765625, 12.0594482421875, 12.487548828125, 12.9156494140625, 13.34375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 10.0, 4.0, 6.0, 10.0, 9.0, 19.0, 19.0, 21.0, 17.0, 23.0, 32.0, 31.0, 41.0, 47.0, 50.0, 52.0, 57.0, 52.0, 56.0, 54.0, 43.0, 52.0, 37.0, 40.0, 30.0, 35.0, 26.0, 24.0, 22.0, 13.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0797119140625, -0.07734107971191406, -0.07497024536132812, -0.07259941101074219, -0.07022857666015625, -0.06785774230957031, -0.06548690795898438, -0.06311607360839844, -0.0607452392578125, -0.05837440490722656, -0.056003570556640625, -0.05363273620605469, -0.05126190185546875, -0.04889106750488281, -0.046520233154296875, -0.04414939880371094, -0.041778564453125, -0.03940773010253906, -0.037036895751953125, -0.03466606140136719, -0.03229522705078125, -0.029924392700195312, -0.027553558349609375, -0.025182723999023438, -0.0228118896484375, -0.020441055297851562, -0.018070220947265625, -0.015699386596679688, -0.01332855224609375, -0.010957717895507812, -0.008586883544921875, -0.0062160491943359375, -0.00384521484375, -0.0014743804931640625, 0.000896453857421875, 0.0032672882080078125, 0.00563812255859375, 0.008008956909179688, 0.010379791259765625, 0.012750625610351562, 0.0151214599609375, 0.017492294311523438, 0.019863128662109375, 0.022233963012695312, 0.02460479736328125, 0.026975631713867188, 0.029346466064453125, 0.03171730041503906, 0.034088134765625, 0.03645896911621094, 0.038829803466796875, 0.04120063781738281, 0.04357147216796875, 0.04594230651855469, 0.048313140869140625, 0.05068397521972656, 0.0530548095703125, 0.05542564392089844, 0.057796478271484375, 0.06016731262207031, 0.06253814697265625, 0.06490898132324219, 0.06727981567382812, 0.06965065002441406, 0.072021484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 14.0, 32.0, 46.0, 170.0, 25568.0, 4167964.0, 364.0, 85.0, 31.0, 12.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.28125, -7.4658203125, -6.650390625, -5.8349609375, -5.01953125, -4.2041015625, -3.388671875, -2.5732421875, -1.7578125, -0.9423828125, -0.126953125, 0.6884765625, 1.50390625, 2.3193359375, 3.134765625, 3.9501953125, 4.765625, 5.5810546875, 6.396484375, 7.2119140625, 8.02734375, 8.8427734375, 9.658203125, 10.4736328125, 11.2890625, 12.1044921875, 12.919921875, 13.7353515625, 14.55078125, 15.3662109375, 16.181640625, 16.9970703125, 17.8125, 18.6279296875, 19.443359375, 20.2587890625, 21.07421875, 21.8896484375, 22.705078125, 23.5205078125, 24.3359375, 25.1513671875, 25.966796875, 26.7822265625, 27.59765625, 28.4130859375, 29.228515625, 30.0439453125, 30.859375, 31.6748046875, 32.490234375, 33.3056640625, 34.12109375, 34.9365234375, 35.751953125, 36.5673828125, 37.3828125, 38.1982421875, 39.013671875, 39.8291015625, 40.64453125, 41.4599609375, 42.275390625, 43.0908203125, 43.90625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 2.0, 10.0, 21.0, 20.0, 16.0, 44.0, 47.0, 90.0, 190.0, 411.0, 1420.0, 1048.0, 313.0, 143.0, 95.0, 56.0, 37.0, 32.0, 20.0, 13.0, 11.0, 9.0, 4.0, 7.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24488449096679688, -0.23464202880859375, -0.22439956665039062, -0.2141571044921875, -0.20391464233398438, -0.19367218017578125, -0.18342971801757812, -0.173187255859375, -0.16294479370117188, -0.15270233154296875, -0.14245986938476562, -0.1322174072265625, -0.12197494506835938, -0.11173248291015625, -0.10149002075195312, -0.09124755859375, -0.08100509643554688, -0.07076263427734375, -0.060520172119140625, -0.0502777099609375, -0.040035247802734375, -0.02979278564453125, -0.019550323486328125, -0.009307861328125, 0.000934600830078125, 0.01117706298828125, 0.021419525146484375, 0.0316619873046875, 0.041904449462890625, 0.05214691162109375, 0.062389373779296875, 0.0726318359375, 0.08287429809570312, 0.09311676025390625, 0.10335922241210938, 0.1136016845703125, 0.12384414672851562, 0.13408660888671875, 0.14432907104492188, 0.154571533203125, 0.16481399536132812, 0.17505645751953125, 0.18529891967773438, 0.1955413818359375, 0.20578384399414062, 0.21602630615234375, 0.22626876831054688, 0.23651123046875, 0.24675369262695312, 0.25699615478515625, 0.2672386169433594, 0.2774810791015625, 0.2877235412597656, 0.29796600341796875, 0.3082084655761719, 0.318450927734375, 0.3286933898925781, 0.33893585205078125, 0.3491783142089844, 0.3594207763671875, 0.3696632385253906, 0.37990570068359375, 0.3901481628417969, 0.400390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 5.0, 862.0, 154.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9658284187316895, -3.255408525466919, -1.5449886322021484, 0.16543149948120117, 1.8758511543273926, 3.586270809173584, 5.296691417694092, 7.007111072540283, 8.717531204223633, 10.427950859069824, 12.138370513916016, 13.848791122436523, 15.559210777282715, 17.269630432128906, 18.980051040649414, 20.690471649169922, 22.400890350341797, 24.111310958862305, 25.82172966003418, 27.532150268554688, 29.242568969726562, 30.95298957824707, 32.66341018676758, 34.37382888793945, 36.08424758911133, 37.7946662902832, 39.505088806152344, 41.21550750732422, 42.925926208496094, 44.63634490966797, 46.34676742553711, 48.057186126708984, 49.767608642578125, 51.47802734375, 53.18844985961914, 54.898868560791016, 56.60928726196289, 58.31970977783203, 60.030128479003906, 61.74054718017578, 63.450965881347656, 65.16138458251953, 66.8718032836914, 68.58222961425781, 70.29264831542969, 72.00306701660156, 73.71348571777344, 75.42390441894531, 77.13432312011719, 78.84474182128906, 80.55516052246094, 82.26557922363281, 83.97600555419922, 85.6864242553711, 87.39684295654297, 89.10726165771484, 90.81768798828125, 92.52810668945312, 94.238525390625, 95.94894409179688, 97.65937042236328, 99.36978912353516, 101.08020782470703, 102.7906265258789, 104.50104522705078]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 15.0, 29.0, 68.0, 117.0, 162.0, 184.0, 209.0, 111.0, 60.0, 33.0, 19.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3870370388031006, -2.258721113204956, -2.1304049491882324, -2.002089023590088, -1.8737730979919434, -1.7454570531845093, -1.6171410083770752, -1.4888250827789307, -1.3605090379714966, -1.2321929931640625, -1.103877067565918, -0.9755610227584839, -0.8472450375556946, -0.7189290523529053, -0.5906130075454712, -0.4622970223426819, -0.3339810371398926, -0.20566503703594208, -0.07734903693199158, 0.05096697807312012, 0.17928296327590942, 0.30759894847869873, 0.4359149932861328, 0.5642309784889221, 0.6925469636917114, 0.8208629488945007, 0.94917893409729, 1.0774949789047241, 1.2058110237121582, 1.3341269493103027, 1.4624429941177368, 1.590759038925171, 1.7190752029418945, 1.8473912477493286, 1.9757071733474731, 2.1040232181549072, 2.2323391437530518, 2.3606553077697754, 2.48897123336792, 2.6172871589660645, 2.745603084564209, 2.8739190101623535, 3.002235174179077, 3.1305510997772217, 3.258867025375366, 3.38718318939209, 3.5154991149902344, 3.643815040588379, 3.7721312046051025, 3.900447130203247, 4.028763294219971, 4.157079219818115, 4.28539514541626, 4.413711071014404, 4.542027473449707, 4.670343399047852, 4.798659324645996, 4.926975250244141, 5.055291175842285, 5.18360710144043, 5.311923503875732, 5.440239429473877, 5.5685553550720215, 5.696871280670166, 5.8251872062683105]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 7.0, 6.0, 3.0, 8.0, 19.0, 16.0, 24.0, 25.0, 28.0, 25.0, 52.0, 55.0, 55.0, 41.0, 63.0, 1206.0, 1041327.0, 5173.0, 64.0, 50.0, 45.0, 41.0, 47.0, 29.0, 23.0, 29.0, 25.0, 13.0, 14.0, 10.0, 7.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.8773193359375, -7.512451171875, -7.1475830078125, -6.78271484375, -6.4178466796875, -6.052978515625, -5.6881103515625, -5.3232421875, -4.9583740234375, -4.593505859375, -4.2286376953125, -3.86376953125, -3.4989013671875, -3.134033203125, -2.7691650390625, -2.404296875, -2.0394287109375, -1.674560546875, -1.3096923828125, -0.94482421875, -0.5799560546875, -0.215087890625, 0.1497802734375, 0.5146484375, 0.8795166015625, 1.244384765625, 1.6092529296875, 1.97412109375, 2.3389892578125, 2.703857421875, 3.0687255859375, 3.43359375, 3.7984619140625, 4.163330078125, 4.5281982421875, 4.89306640625, 5.2579345703125, 5.622802734375, 5.9876708984375, 6.3525390625, 6.7174072265625, 7.082275390625, 7.4471435546875, 7.81201171875, 8.1768798828125, 8.541748046875, 8.9066162109375, 9.271484375, 9.6363525390625, 10.001220703125, 10.3660888671875, 10.73095703125, 11.0958251953125, 11.460693359375, 11.8255615234375, 12.1904296875, 12.5552978515625, 12.920166015625, 13.2850341796875, 13.64990234375, 14.0147705078125, 14.379638671875, 14.7445068359375, 15.109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 30.0, 124.0, 253.0, 327.0, 209.0, 63.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.11553192138671875, -0.0938568115234375, -0.07218170166015625, -0.050506591796875, -0.02883148193359375, -0.0071563720703125, 0.01451873779296875, 0.03619384765625, 0.05786895751953125, 0.0795440673828125, 0.10121917724609375, 0.122894287109375, 0.14456939697265625, 0.1662445068359375, 0.18791961669921875, 0.2095947265625, 0.23126983642578125, 0.2529449462890625, 0.27462005615234375, 0.296295166015625, 0.31797027587890625, 0.3396453857421875, 0.36132049560546875, 0.38299560546875, 0.40467071533203125, 0.4263458251953125, 0.44802093505859375, 0.469696044921875, 0.49137115478515625, 0.5130462646484375, 0.5347213745117188, 0.556396484375, 0.5780715942382812, 0.5997467041015625, 0.6214218139648438, 0.643096923828125, 0.6647720336914062, 0.6864471435546875, 0.7081222534179688, 0.72979736328125, 0.7514724731445312, 0.7731475830078125, 0.7948226928710938, 0.816497802734375, 0.8381729125976562, 0.8598480224609375, 0.8815231323242188, 0.9031982421875, 0.9248733520507812, 0.9465484619140625, 0.9682235717773438, 0.989898681640625, 1.0115737915039062, 1.0332489013671875, 1.0549240112304688, 1.07659912109375, 1.0982742309570312, 1.1199493408203125, 1.1416244506835938, 1.163299560546875, 1.1849746704101562, 1.2066497802734375, 1.2283248901367188, 1.25]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 7.0, 25.0, 21.0, 26.0, 63.0, 69.0, 126.0, 260.0, 504.0, 1356.0, 4680.0, 25804.0, 227652.0, 669614.0, 99928.0, 13624.0, 2933.0, 915.0, 378.0, 208.0, 114.0, 66.0, 40.0, 20.0, 23.0, 13.0, 14.0, 14.0, 9.0, 9.0, 2.0, 6.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4296875, -3.323577880859375, -3.21746826171875, -3.111358642578125, -3.0052490234375, -2.899139404296875, -2.79302978515625, -2.686920166015625, -2.580810546875, -2.474700927734375, -2.36859130859375, -2.262481689453125, -2.1563720703125, -2.050262451171875, -1.94415283203125, -1.838043212890625, -1.73193359375, -1.625823974609375, -1.51971435546875, -1.413604736328125, -1.3074951171875, -1.201385498046875, -1.09527587890625, -0.989166259765625, -0.883056640625, -0.776947021484375, -0.67083740234375, -0.564727783203125, -0.4586181640625, -0.352508544921875, -0.24639892578125, -0.140289306640625, -0.0341796875, 0.071929931640625, 0.17803955078125, 0.284149169921875, 0.3902587890625, 0.496368408203125, 0.60247802734375, 0.708587646484375, 0.814697265625, 0.920806884765625, 1.02691650390625, 1.133026123046875, 1.2391357421875, 1.345245361328125, 1.45135498046875, 1.557464599609375, 1.66357421875, 1.769683837890625, 1.87579345703125, 1.981903076171875, 2.0880126953125, 2.194122314453125, 2.30023193359375, 2.406341552734375, 2.512451171875, 2.618560791015625, 2.72467041015625, 2.830780029296875, 2.9368896484375, 3.042999267578125, 3.14910888671875, 3.255218505859375, 3.361328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 3.0, 8.0, 7.0, 14.0, 22.0, 18.0, 22.0, 20.0, 34.0, 25.0, 30.0, 54.0, 41.0, 52.0, 53.0, 49.0, 51.0, 51.0, 47.0, 48.0, 49.0, 47.0, 43.0, 35.0, 35.0, 27.0, 20.0, 16.0, 13.0, 13.0, 8.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.133148193359375, -1.09735107421875, -1.061553955078125, -1.0257568359375, -0.989959716796875, -0.95416259765625, -0.918365478515625, -0.882568359375, -0.846771240234375, -0.81097412109375, -0.775177001953125, -0.7393798828125, -0.703582763671875, -0.66778564453125, -0.631988525390625, -0.59619140625, -0.560394287109375, -0.52459716796875, -0.488800048828125, -0.4530029296875, -0.417205810546875, -0.38140869140625, -0.345611572265625, -0.309814453125, -0.274017333984375, -0.23822021484375, -0.202423095703125, -0.1666259765625, -0.130828857421875, -0.09503173828125, -0.059234619140625, -0.0234375, 0.012359619140625, 0.04815673828125, 0.083953857421875, 0.1197509765625, 0.155548095703125, 0.19134521484375, 0.227142333984375, 0.262939453125, 0.298736572265625, 0.33453369140625, 0.370330810546875, 0.4061279296875, 0.441925048828125, 0.47772216796875, 0.513519287109375, 0.54931640625, 0.585113525390625, 0.62091064453125, 0.656707763671875, 0.6925048828125, 0.728302001953125, 0.76409912109375, 0.799896240234375, 0.835693359375, 0.871490478515625, 0.90728759765625, 0.943084716796875, 0.9788818359375, 1.014678955078125, 1.05047607421875, 1.086273193359375, 1.1220703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 12.0, 11.0, 9.0, 21.0, 24.0, 33.0, 49.0, 92.0, 148.0, 310.0, 914.0, 3000.0, 14311.0, 170372.0, 778015.0, 69400.0, 8487.0, 2031.0, 653.0, 282.0, 144.0, 67.0, 36.0, 29.0, 20.0, 21.0, 8.0, 11.0, 10.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.4296875, -5.2716064453125, -5.113525390625, -4.9554443359375, -4.79736328125, -4.6392822265625, -4.481201171875, -4.3231201171875, -4.1650390625, -4.0069580078125, -3.848876953125, -3.6907958984375, -3.53271484375, -3.3746337890625, -3.216552734375, -3.0584716796875, -2.900390625, -2.7423095703125, -2.584228515625, -2.4261474609375, -2.26806640625, -2.1099853515625, -1.951904296875, -1.7938232421875, -1.6357421875, -1.4776611328125, -1.319580078125, -1.1614990234375, -1.00341796875, -0.8453369140625, -0.687255859375, -0.5291748046875, -0.37109375, -0.2130126953125, -0.054931640625, 0.1031494140625, 0.26123046875, 0.4193115234375, 0.577392578125, 0.7354736328125, 0.8935546875, 1.0516357421875, 1.209716796875, 1.3677978515625, 1.52587890625, 1.6839599609375, 1.842041015625, 2.0001220703125, 2.158203125, 2.3162841796875, 2.474365234375, 2.6324462890625, 2.79052734375, 2.9486083984375, 3.106689453125, 3.2647705078125, 3.4228515625, 3.5809326171875, 3.739013671875, 3.8970947265625, 4.05517578125, 4.2132568359375, 4.371337890625, 4.5294189453125, 4.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 11.0, 12.0, 14.0, 14.0, 32.0, 39.0, 47.0, 56.0, 76.0, 121.0, 121.0, 86.0, 90.0, 44.0, 41.0, 36.0, 28.0, 27.0, 17.0, 10.0, 11.0, 12.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0004756450653076172, -0.0004621855914592743, -0.0004487261176109314, -0.0004352666437625885, -0.0004218071699142456, -0.0004083476960659027, -0.0003948882222175598, -0.0003814287483692169, -0.000367969274520874, -0.00035450980067253113, -0.00034105032682418823, -0.00032759085297584534, -0.00031413137912750244, -0.00030067190527915955, -0.00028721243143081665, -0.00027375295758247375, -0.00026029348373413086, -0.00024683400988578796, -0.00023337453603744507, -0.00021991506218910217, -0.00020645558834075928, -0.00019299611449241638, -0.00017953664064407349, -0.0001660771667957306, -0.0001526176929473877, -0.0001391582190990448, -0.0001256987452507019, -0.00011223927140235901, -9.877979755401611e-05, -8.532032370567322e-05, -7.186084985733032e-05, -5.840137600898743e-05, -4.494190216064453e-05, -3.1482428312301636e-05, -1.802295446395874e-05, -4.563480615615845e-06, 8.89599323272705e-06, 2.2355467081069946e-05, 3.581494092941284e-05, 4.927441477775574e-05, 6.273388862609863e-05, 7.619336247444153e-05, 8.965283632278442e-05, 0.00010311231017112732, 0.00011657178401947021, 0.0001300312578678131, 0.000143490731716156, 0.0001569502055644989, 0.0001704096794128418, 0.0001838691532611847, 0.0001973286271095276, 0.00021078810095787048, 0.00022424757480621338, 0.00023770704865455627, 0.00025116652250289917, 0.00026462599635124207, 0.00027808547019958496, 0.00029154494404792786, 0.00030500441789627075, 0.00031846389174461365, 0.00033192336559295654, 0.00034538283944129944, 0.00035884231328964233, 0.00037230178713798523, 0.0003857612609863281]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 11.0, 15.0, 18.0, 41.0, 35.0, 86.0, 130.0, 271.0, 659.0, 1833.0, 6844.0, 40326.0, 784787.0, 193897.0, 14473.0, 3224.0, 1059.0, 392.0, 184.0, 107.0, 56.0, 24.0, 15.0, 18.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.587890625, -6.38671875, -6.185546875, -5.984375, -5.783203125, -5.58203125, -5.380859375, -5.1796875, -4.978515625, -4.77734375, -4.576171875, -4.375, -4.173828125, -3.97265625, -3.771484375, -3.5703125, -3.369140625, -3.16796875, -2.966796875, -2.765625, -2.564453125, -2.36328125, -2.162109375, -1.9609375, -1.759765625, -1.55859375, -1.357421875, -1.15625, -0.955078125, -0.75390625, -0.552734375, -0.3515625, -0.150390625, 0.05078125, 0.251953125, 0.453125, 0.654296875, 0.85546875, 1.056640625, 1.2578125, 1.458984375, 1.66015625, 1.861328125, 2.0625, 2.263671875, 2.46484375, 2.666015625, 2.8671875, 3.068359375, 3.26953125, 3.470703125, 3.671875, 3.873046875, 4.07421875, 4.275390625, 4.4765625, 4.677734375, 4.87890625, 5.080078125, 5.28125, 5.482421875, 5.68359375, 5.884765625, 6.0859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 2.0, 5.0, 6.0, 8.0, 9.0, 33.0, 46.0, 72.0, 120.0, 146.0, 148.0, 150.0, 87.0, 52.0, 35.0, 18.0, 13.0, 4.0, 5.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.848602294921875, -3.74798583984375, -3.647369384765625, -3.5467529296875, -3.446136474609375, -3.34552001953125, -3.244903564453125, -3.144287109375, -3.043670654296875, -2.94305419921875, -2.842437744140625, -2.7418212890625, -2.641204833984375, -2.54058837890625, -2.439971923828125, -2.33935546875, -2.238739013671875, -2.13812255859375, -2.037506103515625, -1.9368896484375, -1.836273193359375, -1.73565673828125, -1.635040283203125, -1.534423828125, -1.433807373046875, -1.33319091796875, -1.232574462890625, -1.1319580078125, -1.031341552734375, -0.93072509765625, -0.830108642578125, -0.7294921875, -0.628875732421875, -0.52825927734375, -0.427642822265625, -0.3270263671875, -0.226409912109375, -0.12579345703125, -0.025177001953125, 0.075439453125, 0.176055908203125, 0.27667236328125, 0.377288818359375, 0.4779052734375, 0.578521728515625, 0.67913818359375, 0.779754638671875, 0.88037109375, 0.980987548828125, 1.08160400390625, 1.182220458984375, 1.2828369140625, 1.383453369140625, 1.48406982421875, 1.584686279296875, 1.685302734375, 1.785919189453125, 1.88653564453125, 1.987152099609375, 2.0877685546875, 2.188385009765625, 2.28900146484375, 2.389617919921875, 2.490234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 18.0, 982.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.80794143676758, -49.115779876708984, -40.423622131347656, -31.731460571289062, -23.03929901123047, -14.347137451171875, -5.654979705810547, 3.037181854248047, 11.72934341430664, 20.421504974365234, 29.113664627075195, 37.805824279785156, 46.49798583984375, 55.190147399902344, 63.88230514526367, 72.574462890625, 81.26663208007812, 89.95879364013672, 98.65095520019531, 107.34310913085938, 116.0352783203125, 124.72743225097656, 133.41958618164062, 142.11175537109375, 150.8039093017578, 159.49606323242188, 168.188232421875, 176.88038635253906, 185.5725555419922, 194.26470947265625, 202.95687866210938, 211.64903259277344, 220.34121704101562, 229.0333709716797, 237.7255401611328, 246.41769409179688, 255.10986328125, 263.8020324707031, 272.4941711425781, 281.18634033203125, 289.8785095214844, 298.5706787109375, 307.2628173828125, 315.9549865722656, 324.64715576171875, 333.3393249511719, 342.0314636230469, 350.7236328125, 359.415771484375, 368.1079406738281, 376.8000793457031, 385.49224853515625, 394.1844177246094, 402.8765869140625, 411.5687255859375, 420.2608947753906, 428.95306396484375, 437.6452331542969, 446.3373718261719, 455.029541015625, 463.7217102050781, 472.41387939453125, 481.10601806640625, 489.7981872558594, 498.4903564453125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 14.0, 32.0, 46.0, 97.0, 137.0, 156.0, 169.0, 144.0, 101.0, 63.0, 29.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.47555160522461, -12.563921928405762, -11.652291297912598, -10.74066162109375, -9.829030990600586, -8.917401313781738, -8.00577163696289, -7.094141483306885, -6.182511329650879, -5.270881175994873, -4.359251022338867, -3.4476213455200195, -2.5359911918640137, -1.6243610382080078, -0.7127313613891602, 0.1988987922668457, 1.1105289459228516, 2.0221590995788574, 2.933789014816284, 3.845418930053711, 4.757049083709717, 5.668679237365723, 6.58030891418457, 7.491939067840576, 8.403569221496582, 9.31519889831543, 10.226829528808594, 11.138459205627441, 12.050088882446289, 12.961719512939453, 13.8733491897583, 14.784978866577148, 15.696609497070312, 16.608240127563477, 17.519868850708008, 18.431499481201172, 19.343130111694336, 20.2547607421875, 21.16638946533203, 22.078020095825195, 22.98965072631836, 23.901281356811523, 24.812910079956055, 25.72454071044922, 26.636171340942383, 27.547801971435547, 28.459430694580078, 29.371061325073242, 30.282690048217773, 31.194320678710938, 32.10594940185547, 33.017578125, 33.9292106628418, 34.84083938598633, 35.752471923828125, 36.664100646972656, 37.57572937011719, 38.48735809326172, 39.398990631103516, 40.31061935424805, 41.22224807739258, 42.133880615234375, 43.045509338378906, 43.95713806152344, 44.868770599365234]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 4.0, 10.0, 9.0, 29.0, 47.0, 81.0, 145.0, 1149.0, 4172780.0, 19007.0, 586.0, 197.0, 112.0, 58.0, 33.0, 16.0, 13.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.0220947265625, -7.989501953125, -6.9569091796875, -5.92431640625, -4.8917236328125, -3.859130859375, -2.8265380859375, -1.7939453125, -0.7613525390625, 0.271240234375, 1.3038330078125, 2.33642578125, 3.3690185546875, 4.401611328125, 5.4342041015625, 6.466796875, 7.4993896484375, 8.531982421875, 9.5645751953125, 10.59716796875, 11.6297607421875, 12.662353515625, 13.6949462890625, 14.7275390625, 15.7601318359375, 16.792724609375, 17.8253173828125, 18.85791015625, 19.8905029296875, 20.923095703125, 21.9556884765625, 22.98828125, 24.0208740234375, 25.053466796875, 26.0860595703125, 27.11865234375, 28.1512451171875, 29.183837890625, 30.2164306640625, 31.2490234375, 32.2816162109375, 33.314208984375, 34.3468017578125, 35.37939453125, 36.4119873046875, 37.444580078125, 38.4771728515625, 39.509765625, 40.5423583984375, 41.574951171875, 42.6075439453125, 43.64013671875, 44.6727294921875, 45.705322265625, 46.7379150390625, 47.7705078125, 48.8031005859375, 49.835693359375, 50.8682861328125, 51.90087890625, 52.9334716796875, 53.966064453125, 54.9986572265625, 56.03125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 6.0, 6.0, 31.0, 81.0, 190.0, 289.0, 254.0, 118.0, 35.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2225341796875, -0.1893024444580078, -0.15607070922851562, -0.12283897399902344, -0.08960723876953125, -0.05637550354003906, -0.023143768310546875, 0.010087966918945312, 0.0433197021484375, 0.07655143737792969, 0.10978317260742188, 0.14301490783691406, 0.17624664306640625, 0.20947837829589844, 0.24271011352539062, 0.2759418487548828, 0.309173583984375, 0.3424053192138672, 0.3756370544433594, 0.40886878967285156, 0.44210052490234375, 0.47533226013183594, 0.5085639953613281, 0.5417957305908203, 0.5750274658203125, 0.6082592010498047, 0.6414909362792969, 0.6747226715087891, 0.7079544067382812, 0.7411861419677734, 0.7744178771972656, 0.8076496124267578, 0.84088134765625, 0.8741130828857422, 0.9073448181152344, 0.9405765533447266, 0.9738082885742188, 1.007040023803711, 1.0402717590332031, 1.0735034942626953, 1.1067352294921875, 1.1399669647216797, 1.1731986999511719, 1.206430435180664, 1.2396621704101562, 1.2728939056396484, 1.3061256408691406, 1.3393573760986328, 1.372589111328125, 1.4058208465576172, 1.4390525817871094, 1.4722843170166016, 1.5055160522460938, 1.538747787475586, 1.5719795227050781, 1.6052112579345703, 1.6384429931640625, 1.6716747283935547, 1.7049064636230469, 1.738138198852539, 1.7713699340820312, 1.8046016693115234, 1.8378334045410156, 1.8710651397705078, 1.904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 19.0, 59.0, 114.0, 230.0, 2209.0, 4190100.0, 976.0, 299.0, 170.0, 75.0, 28.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.5, -28.224609375, -25.94921875, -23.673828125, -21.3984375, -19.123046875, -16.84765625, -14.572265625, -12.296875, -10.021484375, -7.74609375, -5.470703125, -3.1953125, -0.919921875, 1.35546875, 3.630859375, 5.90625, 8.181640625, 10.45703125, 12.732421875, 15.0078125, 17.283203125, 19.55859375, 21.833984375, 24.109375, 26.384765625, 28.66015625, 30.935546875, 33.2109375, 35.486328125, 37.76171875, 40.037109375, 42.3125, 44.587890625, 46.86328125, 49.138671875, 51.4140625, 53.689453125, 55.96484375, 58.240234375, 60.515625, 62.791015625, 65.06640625, 67.341796875, 69.6171875, 71.892578125, 74.16796875, 76.443359375, 78.71875, 80.994140625, 83.26953125, 85.544921875, 87.8203125, 90.095703125, 92.37109375, 94.646484375, 96.921875, 99.197265625, 101.47265625, 103.748046875, 106.0234375, 108.298828125, 110.57421875, 112.849609375, 115.125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 12.0, 51.0, 1640.0, 2316.0, 55.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.20343017578125, -2.0201416015625, -1.83685302734375, -1.653564453125, -1.47027587890625, -1.2869873046875, -1.10369873046875, -0.92041015625, -0.73712158203125, -0.5538330078125, -0.37054443359375, -0.187255859375, -0.00396728515625, 0.1793212890625, 0.36260986328125, 0.5458984375, 0.72918701171875, 0.9124755859375, 1.09576416015625, 1.279052734375, 1.46234130859375, 1.6456298828125, 1.82891845703125, 2.01220703125, 2.19549560546875, 2.3787841796875, 2.56207275390625, 2.745361328125, 2.92864990234375, 3.1119384765625, 3.29522705078125, 3.478515625, 3.66180419921875, 3.8450927734375, 4.02838134765625, 4.211669921875, 4.39495849609375, 4.5782470703125, 4.76153564453125, 4.94482421875, 5.12811279296875, 5.3114013671875, 5.49468994140625, 5.677978515625, 5.86126708984375, 6.0445556640625, 6.22784423828125, 6.4111328125, 6.59442138671875, 6.7777099609375, 6.96099853515625, 7.144287109375, 7.32757568359375, 7.5108642578125, 7.69415283203125, 7.87744140625, 8.06072998046875, 8.2440185546875, 8.42730712890625, 8.610595703125, 8.79388427734375, 8.9771728515625, 9.16046142578125, 9.34375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 591.0, 396.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.34315490722656, -90.70955657958984, -87.0759506225586, -83.44235229492188, -79.80874633789062, -76.1751480102539, -72.54154968261719, -68.90794372558594, -65.27434539794922, -61.640743255615234, -58.00714111328125, -54.37354278564453, -50.73994064331055, -47.10633850097656, -43.472740173339844, -39.83913803100586, -36.205535888671875, -32.57193374633789, -28.93833351135254, -25.304733276367188, -21.671131134033203, -18.03752899169922, -14.403928756713867, -10.770328521728516, -7.136726379394531, -3.5031251907348633, 0.1304759979248047, 3.7640771865844727, 7.397678375244141, 11.031280517578125, 14.664880752563477, 18.298480987548828, 21.932083129882812, 25.565685272216797, 29.19928550720215, 32.8328857421875, 36.466487884521484, 40.10009002685547, 43.73368835449219, 47.36729049682617, 51.000892639160156, 54.63449478149414, 58.268096923828125, 61.901695251464844, 65.53529357910156, 69.16889953613281, 72.80249786376953, 76.43609619140625, 80.0697021484375, 83.70330047607422, 87.33690643310547, 90.97050476074219, 94.60411071777344, 98.23770904541016, 101.87130737304688, 105.50491333007812, 109.13851165771484, 112.77210998535156, 116.40571594238281, 120.03931427001953, 123.67291259765625, 127.3065185546875, 130.94012451171875, 134.57371520996094, 138.2073211669922]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 17.0, 28.0, 53.0, 80.0, 112.0, 148.0, 148.0, 141.0, 119.0, 71.0, 34.0, 27.0, 10.0, 5.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.74961853027344, -32.71575927734375, -31.681903839111328, -30.648046493530273, -29.61418914794922, -28.580331802368164, -27.54647445678711, -26.512615203857422, -25.478759765625, -24.444902420043945, -23.41104507446289, -22.377187728881836, -21.34333038330078, -20.309473037719727, -19.275615692138672, -18.241756439208984, -17.20789909362793, -16.174041748046875, -15.14018440246582, -14.106327056884766, -13.072469711303711, -12.038612365722656, -11.004754066467285, -9.97089672088623, -8.937039375305176, -7.903182029724121, -6.869324684143066, -5.8354668617248535, -4.801609516143799, -3.767752170562744, -2.7338943481445312, -1.7000370025634766, -0.6661796569824219, 0.36767780780792236, 1.4015352725982666, 2.4353928565979004, 3.469250202178955, 4.50310754776001, 5.536965370178223, 6.570822715759277, 7.604680061340332, 8.638537406921387, 9.672394752502441, 10.706253051757812, 11.740110397338867, 12.773967742919922, 13.807825088500977, 14.841682434082031, 15.875539779663086, 16.90939712524414, 17.943254470825195, 18.97711181640625, 20.010969161987305, 21.04482650756836, 22.078685760498047, 23.11254119873047, 24.146400451660156, 25.18025779724121, 26.214115142822266, 27.24797248840332, 28.281829833984375, 29.31568717956543, 30.349544525146484, 31.383403778076172, 32.417259216308594]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 0.0, 6.0, 7.0, 13.0, 20.0, 18.0, 19.0, 34.0, 52.0, 70.0, 119.0, 225.0, 522.0, 1568.0, 8601.0, 253752.0, 762753.0, 17036.0, 2373.0, 664.0, 278.0, 134.0, 77.0, 56.0, 50.0, 23.0, 19.0, 11.0, 18.0, 6.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.9921875, -13.5823974609375, -13.172607421875, -12.7628173828125, -12.35302734375, -11.9432373046875, -11.533447265625, -11.1236572265625, -10.7138671875, -10.3040771484375, -9.894287109375, -9.4844970703125, -9.07470703125, -8.6649169921875, -8.255126953125, -7.8453369140625, -7.435546875, -7.0257568359375, -6.615966796875, -6.2061767578125, -5.79638671875, -5.3865966796875, -4.976806640625, -4.5670166015625, -4.1572265625, -3.7474365234375, -3.337646484375, -2.9278564453125, -2.51806640625, -2.1082763671875, -1.698486328125, -1.2886962890625, -0.87890625, -0.4691162109375, -0.059326171875, 0.3504638671875, 0.76025390625, 1.1700439453125, 1.579833984375, 1.9896240234375, 2.3994140625, 2.8092041015625, 3.218994140625, 3.6287841796875, 4.03857421875, 4.4483642578125, 4.858154296875, 5.2679443359375, 5.677734375, 6.0875244140625, 6.497314453125, 6.9071044921875, 7.31689453125, 7.7266845703125, 8.136474609375, 8.5462646484375, 8.9560546875, 9.3658447265625, 9.775634765625, 10.1854248046875, 10.59521484375, 11.0050048828125, 11.414794921875, 11.8245849609375, 12.234375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 27.0, 49.0, 65.0, 101.0, 110.0, 140.0, 131.0, 126.0, 100.0, 67.0, 26.0, 27.0, 11.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0771026611328125, -1.028228759765625, -0.9793548583984375, -0.93048095703125, -0.8816070556640625, -0.832733154296875, -0.7838592529296875, -0.7349853515625, -0.6861114501953125, -0.637237548828125, -0.5883636474609375, -0.53948974609375, -0.4906158447265625, -0.441741943359375, -0.3928680419921875, -0.343994140625, -0.2951202392578125, -0.246246337890625, -0.1973724365234375, -0.14849853515625, -0.0996246337890625, -0.050750732421875, -0.0018768310546875, 0.0469970703125, 0.0958709716796875, 0.144744873046875, 0.1936187744140625, 0.24249267578125, 0.2913665771484375, 0.340240478515625, 0.3891143798828125, 0.43798828125, 0.4868621826171875, 0.535736083984375, 0.5846099853515625, 0.63348388671875, 0.6823577880859375, 0.731231689453125, 0.7801055908203125, 0.8289794921875, 0.8778533935546875, 0.926727294921875, 0.9756011962890625, 1.02447509765625, 1.0733489990234375, 1.122222900390625, 1.1710968017578125, 1.219970703125, 1.2688446044921875, 1.317718505859375, 1.3665924072265625, 1.41546630859375, 1.4643402099609375, 1.513214111328125, 1.5620880126953125, 1.6109619140625, 1.6598358154296875, 1.708709716796875, 1.7575836181640625, 1.80645751953125, 1.8553314208984375, 1.904205322265625, 1.9530792236328125, 2.001953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 4.0, 12.0, 5.0, 10.0, 13.0, 9.0, 14.0, 30.0, 42.0, 88.0, 153.0, 533.0, 3338.0, 75704.0, 933930.0, 31729.0, 2162.0, 423.0, 140.0, 64.0, 32.0, 24.0, 13.0, 16.0, 14.0, 13.0, 9.0, 3.0, 5.0, 2.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.140625, -10.8070068359375, -10.473388671875, -10.1397705078125, -9.80615234375, -9.4725341796875, -9.138916015625, -8.8052978515625, -8.4716796875, -8.1380615234375, -7.804443359375, -7.4708251953125, -7.13720703125, -6.8035888671875, -6.469970703125, -6.1363525390625, -5.802734375, -5.4691162109375, -5.135498046875, -4.8018798828125, -4.46826171875, -4.1346435546875, -3.801025390625, -3.4674072265625, -3.1337890625, -2.8001708984375, -2.466552734375, -2.1329345703125, -1.79931640625, -1.4656982421875, -1.132080078125, -0.7984619140625, -0.46484375, -0.1312255859375, 0.202392578125, 0.5360107421875, 0.86962890625, 1.2032470703125, 1.536865234375, 1.8704833984375, 2.2041015625, 2.5377197265625, 2.871337890625, 3.2049560546875, 3.53857421875, 3.8721923828125, 4.205810546875, 4.5394287109375, 4.873046875, 5.2066650390625, 5.540283203125, 5.8739013671875, 6.20751953125, 6.5411376953125, 6.874755859375, 7.2083740234375, 7.5419921875, 7.8756103515625, 8.209228515625, 8.5428466796875, 8.87646484375, 9.2100830078125, 9.543701171875, 9.8773193359375, 10.2109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 18.0, 17.0, 17.0, 30.0, 32.0, 33.0, 42.0, 51.0, 70.0, 44.0, 69.0, 68.0, 56.0, 66.0, 60.0, 68.0, 48.0, 28.0, 34.0, 22.0, 26.0, 13.0, 10.0, 11.0, 10.0, 4.0, 6.0, 1.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-4.01953125, -3.907257080078125, -3.79498291015625, -3.682708740234375, -3.5704345703125, -3.458160400390625, -3.34588623046875, -3.233612060546875, -3.121337890625, -3.009063720703125, -2.89678955078125, -2.784515380859375, -2.6722412109375, -2.559967041015625, -2.44769287109375, -2.335418701171875, -2.22314453125, -2.110870361328125, -1.99859619140625, -1.886322021484375, -1.7740478515625, -1.661773681640625, -1.54949951171875, -1.437225341796875, -1.324951171875, -1.212677001953125, -1.10040283203125, -0.988128662109375, -0.8758544921875, -0.763580322265625, -0.65130615234375, -0.539031982421875, -0.4267578125, -0.314483642578125, -0.20220947265625, -0.089935302734375, 0.0223388671875, 0.134613037109375, 0.24688720703125, 0.359161376953125, 0.471435546875, 0.583709716796875, 0.69598388671875, 0.808258056640625, 0.9205322265625, 1.032806396484375, 1.14508056640625, 1.257354736328125, 1.36962890625, 1.481903076171875, 1.59417724609375, 1.706451416015625, 1.8187255859375, 1.930999755859375, 2.04327392578125, 2.155548095703125, 2.267822265625, 2.380096435546875, 2.49237060546875, 2.604644775390625, 2.7169189453125, 2.829193115234375, 2.94146728515625, 3.053741455078125, 3.166015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 5.0, 2.0, 8.0, 16.0, 12.0, 25.0, 36.0, 66.0, 99.0, 243.0, 477.0, 1438.0, 6175.0, 98703.0, 887463.0, 47421.0, 4371.0, 1137.0, 429.0, 197.0, 88.0, 54.0, 31.0, 22.0, 11.0, 5.0, 5.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.0078125, -7.82330322265625, -7.6387939453125, -7.45428466796875, -7.269775390625, -7.08526611328125, -6.9007568359375, -6.71624755859375, -6.53173828125, -6.34722900390625, -6.1627197265625, -5.97821044921875, -5.793701171875, -5.60919189453125, -5.4246826171875, -5.24017333984375, -5.0556640625, -4.87115478515625, -4.6866455078125, -4.50213623046875, -4.317626953125, -4.13311767578125, -3.9486083984375, -3.76409912109375, -3.57958984375, -3.39508056640625, -3.2105712890625, -3.02606201171875, -2.841552734375, -2.65704345703125, -2.4725341796875, -2.28802490234375, -2.103515625, -1.91900634765625, -1.7344970703125, -1.54998779296875, -1.365478515625, -1.18096923828125, -0.9964599609375, -0.81195068359375, -0.62744140625, -0.44293212890625, -0.2584228515625, -0.07391357421875, 0.110595703125, 0.29510498046875, 0.4796142578125, 0.66412353515625, 0.8486328125, 1.03314208984375, 1.2176513671875, 1.40216064453125, 1.586669921875, 1.77117919921875, 1.9556884765625, 2.14019775390625, 2.32470703125, 2.50921630859375, 2.6937255859375, 2.87823486328125, 3.062744140625, 3.24725341796875, 3.4317626953125, 3.61627197265625, 3.80078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 9.0, 12.0, 13.0, 13.0, 17.0, 20.0, 30.0, 47.0, 27.0, 47.0, 52.0, 67.0, 61.0, 65.0, 51.0, 66.0, 64.0, 47.0, 51.0, 41.0, 32.0, 22.0, 17.0, 22.0, 13.0, 15.0, 8.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022935867309570312, -0.00022200867533683777, -0.0002146586775779724, -0.00020730867981910706, -0.0001999586820602417, -0.00019260868430137634, -0.00018525868654251099, -0.00017790868878364563, -0.00017055869102478027, -0.00016320869326591492, -0.00015585869550704956, -0.0001485086977481842, -0.00014115869998931885, -0.0001338087022304535, -0.00012645870447158813, -0.00011910870671272278, -0.00011175870895385742, -0.00010440871119499207, -9.705871343612671e-05, -8.970871567726135e-05, -8.2358717918396e-05, -7.500872015953064e-05, -6.765872240066528e-05, -6.030872464179993e-05, -5.295872688293457e-05, -4.5608729124069214e-05, -3.825873136520386e-05, -3.09087336063385e-05, -2.3558735847473145e-05, -1.6208738088607788e-05, -8.858740329742432e-06, -1.5087425708770752e-06, 5.841255187988281e-06, 1.3191252946853638e-05, 2.0541250705718994e-05, 2.789124846458435e-05, 3.524124622344971e-05, 4.2591243982315063e-05, 4.994124174118042e-05, 5.7291239500045776e-05, 6.464123725891113e-05, 7.199123501777649e-05, 7.934123277664185e-05, 8.66912305355072e-05, 9.404122829437256e-05, 0.00010139122605323792, 0.00010874122381210327, 0.00011609122157096863, 0.00012344121932983398, 0.00013079121708869934, 0.0001381412148475647, 0.00014549121260643005, 0.0001528412103652954, 0.00016019120812416077, 0.00016754120588302612, 0.00017489120364189148, 0.00018224120140075684, 0.0001895911991596222, 0.00019694119691848755, 0.0002042911946773529, 0.00021164119243621826, 0.00021899119019508362, 0.00022634118795394897, 0.00023369118571281433, 0.0002410411834716797]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 15.0, 5.0, 15.0, 25.0, 57.0, 110.0, 297.0, 1147.0, 8511.0, 537031.0, 491897.0, 7938.0, 1035.0, 239.0, 97.0, 58.0, 28.0, 15.0, 8.0, 5.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.484375, -10.23468017578125, -9.9849853515625, -9.73529052734375, -9.485595703125, -9.23590087890625, -8.9862060546875, -8.73651123046875, -8.48681640625, -8.23712158203125, -7.9874267578125, -7.73773193359375, -7.488037109375, -7.23834228515625, -6.9886474609375, -6.73895263671875, -6.4892578125, -6.23956298828125, -5.9898681640625, -5.74017333984375, -5.490478515625, -5.24078369140625, -4.9910888671875, -4.74139404296875, -4.49169921875, -4.24200439453125, -3.9923095703125, -3.74261474609375, -3.492919921875, -3.24322509765625, -2.9935302734375, -2.74383544921875, -2.494140625, -2.24444580078125, -1.9947509765625, -1.74505615234375, -1.495361328125, -1.24566650390625, -0.9959716796875, -0.74627685546875, -0.49658203125, -0.24688720703125, 0.0028076171875, 0.25250244140625, 0.502197265625, 0.75189208984375, 1.0015869140625, 1.25128173828125, 1.5009765625, 1.75067138671875, 2.0003662109375, 2.25006103515625, 2.499755859375, 2.74945068359375, 2.9991455078125, 3.24884033203125, 3.49853515625, 3.74822998046875, 3.9979248046875, 4.24761962890625, 4.497314453125, 4.74700927734375, 4.9967041015625, 5.24639892578125, 5.49609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 12.0, 17.0, 22.0, 36.0, 44.0, 81.0, 95.0, 120.0, 123.0, 120.0, 107.0, 74.0, 45.0, 21.0, 18.0, 12.0, 14.0, 11.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.615234375, -3.5300140380859375, -3.444793701171875, -3.3595733642578125, -3.27435302734375, -3.1891326904296875, -3.103912353515625, -3.0186920166015625, -2.9334716796875, -2.8482513427734375, -2.763031005859375, -2.6778106689453125, -2.59259033203125, -2.5073699951171875, -2.422149658203125, -2.3369293212890625, -2.251708984375, -2.1664886474609375, -2.081268310546875, -1.9960479736328125, -1.91082763671875, -1.8256072998046875, -1.740386962890625, -1.6551666259765625, -1.5699462890625, -1.4847259521484375, -1.399505615234375, -1.3142852783203125, -1.22906494140625, -1.1438446044921875, -1.058624267578125, -0.9734039306640625, -0.88818359375, -0.8029632568359375, -0.717742919921875, -0.6325225830078125, -0.54730224609375, -0.4620819091796875, -0.376861572265625, -0.2916412353515625, -0.2064208984375, -0.1212005615234375, -0.035980224609375, 0.0492401123046875, 0.13446044921875, 0.2196807861328125, 0.304901123046875, 0.3901214599609375, 0.475341796875, 0.5605621337890625, 0.645782470703125, 0.7310028076171875, 0.81622314453125, 0.9014434814453125, 0.986663818359375, 1.0718841552734375, 1.1571044921875, 1.2423248291015625, 1.327545166015625, 1.4127655029296875, 1.49798583984375, 1.5832061767578125, 1.668426513671875, 1.7536468505859375, 1.8388671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 10.0, 21.0, 87.0, 577.0, 298.0, 16.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.97378540039062, -157.81253051757812, -154.65127563476562, -151.49002075195312, -148.3287811279297, -145.1675262451172, -142.0062713623047, -138.8450164794922, -135.6837615966797, -132.5225067138672, -129.3612518310547, -126.20000457763672, -123.03874969482422, -119.87750244140625, -116.71624755859375, -113.55499267578125, -110.39374542236328, -107.23249053955078, -104.07124328613281, -100.90998840332031, -97.74873352050781, -94.58747863769531, -91.42623138427734, -88.26497650146484, -85.10372924804688, -81.94247436523438, -78.7812271118164, -75.6199722290039, -72.4587173461914, -69.29747009277344, -66.13621520996094, -62.97496032714844, -59.81371307373047, -56.652462005615234, -53.491207122802734, -50.3299560546875, -47.168701171875, -44.007450103759766, -40.84619903564453, -37.68494415283203, -34.5236930847168, -31.36244010925293, -28.201187133789062, -25.039936065673828, -21.87868309020996, -18.717430114746094, -15.55617904663086, -12.394926071166992, -9.233673095703125, -6.072420597076416, -2.911168098449707, 0.25008392333984375, 3.411336898803711, 6.572589874267578, 9.733840942382812, 12.89509391784668, 16.056346893310547, 19.217599868774414, 22.37885284423828, 25.540103912353516, 28.701356887817383, 31.86260986328125, 35.023860931396484, 38.18511199951172, 41.34636688232422]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 10.0, 16.0, 27.0, 28.0, 32.0, 35.0, 49.0, 57.0, 66.0, 71.0, 67.0, 73.0, 70.0, 75.0, 69.0, 50.0, 46.0, 29.0, 32.0, 21.0, 17.0, 5.0, 8.0, 11.0, 5.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6370849609375, -34.68000030517578, -33.7229118347168, -32.76582717895508, -31.808738708496094, -30.851654052734375, -29.894567489624023, -28.937480926513672, -27.98039436340332, -27.02330780029297, -26.066221237182617, -25.109134674072266, -24.152050018310547, -23.194961547851562, -22.237876892089844, -21.280790328979492, -20.32370376586914, -19.36661720275879, -18.409530639648438, -17.452444076538086, -16.495357513427734, -15.5382719039917, -14.581186294555664, -13.624099731445312, -12.667013168334961, -11.70992660522461, -10.752840042114258, -9.795754432678223, -8.838667869567871, -7.8815813064575195, -6.924495220184326, -5.967409133911133, -5.010322570800781, -4.05323600769043, -3.0961499214172363, -2.139063596725464, -1.1819772720336914, -0.22489070892333984, 0.7321953773498535, 1.6892814636230469, 2.6463680267333984, 3.603454351425171, 4.560540676116943, 5.517626762390137, 6.474713325500488, 7.43179988861084, 8.388885498046875, 9.345972061157227, 10.303058624267578, 11.26014518737793, 12.217231750488281, 13.174317359924316, 14.131403923034668, 15.08849048614502, 16.045576095581055, 17.002662658691406, 17.959749221801758, 18.91683578491211, 19.87392234802246, 20.831008911132812, 21.78809356689453, 22.745182037353516, 23.702266693115234, 24.659353256225586, 25.616439819335938]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 13.0, 25.0, 63.0, 115.0, 384.0, 1955.0, 24075.0, 4062819.0, 99153.0, 4136.0, 810.0, 327.0, 141.0, 93.0, 49.0, 37.0, 24.0, 18.0, 9.0, 10.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -7.7989501953125, -7.183837890625, -6.5687255859375, -5.95361328125, -5.3385009765625, -4.723388671875, -4.1082763671875, -3.4931640625, -2.8780517578125, -2.262939453125, -1.6478271484375, -1.03271484375, -0.4176025390625, 0.197509765625, 0.8126220703125, 1.427734375, 2.0428466796875, 2.657958984375, 3.2730712890625, 3.88818359375, 4.5032958984375, 5.118408203125, 5.7335205078125, 6.3486328125, 6.9637451171875, 7.578857421875, 8.1939697265625, 8.80908203125, 9.4241943359375, 10.039306640625, 10.6544189453125, 11.26953125, 11.8846435546875, 12.499755859375, 13.1148681640625, 13.72998046875, 14.3450927734375, 14.960205078125, 15.5753173828125, 16.1904296875, 16.8055419921875, 17.420654296875, 18.0357666015625, 18.65087890625, 19.2659912109375, 19.881103515625, 20.4962158203125, 21.111328125, 21.7264404296875, 22.341552734375, 22.9566650390625, 23.57177734375, 24.1868896484375, 24.802001953125, 25.4171142578125, 26.0322265625, 26.6473388671875, 27.262451171875, 27.8775634765625, 28.49267578125, 29.1077880859375, 29.722900390625, 30.3380126953125, 30.953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 10.0, 18.0, 22.0, 34.0, 54.0, 75.0, 84.0, 111.0, 116.0, 123.0, 102.0, 69.0, 70.0, 43.0, 26.0, 15.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8320388793945312, -0.7876129150390625, -0.7431869506835938, -0.698760986328125, -0.6543350219726562, -0.6099090576171875, -0.5654830932617188, -0.52105712890625, -0.47663116455078125, -0.4322052001953125, -0.38777923583984375, -0.343353271484375, -0.29892730712890625, -0.2545013427734375, -0.21007537841796875, -0.1656494140625, -0.12122344970703125, -0.0767974853515625, -0.03237152099609375, 0.012054443359375, 0.05648040771484375, 0.1009063720703125, 0.14533233642578125, 0.18975830078125, 0.23418426513671875, 0.2786102294921875, 0.32303619384765625, 0.367462158203125, 0.41188812255859375, 0.4563140869140625, 0.5007400512695312, 0.545166015625, 0.5895919799804688, 0.6340179443359375, 0.6784439086914062, 0.722869873046875, 0.7672958374023438, 0.8117218017578125, 0.8561477661132812, 0.90057373046875, 0.9449996948242188, 0.9894256591796875, 1.0338516235351562, 1.078277587890625, 1.1227035522460938, 1.1671295166015625, 1.2115554809570312, 1.2559814453125, 1.3004074096679688, 1.3448333740234375, 1.3892593383789062, 1.433685302734375, 1.4781112670898438, 1.5225372314453125, 1.5669631958007812, 1.61138916015625, 1.6558151245117188, 1.7002410888671875, 1.7446670532226562, 1.789093017578125, 1.8335189819335938, 1.8779449462890625, 1.9223709106445312, 1.966796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 10.0, 21.0, 62.0, 289.0, 7023.0, 4185639.0, 942.0, 192.0, 71.0, 27.0, 11.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -17.995849609375, -15.10107421875, -12.206298828125, -9.3115234375, -6.416748046875, -3.52197265625, -0.627197265625, 2.267578125, 5.162353515625, 8.05712890625, 10.951904296875, 13.8466796875, 16.741455078125, 19.63623046875, 22.531005859375, 25.42578125, 28.320556640625, 31.21533203125, 34.110107421875, 37.0048828125, 39.899658203125, 42.79443359375, 45.689208984375, 48.583984375, 51.478759765625, 54.37353515625, 57.268310546875, 60.1630859375, 63.057861328125, 65.95263671875, 68.847412109375, 71.7421875, 74.636962890625, 77.53173828125, 80.426513671875, 83.3212890625, 86.216064453125, 89.11083984375, 92.005615234375, 94.900390625, 97.795166015625, 100.68994140625, 103.584716796875, 106.4794921875, 109.374267578125, 112.26904296875, 115.163818359375, 118.05859375, 120.953369140625, 123.84814453125, 126.742919921875, 129.6376953125, 132.532470703125, 135.42724609375, 138.322021484375, 141.216796875, 144.111572265625, 147.00634765625, 149.901123046875, 152.7958984375, 155.690673828125, 158.58544921875, 161.480224609375, 164.375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 17.0, 65.0, 454.0, 3355.0, 157.0, 13.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.6173248291015625, -1.360626220703125, -1.1039276123046875, -0.84722900390625, -0.5905303955078125, -0.333831787109375, -0.0771331787109375, 0.1795654296875, 0.4362640380859375, 0.692962646484375, 0.9496612548828125, 1.20635986328125, 1.4630584716796875, 1.719757080078125, 1.9764556884765625, 2.233154296875, 2.4898529052734375, 2.746551513671875, 3.0032501220703125, 3.25994873046875, 3.5166473388671875, 3.773345947265625, 4.0300445556640625, 4.2867431640625, 4.5434417724609375, 4.800140380859375, 5.0568389892578125, 5.31353759765625, 5.5702362060546875, 5.826934814453125, 6.0836334228515625, 6.34033203125, 6.5970306396484375, 6.853729248046875, 7.1104278564453125, 7.36712646484375, 7.6238250732421875, 7.880523681640625, 8.137222290039062, 8.3939208984375, 8.650619506835938, 8.907318115234375, 9.164016723632812, 9.42071533203125, 9.677413940429688, 9.934112548828125, 10.190811157226562, 10.447509765625, 10.704208374023438, 10.960906982421875, 11.217605590820312, 11.47430419921875, 11.731002807617188, 11.987701416015625, 12.244400024414062, 12.5010986328125, 12.757797241210938, 13.014495849609375, 13.271194458007812, 13.52789306640625, 13.784591674804688, 14.041290283203125, 14.297988891601562, 14.5546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 110.0, 735.0, 124.0, 21.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.00344848632812, -70.75090789794922, -68.49836730957031, -66.2458267211914, -63.993282318115234, -61.74074172973633, -59.488197326660156, -57.23565673828125, -54.983116149902344, -52.73057556152344, -50.47803497314453, -48.22549057006836, -45.97294998168945, -43.72040939331055, -41.467864990234375, -39.21532440185547, -36.96278381347656, -34.710243225097656, -32.45770263671875, -30.205158233642578, -27.952617645263672, -25.700077056884766, -23.447534561157227, -21.194992065429688, -18.94245147705078, -16.689910888671875, -14.437368392944336, -12.184826850891113, -9.93228530883789, -7.679743766784668, -5.427202224731445, -3.1746606826782227, -0.9221115112304688, 1.330430030822754, 3.5829715728759766, 5.835513114929199, 8.088054656982422, 10.340596199035645, 12.593137741088867, 14.84567928314209, 17.098220825195312, 19.35076141357422, 21.603303909301758, 23.855846405029297, 26.108386993408203, 28.36092758178711, 30.61347007751465, 32.86601257324219, 35.118553161621094, 37.37109375, 39.623634338378906, 41.87617874145508, 44.128719329833984, 46.38125991821289, 48.63380432128906, 50.88634490966797, 53.138885498046875, 55.39142608642578, 57.64396667480469, 59.89651107788086, 62.149051666259766, 64.40159606933594, 66.65413665771484, 68.90667724609375, 71.15921783447266]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 4.0, 13.0, 15.0, 47.0, 51.0, 78.0, 89.0, 95.0, 112.0, 135.0, 112.0, 69.0, 56.0, 49.0, 27.0, 24.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.984140396118164, -26.096216201782227, -25.208293914794922, -24.320369720458984, -23.432445526123047, -22.544523239135742, -21.656599044799805, -20.7686767578125, -19.880752563476562, -18.992828369140625, -18.10490608215332, -17.216981887817383, -16.329057693481445, -15.44113540649414, -14.553211212158203, -13.665287971496582, -12.777363777160645, -11.889440536499023, -11.001516342163086, -10.113593101501465, -9.225669860839844, -8.337745666503906, -7.449822425842285, -6.561899185180664, -5.673975467681885, -4.7860517501831055, -3.8981285095214844, -3.010204792022705, -2.122281312942505, -1.2343578338623047, -0.3464341163635254, 0.5414891242980957, 1.429412841796875, 2.317336320877075, 3.2052597999572754, 4.093183517456055, 4.981106758117676, 5.869030475616455, 6.756954193115234, 7.6448774337768555, 8.532800674438477, 9.420723915100098, 10.308648109436035, 11.196571350097656, 12.084494590759277, 12.972417831420898, 13.860342025756836, 14.748265266418457, 15.636189460754395, 16.524112701416016, 17.412036895751953, 18.29996109008789, 19.187883377075195, 20.075807571411133, 20.963729858398438, 21.851654052734375, 22.739578247070312, 23.62750244140625, 24.515424728393555, 25.403348922729492, 26.29127311706543, 27.179195404052734, 28.067119598388672, 28.95504379272461, 29.842966079711914]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 17.0, 14.0, 16.0, 27.0, 26.0, 28.0, 68.0, 89.0, 112.0, 197.0, 388.0, 627.0, 1526.0, 4525.0, 22407.0, 174594.0, 715180.0, 107114.0, 15467.0, 3455.0, 1252.0, 522.0, 308.0, 165.0, 131.0, 69.0, 56.0, 44.0, 38.0, 20.0, 14.0, 9.0, 14.0, 4.0, 10.0, 11.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.60906982421875, -8.3587646484375, -8.10845947265625, -7.858154296875, -7.60784912109375, -7.3575439453125, -7.10723876953125, -6.85693359375, -6.60662841796875, -6.3563232421875, -6.10601806640625, -5.855712890625, -5.60540771484375, -5.3551025390625, -5.10479736328125, -4.8544921875, -4.60418701171875, -4.3538818359375, -4.10357666015625, -3.853271484375, -3.60296630859375, -3.3526611328125, -3.10235595703125, -2.85205078125, -2.60174560546875, -2.3514404296875, -2.10113525390625, -1.850830078125, -1.60052490234375, -1.3502197265625, -1.09991455078125, -0.849609375, -0.59930419921875, -0.3489990234375, -0.09869384765625, 0.151611328125, 0.40191650390625, 0.6522216796875, 0.90252685546875, 1.15283203125, 1.40313720703125, 1.6534423828125, 1.90374755859375, 2.154052734375, 2.40435791015625, 2.6546630859375, 2.90496826171875, 3.1552734375, 3.40557861328125, 3.6558837890625, 3.90618896484375, 4.156494140625, 4.40679931640625, 4.6571044921875, 4.90740966796875, 5.15771484375, 5.40802001953125, 5.6583251953125, 5.90863037109375, 6.158935546875, 6.40924072265625, 6.6595458984375, 6.90985107421875, 7.16015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 16.0, 20.0, 35.0, 54.0, 70.0, 75.0, 68.0, 109.0, 124.0, 91.0, 74.0, 71.0, 59.0, 49.0, 24.0, 19.0, 15.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.210693359375, -1.14794921875, -1.085205078125, -1.0224609375, -0.959716796875, -0.89697265625, -0.834228515625, -0.771484375, -0.708740234375, -0.64599609375, -0.583251953125, -0.5205078125, -0.457763671875, -0.39501953125, -0.332275390625, -0.26953125, -0.206787109375, -0.14404296875, -0.081298828125, -0.0185546875, 0.044189453125, 0.10693359375, 0.169677734375, 0.232421875, 0.295166015625, 0.35791015625, 0.420654296875, 0.4833984375, 0.546142578125, 0.60888671875, 0.671630859375, 0.734375, 0.797119140625, 0.85986328125, 0.922607421875, 0.9853515625, 1.048095703125, 1.11083984375, 1.173583984375, 1.236328125, 1.299072265625, 1.36181640625, 1.424560546875, 1.4873046875, 1.550048828125, 1.61279296875, 1.675537109375, 1.73828125, 1.801025390625, 1.86376953125, 1.926513671875, 1.9892578125, 2.052001953125, 2.11474609375, 2.177490234375, 2.240234375, 2.302978515625, 2.36572265625, 2.428466796875, 2.4912109375, 2.553955078125, 2.61669921875, 2.679443359375, 2.7421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 6.0, 11.0, 10.0, 11.0, 18.0, 19.0, 32.0, 60.0, 108.0, 157.0, 443.0, 1630.0, 8564.0, 92908.0, 827893.0, 104770.0, 9328.0, 1664.0, 494.0, 179.0, 71.0, 44.0, 29.0, 30.0, 19.0, 16.0, 7.0, 11.0, 5.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.7578125, -9.48309326171875, -9.2083740234375, -8.93365478515625, -8.658935546875, -8.38421630859375, -8.1094970703125, -7.83477783203125, -7.56005859375, -7.28533935546875, -7.0106201171875, -6.73590087890625, -6.461181640625, -6.18646240234375, -5.9117431640625, -5.63702392578125, -5.3623046875, -5.08758544921875, -4.8128662109375, -4.53814697265625, -4.263427734375, -3.98870849609375, -3.7139892578125, -3.43927001953125, -3.16455078125, -2.88983154296875, -2.6151123046875, -2.34039306640625, -2.065673828125, -1.79095458984375, -1.5162353515625, -1.24151611328125, -0.966796875, -0.69207763671875, -0.4173583984375, -0.14263916015625, 0.132080078125, 0.40679931640625, 0.6815185546875, 0.95623779296875, 1.23095703125, 1.50567626953125, 1.7803955078125, 2.05511474609375, 2.329833984375, 2.60455322265625, 2.8792724609375, 3.15399169921875, 3.4287109375, 3.70343017578125, 3.9781494140625, 4.25286865234375, 4.527587890625, 4.80230712890625, 5.0770263671875, 5.35174560546875, 5.62646484375, 5.90118408203125, 6.1759033203125, 6.45062255859375, 6.725341796875, 7.00006103515625, 7.2747802734375, 7.54949951171875, 7.82421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 1.0, 13.0, 11.0, 16.0, 10.0, 18.0, 20.0, 45.0, 48.0, 43.0, 45.0, 47.0, 48.0, 63.0, 67.0, 55.0, 61.0, 59.0, 50.0, 46.0, 30.0, 37.0, 29.0, 20.0, 25.0, 16.0, 15.0, 18.0, 5.0, 3.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-5.99609375, -5.829833984375, -5.66357421875, -5.497314453125, -5.3310546875, -5.164794921875, -4.99853515625, -4.832275390625, -4.666015625, -4.499755859375, -4.33349609375, -4.167236328125, -4.0009765625, -3.834716796875, -3.66845703125, -3.502197265625, -3.3359375, -3.169677734375, -3.00341796875, -2.837158203125, -2.6708984375, -2.504638671875, -2.33837890625, -2.172119140625, -2.005859375, -1.839599609375, -1.67333984375, -1.507080078125, -1.3408203125, -1.174560546875, -1.00830078125, -0.842041015625, -0.67578125, -0.509521484375, -0.34326171875, -0.177001953125, -0.0107421875, 0.155517578125, 0.32177734375, 0.488037109375, 0.654296875, 0.820556640625, 0.98681640625, 1.153076171875, 1.3193359375, 1.485595703125, 1.65185546875, 1.818115234375, 1.984375, 2.150634765625, 2.31689453125, 2.483154296875, 2.6494140625, 2.815673828125, 2.98193359375, 3.148193359375, 3.314453125, 3.480712890625, 3.64697265625, 3.813232421875, 3.9794921875, 4.145751953125, 4.31201171875, 4.478271484375, 4.64453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 4.0, 8.0, 11.0, 12.0, 24.0, 37.0, 55.0, 96.0, 126.0, 249.0, 476.0, 897.0, 1928.0, 4566.0, 12726.0, 45524.0, 206703.0, 508129.0, 201328.0, 44663.0, 12646.0, 4541.0, 1826.0, 875.0, 443.0, 235.0, 157.0, 93.0, 52.0, 34.0, 21.0, 16.0, 9.0, 10.0, 8.0, 4.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.8310699462890625, -1.776397705078125, -1.7217254638671875, -1.66705322265625, -1.6123809814453125, -1.557708740234375, -1.5030364990234375, -1.4483642578125, -1.3936920166015625, -1.339019775390625, -1.2843475341796875, -1.22967529296875, -1.1750030517578125, -1.120330810546875, -1.0656585693359375, -1.010986328125, -0.9563140869140625, -0.901641845703125, -0.8469696044921875, -0.79229736328125, -0.7376251220703125, -0.682952880859375, -0.6282806396484375, -0.5736083984375, -0.5189361572265625, -0.464263916015625, -0.4095916748046875, -0.35491943359375, -0.3002471923828125, -0.245574951171875, -0.1909027099609375, -0.13623046875, -0.0815582275390625, -0.026885986328125, 0.0277862548828125, 0.08245849609375, 0.1371307373046875, 0.191802978515625, 0.2464752197265625, 0.3011474609375, 0.3558197021484375, 0.410491943359375, 0.4651641845703125, 0.51983642578125, 0.5745086669921875, 0.629180908203125, 0.6838531494140625, 0.738525390625, 0.7931976318359375, 0.847869873046875, 0.9025421142578125, 0.95721435546875, 1.0118865966796875, 1.066558837890625, 1.1212310791015625, 1.1759033203125, 1.2305755615234375, 1.285247802734375, 1.3399200439453125, 1.39459228515625, 1.4492645263671875, 1.503936767578125, 1.5586090087890625, 1.61328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 8.0, 15.0, 17.0, 28.0, 39.0, 50.0, 79.0, 119.0, 133.0, 120.0, 109.0, 68.0, 59.0, 38.0, 31.0, 21.0, 20.0, 6.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034117698669433594, -0.0003280453383922577, -0.00031491369009017944, -0.0003017820417881012, -0.00028865039348602295, -0.0002755187451839447, -0.00026238709688186646, -0.0002492554485797882, -0.00023612380027770996, -0.00022299215197563171, -0.00020986050367355347, -0.00019672885537147522, -0.00018359720706939697, -0.00017046555876731873, -0.00015733391046524048, -0.00014420226216316223, -0.00013107061386108398, -0.00011793896555900574, -0.00010480731725692749, -9.167566895484924e-05, -7.8544020652771e-05, -6.541237235069275e-05, -5.22807240486145e-05, -3.9149075746536255e-05, -2.6017427444458008e-05, -1.288577914237976e-05, 2.4586915969848633e-07, 1.3377517461776733e-05, 2.650916576385498e-05, 3.964081406593323e-05, 5.2772462368011475e-05, 6.590411067008972e-05, 7.903575897216797e-05, 9.216740727424622e-05, 0.00010529905557632446, 0.00011843070387840271, 0.00013156235218048096, 0.0001446940004825592, 0.00015782564878463745, 0.0001709572970867157, 0.00018408894538879395, 0.0001972205936908722, 0.00021035224199295044, 0.0002234838902950287, 0.00023661553859710693, 0.0002497471868991852, 0.00026287883520126343, 0.0002760104835033417, 0.0002891421318054199, 0.00030227378010749817, 0.0003154054284095764, 0.00032853707671165466, 0.0003416687250137329, 0.00035480037331581116, 0.0003679320216178894, 0.00038106366991996765, 0.0003941953182220459, 0.00040732696652412415, 0.0004204586148262024, 0.00043359026312828064, 0.0004467219114303589, 0.00045985355973243713, 0.0004729852080345154, 0.00048611685633659363, 0.0004992485046386719]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 11.0, 17.0, 17.0, 26.0, 25.0, 51.0, 82.0, 128.0, 222.0, 368.0, 701.0, 1651.0, 4069.0, 11618.0, 40110.0, 163894.0, 482456.0, 253772.0, 62280.0, 17191.0, 5625.0, 2145.0, 973.0, 445.0, 264.0, 137.0, 68.0, 48.0, 42.0, 17.0, 18.0, 22.0, 10.0, 5.0, 7.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4239959716796875, -1.368499755859375, -1.3130035400390625, -1.25750732421875, -1.2020111083984375, -1.146514892578125, -1.0910186767578125, -1.0355224609375, -0.9800262451171875, -0.924530029296875, -0.8690338134765625, -0.81353759765625, -0.7580413818359375, -0.702545166015625, -0.6470489501953125, -0.591552734375, -0.5360565185546875, -0.480560302734375, -0.4250640869140625, -0.36956787109375, -0.3140716552734375, -0.258575439453125, -0.2030792236328125, -0.1475830078125, -0.0920867919921875, -0.036590576171875, 0.0189056396484375, 0.07440185546875, 0.1298980712890625, 0.185394287109375, 0.2408905029296875, 0.29638671875, 0.3518829345703125, 0.407379150390625, 0.4628753662109375, 0.51837158203125, 0.5738677978515625, 0.629364013671875, 0.6848602294921875, 0.7403564453125, 0.7958526611328125, 0.851348876953125, 0.9068450927734375, 0.96234130859375, 1.0178375244140625, 1.073333740234375, 1.1288299560546875, 1.184326171875, 1.2398223876953125, 1.295318603515625, 1.3508148193359375, 1.40631103515625, 1.4618072509765625, 1.517303466796875, 1.5727996826171875, 1.6282958984375, 1.6837921142578125, 1.739288330078125, 1.7947845458984375, 1.85028076171875, 1.9057769775390625, 1.961273193359375, 2.0167694091796875, 2.072265625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 12.0, 7.0, 11.0, 8.0, 9.0, 20.0, 24.0, 31.0, 28.0, 50.0, 43.0, 42.0, 50.0, 71.0, 58.0, 84.0, 67.0, 51.0, 47.0, 47.0, 36.0, 38.0, 27.0, 37.0, 17.0, 20.0, 11.0, 13.0, 8.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.25146484375, -1.208984375, -1.16650390625, -1.1240234375, -1.08154296875, -1.0390625, -0.99658203125, -0.9541015625, -0.91162109375, -0.869140625, -0.82666015625, -0.7841796875, -0.74169921875, -0.69921875, -0.65673828125, -0.6142578125, -0.57177734375, -0.529296875, -0.48681640625, -0.4443359375, -0.40185546875, -0.359375, -0.31689453125, -0.2744140625, -0.23193359375, -0.189453125, -0.14697265625, -0.1044921875, -0.06201171875, -0.01953125, 0.02294921875, 0.0654296875, 0.10791015625, 0.150390625, 0.19287109375, 0.2353515625, 0.27783203125, 0.3203125, 0.36279296875, 0.4052734375, 0.44775390625, 0.490234375, 0.53271484375, 0.5751953125, 0.61767578125, 0.66015625, 0.70263671875, 0.7451171875, 0.78759765625, 0.830078125, 0.87255859375, 0.9150390625, 0.95751953125, 1.0, 1.04248046875, 1.0849609375, 1.12744140625, 1.169921875, 1.21240234375, 1.2548828125, 1.29736328125, 1.33984375, 1.38232421875, 1.4248046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 12.0, 23.0, 27.0, 67.0, 160.0, 290.0, 233.0, 118.0, 44.0, 21.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.26384353637695, -38.91786575317383, -37.5718879699707, -36.225914001464844, -34.87993621826172, -33.533958435058594, -32.18798065185547, -30.842002868652344, -29.49602699279785, -28.150049209594727, -26.804073333740234, -25.45809555053711, -24.112117767333984, -22.766141891479492, -21.420164108276367, -20.074188232421875, -18.72821044921875, -17.382232666015625, -16.036256790161133, -14.690279006958008, -13.3443021774292, -11.99832534790039, -10.652347564697266, -9.306370735168457, -7.960393905639648, -6.61441707611084, -5.268439769744873, -3.9224624633789062, -2.5764856338500977, -1.230508804321289, 0.11546897888183594, 1.4614458084106445, 2.8074188232421875, 4.153395652770996, 5.499372959136963, 6.84535026550293, 8.191327095031738, 9.537303924560547, 10.883281707763672, 12.22925853729248, 13.575235366821289, 14.921212196350098, 16.267189025878906, 17.61316680908203, 18.959144592285156, 20.30512046813965, 21.651098251342773, 22.997074127197266, 24.34305191040039, 25.689029693603516, 27.035005569458008, 28.380983352661133, 29.726959228515625, 31.07293701171875, 32.418914794921875, 33.764892578125, 35.110870361328125, 36.45684814453125, 37.802825927734375, 39.1488037109375, 40.49477767944336, 41.840755462646484, 43.18673324584961, 44.532711029052734, 45.878684997558594]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 7.0, 6.0, 17.0, 11.0, 10.0, 13.0, 22.0, 19.0, 29.0, 32.0, 31.0, 34.0, 40.0, 48.0, 59.0, 47.0, 38.0, 46.0, 41.0, 42.0, 58.0, 43.0, 40.0, 30.0, 29.0, 28.0, 24.0, 28.0, 19.0, 23.0, 24.0, 15.0, 9.0, 6.0, 6.0, 7.0, 3.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.08823013305664, -28.28565216064453, -27.483074188232422, -26.680496215820312, -25.877920150756836, -25.075342178344727, -24.272764205932617, -23.470186233520508, -22.6676082611084, -21.86503028869629, -21.06245231628418, -20.259876251220703, -19.457298278808594, -18.654720306396484, -17.852142333984375, -17.049564361572266, -16.246986389160156, -15.444408416748047, -14.641831398010254, -13.839253425598145, -13.036675453186035, -12.234098434448242, -11.431520462036133, -10.628942489624023, -9.826366424560547, -9.023788452148438, -8.221211433410645, -7.418633460998535, -6.616055488586426, -5.813477993011475, -5.010900497436523, -4.208322525024414, -3.4057445526123047, -2.6031668186187744, -1.8005892038345337, -0.998011589050293, -0.1954338550567627, 0.6071438789367676, 1.4097213745117188, 2.212299346923828, 3.0148768424987793, 3.8174545764923096, 4.62003231048584, 5.422609806060791, 6.225187301635742, 7.027765274047852, 7.830342769622803, 8.63292121887207, 9.435498237609863, 10.238076210021973, 11.040653228759766, 11.843231201171875, 12.645809173583984, 13.448387145996094, 14.250964164733887, 15.053542137145996, 15.856119155883789, 16.6586971282959, 17.461275100708008, 18.263851165771484, 19.066429138183594, 19.869007110595703, 20.671585083007812, 21.474163055419922, 22.27674102783203]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 8.0, 27.0, 56.0, 86.0, 170.0, 418.0, 1104.0, 3984.0, 28146.0, 3830764.0, 313114.0, 11711.0, 2659.0, 898.0, 475.0, 252.0, 123.0, 78.0, 49.0, 46.0, 23.0, 27.0, 13.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.2523193359375, -6.793701171875, -6.3350830078125, -5.87646484375, -5.4178466796875, -4.959228515625, -4.5006103515625, -4.0419921875, -3.5833740234375, -3.124755859375, -2.6661376953125, -2.20751953125, -1.7489013671875, -1.290283203125, -0.8316650390625, -0.373046875, 0.0855712890625, 0.544189453125, 1.0028076171875, 1.46142578125, 1.9200439453125, 2.378662109375, 2.8372802734375, 3.2958984375, 3.7545166015625, 4.213134765625, 4.6717529296875, 5.13037109375, 5.5889892578125, 6.047607421875, 6.5062255859375, 6.96484375, 7.4234619140625, 7.882080078125, 8.3406982421875, 8.79931640625, 9.2579345703125, 9.716552734375, 10.1751708984375, 10.6337890625, 11.0924072265625, 11.551025390625, 12.0096435546875, 12.46826171875, 12.9268798828125, 13.385498046875, 13.8441162109375, 14.302734375, 14.7613525390625, 15.219970703125, 15.6785888671875, 16.13720703125, 16.5958251953125, 17.054443359375, 17.5130615234375, 17.9716796875, 18.4302978515625, 18.888916015625, 19.3475341796875, 19.80615234375, 20.2647705078125, 20.723388671875, 21.1820068359375, 21.640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 16.0, 19.0, 43.0, 54.0, 82.0, 100.0, 112.0, 113.0, 123.0, 97.0, 79.0, 58.0, 39.0, 24.0, 14.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.2762451171875, -1.198974609375, -1.1217041015625, -1.04443359375, -0.9671630859375, -0.889892578125, -0.8126220703125, -0.7353515625, -0.6580810546875, -0.580810546875, -0.5035400390625, -0.42626953125, -0.3489990234375, -0.271728515625, -0.1944580078125, -0.1171875, -0.0399169921875, 0.037353515625, 0.1146240234375, 0.19189453125, 0.2691650390625, 0.346435546875, 0.4237060546875, 0.5009765625, 0.5782470703125, 0.655517578125, 0.7327880859375, 0.81005859375, 0.8873291015625, 0.964599609375, 1.0418701171875, 1.119140625, 1.1964111328125, 1.273681640625, 1.3509521484375, 1.42822265625, 1.5054931640625, 1.582763671875, 1.6600341796875, 1.7373046875, 1.8145751953125, 1.891845703125, 1.9691162109375, 2.04638671875, 2.1236572265625, 2.200927734375, 2.2781982421875, 2.35546875, 2.4327392578125, 2.510009765625, 2.5872802734375, 2.66455078125, 2.7418212890625, 2.819091796875, 2.8963623046875, 2.9736328125, 3.0509033203125, 3.128173828125, 3.2054443359375, 3.28271484375, 3.3599853515625, 3.437255859375, 3.5145263671875, 3.591796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 17.0, 40.0, 65.0, 143.0, 273.0, 2660.0, 4189810.0, 915.0, 219.0, 86.0, 37.0, 14.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.625, -92.39111328125, -90.1572265625, -87.92333984375, -85.689453125, -83.45556640625, -81.2216796875, -78.98779296875, -76.75390625, -74.52001953125, -72.2861328125, -70.05224609375, -67.818359375, -65.58447265625, -63.3505859375, -61.11669921875, -58.8828125, -56.64892578125, -54.4150390625, -52.18115234375, -49.947265625, -47.71337890625, -45.4794921875, -43.24560546875, -41.01171875, -38.77783203125, -36.5439453125, -34.31005859375, -32.076171875, -29.84228515625, -27.6083984375, -25.37451171875, -23.140625, -20.90673828125, -18.6728515625, -16.43896484375, -14.205078125, -11.97119140625, -9.7373046875, -7.50341796875, -5.26953125, -3.03564453125, -0.8017578125, 1.43212890625, 3.666015625, 5.89990234375, 8.1337890625, 10.36767578125, 12.6015625, 14.83544921875, 17.0693359375, 19.30322265625, 21.537109375, 23.77099609375, 26.0048828125, 28.23876953125, 30.47265625, 32.70654296875, 34.9404296875, 37.17431640625, 39.408203125, 41.64208984375, 43.8759765625, 46.10986328125, 48.34375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 10.0, 34.0, 430.0, 3467.0, 126.0, 15.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.84375, -14.4844970703125, -14.125244140625, -13.7659912109375, -13.40673828125, -13.0474853515625, -12.688232421875, -12.3289794921875, -11.9697265625, -11.6104736328125, -11.251220703125, -10.8919677734375, -10.53271484375, -10.1734619140625, -9.814208984375, -9.4549560546875, -9.095703125, -8.7364501953125, -8.377197265625, -8.0179443359375, -7.65869140625, -7.2994384765625, -6.940185546875, -6.5809326171875, -6.2216796875, -5.8624267578125, -5.503173828125, -5.1439208984375, -4.78466796875, -4.4254150390625, -4.066162109375, -3.7069091796875, -3.34765625, -2.9884033203125, -2.629150390625, -2.2698974609375, -1.91064453125, -1.5513916015625, -1.192138671875, -0.8328857421875, -0.4736328125, -0.1143798828125, 0.244873046875, 0.6041259765625, 0.96337890625, 1.3226318359375, 1.681884765625, 2.0411376953125, 2.400390625, 2.7596435546875, 3.118896484375, 3.4781494140625, 3.83740234375, 4.1966552734375, 4.555908203125, 4.9151611328125, 5.2744140625, 5.6336669921875, 5.992919921875, 6.3521728515625, 6.71142578125, 7.0706787109375, 7.429931640625, 7.7891845703125, 8.1484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 516.0, 471.0, 16.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.27314758300781, -65.16852569580078, -62.063899993896484, -58.95927810668945, -55.854652404785156, -52.750030517578125, -49.645408630371094, -46.54078674316406, -43.436161041259766, -40.331539154052734, -37.22691345214844, -34.122291564941406, -31.017667770385742, -27.913043975830078, -24.808422088623047, -21.703798294067383, -18.59917449951172, -15.494550704956055, -12.389927864074707, -9.28530502319336, -6.180681228637695, -3.0760574340820312, 0.028564453125, 3.133188247680664, 6.237812042236328, 9.342435836791992, 12.44705867767334, 15.551681518554688, 18.65630531311035, 21.760929107666016, 24.865550994873047, 27.97017478942871, 31.074798583984375, 34.179420471191406, 37.2840461730957, 40.388668060302734, 43.49329376220703, 46.59791564941406, 49.702537536621094, 52.807159423828125, 55.91178512573242, 59.01640701293945, 62.12103271484375, 65.22565460205078, 68.33027648925781, 71.43490600585938, 74.53952026367188, 77.64414978027344, 80.74877166748047, 83.8533935546875, 86.95801544189453, 90.06263732910156, 93.16726684570312, 96.27188873291016, 99.37651062011719, 102.48113250732422, 105.58575439453125, 108.69037628173828, 111.79499816894531, 114.89962768554688, 118.0042495727539, 121.10887145996094, 124.21349334716797, 127.318115234375, 130.42274475097656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 10.0, 27.0, 31.0, 44.0, 58.0, 94.0, 107.0, 104.0, 97.0, 101.0, 106.0, 61.0, 62.0, 38.0, 19.0, 14.0, 8.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.749408721923828, -11.235383033752441, -10.721357345581055, -10.207331657409668, -9.693305969238281, -9.179280281066895, -8.665254592895508, -8.151227951049805, -7.637202739715576, -7.1231770515441895, -6.609151363372803, -6.095125198364258, -5.581099510192871, -5.067073822021484, -4.553048133850098, -4.039022445678711, -3.524996757507324, -3.0109710693359375, -2.496945381164551, -1.982919454574585, -1.4688937664031982, -0.9548680782318115, -0.4408421516418457, 0.07318353652954102, 0.5872092247009277, 1.1012349128723145, 1.6152607202529907, 2.129286527633667, 2.6433122158050537, 3.1573379039764404, 3.6713638305664062, 4.185389518737793, 4.69941520690918, 5.213440895080566, 5.727466583251953, 6.24149227142334, 6.755517959594727, 7.269543647766113, 7.783569812774658, 8.297595977783203, 8.811620712280273, 9.32564640045166, 9.839672088623047, 10.353697776794434, 10.86772346496582, 11.381749153137207, 11.895774841308594, 12.409801483154297, 12.923827171325684, 13.43785285949707, 13.951878547668457, 14.465904235839844, 14.97992992401123, 15.493955612182617, 16.00798225402832, 16.52200698852539, 17.036033630371094, 17.550060272216797, 18.064085006713867, 18.57811164855957, 19.09213638305664, 19.606163024902344, 20.120187759399414, 20.634214401245117, 21.148239135742188]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 3.0, 5.0, 9.0, 9.0, 17.0, 20.0, 17.0, 31.0, 46.0, 58.0, 92.0, 128.0, 217.0, 325.0, 552.0, 1108.0, 2494.0, 6804.0, 23769.0, 107021.0, 509476.0, 313602.0, 59767.0, 14573.0, 4510.0, 1798.0, 844.0, 431.0, 254.0, 156.0, 117.0, 85.0, 53.0, 36.0, 30.0, 23.0, 19.0, 16.0, 14.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.7982177734375, -5.615966796875, -5.4337158203125, -5.25146484375, -5.0692138671875, -4.886962890625, -4.7047119140625, -4.5224609375, -4.3402099609375, -4.157958984375, -3.9757080078125, -3.79345703125, -3.6112060546875, -3.428955078125, -3.2467041015625, -3.064453125, -2.8822021484375, -2.699951171875, -2.5177001953125, -2.33544921875, -2.1531982421875, -1.970947265625, -1.7886962890625, -1.6064453125, -1.4241943359375, -1.241943359375, -1.0596923828125, -0.87744140625, -0.6951904296875, -0.512939453125, -0.3306884765625, -0.1484375, 0.0338134765625, 0.216064453125, 0.3983154296875, 0.58056640625, 0.7628173828125, 0.945068359375, 1.1273193359375, 1.3095703125, 1.4918212890625, 1.674072265625, 1.8563232421875, 2.03857421875, 2.2208251953125, 2.403076171875, 2.5853271484375, 2.767578125, 2.9498291015625, 3.132080078125, 3.3143310546875, 3.49658203125, 3.6788330078125, 3.861083984375, 4.0433349609375, 4.2255859375, 4.4078369140625, 4.590087890625, 4.7723388671875, 4.95458984375, 5.1368408203125, 5.319091796875, 5.5013427734375, 5.68359375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 19.0, 14.0, 32.0, 38.0, 41.0, 56.0, 76.0, 70.0, 94.0, 91.0, 77.0, 79.0, 60.0, 64.0, 50.0, 45.0, 22.0, 19.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.646484375, -1.588775634765625, -1.53106689453125, -1.473358154296875, -1.4156494140625, -1.357940673828125, -1.30023193359375, -1.242523193359375, -1.184814453125, -1.127105712890625, -1.06939697265625, -1.011688232421875, -0.9539794921875, -0.896270751953125, -0.83856201171875, -0.780853271484375, -0.72314453125, -0.665435791015625, -0.60772705078125, -0.550018310546875, -0.4923095703125, -0.434600830078125, -0.37689208984375, -0.319183349609375, -0.261474609375, -0.203765869140625, -0.14605712890625, -0.088348388671875, -0.0306396484375, 0.027069091796875, 0.08477783203125, 0.142486572265625, 0.2001953125, 0.257904052734375, 0.31561279296875, 0.373321533203125, 0.4310302734375, 0.488739013671875, 0.54644775390625, 0.604156494140625, 0.661865234375, 0.719573974609375, 0.77728271484375, 0.834991455078125, 0.8927001953125, 0.950408935546875, 1.00811767578125, 1.065826416015625, 1.12353515625, 1.181243896484375, 1.23895263671875, 1.296661376953125, 1.3543701171875, 1.412078857421875, 1.46978759765625, 1.527496337890625, 1.585205078125, 1.642913818359375, 1.70062255859375, 1.758331298828125, 1.8160400390625, 1.873748779296875, 1.93145751953125, 1.989166259765625, 2.046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 8.0, 8.0, 12.0, 16.0, 23.0, 38.0, 57.0, 86.0, 214.0, 446.0, 1178.0, 4499.0, 26593.0, 386221.0, 582293.0, 38437.0, 5958.0, 1434.0, 476.0, 243.0, 123.0, 56.0, 38.0, 21.0, 14.0, 10.0, 15.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.45703125, -6.17730712890625, -5.8975830078125, -5.61785888671875, -5.338134765625, -5.05841064453125, -4.7786865234375, -4.49896240234375, -4.21923828125, -3.93951416015625, -3.6597900390625, -3.38006591796875, -3.100341796875, -2.82061767578125, -2.5408935546875, -2.26116943359375, -1.9814453125, -1.70172119140625, -1.4219970703125, -1.14227294921875, -0.862548828125, -0.58282470703125, -0.3031005859375, -0.02337646484375, 0.25634765625, 0.53607177734375, 0.8157958984375, 1.09552001953125, 1.375244140625, 1.65496826171875, 1.9346923828125, 2.21441650390625, 2.494140625, 2.77386474609375, 3.0535888671875, 3.33331298828125, 3.613037109375, 3.89276123046875, 4.1724853515625, 4.45220947265625, 4.73193359375, 5.01165771484375, 5.2913818359375, 5.57110595703125, 5.850830078125, 6.13055419921875, 6.4102783203125, 6.69000244140625, 6.9697265625, 7.24945068359375, 7.5291748046875, 7.80889892578125, 8.088623046875, 8.36834716796875, 8.6480712890625, 8.92779541015625, 9.20751953125, 9.48724365234375, 9.7669677734375, 10.04669189453125, 10.326416015625, 10.60614013671875, 10.8858642578125, 11.16558837890625, 11.4453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 1.0, 13.0, 7.0, 14.0, 23.0, 23.0, 31.0, 37.0, 37.0, 54.0, 54.0, 66.0, 68.0, 77.0, 72.0, 64.0, 65.0, 59.0, 47.0, 44.0, 32.0, 24.0, 12.0, 13.0, 12.0, 16.0, 6.0, 5.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.6749267578125, -4.459228515625, -4.2435302734375, -4.02783203125, -3.8121337890625, -3.596435546875, -3.3807373046875, -3.1650390625, -2.9493408203125, -2.733642578125, -2.5179443359375, -2.30224609375, -2.0865478515625, -1.870849609375, -1.6551513671875, -1.439453125, -1.2237548828125, -1.008056640625, -0.7923583984375, -0.57666015625, -0.3609619140625, -0.145263671875, 0.0704345703125, 0.2861328125, 0.5018310546875, 0.717529296875, 0.9332275390625, 1.14892578125, 1.3646240234375, 1.580322265625, 1.7960205078125, 2.01171875, 2.2274169921875, 2.443115234375, 2.6588134765625, 2.87451171875, 3.0902099609375, 3.305908203125, 3.5216064453125, 3.7373046875, 3.9530029296875, 4.168701171875, 4.3843994140625, 4.60009765625, 4.8157958984375, 5.031494140625, 5.2471923828125, 5.462890625, 5.6785888671875, 5.894287109375, 6.1099853515625, 6.32568359375, 6.5413818359375, 6.757080078125, 6.9727783203125, 7.1884765625, 7.4041748046875, 7.619873046875, 7.8355712890625, 8.05126953125, 8.2669677734375, 8.482666015625, 8.6983642578125, 8.9140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 3.0, 13.0, 11.0, 19.0, 15.0, 33.0, 48.0, 85.0, 122.0, 299.0, 651.0, 1725.0, 6770.0, 52796.0, 664322.0, 294190.0, 21487.0, 3797.0, 1170.0, 477.0, 216.0, 118.0, 66.0, 44.0, 16.0, 16.0, 7.0, 2.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.935546875, -2.829986572265625, -2.72442626953125, -2.618865966796875, -2.5133056640625, -2.407745361328125, -2.30218505859375, -2.196624755859375, -2.091064453125, -1.985504150390625, -1.87994384765625, -1.774383544921875, -1.6688232421875, -1.563262939453125, -1.45770263671875, -1.352142333984375, -1.24658203125, -1.141021728515625, -1.03546142578125, -0.929901123046875, -0.8243408203125, -0.718780517578125, -0.61322021484375, -0.507659912109375, -0.402099609375, -0.296539306640625, -0.19097900390625, -0.085418701171875, 0.0201416015625, 0.125701904296875, 0.23126220703125, 0.336822509765625, 0.4423828125, 0.547943115234375, 0.65350341796875, 0.759063720703125, 0.8646240234375, 0.970184326171875, 1.07574462890625, 1.181304931640625, 1.286865234375, 1.392425537109375, 1.49798583984375, 1.603546142578125, 1.7091064453125, 1.814666748046875, 1.92022705078125, 2.025787353515625, 2.13134765625, 2.236907958984375, 2.34246826171875, 2.448028564453125, 2.5535888671875, 2.659149169921875, 2.76470947265625, 2.870269775390625, 2.975830078125, 3.081390380859375, 3.18695068359375, 3.292510986328125, 3.3980712890625, 3.503631591796875, 3.60919189453125, 3.714752197265625, 3.8203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 1.0, 3.0, 6.0, 8.0, 7.0, 15.0, 16.0, 26.0, 28.0, 43.0, 53.0, 51.0, 83.0, 96.0, 112.0, 82.0, 67.0, 52.0, 47.0, 46.0, 32.0, 31.0, 15.0, 8.0, 14.0, 10.0, 10.0, 3.0, 4.0, 4.0, 10.0, 6.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027871131896972656, -0.00027015432715415955, -0.00026159733533859253, -0.0002530403435230255, -0.0002444833517074585, -0.00023592635989189148, -0.00022736936807632446, -0.00021881237626075745, -0.00021025538444519043, -0.0002016983926296234, -0.0001931414008140564, -0.00018458440899848938, -0.00017602741718292236, -0.00016747042536735535, -0.00015891343355178833, -0.0001503564417362213, -0.0001417994499206543, -0.00013324245810508728, -0.00012468546628952026, -0.00011612847447395325, -0.00010757148265838623, -9.901449084281921e-05, -9.04574990272522e-05, -8.190050721168518e-05, -7.334351539611816e-05, -6.478652358055115e-05, -5.622953176498413e-05, -4.7672539949417114e-05, -3.91155481338501e-05, -3.055855631828308e-05, -2.2001564502716064e-05, -1.3444572687149048e-05, -4.887580871582031e-06, 3.6694109439849854e-06, 1.2226402759552002e-05, 2.078339457511902e-05, 2.9340386390686035e-05, 3.789737820625305e-05, 4.645437002182007e-05, 5.5011361837387085e-05, 6.35683536529541e-05, 7.212534546852112e-05, 8.068233728408813e-05, 8.923932909965515e-05, 9.779632091522217e-05, 0.00010635331273078918, 0.0001149103045463562, 0.00012346729636192322, 0.00013202428817749023, 0.00014058127999305725, 0.00014913827180862427, 0.00015769526362419128, 0.0001662522554397583, 0.00017480924725532532, 0.00018336623907089233, 0.00019192323088645935, 0.00020048022270202637, 0.00020903721451759338, 0.0002175942063331604, 0.00022615119814872742, 0.00023470818996429443, 0.00024326518177986145, 0.00025182217359542847, 0.0002603791654109955, 0.0002689361572265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 9.0, 6.0, 7.0, 9.0, 18.0, 22.0, 37.0, 57.0, 112.0, 224.0, 469.0, 1154.0, 3191.0, 12462.0, 93765.0, 692161.0, 214477.0, 22596.0, 4897.0, 1545.0, 668.0, 298.0, 162.0, 80.0, 40.0, 25.0, 23.0, 5.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.774322509765625, -2.67755126953125, -2.580780029296875, -2.4840087890625, -2.387237548828125, -2.29046630859375, -2.193695068359375, -2.096923828125, -2.000152587890625, -1.90338134765625, -1.806610107421875, -1.7098388671875, -1.613067626953125, -1.51629638671875, -1.419525146484375, -1.32275390625, -1.225982666015625, -1.12921142578125, -1.032440185546875, -0.9356689453125, -0.838897705078125, -0.74212646484375, -0.645355224609375, -0.548583984375, -0.451812744140625, -0.35504150390625, -0.258270263671875, -0.1614990234375, -0.064727783203125, 0.03204345703125, 0.128814697265625, 0.2255859375, 0.322357177734375, 0.41912841796875, 0.515899658203125, 0.6126708984375, 0.709442138671875, 0.80621337890625, 0.902984619140625, 0.999755859375, 1.096527099609375, 1.19329833984375, 1.290069580078125, 1.3868408203125, 1.483612060546875, 1.58038330078125, 1.677154541015625, 1.77392578125, 1.870697021484375, 1.96746826171875, 2.064239501953125, 2.1610107421875, 2.257781982421875, 2.35455322265625, 2.451324462890625, 2.548095703125, 2.644866943359375, 2.74163818359375, 2.838409423828125, 2.9351806640625, 3.031951904296875, 3.12872314453125, 3.225494384765625, 3.322265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 14.0, 20.0, 31.0, 36.0, 65.0, 81.0, 125.0, 119.0, 110.0, 93.0, 78.0, 52.0, 43.0, 33.0, 19.0, 9.0, 10.0, 12.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.291015625, -2.2142333984375, -2.137451171875, -2.0606689453125, -1.98388671875, -1.9071044921875, -1.830322265625, -1.7535400390625, -1.6767578125, -1.5999755859375, -1.523193359375, -1.4464111328125, -1.36962890625, -1.2928466796875, -1.216064453125, -1.1392822265625, -1.0625, -0.9857177734375, -0.908935546875, -0.8321533203125, -0.75537109375, -0.6785888671875, -0.601806640625, -0.5250244140625, -0.4482421875, -0.3714599609375, -0.294677734375, -0.2178955078125, -0.14111328125, -0.0643310546875, 0.012451171875, 0.0892333984375, 0.166015625, 0.2427978515625, 0.319580078125, 0.3963623046875, 0.47314453125, 0.5499267578125, 0.626708984375, 0.7034912109375, 0.7802734375, 0.8570556640625, 0.933837890625, 1.0106201171875, 1.08740234375, 1.1641845703125, 1.240966796875, 1.3177490234375, 1.39453125, 1.4713134765625, 1.548095703125, 1.6248779296875, 1.70166015625, 1.7784423828125, 1.855224609375, 1.9320068359375, 2.0087890625, 2.0855712890625, 2.162353515625, 2.2391357421875, 2.31591796875, 2.3927001953125, 2.469482421875, 2.5462646484375, 2.623046875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 15.0, 39.0, 111.0, 308.0, 307.0, 123.0, 57.0, 13.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.99281311035156, -69.01544952392578, -67.03807830810547, -65.06071472167969, -63.083351135253906, -61.10598373413086, -59.12861633300781, -57.15125274658203, -55.17388916015625, -53.1965217590332, -51.21915817260742, -49.241790771484375, -47.264427185058594, -45.28705978393555, -43.3096923828125, -41.33232879638672, -39.35496139526367, -37.377593994140625, -35.400230407714844, -33.4228630065918, -31.445499420166016, -29.46813201904297, -27.490766525268555, -25.51340103149414, -23.536035537719727, -21.558670043945312, -19.5813045501709, -17.603939056396484, -15.626572608947754, -13.64920711517334, -11.67184066772461, -9.694475173950195, -7.717113494873047, -5.739748001098633, -3.7623820304870605, -1.7850160598754883, 0.19234943389892578, 2.16971492767334, 4.14708137512207, 6.124446868896484, 8.101812362670898, 10.079177856445312, 12.056543350219727, 14.033909797668457, 16.011276245117188, 17.98863983154297, 19.966007232666016, 21.94337272644043, 23.920738220214844, 25.898103713989258, 27.875469207763672, 29.85283660888672, 31.8302001953125, 33.80756759643555, 35.784934997558594, 37.762298583984375, 39.739662170410156, 41.7170295715332, 43.694393157958984, 45.67176055908203, 47.64912414550781, 49.62649154663086, 51.603858947753906, 53.58122253417969, 55.558589935302734]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 10.0, 11.0, 21.0, 15.0, 25.0, 25.0, 31.0, 36.0, 53.0, 54.0, 60.0, 62.0, 72.0, 69.0, 56.0, 69.0, 61.0, 44.0, 40.0, 36.0, 34.0, 27.0, 16.0, 14.0, 16.0, 11.0, 7.0, 2.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.55316925048828, -43.291900634765625, -42.030635833740234, -40.76936721801758, -39.50809860229492, -38.24683380126953, -36.985565185546875, -35.72429656982422, -34.46302795410156, -33.201759338378906, -31.940492630004883, -30.67922592163086, -29.417957305908203, -28.15669059753418, -26.895423889160156, -25.6341552734375, -24.37289047241211, -23.111623764038086, -21.85035514831543, -20.589088439941406, -19.32781982421875, -18.066553115844727, -16.805286407470703, -15.544018745422363, -14.282751083374023, -13.021483421325684, -11.760215759277344, -10.49894905090332, -9.23768138885498, -7.976413726806641, -6.715146541595459, -5.453879356384277, -4.1926116943359375, -2.9313442707061768, -1.670076847076416, -0.4088094234466553, 0.8524580001831055, 2.1137256622314453, 3.374992847442627, 4.636260032653809, 5.897527694702148, 7.158795356750488, 8.420063018798828, 9.681329727172852, 10.942597389221191, 12.203865051269531, 13.465131759643555, 14.726399421691895, 15.987667083740234, 17.248933792114258, 18.510202407836914, 19.771469116210938, 21.032737731933594, 22.294004440307617, 23.55527114868164, 24.816539764404297, 26.07780647277832, 27.339073181152344, 28.600341796875, 29.861608505249023, 31.122875213623047, 32.3841438293457, 33.64541244506836, 34.90667724609375, 36.167945861816406]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1.0, 8.0, 10.0, 23.0, 28.0, 49.0, 83.0, 154.0, 254.0, 510.0, 1096.0, 2936.0, 10050.0, 57775.0, 3494350.0, 583693.0, 31355.0, 7114.0, 2436.0, 1046.0, 484.0, 305.0, 165.0, 99.0, 82.0, 56.0, 19.0, 25.0, 24.0, 22.0, 8.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.2734375, -7.926513671875, -7.57958984375, -7.232666015625, -6.8857421875, -6.538818359375, -6.19189453125, -5.844970703125, -5.498046875, -5.151123046875, -4.80419921875, -4.457275390625, -4.1103515625, -3.763427734375, -3.41650390625, -3.069580078125, -2.72265625, -2.375732421875, -2.02880859375, -1.681884765625, -1.3349609375, -0.988037109375, -0.64111328125, -0.294189453125, 0.052734375, 0.399658203125, 0.74658203125, 1.093505859375, 1.4404296875, 1.787353515625, 2.13427734375, 2.481201171875, 2.828125, 3.175048828125, 3.52197265625, 3.868896484375, 4.2158203125, 4.562744140625, 4.90966796875, 5.256591796875, 5.603515625, 5.950439453125, 6.29736328125, 6.644287109375, 6.9912109375, 7.338134765625, 7.68505859375, 8.031982421875, 8.37890625, 8.725830078125, 9.07275390625, 9.419677734375, 9.7666015625, 10.113525390625, 10.46044921875, 10.807373046875, 11.154296875, 11.501220703125, 11.84814453125, 12.195068359375, 12.5419921875, 12.888916015625, 13.23583984375, 13.582763671875, 13.9296875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 10.0, 10.0, 17.0, 34.0, 24.0, 33.0, 49.0, 70.0, 75.0, 78.0, 80.0, 88.0, 71.0, 84.0, 58.0, 51.0, 50.0, 32.0, 28.0, 20.0, 14.0, 8.0, 10.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7607421875, -1.7005767822265625, -1.640411376953125, -1.5802459716796875, -1.52008056640625, -1.4599151611328125, -1.399749755859375, -1.3395843505859375, -1.2794189453125, -1.2192535400390625, -1.159088134765625, -1.0989227294921875, -1.03875732421875, -0.9785919189453125, -0.918426513671875, -0.8582611083984375, -0.798095703125, -0.7379302978515625, -0.677764892578125, -0.6175994873046875, -0.55743408203125, -0.4972686767578125, -0.437103271484375, -0.3769378662109375, -0.3167724609375, -0.2566070556640625, -0.196441650390625, -0.1362762451171875, -0.07611083984375, -0.0159454345703125, 0.044219970703125, 0.1043853759765625, 0.16455078125, 0.2247161865234375, 0.284881591796875, 0.3450469970703125, 0.40521240234375, 0.4653778076171875, 0.525543212890625, 0.5857086181640625, 0.6458740234375, 0.7060394287109375, 0.766204833984375, 0.8263702392578125, 0.88653564453125, 0.9467010498046875, 1.006866455078125, 1.0670318603515625, 1.127197265625, 1.1873626708984375, 1.247528076171875, 1.3076934814453125, 1.36785888671875, 1.4280242919921875, 1.488189697265625, 1.5483551025390625, 1.6085205078125, 1.6686859130859375, 1.728851318359375, 1.7890167236328125, 1.84918212890625, 1.9093475341796875, 1.969512939453125, 2.0296783447265625, 2.08984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 16.0, 28.0, 40.0, 49.0, 62.0, 118.0, 196.0, 396.0, 947.0, 2645.0, 10187.0, 229105.0, 3916403.0, 26730.0, 4670.0, 1456.0, 537.0, 254.0, 145.0, 89.0, 70.0, 36.0, 26.0, 20.0, 19.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.0390625, -14.5416259765625, -14.044189453125, -13.5467529296875, -13.04931640625, -12.5518798828125, -12.054443359375, -11.5570068359375, -11.0595703125, -10.5621337890625, -10.064697265625, -9.5672607421875, -9.06982421875, -8.5723876953125, -8.074951171875, -7.5775146484375, -7.080078125, -6.5826416015625, -6.085205078125, -5.5877685546875, -5.09033203125, -4.5928955078125, -4.095458984375, -3.5980224609375, -3.1005859375, -2.6031494140625, -2.105712890625, -1.6082763671875, -1.11083984375, -0.6134033203125, -0.115966796875, 0.3814697265625, 0.87890625, 1.3763427734375, 1.873779296875, 2.3712158203125, 2.86865234375, 3.3660888671875, 3.863525390625, 4.3609619140625, 4.8583984375, 5.3558349609375, 5.853271484375, 6.3507080078125, 6.84814453125, 7.3455810546875, 7.843017578125, 8.3404541015625, 8.837890625, 9.3353271484375, 9.832763671875, 10.3302001953125, 10.82763671875, 11.3250732421875, 11.822509765625, 12.3199462890625, 12.8173828125, 13.3148193359375, 13.812255859375, 14.3096923828125, 14.80712890625, 15.3045654296875, 15.802001953125, 16.2994384765625, 16.796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 13.0, 16.0, 46.0, 97.0, 450.0, 2773.0, 510.0, 86.0, 41.0, 17.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.049072265625, -7.78564453125, -7.522216796875, -7.2587890625, -6.995361328125, -6.73193359375, -6.468505859375, -6.205078125, -5.941650390625, -5.67822265625, -5.414794921875, -5.1513671875, -4.887939453125, -4.62451171875, -4.361083984375, -4.09765625, -3.834228515625, -3.57080078125, -3.307373046875, -3.0439453125, -2.780517578125, -2.51708984375, -2.253662109375, -1.990234375, -1.726806640625, -1.46337890625, -1.199951171875, -0.9365234375, -0.673095703125, -0.40966796875, -0.146240234375, 0.1171875, 0.380615234375, 0.64404296875, 0.907470703125, 1.1708984375, 1.434326171875, 1.69775390625, 1.961181640625, 2.224609375, 2.488037109375, 2.75146484375, 3.014892578125, 3.2783203125, 3.541748046875, 3.80517578125, 4.068603515625, 4.33203125, 4.595458984375, 4.85888671875, 5.122314453125, 5.3857421875, 5.649169921875, 5.91259765625, 6.176025390625, 6.439453125, 6.702880859375, 6.96630859375, 7.229736328125, 7.4931640625, 7.756591796875, 8.02001953125, 8.283447265625, 8.546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 39.0, 78.0, 211.0, 319.0, 189.0, 102.0, 33.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.20782470703125, -22.139741897583008, -21.071659088134766, -20.00357437133789, -18.93549156188965, -17.867408752441406, -16.79932403564453, -15.731241226196289, -14.663158416748047, -13.595075607299805, -12.526991844177246, -11.458908081054688, -10.390825271606445, -9.322742462158203, -8.254658699035645, -7.186575412750244, -6.118492126464844, -5.050408840179443, -3.982325553894043, -2.9142422676086426, -1.8461589813232422, -0.7780756950378418, 0.2900075912475586, 1.358090877532959, 2.4261741638183594, 3.4942574501037598, 4.56234073638916, 5.6304240226745605, 6.698507308959961, 7.766590595245361, 8.834673881530762, 9.90275764465332, 10.970840454101562, 12.038923263549805, 13.107007026672363, 14.175090789794922, 15.243173599243164, 16.311256408691406, 17.37934112548828, 18.447423934936523, 19.515506744384766, 20.583589553833008, 21.65167236328125, 22.719757080078125, 23.787839889526367, 24.85592269897461, 25.924007415771484, 26.992090225219727, 28.06017303466797, 29.12825584411621, 30.196338653564453, 31.264423370361328, 32.33250427246094, 33.40058898925781, 34.46867370605469, 35.5367546081543, 36.60483932495117, 37.67292404174805, 38.741004943847656, 39.80908966064453, 40.877174377441406, 41.945255279541016, 43.01333999633789, 44.0814208984375, 45.149505615234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 14.0, 25.0, 19.0, 20.0, 29.0, 38.0, 39.0, 35.0, 55.0, 58.0, 72.0, 80.0, 66.0, 63.0, 72.0, 58.0, 54.0, 34.0, 29.0, 28.0, 32.0, 17.0, 18.0, 10.0, 9.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.771625518798828, -19.298376083374023, -18.82512664794922, -18.35187530517578, -17.878625869750977, -17.405376434326172, -16.932126998901367, -16.458877563476562, -15.985628128051758, -15.512378692626953, -15.039128303527832, -14.565878868103027, -14.092629432678223, -13.619379043579102, -13.146129608154297, -12.672880172729492, -12.199629783630371, -11.726380348205566, -11.253129959106445, -10.77988052368164, -10.306631088256836, -9.833381652832031, -9.36013126373291, -8.886881828308105, -8.413631439208984, -7.9403815269470215, -7.467132091522217, -6.993882179260254, -6.520632743835449, -6.047382831573486, -5.574132919311523, -5.100883483886719, -4.627634048461914, -4.154384136199951, -3.6811347007751465, -3.2078847885131836, -2.7346351146698, -2.261385440826416, -1.7881355285644531, -1.3148858547210693, -0.8416361808776855, -0.368386447429657, 0.10486328601837158, 0.5781130790710449, 1.0513627529144287, 1.5246124267578125, 1.9978623390197754, 2.471112012863159, 2.944361686706543, 3.4176113605499268, 3.8908610343933105, 4.364110946655273, 4.837360382080078, 5.310610294342041, 5.783860206604004, 6.257109642028809, 6.7303595542907715, 7.203609466552734, 7.676858901977539, 8.150108337402344, 8.623358726501465, 9.09660816192627, 9.56985855102539, 10.043107986450195, 10.516357421875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 15.0, 15.0, 38.0, 54.0, 112.0, 152.0, 268.0, 543.0, 1215.0, 3142.0, 12384.0, 82274.0, 629027.0, 277814.0, 31618.0, 6111.0, 1997.0, 814.0, 403.0, 209.0, 128.0, 77.0, 44.0, 23.0, 26.0, 11.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.8973388671875, -7.622802734375, -7.3482666015625, -7.07373046875, -6.7991943359375, -6.524658203125, -6.2501220703125, -5.9755859375, -5.7010498046875, -5.426513671875, -5.1519775390625, -4.87744140625, -4.6029052734375, -4.328369140625, -4.0538330078125, -3.779296875, -3.5047607421875, -3.230224609375, -2.9556884765625, -2.68115234375, -2.4066162109375, -2.132080078125, -1.8575439453125, -1.5830078125, -1.3084716796875, -1.033935546875, -0.7593994140625, -0.48486328125, -0.2103271484375, 0.064208984375, 0.3387451171875, 0.61328125, 0.8878173828125, 1.162353515625, 1.4368896484375, 1.71142578125, 1.9859619140625, 2.260498046875, 2.5350341796875, 2.8095703125, 3.0841064453125, 3.358642578125, 3.6331787109375, 3.90771484375, 4.1822509765625, 4.456787109375, 4.7313232421875, 5.005859375, 5.2803955078125, 5.554931640625, 5.8294677734375, 6.10400390625, 6.3785400390625, 6.653076171875, 6.9276123046875, 7.2021484375, 7.4766845703125, 7.751220703125, 8.0257568359375, 8.30029296875, 8.5748291015625, 8.849365234375, 9.1239013671875, 9.3984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 14.0, 23.0, 26.0, 48.0, 73.0, 65.0, 73.0, 107.0, 106.0, 101.0, 85.0, 81.0, 63.0, 45.0, 37.0, 15.0, 11.0, 10.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.41070556640625, -2.3389892578125, -2.26727294921875, -2.195556640625, -2.12384033203125, -2.0521240234375, -1.98040771484375, -1.90869140625, -1.83697509765625, -1.7652587890625, -1.69354248046875, -1.621826171875, -1.55010986328125, -1.4783935546875, -1.40667724609375, -1.3349609375, -1.26324462890625, -1.1915283203125, -1.11981201171875, -1.048095703125, -0.97637939453125, -0.9046630859375, -0.83294677734375, -0.76123046875, -0.68951416015625, -0.6177978515625, -0.54608154296875, -0.474365234375, -0.40264892578125, -0.3309326171875, -0.25921630859375, -0.1875, -0.11578369140625, -0.0440673828125, 0.02764892578125, 0.099365234375, 0.17108154296875, 0.2427978515625, 0.31451416015625, 0.38623046875, 0.45794677734375, 0.5296630859375, 0.60137939453125, 0.673095703125, 0.74481201171875, 0.8165283203125, 0.88824462890625, 0.9599609375, 1.03167724609375, 1.1033935546875, 1.17510986328125, 1.246826171875, 1.31854248046875, 1.3902587890625, 1.46197509765625, 1.53369140625, 1.60540771484375, 1.6771240234375, 1.74884033203125, 1.820556640625, 1.89227294921875, 1.9639892578125, 2.03570556640625, 2.107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 4.0, 11.0, 15.0, 16.0, 33.0, 46.0, 70.0, 120.0, 177.0, 282.0, 524.0, 944.0, 1944.0, 3684.0, 8137.0, 18565.0, 48224.0, 140090.0, 360766.0, 297383.0, 103045.0, 36744.0, 14810.0, 6583.0, 2995.0, 1531.0, 733.0, 450.0, 225.0, 133.0, 80.0, 61.0, 32.0, 27.0, 23.0, 5.0, 17.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.771484375, -3.663299560546875, -3.55511474609375, -3.446929931640625, -3.3387451171875, -3.230560302734375, -3.12237548828125, -3.014190673828125, -2.906005859375, -2.797821044921875, -2.68963623046875, -2.581451416015625, -2.4732666015625, -2.365081787109375, -2.25689697265625, -2.148712158203125, -2.04052734375, -1.932342529296875, -1.82415771484375, -1.715972900390625, -1.6077880859375, -1.499603271484375, -1.39141845703125, -1.283233642578125, -1.175048828125, -1.066864013671875, -0.95867919921875, -0.850494384765625, -0.7423095703125, -0.634124755859375, -0.52593994140625, -0.417755126953125, -0.3095703125, -0.201385498046875, -0.09320068359375, 0.014984130859375, 0.1231689453125, 0.231353759765625, 0.33953857421875, 0.447723388671875, 0.555908203125, 0.664093017578125, 0.77227783203125, 0.880462646484375, 0.9886474609375, 1.096832275390625, 1.20501708984375, 1.313201904296875, 1.42138671875, 1.529571533203125, 1.63775634765625, 1.745941162109375, 1.8541259765625, 1.962310791015625, 2.07049560546875, 2.178680419921875, 2.286865234375, 2.395050048828125, 2.50323486328125, 2.611419677734375, 2.7196044921875, 2.827789306640625, 2.93597412109375, 3.044158935546875, 3.15234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 12.0, 14.0, 7.0, 9.0, 9.0, 14.0, 17.0, 20.0, 21.0, 28.0, 37.0, 33.0, 39.0, 48.0, 37.0, 52.0, 47.0, 36.0, 56.0, 28.0, 33.0, 47.0, 43.0, 44.0, 30.0, 29.0, 31.0, 20.0, 23.0, 19.0, 21.0, 14.0, 17.0, 10.0, 9.0, 8.0, 12.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-4.765625, -4.6239013671875, -4.482177734375, -4.3404541015625, -4.19873046875, -4.0570068359375, -3.915283203125, -3.7735595703125, -3.6318359375, -3.4901123046875, -3.348388671875, -3.2066650390625, -3.06494140625, -2.9232177734375, -2.781494140625, -2.6397705078125, -2.498046875, -2.3563232421875, -2.214599609375, -2.0728759765625, -1.93115234375, -1.7894287109375, -1.647705078125, -1.5059814453125, -1.3642578125, -1.2225341796875, -1.080810546875, -0.9390869140625, -0.79736328125, -0.6556396484375, -0.513916015625, -0.3721923828125, -0.23046875, -0.0887451171875, 0.052978515625, 0.1947021484375, 0.33642578125, 0.4781494140625, 0.619873046875, 0.7615966796875, 0.9033203125, 1.0450439453125, 1.186767578125, 1.3284912109375, 1.47021484375, 1.6119384765625, 1.753662109375, 1.8953857421875, 2.037109375, 2.1788330078125, 2.320556640625, 2.4622802734375, 2.60400390625, 2.7457275390625, 2.887451171875, 3.0291748046875, 3.1708984375, 3.3126220703125, 3.454345703125, 3.5960693359375, 3.73779296875, 3.8795166015625, 4.021240234375, 4.1629638671875, 4.3046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 4.0, 2.0, 3.0, 6.0, 9.0, 14.0, 10.0, 24.0, 26.0, 61.0, 98.0, 187.0, 397.0, 1093.0, 3624.0, 15678.0, 91649.0, 539043.0, 333790.0, 49651.0, 9181.0, 2468.0, 839.0, 316.0, 157.0, 85.0, 42.0, 27.0, 19.0, 16.0, 11.0, 5.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.012847900390625, -1.94757080078125, -1.882293701171875, -1.8170166015625, -1.751739501953125, -1.68646240234375, -1.621185302734375, -1.555908203125, -1.490631103515625, -1.42535400390625, -1.360076904296875, -1.2947998046875, -1.229522705078125, -1.16424560546875, -1.098968505859375, -1.03369140625, -0.968414306640625, -0.90313720703125, -0.837860107421875, -0.7725830078125, -0.707305908203125, -0.64202880859375, -0.576751708984375, -0.511474609375, -0.446197509765625, -0.38092041015625, -0.315643310546875, -0.2503662109375, -0.185089111328125, -0.11981201171875, -0.054534912109375, 0.0107421875, 0.076019287109375, 0.14129638671875, 0.206573486328125, 0.2718505859375, 0.337127685546875, 0.40240478515625, 0.467681884765625, 0.532958984375, 0.598236083984375, 0.66351318359375, 0.728790283203125, 0.7940673828125, 0.859344482421875, 0.92462158203125, 0.989898681640625, 1.05517578125, 1.120452880859375, 1.18572998046875, 1.251007080078125, 1.3162841796875, 1.381561279296875, 1.44683837890625, 1.512115478515625, 1.577392578125, 1.642669677734375, 1.70794677734375, 1.773223876953125, 1.8385009765625, 1.903778076171875, 1.96905517578125, 2.034332275390625, 2.099609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 3.0, 8.0, 9.0, 8.0, 7.0, 17.0, 15.0, 25.0, 33.0, 33.0, 41.0, 64.0, 101.0, 95.0, 124.0, 95.0, 74.0, 71.0, 50.0, 25.0, 23.0, 18.0, 9.0, 12.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003345012664794922, -0.0003255307674407959, -0.0003165602684020996, -0.0003075897693634033, -0.00029861927032470703, -0.00028964877128601074, -0.00028067827224731445, -0.00027170777320861816, -0.0002627372741699219, -0.0002537667751312256, -0.0002447962760925293, -0.000235825777053833, -0.00022685527801513672, -0.00021788477897644043, -0.00020891427993774414, -0.00019994378089904785, -0.00019097328186035156, -0.00018200278282165527, -0.00017303228378295898, -0.0001640617847442627, -0.0001550912857055664, -0.00014612078666687012, -0.00013715028762817383, -0.00012817978858947754, -0.00011920928955078125, -0.00011023879051208496, -0.00010126829147338867, -9.229779243469238e-05, -8.33272933959961e-05, -7.43567943572998e-05, -6.538629531860352e-05, -5.6415796279907227e-05, -4.744529724121094e-05, -3.847479820251465e-05, -2.950429916381836e-05, -2.053380012512207e-05, -1.1563301086425781e-05, -2.592802047729492e-06, 6.377696990966797e-06, 1.5348196029663086e-05, 2.4318695068359375e-05, 3.3289194107055664e-05, 4.225969314575195e-05, 5.123019218444824e-05, 6.020069122314453e-05, 6.917119026184082e-05, 7.814168930053711e-05, 8.71121883392334e-05, 9.608268737792969e-05, 0.00010505318641662598, 0.00011402368545532227, 0.00012299418449401855, 0.00013196468353271484, 0.00014093518257141113, 0.00014990568161010742, 0.0001588761806488037, 0.0001678466796875, 0.0001768171787261963, 0.00018578767776489258, 0.00019475817680358887, 0.00020372867584228516, 0.00021269917488098145, 0.00022166967391967773, 0.00023064017295837402, 0.0002396106719970703]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 5.0, 9.0, 12.0, 22.0, 25.0, 41.0, 70.0, 83.0, 129.0, 223.0, 329.0, 589.0, 1045.0, 2161.0, 4914.0, 12564.0, 36366.0, 113364.0, 373484.0, 345562.0, 103185.0, 33399.0, 11664.0, 4587.0, 2074.0, 1005.0, 607.0, 347.0, 230.0, 142.0, 106.0, 62.0, 41.0, 24.0, 24.0, 12.0, 18.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-1.5791015625, -1.535186767578125, -1.49127197265625, -1.447357177734375, -1.4034423828125, -1.359527587890625, -1.31561279296875, -1.271697998046875, -1.227783203125, -1.183868408203125, -1.13995361328125, -1.096038818359375, -1.0521240234375, -1.008209228515625, -0.96429443359375, -0.920379638671875, -0.87646484375, -0.832550048828125, -0.78863525390625, -0.744720458984375, -0.7008056640625, -0.656890869140625, -0.61297607421875, -0.569061279296875, -0.525146484375, -0.481231689453125, -0.43731689453125, -0.393402099609375, -0.3494873046875, -0.305572509765625, -0.26165771484375, -0.217742919921875, -0.173828125, -0.129913330078125, -0.08599853515625, -0.042083740234375, 0.0018310546875, 0.045745849609375, 0.08966064453125, 0.133575439453125, 0.177490234375, 0.221405029296875, 0.26531982421875, 0.309234619140625, 0.3531494140625, 0.397064208984375, 0.44097900390625, 0.484893798828125, 0.52880859375, 0.572723388671875, 0.61663818359375, 0.660552978515625, 0.7044677734375, 0.748382568359375, 0.79229736328125, 0.836212158203125, 0.880126953125, 0.924041748046875, 0.96795654296875, 1.011871337890625, 1.0557861328125, 1.099700927734375, 1.14361572265625, 1.187530517578125, 1.2314453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 2.0, 8.0, 7.0, 14.0, 17.0, 22.0, 28.0, 30.0, 40.0, 49.0, 61.0, 80.0, 85.0, 96.0, 82.0, 66.0, 59.0, 49.0, 39.0, 36.0, 21.0, 25.0, 15.0, 16.0, 7.0, 6.0, 3.0, 8.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.4353485107421875, -1.388275146484375, -1.3412017822265625, -1.29412841796875, -1.2470550537109375, -1.199981689453125, -1.1529083251953125, -1.1058349609375, -1.0587615966796875, -1.011688232421875, -0.9646148681640625, -0.91754150390625, -0.8704681396484375, -0.823394775390625, -0.7763214111328125, -0.729248046875, -0.6821746826171875, -0.635101318359375, -0.5880279541015625, -0.54095458984375, -0.4938812255859375, -0.446807861328125, -0.3997344970703125, -0.3526611328125, -0.3055877685546875, -0.258514404296875, -0.2114410400390625, -0.16436767578125, -0.1172943115234375, -0.070220947265625, -0.0231475830078125, 0.02392578125, 0.0709991455078125, 0.118072509765625, 0.1651458740234375, 0.21221923828125, 0.2592926025390625, 0.306365966796875, 0.3534393310546875, 0.4005126953125, 0.4475860595703125, 0.494659423828125, 0.5417327880859375, 0.58880615234375, 0.6358795166015625, 0.682952880859375, 0.7300262451171875, 0.777099609375, 0.8241729736328125, 0.871246337890625, 0.9183197021484375, 0.96539306640625, 1.0124664306640625, 1.059539794921875, 1.1066131591796875, 1.1536865234375, 1.2007598876953125, 1.247833251953125, 1.2949066162109375, 1.34197998046875, 1.3890533447265625, 1.436126708984375, 1.4832000732421875, 1.5302734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 9.0, 18.0, 23.0, 49.0, 126.0, 168.0, 226.0, 181.0, 94.0, 44.0, 30.0, 12.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.797157287597656, -20.552026748657227, -19.30689811706543, -18.061767578125, -16.81663703918457, -15.571507453918457, -14.326377868652344, -13.081247329711914, -11.8361177444458, -10.590988159179688, -9.345857620239258, -8.100728034973145, -6.855597972869873, -5.610467910766602, -4.365338325500488, -3.1202077865600586, -1.8750782012939453, -0.6299482583999634, 0.6151816844940186, 1.860311508178711, 3.1054415702819824, 4.350571632385254, 5.595701217651367, 6.840831756591797, 8.08596134185791, 9.331090927124023, 10.576221466064453, 11.821351051330566, 13.06648063659668, 14.31161117553711, 15.556740760803223, 16.80187225341797, 18.047000885009766, 19.292131423950195, 20.537260055541992, 21.782390594482422, 23.02752113342285, 24.27265167236328, 25.517780303955078, 26.762910842895508, 28.008041381835938, 29.253171920776367, 30.498300552368164, 31.743431091308594, 32.98855972290039, 34.23369216918945, 35.47882080078125, 36.72395324707031, 37.969078063964844, 39.21420669555664, 40.4593391418457, 41.7044677734375, 42.9495964050293, 44.19472885131836, 45.439857482910156, 46.68498992919922, 47.930118560791016, 49.17524719238281, 50.420379638671875, 51.66550827026367, 52.91063690185547, 54.15576934814453, 55.40089797973633, 56.646026611328125, 57.89115905761719]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 14.0, 9.0, 12.0, 13.0, 14.0, 17.0, 19.0, 27.0, 37.0, 30.0, 34.0, 53.0, 43.0, 39.0, 45.0, 51.0, 49.0, 43.0, 50.0, 59.0, 46.0, 43.0, 37.0, 26.0, 29.0, 22.0, 30.0, 23.0, 16.0, 14.0, 16.0, 11.0, 1.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.802770614624023, -24.875926971435547, -23.94908332824707, -23.022239685058594, -22.095394134521484, -21.16855239868164, -20.24170684814453, -19.314863204956055, -18.388019561767578, -17.4611759185791, -16.534332275390625, -15.607487678527832, -14.680644035339355, -13.753800392150879, -12.826955795288086, -11.90011215209961, -10.973268508911133, -10.046424865722656, -9.11958122253418, -8.192736625671387, -7.26589298248291, -6.339049339294434, -5.412205219268799, -4.485361099243164, -3.5585174560546875, -2.631673574447632, -1.7048296928405762, -0.7779858112335205, 0.14885807037353516, 1.0757017135620117, 2.0025458335876465, 2.9293899536132812, 3.856231689453125, 4.783075332641602, 5.709919452667236, 6.636763572692871, 7.563607215881348, 8.490450859069824, 9.417295455932617, 10.344139099121094, 11.27098274230957, 12.197826385498047, 13.124670028686523, 14.051514625549316, 14.978358268737793, 15.90520191192627, 16.832046508789062, 17.75889015197754, 18.685733795166016, 19.612577438354492, 20.53942108154297, 21.466264724731445, 22.393108367919922, 23.31995391845703, 24.246797561645508, 25.173641204833984, 26.10048484802246, 27.027328491210938, 27.954172134399414, 28.88101577758789, 29.807861328125, 30.734703063964844, 31.661548614501953, 32.58839416503906, 33.515235900878906]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 10.0, 7.0, 14.0, 20.0, 19.0, 27.0, 35.0, 54.0, 89.0, 125.0, 239.0, 420.0, 783.0, 1585.0, 3856.0, 11317.0, 55469.0, 3283588.0, 783783.0, 37709.0, 8968.0, 3134.0, 1341.0, 665.0, 373.0, 228.0, 138.0, 96.0, 46.0, 38.0, 29.0, 18.0, 15.0, 12.0, 11.0, 5.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.562744140625, -5.35595703125, -5.149169921875, -4.9423828125, -4.735595703125, -4.52880859375, -4.322021484375, -4.115234375, -3.908447265625, -3.70166015625, -3.494873046875, -3.2880859375, -3.081298828125, -2.87451171875, -2.667724609375, -2.4609375, -2.254150390625, -2.04736328125, -1.840576171875, -1.6337890625, -1.427001953125, -1.22021484375, -1.013427734375, -0.806640625, -0.599853515625, -0.39306640625, -0.186279296875, 0.0205078125, 0.227294921875, 0.43408203125, 0.640869140625, 0.84765625, 1.054443359375, 1.26123046875, 1.468017578125, 1.6748046875, 1.881591796875, 2.08837890625, 2.295166015625, 2.501953125, 2.708740234375, 2.91552734375, 3.122314453125, 3.3291015625, 3.535888671875, 3.74267578125, 3.949462890625, 4.15625, 4.363037109375, 4.56982421875, 4.776611328125, 4.9833984375, 5.190185546875, 5.39697265625, 5.603759765625, 5.810546875, 6.017333984375, 6.22412109375, 6.430908203125, 6.6376953125, 6.844482421875, 7.05126953125, 7.258056640625, 7.46484375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 30.0, 33.0, 41.0, 53.0, 55.0, 75.0, 79.0, 96.0, 79.0, 74.0, 77.0, 58.0, 61.0, 41.0, 34.0, 19.0, 15.0, 16.0, 13.0, 4.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1015625, -2.03985595703125, -1.9781494140625, -1.91644287109375, -1.854736328125, -1.79302978515625, -1.7313232421875, -1.66961669921875, -1.60791015625, -1.54620361328125, -1.4844970703125, -1.42279052734375, -1.361083984375, -1.29937744140625, -1.2376708984375, -1.17596435546875, -1.1142578125, -1.05255126953125, -0.9908447265625, -0.92913818359375, -0.867431640625, -0.80572509765625, -0.7440185546875, -0.68231201171875, -0.62060546875, -0.55889892578125, -0.4971923828125, -0.43548583984375, -0.373779296875, -0.31207275390625, -0.2503662109375, -0.18865966796875, -0.126953125, -0.06524658203125, -0.0035400390625, 0.05816650390625, 0.119873046875, 0.18157958984375, 0.2432861328125, 0.30499267578125, 0.36669921875, 0.42840576171875, 0.4901123046875, 0.55181884765625, 0.613525390625, 0.67523193359375, 0.7369384765625, 0.79864501953125, 0.8603515625, 0.92205810546875, 0.9837646484375, 1.04547119140625, 1.107177734375, 1.16888427734375, 1.2305908203125, 1.29229736328125, 1.35400390625, 1.41571044921875, 1.4774169921875, 1.53912353515625, 1.600830078125, 1.66253662109375, 1.7242431640625, 1.78594970703125, 1.84765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 9.0, 8.0, 20.0, 18.0, 24.0, 35.0, 61.0, 77.0, 115.0, 127.0, 221.0, 363.0, 583.0, 1064.0, 2943.0, 18163.0, 521911.0, 3598056.0, 42909.0, 4671.0, 1281.0, 602.0, 323.0, 221.0, 128.0, 91.0, 62.0, 37.0, 43.0, 17.0, 19.0, 15.0, 10.0, 13.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2891845703125, -8.039306640625, -7.7894287109375, -7.53955078125, -7.2896728515625, -7.039794921875, -6.7899169921875, -6.5400390625, -6.2901611328125, -6.040283203125, -5.7904052734375, -5.54052734375, -5.2906494140625, -5.040771484375, -4.7908935546875, -4.541015625, -4.2911376953125, -4.041259765625, -3.7913818359375, -3.54150390625, -3.2916259765625, -3.041748046875, -2.7918701171875, -2.5419921875, -2.2921142578125, -2.042236328125, -1.7923583984375, -1.54248046875, -1.2926025390625, -1.042724609375, -0.7928466796875, -0.54296875, -0.2930908203125, -0.043212890625, 0.2066650390625, 0.45654296875, 0.7064208984375, 0.956298828125, 1.2061767578125, 1.4560546875, 1.7059326171875, 1.955810546875, 2.2056884765625, 2.45556640625, 2.7054443359375, 2.955322265625, 3.2052001953125, 3.455078125, 3.7049560546875, 3.954833984375, 4.2047119140625, 4.45458984375, 4.7044677734375, 4.954345703125, 5.2042236328125, 5.4541015625, 5.7039794921875, 5.953857421875, 6.2037353515625, 6.45361328125, 6.7034912109375, 6.953369140625, 7.2032470703125, 7.453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 6.0, 4.0, 18.0, 30.0, 63.0, 111.0, 263.0, 954.0, 1987.0, 361.0, 134.0, 58.0, 34.0, 16.0, 8.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.2890625, -4.200164794921875, -4.11126708984375, -4.022369384765625, -3.9334716796875, -3.844573974609375, -3.75567626953125, -3.666778564453125, -3.577880859375, -3.488983154296875, -3.40008544921875, -3.311187744140625, -3.2222900390625, -3.133392333984375, -3.04449462890625, -2.955596923828125, -2.86669921875, -2.777801513671875, -2.68890380859375, -2.600006103515625, -2.5111083984375, -2.422210693359375, -2.33331298828125, -2.244415283203125, -2.155517578125, -2.066619873046875, -1.97772216796875, -1.888824462890625, -1.7999267578125, -1.711029052734375, -1.62213134765625, -1.533233642578125, -1.4443359375, -1.355438232421875, -1.26654052734375, -1.177642822265625, -1.0887451171875, -0.999847412109375, -0.91094970703125, -0.822052001953125, -0.733154296875, -0.644256591796875, -0.55535888671875, -0.466461181640625, -0.3775634765625, -0.288665771484375, -0.19976806640625, -0.110870361328125, -0.02197265625, 0.066925048828125, 0.15582275390625, 0.244720458984375, 0.3336181640625, 0.422515869140625, 0.51141357421875, 0.600311279296875, 0.689208984375, 0.778106689453125, 0.86700439453125, 0.955902099609375, 1.0447998046875, 1.133697509765625, 1.22259521484375, 1.311492919921875, 1.400390625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 16.0, 36.0, 119.0, 339.0, 328.0, 118.0, 29.0, 10.0, 6.0, 1.0, 1.0], "bins": [-54.2608528137207, -53.31338882446289, -52.36592483520508, -51.418460845947266, -50.47099685668945, -49.52353286743164, -48.57606506347656, -47.62860107421875, -46.68113708496094, -45.733673095703125, -44.78620910644531, -43.8387451171875, -42.89128112792969, -41.943817138671875, -40.99635314941406, -40.04888916015625, -39.10142517089844, -38.153961181640625, -37.20649719238281, -36.259033203125, -35.31156921386719, -34.364105224609375, -33.41664123535156, -32.46917724609375, -31.521709442138672, -30.57424545288086, -29.626781463623047, -28.679317474365234, -27.73185157775879, -26.784387588500977, -25.836923599243164, -24.88945960998535, -23.94199562072754, -22.994531631469727, -22.047067642211914, -21.09960174560547, -20.152137756347656, -19.204673767089844, -18.25720977783203, -17.30974578857422, -16.362281799316406, -15.414817810058594, -14.467352867126465, -13.519888877868652, -12.57242488861084, -11.624959945678711, -10.677495956420898, -9.730031967163086, -8.78256607055664, -7.83510160446167, -6.887637615203857, -5.940173149108887, -4.992709159851074, -4.0452446937561035, -3.097780227661133, -2.1503162384033203, -1.2028522491455078, -0.25538796186447144, 0.6920763254165649, 1.639540672302246, 2.5870048999786377, 3.5344691276550293, 4.48193359375, 5.4293975830078125, 6.376862049102783]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 11.0, 14.0, 18.0, 38.0, 48.0, 49.0, 67.0, 64.0, 77.0, 73.0, 76.0, 104.0, 70.0, 59.0, 66.0, 32.0, 38.0, 35.0, 19.0, 13.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.274557113647461, -13.862266540527344, -13.449975967407227, -13.03768539428711, -12.625394821166992, -12.213104248046875, -11.800812721252441, -11.388522148132324, -10.976231575012207, -10.56394100189209, -10.151650428771973, -9.739359855651855, -9.327068328857422, -8.914777755737305, -8.502487182617188, -8.09019660949707, -7.677906036376953, -7.265615463256836, -6.853324890136719, -6.441033840179443, -6.028743267059326, -5.616452693939209, -5.204161643981934, -4.791871070861816, -4.379580497741699, -3.967289924621582, -3.5549991130828857, -3.1427083015441895, -2.7304177284240723, -2.318127155303955, -1.9058363437652588, -1.4935455322265625, -1.0812559127807617, -0.668965220451355, -0.25667452812194824, 0.1556161642074585, 0.5679068565368652, 0.9801974296569824, 1.3924882411956787, 1.804779052734375, 2.217069625854492, 2.6293601989746094, 3.0416510105133057, 3.453941822052002, 3.866232395172119, 4.278522968292236, 4.690814018249512, 5.103104591369629, 5.515395164489746, 5.927685737609863, 6.3399763107299805, 6.752267360687256, 7.164557933807373, 7.57684850692749, 7.989139556884766, 8.401430130004883, 8.813720703125, 9.226011276245117, 9.638301849365234, 10.050592422485352, 10.462882995605469, 10.875173568725586, 11.28746509552002, 11.699755668640137, 12.112046241760254]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 7.0, 7.0, 8.0, 17.0, 26.0, 27.0, 34.0, 44.0, 83.0, 123.0, 184.0, 315.0, 537.0, 999.0, 2079.0, 4905.0, 13045.0, 39534.0, 153508.0, 489857.0, 251630.0, 60609.0, 18575.0, 6690.0, 2742.0, 1287.0, 600.0, 407.0, 207.0, 154.0, 94.0, 70.0, 31.0, 31.0, 21.0, 21.0, 13.0, 14.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.897216796875, -4.72021484375, -4.543212890625, -4.3662109375, -4.189208984375, -4.01220703125, -3.835205078125, -3.658203125, -3.481201171875, -3.30419921875, -3.127197265625, -2.9501953125, -2.773193359375, -2.59619140625, -2.419189453125, -2.2421875, -2.065185546875, -1.88818359375, -1.711181640625, -1.5341796875, -1.357177734375, -1.18017578125, -1.003173828125, -0.826171875, -0.649169921875, -0.47216796875, -0.295166015625, -0.1181640625, 0.058837890625, 0.23583984375, 0.412841796875, 0.58984375, 0.766845703125, 0.94384765625, 1.120849609375, 1.2978515625, 1.474853515625, 1.65185546875, 1.828857421875, 2.005859375, 2.182861328125, 2.35986328125, 2.536865234375, 2.7138671875, 2.890869140625, 3.06787109375, 3.244873046875, 3.421875, 3.598876953125, 3.77587890625, 3.952880859375, 4.1298828125, 4.306884765625, 4.48388671875, 4.660888671875, 4.837890625, 5.014892578125, 5.19189453125, 5.368896484375, 5.5458984375, 5.722900390625, 5.89990234375, 6.076904296875, 6.25390625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 3.0, 3.0, 18.0, 15.0, 23.0, 25.0, 42.0, 48.0, 68.0, 66.0, 67.0, 85.0, 78.0, 81.0, 62.0, 73.0, 59.0, 44.0, 33.0, 33.0, 18.0, 11.0, 12.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.624359130859375, -1.56512451171875, -1.505889892578125, -1.4466552734375, -1.387420654296875, -1.32818603515625, -1.268951416015625, -1.209716796875, -1.150482177734375, -1.09124755859375, -1.032012939453125, -0.9727783203125, -0.913543701171875, -0.85430908203125, -0.795074462890625, -0.73583984375, -0.676605224609375, -0.61737060546875, -0.558135986328125, -0.4989013671875, -0.439666748046875, -0.38043212890625, -0.321197509765625, -0.261962890625, -0.202728271484375, -0.14349365234375, -0.084259033203125, -0.0250244140625, 0.034210205078125, 0.09344482421875, 0.152679443359375, 0.2119140625, 0.271148681640625, 0.33038330078125, 0.389617919921875, 0.4488525390625, 0.508087158203125, 0.56732177734375, 0.626556396484375, 0.685791015625, 0.745025634765625, 0.80426025390625, 0.863494873046875, 0.9227294921875, 0.981964111328125, 1.04119873046875, 1.100433349609375, 1.15966796875, 1.218902587890625, 1.27813720703125, 1.337371826171875, 1.3966064453125, 1.455841064453125, 1.51507568359375, 1.574310302734375, 1.633544921875, 1.692779541015625, 1.75201416015625, 1.811248779296875, 1.8704833984375, 1.929718017578125, 1.98895263671875, 2.048187255859375, 2.107421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 11.0, 12.0, 21.0, 25.0, 36.0, 59.0, 98.0, 147.0, 220.0, 315.0, 484.0, 752.0, 1233.0, 2076.0, 3723.0, 6551.0, 12704.0, 26187.0, 57174.0, 137230.0, 291038.0, 277140.0, 126935.0, 53440.0, 24193.0, 11849.0, 6262.0, 3462.0, 1951.0, 1149.0, 748.0, 462.0, 275.0, 195.0, 143.0, 68.0, 55.0, 38.0, 32.0, 20.0, 17.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.5472412109375, -2.467529296875, -2.3878173828125, -2.30810546875, -2.2283935546875, -2.148681640625, -2.0689697265625, -1.9892578125, -1.9095458984375, -1.829833984375, -1.7501220703125, -1.67041015625, -1.5906982421875, -1.510986328125, -1.4312744140625, -1.3515625, -1.2718505859375, -1.192138671875, -1.1124267578125, -1.03271484375, -0.9530029296875, -0.873291015625, -0.7935791015625, -0.7138671875, -0.6341552734375, -0.554443359375, -0.4747314453125, -0.39501953125, -0.3153076171875, -0.235595703125, -0.1558837890625, -0.076171875, 0.0035400390625, 0.083251953125, 0.1629638671875, 0.24267578125, 0.3223876953125, 0.402099609375, 0.4818115234375, 0.5615234375, 0.6412353515625, 0.720947265625, 0.8006591796875, 0.88037109375, 0.9600830078125, 1.039794921875, 1.1195068359375, 1.19921875, 1.2789306640625, 1.358642578125, 1.4383544921875, 1.51806640625, 1.5977783203125, 1.677490234375, 1.7572021484375, 1.8369140625, 1.9166259765625, 1.996337890625, 2.0760498046875, 2.15576171875, 2.2354736328125, 2.315185546875, 2.3948974609375, 2.474609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 3.0, 5.0, 9.0, 22.0, 15.0, 12.0, 21.0, 24.0, 25.0, 29.0, 32.0, 32.0, 38.0, 37.0, 38.0, 40.0, 41.0, 34.0, 49.0, 37.0, 47.0, 47.0, 30.0, 42.0, 43.0, 37.0, 25.0, 23.0, 21.0, 11.0, 26.0, 14.0, 18.0, 11.0, 9.0, 7.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.95928955078125, -3.8209228515625, -3.68255615234375, -3.544189453125, -3.40582275390625, -3.2674560546875, -3.12908935546875, -2.99072265625, -2.85235595703125, -2.7139892578125, -2.57562255859375, -2.437255859375, -2.29888916015625, -2.1605224609375, -2.02215576171875, -1.8837890625, -1.74542236328125, -1.6070556640625, -1.46868896484375, -1.330322265625, -1.19195556640625, -1.0535888671875, -0.91522216796875, -0.77685546875, -0.63848876953125, -0.5001220703125, -0.36175537109375, -0.223388671875, -0.08502197265625, 0.0533447265625, 0.19171142578125, 0.330078125, 0.46844482421875, 0.6068115234375, 0.74517822265625, 0.883544921875, 1.02191162109375, 1.1602783203125, 1.29864501953125, 1.43701171875, 1.57537841796875, 1.7137451171875, 1.85211181640625, 1.990478515625, 2.12884521484375, 2.2672119140625, 2.40557861328125, 2.5439453125, 2.68231201171875, 2.8206787109375, 2.95904541015625, 3.097412109375, 3.23577880859375, 3.3741455078125, 3.51251220703125, 3.65087890625, 3.78924560546875, 3.9276123046875, 4.06597900390625, 4.204345703125, 4.34271240234375, 4.4810791015625, 4.61944580078125, 4.7578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 5.0, 3.0, 14.0, 10.0, 27.0, 29.0, 57.0, 108.0, 199.0, 403.0, 902.0, 2047.0, 5808.0, 19157.0, 85360.0, 476463.0, 371582.0, 63557.0, 14967.0, 4604.0, 1738.0, 725.0, 370.0, 173.0, 91.0, 73.0, 24.0, 22.0, 11.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.619140625, -1.55413818359375, -1.4891357421875, -1.42413330078125, -1.359130859375, -1.29412841796875, -1.2291259765625, -1.16412353515625, -1.09912109375, -1.03411865234375, -0.9691162109375, -0.90411376953125, -0.839111328125, -0.77410888671875, -0.7091064453125, -0.64410400390625, -0.5791015625, -0.51409912109375, -0.4490966796875, -0.38409423828125, -0.319091796875, -0.25408935546875, -0.1890869140625, -0.12408447265625, -0.05908203125, 0.00592041015625, 0.0709228515625, 0.13592529296875, 0.200927734375, 0.26593017578125, 0.3309326171875, 0.39593505859375, 0.4609375, 0.52593994140625, 0.5909423828125, 0.65594482421875, 0.720947265625, 0.78594970703125, 0.8509521484375, 0.91595458984375, 0.98095703125, 1.04595947265625, 1.1109619140625, 1.17596435546875, 1.240966796875, 1.30596923828125, 1.3709716796875, 1.43597412109375, 1.5009765625, 1.56597900390625, 1.6309814453125, 1.69598388671875, 1.760986328125, 1.82598876953125, 1.8909912109375, 1.95599365234375, 2.02099609375, 2.08599853515625, 2.1510009765625, 2.21600341796875, 2.281005859375, 2.34600830078125, 2.4110107421875, 2.47601318359375, 2.541015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 11.0, 6.0, 8.0, 10.0, 15.0, 14.0, 15.0, 20.0, 24.0, 30.0, 34.0, 64.0, 88.0, 101.0, 99.0, 88.0, 78.0, 49.0, 36.0, 42.0, 28.0, 23.0, 22.0, 16.0, 11.0, 14.0, 12.0, 11.0, 5.0, 4.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00029015541076660156, -0.000281263142824173, -0.0002723708748817444, -0.0002634786069393158, -0.0002545863389968872, -0.0002456940710544586, -0.00023680180311203003, -0.00022790953516960144, -0.00021901726722717285, -0.00021012499928474426, -0.00020123273134231567, -0.00019234046339988708, -0.0001834481954574585, -0.0001745559275150299, -0.00016566365957260132, -0.00015677139163017273, -0.00014787912368774414, -0.00013898685574531555, -0.00013009458780288696, -0.00012120231986045837, -0.00011231005191802979, -0.0001034177839756012, -9.452551603317261e-05, -8.563324809074402e-05, -7.674098014831543e-05, -6.784871220588684e-05, -5.895644426345825e-05, -5.006417632102966e-05, -4.1171908378601074e-05, -3.2279640436172485e-05, -2.3387372493743896e-05, -1.4495104551315308e-05, -5.602836608886719e-06, 3.28943133354187e-06, 1.2181699275970459e-05, 2.1073967218399048e-05, 2.9966235160827637e-05, 3.8858503103256226e-05, 4.7750771045684814e-05, 5.66430389881134e-05, 6.553530693054199e-05, 7.442757487297058e-05, 8.331984281539917e-05, 9.221211075782776e-05, 0.00010110437870025635, 0.00010999664664268494, 0.00011888891458511353, 0.00012778118252754211, 0.0001366734504699707, 0.0001455657184123993, 0.00015445798635482788, 0.00016335025429725647, 0.00017224252223968506, 0.00018113479018211365, 0.00019002705812454224, 0.00019891932606697083, 0.00020781159400939941, 0.000216703861951828, 0.0002255961298942566, 0.00023448839783668518, 0.00024338066577911377, 0.00025227293372154236, 0.00026116520166397095, 0.00027005746960639954, 0.0002789497375488281]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 15.0, 16.0, 31.0, 39.0, 61.0, 83.0, 109.0, 184.0, 321.0, 536.0, 979.0, 1835.0, 3818.0, 8687.0, 21300.0, 68558.0, 332414.0, 461374.0, 99731.0, 27974.0, 10774.0, 4746.0, 2278.0, 1168.0, 611.0, 325.0, 191.0, 128.0, 86.0, 43.0, 33.0, 34.0, 15.0, 12.0, 6.0, 8.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.017578125, -1.9566802978515625, -1.895782470703125, -1.8348846435546875, -1.77398681640625, -1.7130889892578125, -1.652191162109375, -1.5912933349609375, -1.5303955078125, -1.4694976806640625, -1.408599853515625, -1.3477020263671875, -1.28680419921875, -1.2259063720703125, -1.165008544921875, -1.1041107177734375, -1.043212890625, -0.9823150634765625, -0.921417236328125, -0.8605194091796875, -0.79962158203125, -0.7387237548828125, -0.677825927734375, -0.6169281005859375, -0.5560302734375, -0.4951324462890625, -0.434234619140625, -0.3733367919921875, -0.31243896484375, -0.2515411376953125, -0.190643310546875, -0.1297454833984375, -0.06884765625, -0.0079498291015625, 0.052947998046875, 0.1138458251953125, 0.17474365234375, 0.2356414794921875, 0.296539306640625, 0.3574371337890625, 0.4183349609375, 0.4792327880859375, 0.540130615234375, 0.6010284423828125, 0.66192626953125, 0.7228240966796875, 0.783721923828125, 0.8446197509765625, 0.905517578125, 0.9664154052734375, 1.027313232421875, 1.0882110595703125, 1.14910888671875, 1.2100067138671875, 1.270904541015625, 1.3318023681640625, 1.3927001953125, 1.4535980224609375, 1.514495849609375, 1.5753936767578125, 1.63629150390625, 1.6971893310546875, 1.758087158203125, 1.8189849853515625, 1.8798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 7.0, 8.0, 15.0, 13.0, 14.0, 30.0, 34.0, 39.0, 65.0, 77.0, 94.0, 84.0, 83.0, 104.0, 72.0, 57.0, 52.0, 36.0, 20.0, 21.0, 9.0, 12.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.630096435546875, -1.57366943359375, -1.517242431640625, -1.4608154296875, -1.404388427734375, -1.34796142578125, -1.291534423828125, -1.235107421875, -1.178680419921875, -1.12225341796875, -1.065826416015625, -1.0093994140625, -0.952972412109375, -0.89654541015625, -0.840118408203125, -0.78369140625, -0.727264404296875, -0.67083740234375, -0.614410400390625, -0.5579833984375, -0.501556396484375, -0.44512939453125, -0.388702392578125, -0.332275390625, -0.275848388671875, -0.21942138671875, -0.162994384765625, -0.1065673828125, -0.050140380859375, 0.00628662109375, 0.062713623046875, 0.119140625, 0.175567626953125, 0.23199462890625, 0.288421630859375, 0.3448486328125, 0.401275634765625, 0.45770263671875, 0.514129638671875, 0.570556640625, 0.626983642578125, 0.68341064453125, 0.739837646484375, 0.7962646484375, 0.852691650390625, 0.90911865234375, 0.965545654296875, 1.02197265625, 1.078399658203125, 1.13482666015625, 1.191253662109375, 1.2476806640625, 1.304107666015625, 1.36053466796875, 1.416961669921875, 1.473388671875, 1.529815673828125, 1.58624267578125, 1.642669677734375, 1.6990966796875, 1.755523681640625, 1.81195068359375, 1.868377685546875, 1.9248046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 29.0, 38.0, 72.0, 105.0, 184.0, 177.0, 132.0, 90.0, 48.0, 42.0, 22.0, 15.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.351150512695312, -26.21552276611328, -25.07989501953125, -23.94426918029785, -22.80864143371582, -21.67301368713379, -20.53738784790039, -19.40176010131836, -18.266132354736328, -17.130504608154297, -15.994877815246582, -14.859251022338867, -13.723623275756836, -12.587995529174805, -11.45236873626709, -10.316741943359375, -9.181114196777344, -8.045486450195312, -6.909859657287598, -5.774232387542725, -4.638605117797852, -3.5029778480529785, -2.3673505783081055, -1.2317233085632324, -0.09609603881835938, 1.0395312309265137, 2.1751585006713867, 3.3107857704162598, 4.446413040161133, 5.582040309906006, 6.717667579650879, 7.853294849395752, 8.988922119140625, 10.124549865722656, 11.260176658630371, 12.395803451538086, 13.531431198120117, 14.667058944702148, 15.802685737609863, 16.938312530517578, 18.07394027709961, 19.20956802368164, 20.345195770263672, 21.48082160949707, 22.6164493560791, 23.752077102661133, 24.88770294189453, 26.023330688476562, 27.158958435058594, 28.294586181640625, 29.430213928222656, 30.565839767456055, 31.701467514038086, 32.837093353271484, 33.972721099853516, 35.10834884643555, 36.24397659301758, 37.37960433959961, 38.51523208618164, 39.65085983276367, 40.78648376464844, 41.92211151123047, 43.0577392578125, 44.19336700439453, 45.32899475097656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 11.0, 14.0, 18.0, 22.0, 23.0, 17.0, 28.0, 27.0, 27.0, 36.0, 38.0, 30.0, 33.0, 34.0, 53.0, 43.0, 49.0, 37.0, 54.0, 41.0, 30.0, 41.0, 37.0, 28.0, 22.0, 18.0, 22.0, 19.0, 15.0, 18.0, 18.0, 16.0, 12.0, 17.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.037307739257812, -26.202707290649414, -25.368104934692383, -24.533504486083984, -23.698904037475586, -22.864303588867188, -22.029701232910156, -21.195100784301758, -20.36050033569336, -19.52589988708496, -18.69129753112793, -17.85669708251953, -17.022096633911133, -16.187496185302734, -15.352893829345703, -14.518293380737305, -13.683691024780273, -12.849089622497559, -12.01448917388916, -11.179887771606445, -10.345287322998047, -9.510685920715332, -8.676084518432617, -7.8414835929870605, -7.006882667541504, -6.172281742095947, -5.337680816650391, -4.503079414367676, -3.668478488922119, -2.8338775634765625, -1.9992761611938477, -1.164675235748291, -0.33007240295410156, 0.5045286417007446, 1.3391296863555908, 2.1737308502197266, 3.008331775665283, 3.84293270111084, 4.677534103393555, 5.512135028839111, 6.346735954284668, 7.181336879730225, 8.015937805175781, 8.850539207458496, 9.685140609741211, 10.51974105834961, 11.354342460632324, 12.188943862915039, 13.023544311523438, 13.858145713806152, 14.69274616241455, 15.527347564697266, 16.361948013305664, 17.196548461914062, 18.031150817871094, 18.865751266479492, 19.70035171508789, 20.53495216369629, 21.36955451965332, 22.20415496826172, 23.038755416870117, 23.873355865478516, 24.707958221435547, 25.542558670043945, 26.377161026000977]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 12.0, 10.0, 23.0, 47.0, 65.0, 107.0, 145.0, 280.0, 605.0, 1477.0, 4592.0, 21751.0, 391713.0, 3717046.0, 44627.0, 7534.0, 2410.0, 866.0, 405.0, 210.0, 123.0, 76.0, 46.0, 36.0, 24.0, 10.0, 7.0, 13.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.3218994140625, -8.026611328125, -7.7313232421875, -7.43603515625, -7.1407470703125, -6.845458984375, -6.5501708984375, -6.2548828125, -5.9595947265625, -5.664306640625, -5.3690185546875, -5.07373046875, -4.7784423828125, -4.483154296875, -4.1878662109375, -3.892578125, -3.5972900390625, -3.302001953125, -3.0067138671875, -2.71142578125, -2.4161376953125, -2.120849609375, -1.8255615234375, -1.5302734375, -1.2349853515625, -0.939697265625, -0.6444091796875, -0.34912109375, -0.0538330078125, 0.241455078125, 0.5367431640625, 0.83203125, 1.1273193359375, 1.422607421875, 1.7178955078125, 2.01318359375, 2.3084716796875, 2.603759765625, 2.8990478515625, 3.1943359375, 3.4896240234375, 3.784912109375, 4.0802001953125, 4.37548828125, 4.6707763671875, 4.966064453125, 5.2613525390625, 5.556640625, 5.8519287109375, 6.147216796875, 6.4425048828125, 6.73779296875, 7.0330810546875, 7.328369140625, 7.6236572265625, 7.9189453125, 8.2142333984375, 8.509521484375, 8.8048095703125, 9.10009765625, 9.3953857421875, 9.690673828125, 9.9859619140625, 10.28125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 8.0, 14.0, 25.0, 18.0, 30.0, 59.0, 47.0, 46.0, 65.0, 72.0, 84.0, 76.0, 72.0, 82.0, 54.0, 54.0, 48.0, 29.0, 31.0, 18.0, 23.0, 13.0, 5.0, 11.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.92578125, -1.8602294921875, -1.794677734375, -1.7291259765625, -1.66357421875, -1.5980224609375, -1.532470703125, -1.4669189453125, -1.4013671875, -1.3358154296875, -1.270263671875, -1.2047119140625, -1.13916015625, -1.0736083984375, -1.008056640625, -0.9425048828125, -0.876953125, -0.8114013671875, -0.745849609375, -0.6802978515625, -0.61474609375, -0.5491943359375, -0.483642578125, -0.4180908203125, -0.3525390625, -0.2869873046875, -0.221435546875, -0.1558837890625, -0.09033203125, -0.0247802734375, 0.040771484375, 0.1063232421875, 0.171875, 0.2374267578125, 0.302978515625, 0.3685302734375, 0.43408203125, 0.4996337890625, 0.565185546875, 0.6307373046875, 0.6962890625, 0.7618408203125, 0.827392578125, 0.8929443359375, 0.95849609375, 1.0240478515625, 1.089599609375, 1.1551513671875, 1.220703125, 1.2862548828125, 1.351806640625, 1.4173583984375, 1.48291015625, 1.5484619140625, 1.614013671875, 1.6795654296875, 1.7451171875, 1.8106689453125, 1.876220703125, 1.9417724609375, 2.00732421875, 2.0728759765625, 2.138427734375, 2.2039794921875, 2.26953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 13.0, 10.0, 17.0, 33.0, 55.0, 93.0, 169.0, 335.0, 839.0, 2539.0, 10049.0, 86447.0, 3793204.0, 276186.0, 18497.0, 3768.0, 1153.0, 462.0, 185.0, 102.0, 64.0, 25.0, 15.0, 10.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.4759521484375, -6.233154296875, -5.9903564453125, -5.74755859375, -5.5047607421875, -5.261962890625, -5.0191650390625, -4.7763671875, -4.5335693359375, -4.290771484375, -4.0479736328125, -3.80517578125, -3.5623779296875, -3.319580078125, -3.0767822265625, -2.833984375, -2.5911865234375, -2.348388671875, -2.1055908203125, -1.86279296875, -1.6199951171875, -1.377197265625, -1.1343994140625, -0.8916015625, -0.6488037109375, -0.406005859375, -0.1632080078125, 0.07958984375, 0.3223876953125, 0.565185546875, 0.8079833984375, 1.05078125, 1.2935791015625, 1.536376953125, 1.7791748046875, 2.02197265625, 2.2647705078125, 2.507568359375, 2.7503662109375, 2.9931640625, 3.2359619140625, 3.478759765625, 3.7215576171875, 3.96435546875, 4.2071533203125, 4.449951171875, 4.6927490234375, 4.935546875, 5.1783447265625, 5.421142578125, 5.6639404296875, 5.90673828125, 6.1495361328125, 6.392333984375, 6.6351318359375, 6.8779296875, 7.1207275390625, 7.363525390625, 7.6063232421875, 7.84912109375, 8.0919189453125, 8.334716796875, 8.5775146484375, 8.8203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 2.0, 12.0, 14.0, 14.0, 24.0, 49.0, 66.0, 151.0, 416.0, 1835.0, 942.0, 266.0, 115.0, 57.0, 38.0, 19.0, 17.0, 6.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.19921875, -4.098785400390625, -3.99835205078125, -3.897918701171875, -3.7974853515625, -3.697052001953125, -3.59661865234375, -3.496185302734375, -3.395751953125, -3.295318603515625, -3.19488525390625, -3.094451904296875, -2.9940185546875, -2.893585205078125, -2.79315185546875, -2.692718505859375, -2.59228515625, -2.491851806640625, -2.39141845703125, -2.290985107421875, -2.1905517578125, -2.090118408203125, -1.98968505859375, -1.889251708984375, -1.788818359375, -1.688385009765625, -1.58795166015625, -1.487518310546875, -1.3870849609375, -1.286651611328125, -1.18621826171875, -1.085784912109375, -0.9853515625, -0.884918212890625, -0.78448486328125, -0.684051513671875, -0.5836181640625, -0.483184814453125, -0.38275146484375, -0.282318115234375, -0.181884765625, -0.081451416015625, 0.01898193359375, 0.119415283203125, 0.2198486328125, 0.320281982421875, 0.42071533203125, 0.521148681640625, 0.62158203125, 0.722015380859375, 0.82244873046875, 0.922882080078125, 1.0233154296875, 1.123748779296875, 1.22418212890625, 1.324615478515625, 1.425048828125, 1.525482177734375, 1.62591552734375, 1.726348876953125, 1.8267822265625, 1.927215576171875, 2.02764892578125, 2.128082275390625, 2.228515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 8.0, 13.0, 15.0, 29.0, 62.0, 87.0, 142.0, 167.0, 170.0, 138.0, 81.0, 44.0, 21.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.0150089263916, -19.56905746459961, -19.12310791015625, -18.677156448364258, -18.2312068939209, -17.785255432128906, -17.339305877685547, -16.893354415893555, -16.447402954101562, -16.00145149230957, -15.555501937866211, -15.109550476074219, -14.663599967956543, -14.217649459838867, -13.771698951721191, -13.325748443603516, -12.87979793548584, -12.433847427368164, -11.987896919250488, -11.541946411132812, -11.09599494934082, -10.650044441223145, -10.204093933105469, -9.758143424987793, -9.312192916870117, -8.866242408752441, -8.420291900634766, -7.974340915679932, -7.528389930725098, -7.082439422607422, -6.636488914489746, -6.19053840637207, -5.744585990905762, -5.298635482788086, -4.852684497833252, -4.406733989715576, -3.9607832431793213, -3.5148324966430664, -3.0688819885253906, -2.6229312419891357, -2.176980495452881, -1.731029748916626, -1.2850791215896606, -0.8391284942626953, -0.39317774772644043, 0.05277299880981445, 0.49872350692749023, 0.9446742534637451, 1.390625, 1.8365757465362549, 2.2825264930725098, 2.7284770011901855, 3.1744277477264404, 3.6203784942626953, 4.066329002380371, 4.512279510498047, 4.958230495452881, 5.404181003570557, 5.850131988525391, 6.296082496643066, 6.742033004760742, 7.187983989715576, 7.633934497833252, 8.079885482788086, 8.525835990905762]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 18.0, 4.0, 9.0, 26.0, 23.0, 28.0, 27.0, 40.0, 36.0, 44.0, 32.0, 38.0, 41.0, 41.0, 54.0, 51.0, 57.0, 53.0, 39.0, 53.0, 40.0, 41.0, 30.0, 23.0, 18.0, 25.0, 22.0, 11.0, 15.0, 11.0, 16.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.026930809020996, -8.771805763244629, -8.516681671142578, -8.261556625366211, -8.00643253326416, -7.751307964324951, -7.496183395385742, -7.241058349609375, -6.985934257507324, -6.730809688568115, -6.475685119628906, -6.220560550689697, -5.965435981750488, -5.710311412811279, -5.45518684387207, -5.200061798095703, -4.944937229156494, -4.689812660217285, -4.434688091278076, -4.179563522338867, -3.924438953399658, -3.669314384460449, -3.414189577102661, -3.159065008163452, -2.903940439224243, -2.648815870285034, -2.393691301345825, -2.138566493988037, -1.8834420442581177, -1.6283174753189087, -1.3731927871704102, -1.1180682182312012, -0.8629441261291504, -0.6078195571899414, -0.35269492864608765, -0.09757030010223389, 0.1575542688369751, 0.4126788377761841, 0.6678035259246826, 0.9229280948638916, 1.1780526638031006, 1.4331772327423096, 1.6883018016815186, 1.943426489830017, 2.1985511779785156, 2.4536757469177246, 2.7088003158569336, 2.9639248847961426, 3.2190494537353516, 3.4741740226745605, 3.7292985916137695, 3.9844231605529785, 4.2395477294921875, 4.4946722984313965, 4.7497968673706055, 5.004921913146973, 5.260046005249023, 5.515170574188232, 5.770295143127441, 6.02541971206665, 6.280544281005859, 6.535668849945068, 6.790793418884277, 7.0459184646606445, 7.3010430335998535]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 15.0, 10.0, 16.0, 28.0, 32.0, 54.0, 100.0, 170.0, 277.0, 569.0, 1252.0, 3096.0, 8645.0, 28884.0, 124600.0, 566910.0, 243683.0, 48736.0, 13615.0, 4391.0, 1790.0, 764.0, 405.0, 210.0, 125.0, 67.0, 39.0, 28.0, 13.0, 12.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.45758056640625, -6.2471923828125, -6.03680419921875, -5.826416015625, -5.61602783203125, -5.4056396484375, -5.19525146484375, -4.98486328125, -4.77447509765625, -4.5640869140625, -4.35369873046875, -4.143310546875, -3.93292236328125, -3.7225341796875, -3.51214599609375, -3.3017578125, -3.09136962890625, -2.8809814453125, -2.67059326171875, -2.460205078125, -2.24981689453125, -2.0394287109375, -1.82904052734375, -1.61865234375, -1.40826416015625, -1.1978759765625, -0.98748779296875, -0.777099609375, -0.56671142578125, -0.3563232421875, -0.14593505859375, 0.064453125, 0.27484130859375, 0.4852294921875, 0.69561767578125, 0.906005859375, 1.11639404296875, 1.3267822265625, 1.53717041015625, 1.74755859375, 1.95794677734375, 2.1683349609375, 2.37872314453125, 2.589111328125, 2.79949951171875, 3.0098876953125, 3.22027587890625, 3.4306640625, 3.64105224609375, 3.8514404296875, 4.06182861328125, 4.272216796875, 4.48260498046875, 4.6929931640625, 4.90338134765625, 5.11376953125, 5.32415771484375, 5.5345458984375, 5.74493408203125, 5.955322265625, 6.16571044921875, 6.3760986328125, 6.58648681640625, 6.796875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 12.0, 18.0, 22.0, 17.0, 40.0, 26.0, 49.0, 57.0, 50.0, 85.0, 80.0, 71.0, 65.0, 66.0, 59.0, 61.0, 47.0, 41.0, 28.0, 18.0, 24.0, 13.0, 12.0, 11.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.77001953125, -1.7080078125, -1.64599609375, -1.583984375, -1.52197265625, -1.4599609375, -1.39794921875, -1.3359375, -1.27392578125, -1.2119140625, -1.14990234375, -1.087890625, -1.02587890625, -0.9638671875, -0.90185546875, -0.83984375, -0.77783203125, -0.7158203125, -0.65380859375, -0.591796875, -0.52978515625, -0.4677734375, -0.40576171875, -0.34375, -0.28173828125, -0.2197265625, -0.15771484375, -0.095703125, -0.03369140625, 0.0283203125, 0.09033203125, 0.15234375, 0.21435546875, 0.2763671875, 0.33837890625, 0.400390625, 0.46240234375, 0.5244140625, 0.58642578125, 0.6484375, 0.71044921875, 0.7724609375, 0.83447265625, 0.896484375, 0.95849609375, 1.0205078125, 1.08251953125, 1.14453125, 1.20654296875, 1.2685546875, 1.33056640625, 1.392578125, 1.45458984375, 1.5166015625, 1.57861328125, 1.640625, 1.70263671875, 1.7646484375, 1.82666015625, 1.888671875, 1.95068359375, 2.0126953125, 2.07470703125, 2.13671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 5.0, 17.0, 12.0, 33.0, 44.0, 61.0, 68.0, 120.0, 191.0, 335.0, 600.0, 1021.0, 2208.0, 4558.0, 11403.0, 32564.0, 109396.0, 399519.0, 347417.0, 92086.0, 28417.0, 10074.0, 4226.0, 1852.0, 983.0, 497.0, 293.0, 183.0, 105.0, 76.0, 57.0, 38.0, 27.0, 12.0, 11.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.44921875, -4.318115234375, -4.18701171875, -4.055908203125, -3.9248046875, -3.793701171875, -3.66259765625, -3.531494140625, -3.400390625, -3.269287109375, -3.13818359375, -3.007080078125, -2.8759765625, -2.744873046875, -2.61376953125, -2.482666015625, -2.3515625, -2.220458984375, -2.08935546875, -1.958251953125, -1.8271484375, -1.696044921875, -1.56494140625, -1.433837890625, -1.302734375, -1.171630859375, -1.04052734375, -0.909423828125, -0.7783203125, -0.647216796875, -0.51611328125, -0.385009765625, -0.25390625, -0.122802734375, 0.00830078125, 0.139404296875, 0.2705078125, 0.401611328125, 0.53271484375, 0.663818359375, 0.794921875, 0.926025390625, 1.05712890625, 1.188232421875, 1.3193359375, 1.450439453125, 1.58154296875, 1.712646484375, 1.84375, 1.974853515625, 2.10595703125, 2.237060546875, 2.3681640625, 2.499267578125, 2.63037109375, 2.761474609375, 2.892578125, 3.023681640625, 3.15478515625, 3.285888671875, 3.4169921875, 3.548095703125, 3.67919921875, 3.810302734375, 3.94140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 3.0, 5.0, 8.0, 11.0, 13.0, 20.0, 16.0, 21.0, 24.0, 32.0, 34.0, 33.0, 49.0, 43.0, 50.0, 56.0, 58.0, 47.0, 48.0, 51.0, 54.0, 36.0, 49.0, 37.0, 28.0, 27.0, 26.0, 28.0, 25.0, 15.0, 6.0, 14.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.17218017578125, -5.9888916015625, -5.80560302734375, -5.622314453125, -5.43902587890625, -5.2557373046875, -5.07244873046875, -4.88916015625, -4.70587158203125, -4.5225830078125, -4.33929443359375, -4.156005859375, -3.97271728515625, -3.7894287109375, -3.60614013671875, -3.4228515625, -3.23956298828125, -3.0562744140625, -2.87298583984375, -2.689697265625, -2.50640869140625, -2.3231201171875, -2.13983154296875, -1.95654296875, -1.77325439453125, -1.5899658203125, -1.40667724609375, -1.223388671875, -1.04010009765625, -0.8568115234375, -0.67352294921875, -0.490234375, -0.30694580078125, -0.1236572265625, 0.05963134765625, 0.242919921875, 0.42620849609375, 0.6094970703125, 0.79278564453125, 0.97607421875, 1.15936279296875, 1.3426513671875, 1.52593994140625, 1.709228515625, 1.89251708984375, 2.0758056640625, 2.25909423828125, 2.4423828125, 2.62567138671875, 2.8089599609375, 2.99224853515625, 3.175537109375, 3.35882568359375, 3.5421142578125, 3.72540283203125, 3.90869140625, 4.09197998046875, 4.2752685546875, 4.45855712890625, 4.641845703125, 4.82513427734375, 5.0084228515625, 5.19171142578125, 5.375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 10.0, 19.0, 39.0, 81.0, 196.0, 687.0, 4835.0, 752605.0, 285383.0, 3820.0, 549.0, 182.0, 72.0, 26.0, 16.0, 15.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.1041259765625, -9.755126953125, -9.4061279296875, -9.05712890625, -8.7081298828125, -8.359130859375, -8.0101318359375, -7.6611328125, -7.3121337890625, -6.963134765625, -6.6141357421875, -6.26513671875, -5.9161376953125, -5.567138671875, -5.2181396484375, -4.869140625, -4.5201416015625, -4.171142578125, -3.8221435546875, -3.47314453125, -3.1241455078125, -2.775146484375, -2.4261474609375, -2.0771484375, -1.7281494140625, -1.379150390625, -1.0301513671875, -0.68115234375, -0.3321533203125, 0.016845703125, 0.3658447265625, 0.71484375, 1.0638427734375, 1.412841796875, 1.7618408203125, 2.11083984375, 2.4598388671875, 2.808837890625, 3.1578369140625, 3.5068359375, 3.8558349609375, 4.204833984375, 4.5538330078125, 4.90283203125, 5.2518310546875, 5.600830078125, 5.9498291015625, 6.298828125, 6.6478271484375, 6.996826171875, 7.3458251953125, 7.69482421875, 8.0438232421875, 8.392822265625, 8.7418212890625, 9.0908203125, 9.4398193359375, 9.788818359375, 10.1378173828125, 10.48681640625, 10.8358154296875, 11.184814453125, 11.5338134765625, 11.8828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 7.0, 3.0, 5.0, 20.0, 22.0, 39.0, 82.0, 349.0, 289.0, 78.0, 37.0, 29.0, 20.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011129379272460938, -0.0010819882154464722, -0.0010510385036468506, -0.001020088791847229, -0.0009891390800476074, -0.0009581893682479858, -0.0009272396564483643, -0.0008962899446487427, -0.0008653402328491211, -0.0008343905210494995, -0.0008034408092498779, -0.0007724910974502563, -0.0007415413856506348, -0.0007105916738510132, -0.0006796419620513916, -0.00064869225025177, -0.0006177425384521484, -0.0005867928266525269, -0.0005558431148529053, -0.0005248934030532837, -0.0004939436912536621, -0.00046299397945404053, -0.00043204426765441895, -0.00040109455585479736, -0.0003701448440551758, -0.0003391951322555542, -0.0003082454204559326, -0.00027729570865631104, -0.00024634599685668945, -0.00021539628505706787, -0.0001844465732574463, -0.0001534968614578247, -0.00012254714965820312, -9.159743785858154e-05, -6.064772605895996e-05, -2.969801425933838e-05, 1.2516975402832031e-06, 3.2201409339904785e-05, 6.315112113952637e-05, 9.410083293914795e-05, 0.00012505054473876953, 0.0001560002565383911, 0.0001869499683380127, 0.00021789968013763428, 0.00024884939193725586, 0.00027979910373687744, 0.000310748815536499, 0.0003416985273361206, 0.0003726482391357422, 0.00040359795093536377, 0.00043454766273498535, 0.00046549737453460693, 0.0004964470863342285, 0.0005273967981338501, 0.0005583465099334717, 0.0005892962217330933, 0.0006202459335327148, 0.0006511956453323364, 0.000682145357131958, 0.0007130950689315796, 0.0007440447807312012, 0.0007749944925308228, 0.0008059442043304443, 0.0008368939161300659, 0.0008678436279296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 13.0, 25.0, 43.0, 95.0, 158.0, 305.0, 1222.0, 13529.0, 999419.0, 31186.0, 1790.0, 392.0, 183.0, 85.0, 47.0, 30.0, 18.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.4649658203125, -12.070556640625, -11.6761474609375, -11.28173828125, -10.8873291015625, -10.492919921875, -10.0985107421875, -9.7041015625, -9.3096923828125, -8.915283203125, -8.5208740234375, -8.12646484375, -7.7320556640625, -7.337646484375, -6.9432373046875, -6.548828125, -6.1544189453125, -5.760009765625, -5.3656005859375, -4.97119140625, -4.5767822265625, -4.182373046875, -3.7879638671875, -3.3935546875, -2.9991455078125, -2.604736328125, -2.2103271484375, -1.81591796875, -1.4215087890625, -1.027099609375, -0.6326904296875, -0.23828125, 0.1561279296875, 0.550537109375, 0.9449462890625, 1.33935546875, 1.7337646484375, 2.128173828125, 2.5225830078125, 2.9169921875, 3.3114013671875, 3.705810546875, 4.1002197265625, 4.49462890625, 4.8890380859375, 5.283447265625, 5.6778564453125, 6.072265625, 6.4666748046875, 6.861083984375, 7.2554931640625, 7.64990234375, 8.0443115234375, 8.438720703125, 8.8331298828125, 9.2275390625, 9.6219482421875, 10.016357421875, 10.4107666015625, 10.80517578125, 11.1995849609375, 11.593994140625, 11.9884033203125, 12.3828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 13.0, 19.0, 40.0, 110.0, 360.0, 287.0, 89.0, 46.0, 17.0, 9.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.779541015625, -7.53564453125, -7.291748046875, -7.0478515625, -6.803955078125, -6.56005859375, -6.316162109375, -6.072265625, -5.828369140625, -5.58447265625, -5.340576171875, -5.0966796875, -4.852783203125, -4.60888671875, -4.364990234375, -4.12109375, -3.877197265625, -3.63330078125, -3.389404296875, -3.1455078125, -2.901611328125, -2.65771484375, -2.413818359375, -2.169921875, -1.926025390625, -1.68212890625, -1.438232421875, -1.1943359375, -0.950439453125, -0.70654296875, -0.462646484375, -0.21875, 0.025146484375, 0.26904296875, 0.512939453125, 0.7568359375, 1.000732421875, 1.24462890625, 1.488525390625, 1.732421875, 1.976318359375, 2.22021484375, 2.464111328125, 2.7080078125, 2.951904296875, 3.19580078125, 3.439697265625, 3.68359375, 3.927490234375, 4.17138671875, 4.415283203125, 4.6591796875, 4.903076171875, 5.14697265625, 5.390869140625, 5.634765625, 5.878662109375, 6.12255859375, 6.366455078125, 6.6103515625, 6.854248046875, 7.09814453125, 7.342041015625, 7.5859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 19.0, 81.0, 343.0, 417.0, 119.0, 20.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.73838424682617, -48.73485565185547, -44.731327056884766, -40.72779846191406, -36.724273681640625, -32.720741271972656, -28.71721649169922, -24.713687896728516, -20.710159301757812, -16.70663070678711, -12.703103065490723, -8.699575424194336, -4.696046829223633, -0.6925182342529297, 3.3110084533691406, 7.314537048339844, 11.318065643310547, 15.32159423828125, 19.325122833251953, 23.328649520874023, 27.332178115844727, 31.33570671081543, 35.3392333984375, 39.3427619934082, 43.346290588378906, 47.34981918334961, 51.35334777832031, 55.35687255859375, 59.36040496826172, 63.363929748535156, 67.36746215820312, 71.37098693847656, 75.37452697753906, 79.3780517578125, 83.38158416748047, 87.3851089477539, 91.38864135742188, 95.39216613769531, 99.39569091796875, 103.39922332763672, 107.40275573730469, 111.40628051757812, 115.4098129272461, 119.41333770751953, 123.4168701171875, 127.42039489746094, 131.42391967773438, 135.42745971679688, 139.43096923828125, 143.4344940185547, 147.43801879882812, 151.44155883789062, 155.44508361816406, 159.4486083984375, 163.45213317871094, 167.45565795898438, 171.45919799804688, 175.4627227783203, 179.46624755859375, 183.46978759765625, 187.4733123779297, 191.47683715820312, 195.48036193847656, 199.48388671875, 203.4874267578125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 8.0, 4.0, 11.0, 15.0, 11.0, 13.0, 19.0, 18.0, 27.0, 19.0, 25.0, 30.0, 33.0, 42.0, 34.0, 52.0, 36.0, 38.0, 35.0, 52.0, 54.0, 42.0, 35.0, 47.0, 33.0, 36.0, 32.0, 31.0, 28.0, 22.0, 24.0, 22.0, 10.0, 10.0, 5.0, 4.0, 8.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-26.830242156982422, -26.00262451171875, -25.175006866455078, -24.34739112854004, -23.519773483276367, -22.692155838012695, -21.864540100097656, -21.036922454833984, -20.209304809570312, -19.38168716430664, -18.55406951904297, -17.72645378112793, -16.898836135864258, -16.071218490600586, -15.24360179901123, -14.415985107421875, -13.588367462158203, -12.760749816894531, -11.933133125305176, -11.10551643371582, -10.277898788452148, -9.450281143188477, -8.622664451599121, -7.795047283172607, -6.967430114746094, -6.13981294631958, -5.312195777893066, -4.484578609466553, -3.656961441040039, -2.8293442726135254, -2.0017271041870117, -1.174109935760498, -0.3464946746826172, 0.4811224937438965, 1.3087396621704102, 2.136356830596924, 2.9639739990234375, 3.791591167449951, 4.619208335876465, 5.4468255043029785, 6.274442672729492, 7.102059841156006, 7.9296770095825195, 8.757293701171875, 9.584911346435547, 10.412528991699219, 11.240145683288574, 12.06776237487793, 12.895380020141602, 13.722997665405273, 14.550614356994629, 15.378231048583984, 16.205848693847656, 17.033466339111328, 17.861083984375, 18.68869972229004, 19.51631736755371, 20.343935012817383, 21.171550750732422, 21.999168395996094, 22.826786041259766, 23.654403686523438, 24.48202133178711, 25.30963706970215, 26.13725471496582]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 12.0, 15.0, 22.0, 22.0, 51.0, 79.0, 129.0, 265.0, 458.0, 1014.0, 2800.0, 10925.0, 87006.0, 3980585.0, 94493.0, 11302.0, 2916.0, 1072.0, 493.0, 251.0, 126.0, 84.0, 63.0, 24.0, 18.0, 17.0, 7.0, 8.0, 12.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.6334228515625, -9.337158203125, -9.0408935546875, -8.74462890625, -8.4483642578125, -8.152099609375, -7.8558349609375, -7.5595703125, -7.2633056640625, -6.967041015625, -6.6707763671875, -6.37451171875, -6.0782470703125, -5.781982421875, -5.4857177734375, -5.189453125, -4.8931884765625, -4.596923828125, -4.3006591796875, -4.00439453125, -3.7081298828125, -3.411865234375, -3.1156005859375, -2.8193359375, -2.5230712890625, -2.226806640625, -1.9305419921875, -1.63427734375, -1.3380126953125, -1.041748046875, -0.7454833984375, -0.44921875, -0.1529541015625, 0.143310546875, 0.4395751953125, 0.73583984375, 1.0321044921875, 1.328369140625, 1.6246337890625, 1.9208984375, 2.2171630859375, 2.513427734375, 2.8096923828125, 3.10595703125, 3.4022216796875, 3.698486328125, 3.9947509765625, 4.291015625, 4.5872802734375, 4.883544921875, 5.1798095703125, 5.47607421875, 5.7723388671875, 6.068603515625, 6.3648681640625, 6.6611328125, 6.9573974609375, 7.253662109375, 7.5499267578125, 7.84619140625, 8.1424560546875, 8.438720703125, 8.7349853515625, 9.03125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 12.0, 9.0, 17.0, 27.0, 30.0, 35.0, 36.0, 53.0, 57.0, 45.0, 54.0, 58.0, 54.0, 73.0, 66.0, 50.0, 57.0, 38.0, 45.0, 25.0, 24.0, 25.0, 18.0, 15.0, 15.0, 7.0, 10.0, 7.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.816436767578125, -1.75885009765625, -1.701263427734375, -1.6436767578125, -1.586090087890625, -1.52850341796875, -1.470916748046875, -1.413330078125, -1.355743408203125, -1.29815673828125, -1.240570068359375, -1.1829833984375, -1.125396728515625, -1.06781005859375, -1.010223388671875, -0.95263671875, -0.895050048828125, -0.83746337890625, -0.779876708984375, -0.7222900390625, -0.664703369140625, -0.60711669921875, -0.549530029296875, -0.491943359375, -0.434356689453125, -0.37677001953125, -0.319183349609375, -0.2615966796875, -0.204010009765625, -0.14642333984375, -0.088836669921875, -0.03125, 0.026336669921875, 0.08392333984375, 0.141510009765625, 0.1990966796875, 0.256683349609375, 0.31427001953125, 0.371856689453125, 0.429443359375, 0.487030029296875, 0.54461669921875, 0.602203369140625, 0.6597900390625, 0.717376708984375, 0.77496337890625, 0.832550048828125, 0.89013671875, 0.947723388671875, 1.00531005859375, 1.062896728515625, 1.1204833984375, 1.178070068359375, 1.23565673828125, 1.293243408203125, 1.350830078125, 1.408416748046875, 1.46600341796875, 1.523590087890625, 1.5811767578125, 1.638763427734375, 1.69635009765625, 1.753936767578125, 1.8115234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 9.0, 22.0, 26.0, 37.0, 55.0, 91.0, 117.0, 211.0, 321.0, 615.0, 1236.0, 3409.0, 15129.0, 160795.0, 3911641.0, 84588.0, 10750.0, 2753.0, 1046.0, 604.0, 313.0, 170.0, 128.0, 72.0, 37.0, 34.0, 23.0, 10.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.7835693359375, -8.512451171875, -8.2413330078125, -7.97021484375, -7.6990966796875, -7.427978515625, -7.1568603515625, -6.8857421875, -6.6146240234375, -6.343505859375, -6.0723876953125, -5.80126953125, -5.5301513671875, -5.259033203125, -4.9879150390625, -4.716796875, -4.4456787109375, -4.174560546875, -3.9034423828125, -3.63232421875, -3.3612060546875, -3.090087890625, -2.8189697265625, -2.5478515625, -2.2767333984375, -2.005615234375, -1.7344970703125, -1.46337890625, -1.1922607421875, -0.921142578125, -0.6500244140625, -0.37890625, -0.1077880859375, 0.163330078125, 0.4344482421875, 0.70556640625, 0.9766845703125, 1.247802734375, 1.5189208984375, 1.7900390625, 2.0611572265625, 2.332275390625, 2.6033935546875, 2.87451171875, 3.1456298828125, 3.416748046875, 3.6878662109375, 3.958984375, 4.2301025390625, 4.501220703125, 4.7723388671875, 5.04345703125, 5.3145751953125, 5.585693359375, 5.8568115234375, 6.1279296875, 6.3990478515625, 6.670166015625, 6.9412841796875, 7.21240234375, 7.4835205078125, 7.754638671875, 8.0257568359375, 8.296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 8.0, 11.0, 19.0, 29.0, 44.0, 122.0, 427.0, 2423.0, 608.0, 179.0, 76.0, 39.0, 30.0, 21.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.834869384765625, -2.73223876953125, -2.629608154296875, -2.5269775390625, -2.424346923828125, -2.32171630859375, -2.219085693359375, -2.116455078125, -2.013824462890625, -1.91119384765625, -1.808563232421875, -1.7059326171875, -1.603302001953125, -1.50067138671875, -1.398040771484375, -1.29541015625, -1.192779541015625, -1.09014892578125, -0.987518310546875, -0.8848876953125, -0.782257080078125, -0.67962646484375, -0.576995849609375, -0.474365234375, -0.371734619140625, -0.26910400390625, -0.166473388671875, -0.0638427734375, 0.038787841796875, 0.14141845703125, 0.244049072265625, 0.3466796875, 0.449310302734375, 0.55194091796875, 0.654571533203125, 0.7572021484375, 0.859832763671875, 0.96246337890625, 1.065093994140625, 1.167724609375, 1.270355224609375, 1.37298583984375, 1.475616455078125, 1.5782470703125, 1.680877685546875, 1.78350830078125, 1.886138916015625, 1.98876953125, 2.091400146484375, 2.19403076171875, 2.296661376953125, 2.3992919921875, 2.501922607421875, 2.60455322265625, 2.707183837890625, 2.809814453125, 2.912445068359375, 3.01507568359375, 3.117706298828125, 3.2203369140625, 3.322967529296875, 3.42559814453125, 3.528228759765625, 3.630859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 13.0, 32.0, 83.0, 140.0, 217.0, 174.0, 176.0, 97.0, 32.0, 7.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-28.076038360595703, -27.499469757080078, -26.92289924621582, -26.346330642700195, -25.76976203918457, -25.193193435668945, -24.616622924804688, -24.040054321289062, -23.463485717773438, -22.886917114257812, -22.310346603393555, -21.73377799987793, -21.157209396362305, -20.58064079284668, -20.004070281982422, -19.427501678466797, -18.850933074951172, -18.274364471435547, -17.69779396057129, -17.121225357055664, -16.54465675354004, -15.968087196350098, -15.391517639160156, -14.814949035644531, -14.238378524780273, -13.661808967590332, -13.085240364074707, -12.508670806884766, -11.93210220336914, -11.3555326461792, -10.778963088989258, -10.202394485473633, -9.625824928283691, -9.04925537109375, -8.472686767578125, -7.896117210388184, -7.319548606872559, -6.742979049682617, -6.166409969329834, -5.589840888977051, -5.013271808624268, -4.436702728271484, -3.860133647918701, -3.283564329147339, -2.7069952487945557, -2.1304261684417725, -1.5538568496704102, -0.977287769317627, -0.40071868896484375, 0.17585045099258423, 0.7524195909500122, 1.328988790512085, 1.9055578708648682, 2.4821269512176514, 3.0586962699890137, 3.635265350341797, 4.21183443069458, 4.788403511047363, 5.3649725914001465, 5.94154167175293, 6.518111228942871, 7.094679832458496, 7.6712493896484375, 8.247817993164062, 8.824387550354004]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 11.0, 17.0, 19.0, 35.0, 35.0, 55.0, 61.0, 51.0, 43.0, 55.0, 78.0, 71.0, 65.0, 72.0, 62.0, 36.0, 59.0, 40.0, 28.0, 24.0, 15.0, 21.0, 12.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.687346458435059, -7.387083530426025, -7.086820602416992, -6.786557674407959, -6.486294746398926, -6.186032295227051, -5.885769367218018, -5.585506439208984, -5.285243511199951, -4.984980583190918, -4.684717655181885, -4.384454727172852, -4.084192276000977, -3.7839291095733643, -3.48366641998291, -3.183403491973877, -2.8831405639648438, -2.5828776359558105, -2.2826147079467773, -1.9823520183563232, -1.68208909034729, -1.3818261623382568, -1.0815633535385132, -0.7813005447387695, -0.48103761672973633, -0.1807747483253479, 0.11948812007904053, 0.41975098848342896, 0.7200138568878174, 1.0202767848968506, 1.3205395936965942, 1.620802402496338, 1.9210662841796875, 2.2213292121887207, 2.521592140197754, 2.821854829788208, 3.122117757797241, 3.4223806858062744, 3.7226433753967285, 4.022906303405762, 4.323169231414795, 4.623432159423828, 4.923695087432861, 5.2239580154418945, 5.5242204666137695, 5.824483871459961, 6.124746322631836, 6.425009250640869, 6.725272178649902, 7.0255351066589355, 7.325798034667969, 7.626060962677002, 7.926323890686035, 8.22658634185791, 8.526849746704102, 8.827112197875977, 9.127374649047852, 9.427637100219727, 9.727900505065918, 10.028162956237793, 10.328426361083984, 10.62868881225586, 10.92895221710205, 11.229214668273926, 11.529478073120117]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 13.0, 8.0, 20.0, 29.0, 67.0, 111.0, 253.0, 594.0, 1931.0, 7601.0, 42432.0, 397450.0, 529280.0, 55896.0, 9363.0, 2225.0, 693.0, 261.0, 129.0, 76.0, 42.0, 22.0, 20.0, 13.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.58740234375, -9.2685546875, -8.94970703125, -8.630859375, -8.31201171875, -7.9931640625, -7.67431640625, -7.35546875, -7.03662109375, -6.7177734375, -6.39892578125, -6.080078125, -5.76123046875, -5.4423828125, -5.12353515625, -4.8046875, -4.48583984375, -4.1669921875, -3.84814453125, -3.529296875, -3.21044921875, -2.8916015625, -2.57275390625, -2.25390625, -1.93505859375, -1.6162109375, -1.29736328125, -0.978515625, -0.65966796875, -0.3408203125, -0.02197265625, 0.296875, 0.61572265625, 0.9345703125, 1.25341796875, 1.572265625, 1.89111328125, 2.2099609375, 2.52880859375, 2.84765625, 3.16650390625, 3.4853515625, 3.80419921875, 4.123046875, 4.44189453125, 4.7607421875, 5.07958984375, 5.3984375, 5.71728515625, 6.0361328125, 6.35498046875, 6.673828125, 6.99267578125, 7.3115234375, 7.63037109375, 7.94921875, 8.26806640625, 8.5869140625, 8.90576171875, 9.224609375, 9.54345703125, 9.8623046875, 10.18115234375, 10.5]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 17.0, 13.0, 13.0, 20.0, 20.0, 34.0, 41.0, 40.0, 46.0, 40.0, 54.0, 54.0, 61.0, 57.0, 62.0, 53.0, 61.0, 56.0, 47.0, 35.0, 29.0, 28.0, 19.0, 19.0, 10.0, 13.0, 11.0, 9.0, 8.0, 7.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.830322265625, -1.77392578125, -1.717529296875, -1.6611328125, -1.604736328125, -1.54833984375, -1.491943359375, -1.435546875, -1.379150390625, -1.32275390625, -1.266357421875, -1.2099609375, -1.153564453125, -1.09716796875, -1.040771484375, -0.984375, -0.927978515625, -0.87158203125, -0.815185546875, -0.7587890625, -0.702392578125, -0.64599609375, -0.589599609375, -0.533203125, -0.476806640625, -0.42041015625, -0.364013671875, -0.3076171875, -0.251220703125, -0.19482421875, -0.138427734375, -0.08203125, -0.025634765625, 0.03076171875, 0.087158203125, 0.1435546875, 0.199951171875, 0.25634765625, 0.312744140625, 0.369140625, 0.425537109375, 0.48193359375, 0.538330078125, 0.5947265625, 0.651123046875, 0.70751953125, 0.763916015625, 0.8203125, 0.876708984375, 0.93310546875, 0.989501953125, 1.0458984375, 1.102294921875, 1.15869140625, 1.215087890625, 1.271484375, 1.327880859375, 1.38427734375, 1.440673828125, 1.4970703125, 1.553466796875, 1.60986328125, 1.666259765625, 1.72265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 13.0, 13.0, 22.0, 40.0, 36.0, 47.0, 77.0, 117.0, 211.0, 334.0, 648.0, 1308.0, 3006.0, 6785.0, 18011.0, 50888.0, 160810.0, 462622.0, 232200.0, 70790.0, 24147.0, 8996.0, 3747.0, 1756.0, 769.0, 420.0, 266.0, 158.0, 87.0, 48.0, 36.0, 21.0, 25.0, 14.0, 17.0, 9.0, 12.0, 8.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0], "bins": [-5.08203125, -4.943359375, -4.8046875, -4.666015625, -4.52734375, -4.388671875, -4.25, -4.111328125, -3.97265625, -3.833984375, -3.6953125, -3.556640625, -3.41796875, -3.279296875, -3.140625, -3.001953125, -2.86328125, -2.724609375, -2.5859375, -2.447265625, -2.30859375, -2.169921875, -2.03125, -1.892578125, -1.75390625, -1.615234375, -1.4765625, -1.337890625, -1.19921875, -1.060546875, -0.921875, -0.783203125, -0.64453125, -0.505859375, -0.3671875, -0.228515625, -0.08984375, 0.048828125, 0.1875, 0.326171875, 0.46484375, 0.603515625, 0.7421875, 0.880859375, 1.01953125, 1.158203125, 1.296875, 1.435546875, 1.57421875, 1.712890625, 1.8515625, 1.990234375, 2.12890625, 2.267578125, 2.40625, 2.544921875, 2.68359375, 2.822265625, 2.9609375, 3.099609375, 3.23828125, 3.376953125, 3.515625, 3.654296875, 3.79296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 5.0, 6.0, 3.0, 5.0, 7.0, 18.0, 18.0, 14.0, 19.0, 22.0, 31.0, 28.0, 26.0, 26.0, 44.0, 32.0, 33.0, 35.0, 44.0, 41.0, 53.0, 48.0, 43.0, 37.0, 49.0, 55.0, 32.0, 25.0, 30.0, 20.0, 24.0, 17.0, 17.0, 18.0, 14.0, 12.0, 6.0, 13.0, 4.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.6015625, -5.43426513671875, -5.2669677734375, -5.09967041015625, -4.932373046875, -4.76507568359375, -4.5977783203125, -4.43048095703125, -4.26318359375, -4.09588623046875, -3.9285888671875, -3.76129150390625, -3.593994140625, -3.42669677734375, -3.2593994140625, -3.09210205078125, -2.9248046875, -2.75750732421875, -2.5902099609375, -2.42291259765625, -2.255615234375, -2.08831787109375, -1.9210205078125, -1.75372314453125, -1.58642578125, -1.41912841796875, -1.2518310546875, -1.08453369140625, -0.917236328125, -0.74993896484375, -0.5826416015625, -0.41534423828125, -0.248046875, -0.08074951171875, 0.0865478515625, 0.25384521484375, 0.421142578125, 0.58843994140625, 0.7557373046875, 0.92303466796875, 1.09033203125, 1.25762939453125, 1.4249267578125, 1.59222412109375, 1.759521484375, 1.92681884765625, 2.0941162109375, 2.26141357421875, 2.4287109375, 2.59600830078125, 2.7633056640625, 2.93060302734375, 3.097900390625, 3.26519775390625, 3.4324951171875, 3.59979248046875, 3.76708984375, 3.93438720703125, 4.1016845703125, 4.26898193359375, 4.436279296875, 4.60357666015625, 4.7708740234375, 4.93817138671875, 5.10546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 10.0, 11.0, 17.0, 11.0, 36.0, 95.0, 142.0, 385.0, 1068.0, 3584.0, 18005.0, 180290.0, 786414.0, 47914.0, 7569.0, 1828.0, 688.0, 241.0, 113.0, 50.0, 32.0, 22.0, 10.0, 12.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69921875, -3.58795166015625, -3.4766845703125, -3.36541748046875, -3.254150390625, -3.14288330078125, -3.0316162109375, -2.92034912109375, -2.80908203125, -2.69781494140625, -2.5865478515625, -2.47528076171875, -2.364013671875, -2.25274658203125, -2.1414794921875, -2.03021240234375, -1.9189453125, -1.80767822265625, -1.6964111328125, -1.58514404296875, -1.473876953125, -1.36260986328125, -1.2513427734375, -1.14007568359375, -1.02880859375, -0.91754150390625, -0.8062744140625, -0.69500732421875, -0.583740234375, -0.47247314453125, -0.3612060546875, -0.24993896484375, -0.138671875, -0.02740478515625, 0.0838623046875, 0.19512939453125, 0.306396484375, 0.41766357421875, 0.5289306640625, 0.64019775390625, 0.75146484375, 0.86273193359375, 0.9739990234375, 1.08526611328125, 1.196533203125, 1.30780029296875, 1.4190673828125, 1.53033447265625, 1.6416015625, 1.75286865234375, 1.8641357421875, 1.97540283203125, 2.086669921875, 2.19793701171875, 2.3092041015625, 2.42047119140625, 2.53173828125, 2.64300537109375, 2.7542724609375, 2.86553955078125, 2.976806640625, 3.08807373046875, 3.1993408203125, 3.31060791015625, 3.421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 11.0, 6.0, 17.0, 13.0, 22.0, 44.0, 105.0, 286.0, 250.0, 114.0, 38.0, 33.0, 22.0, 9.0, 6.0, 10.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007410049438476562, -0.0007203966379165649, -0.0006997883319854736, -0.0006791800260543823, -0.000658571720123291, -0.0006379634141921997, -0.0006173551082611084, -0.0005967468023300171, -0.0005761384963989258, -0.0005555301904678345, -0.0005349218845367432, -0.0005143135786056519, -0.0004937052726745605, -0.00047309696674346924, -0.00045248866081237793, -0.0004318803548812866, -0.0004112720489501953, -0.000390663743019104, -0.0003700554370880127, -0.0003494471311569214, -0.0003288388252258301, -0.00030823051929473877, -0.00028762221336364746, -0.00026701390743255615, -0.00024640560150146484, -0.00022579729557037354, -0.00020518898963928223, -0.00018458068370819092, -0.0001639723777770996, -0.0001433640718460083, -0.000122755765914917, -0.00010214745998382568, -8.153915405273438e-05, -6.0930848121643066e-05, -4.032254219055176e-05, -1.971423625946045e-05, 8.940696716308594e-07, 2.1502375602722168e-05, 4.2110681533813477e-05, 6.271898746490479e-05, 8.33272933959961e-05, 0.0001039355993270874, 0.0001245439052581787, 0.00014515221118927002, 0.00016576051712036133, 0.00018636882305145264, 0.00020697712898254395, 0.00022758543491363525, 0.00024819374084472656, 0.00026880204677581787, 0.0002894103527069092, 0.0003100186586380005, 0.0003306269645690918, 0.0003512352705001831, 0.0003718435764312744, 0.0003924518823623657, 0.00041306018829345703, 0.00043366849422454834, 0.00045427680015563965, 0.00047488510608673096, 0.0004954934120178223, 0.0005161017179489136, 0.0005367100238800049, 0.0005573183298110962, 0.0005779266357421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 6.0, 14.0, 29.0, 35.0, 62.0, 98.0, 172.0, 312.0, 500.0, 958.0, 1878.0, 3994.0, 10297.0, 31672.0, 190155.0, 703110.0, 74033.0, 18657.0, 6725.0, 2883.0, 1312.0, 698.0, 367.0, 223.0, 117.0, 83.0, 41.0, 51.0, 22.0, 13.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.79296875, -2.71380615234375, -2.6346435546875, -2.55548095703125, -2.476318359375, -2.39715576171875, -2.3179931640625, -2.23883056640625, -2.15966796875, -2.08050537109375, -2.0013427734375, -1.92218017578125, -1.843017578125, -1.76385498046875, -1.6846923828125, -1.60552978515625, -1.5263671875, -1.44720458984375, -1.3680419921875, -1.28887939453125, -1.209716796875, -1.13055419921875, -1.0513916015625, -0.97222900390625, -0.89306640625, -0.81390380859375, -0.7347412109375, -0.65557861328125, -0.576416015625, -0.49725341796875, -0.4180908203125, -0.33892822265625, -0.259765625, -0.18060302734375, -0.1014404296875, -0.02227783203125, 0.056884765625, 0.13604736328125, 0.2152099609375, 0.29437255859375, 0.37353515625, 0.45269775390625, 0.5318603515625, 0.61102294921875, 0.690185546875, 0.76934814453125, 0.8485107421875, 0.92767333984375, 1.0068359375, 1.08599853515625, 1.1651611328125, 1.24432373046875, 1.323486328125, 1.40264892578125, 1.4818115234375, 1.56097412109375, 1.64013671875, 1.71929931640625, 1.7984619140625, 1.87762451171875, 1.956787109375, 2.03594970703125, 2.1151123046875, 2.19427490234375, 2.2734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 14.0, 17.0, 28.0, 34.0, 67.0, 78.0, 132.0, 150.0, 142.0, 77.0, 74.0, 46.0, 36.0, 19.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.5167236328125, -2.441650390625, -2.3665771484375, -2.29150390625, -2.2164306640625, -2.141357421875, -2.0662841796875, -1.9912109375, -1.9161376953125, -1.841064453125, -1.7659912109375, -1.69091796875, -1.6158447265625, -1.540771484375, -1.4656982421875, -1.390625, -1.3155517578125, -1.240478515625, -1.1654052734375, -1.09033203125, -1.0152587890625, -0.940185546875, -0.8651123046875, -0.7900390625, -0.7149658203125, -0.639892578125, -0.5648193359375, -0.48974609375, -0.4146728515625, -0.339599609375, -0.2645263671875, -0.189453125, -0.1143798828125, -0.039306640625, 0.0357666015625, 0.11083984375, 0.1859130859375, 0.260986328125, 0.3360595703125, 0.4111328125, 0.4862060546875, 0.561279296875, 0.6363525390625, 0.71142578125, 0.7864990234375, 0.861572265625, 0.9366455078125, 1.01171875, 1.0867919921875, 1.161865234375, 1.2369384765625, 1.31201171875, 1.3870849609375, 1.462158203125, 1.5372314453125, 1.6123046875, 1.6873779296875, 1.762451171875, 1.8375244140625, 1.91259765625, 1.9876708984375, 2.062744140625, 2.1378173828125, 2.212890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 21.0, 46.0, 91.0, 180.0, 260.0, 200.0, 113.0, 46.0, 22.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.71807861328125, -99.70803833007812, -97.69799041748047, -95.68795013427734, -93.67790985107422, -91.6678695678711, -89.65782165527344, -87.64778137207031, -85.63774108886719, -83.62770080566406, -81.6176528930664, -79.60761260986328, -77.59757232666016, -75.58753204345703, -73.57748413085938, -71.56744384765625, -69.55740356445312, -67.54736328125, -65.53731536865234, -63.52727508544922, -61.517234802246094, -59.5071907043457, -57.49714660644531, -55.48710632324219, -53.47705841064453, -51.46701431274414, -49.456974029541016, -47.446929931640625, -45.4368896484375, -43.42684555053711, -41.41680145263672, -39.406761169433594, -37.396728515625, -35.38668441772461, -33.376644134521484, -31.366600036621094, -29.35655975341797, -27.346515655517578, -25.33647346496582, -23.326431274414062, -21.316387176513672, -19.306344985961914, -17.296302795410156, -15.286259651184082, -13.276217460632324, -11.266175270080566, -9.256132125854492, -7.246089935302734, -5.236047744750977, -3.2260053157806396, -1.2159628868103027, 0.7940797805786133, 2.804121971130371, 4.814164161682129, 6.824207305908203, 8.834249496459961, 10.844291687011719, 12.854333877563477, 14.864376068115234, 16.874420166015625, 18.88446044921875, 20.89450454711914, 22.9045467376709, 24.914588928222656, 26.924631118774414]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 7.0, 8.0, 17.0, 9.0, 12.0, 24.0, 28.0, 26.0, 28.0, 30.0, 34.0, 26.0, 29.0, 34.0, 27.0, 30.0, 42.0, 27.0, 44.0, 33.0, 34.0, 31.0, 36.0, 33.0, 31.0, 22.0, 26.0, 26.0, 24.0, 33.0, 24.0, 23.0, 21.0, 12.0, 18.0, 10.0, 10.0, 5.0, 6.0, 7.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-23.635513305664062, -22.937578201293945, -22.239643096923828, -21.541709899902344, -20.843774795532227, -20.14583969116211, -19.447904586791992, -18.749969482421875, -18.052034378051758, -17.35409927368164, -16.656164169311523, -15.958230018615723, -15.260294914245605, -14.562360763549805, -13.864425659179688, -13.16649055480957, -12.46855640411377, -11.770621299743652, -11.072687149047852, -10.374752044677734, -9.676816940307617, -8.9788818359375, -8.2809476852417, -7.583012580871582, -6.885077953338623, -6.187143325805664, -5.489208221435547, -4.791273593902588, -4.093338966369629, -3.3954038619995117, -2.6974692344665527, -1.9995341300964355, -1.3015995025634766, -0.6036646962165833, 0.09427011013031006, 0.7922048568725586, 1.4901397228240967, 2.1880745887756348, 2.8860092163085938, 3.583944320678711, 4.28187894821167, 4.979813575744629, 5.677748680114746, 6.375683307647705, 7.073617935180664, 7.771553039550781, 8.469488143920898, 9.167423248291016, 9.865357398986816, 10.563292503356934, 11.261226654052734, 11.959161758422852, 12.657096862792969, 13.355031967163086, 14.052966117858887, 14.750901222229004, 15.448835372924805, 16.146770477294922, 16.84470558166504, 17.542640686035156, 18.24057388305664, 18.938508987426758, 19.636444091796875, 20.334379196166992, 21.03231430053711]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 9.0, 8.0, 13.0, 17.0, 39.0, 48.0, 55.0, 98.0, 143.0, 227.0, 342.0, 667.0, 1273.0, 2733.0, 8548.0, 51196.0, 3993513.0, 114873.0, 13169.0, 3787.0, 1516.0, 770.0, 405.0, 284.0, 158.0, 126.0, 77.0, 49.0, 39.0, 25.0, 19.0, 14.0, 11.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.2421875, -13.7774658203125, -13.312744140625, -12.8480224609375, -12.38330078125, -11.9185791015625, -11.453857421875, -10.9891357421875, -10.5244140625, -10.0596923828125, -9.594970703125, -9.1302490234375, -8.66552734375, -8.2008056640625, -7.736083984375, -7.2713623046875, -6.806640625, -6.3419189453125, -5.877197265625, -5.4124755859375, -4.94775390625, -4.4830322265625, -4.018310546875, -3.5535888671875, -3.0888671875, -2.6241455078125, -2.159423828125, -1.6947021484375, -1.22998046875, -0.7652587890625, -0.300537109375, 0.1641845703125, 0.62890625, 1.0936279296875, 1.558349609375, 2.0230712890625, 2.48779296875, 2.9525146484375, 3.417236328125, 3.8819580078125, 4.3466796875, 4.8114013671875, 5.276123046875, 5.7408447265625, 6.20556640625, 6.6702880859375, 7.135009765625, 7.5997314453125, 8.064453125, 8.5291748046875, 8.993896484375, 9.4586181640625, 9.92333984375, 10.3880615234375, 10.852783203125, 11.3175048828125, 11.7822265625, 12.2469482421875, 12.711669921875, 13.1763916015625, 13.64111328125, 14.1058349609375, 14.570556640625, 15.0352783203125, 15.5]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 13.0, 11.0, 19.0, 20.0, 31.0, 38.0, 50.0, 42.0, 43.0, 42.0, 41.0, 70.0, 74.0, 55.0, 49.0, 47.0, 44.0, 46.0, 46.0, 36.0, 29.0, 31.0, 19.0, 16.0, 17.0, 15.0, 9.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.25, -2.192291259765625, -2.13458251953125, -2.076873779296875, -2.0191650390625, -1.961456298828125, -1.90374755859375, -1.846038818359375, -1.788330078125, -1.730621337890625, -1.67291259765625, -1.615203857421875, -1.5574951171875, -1.499786376953125, -1.44207763671875, -1.384368896484375, -1.32666015625, -1.268951416015625, -1.21124267578125, -1.153533935546875, -1.0958251953125, -1.038116455078125, -0.98040771484375, -0.922698974609375, -0.864990234375, -0.807281494140625, -0.74957275390625, -0.691864013671875, -0.6341552734375, -0.576446533203125, -0.51873779296875, -0.461029052734375, -0.4033203125, -0.345611572265625, -0.28790283203125, -0.230194091796875, -0.1724853515625, -0.114776611328125, -0.05706787109375, 0.000640869140625, 0.058349609375, 0.116058349609375, 0.17376708984375, 0.231475830078125, 0.2891845703125, 0.346893310546875, 0.40460205078125, 0.462310791015625, 0.52001953125, 0.577728271484375, 0.63543701171875, 0.693145751953125, 0.7508544921875, 0.808563232421875, 0.86627197265625, 0.923980712890625, 0.981689453125, 1.039398193359375, 1.09710693359375, 1.154815673828125, 1.2125244140625, 1.270233154296875, 1.32794189453125, 1.385650634765625, 1.443359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 16.0, 35.0, 38.0, 61.0, 118.0, 244.0, 367.0, 624.0, 1157.0, 2457.0, 5504.0, 14037.0, 49059.0, 602104.0, 3410937.0, 76364.0, 18394.0, 6706.0, 2830.0, 1478.0, 755.0, 434.0, 232.0, 129.0, 72.0, 43.0, 25.0, 19.0, 15.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.34808349609375, -6.1141357421875, -5.88018798828125, -5.646240234375, -5.41229248046875, -5.1783447265625, -4.94439697265625, -4.71044921875, -4.47650146484375, -4.2425537109375, -4.00860595703125, -3.774658203125, -3.54071044921875, -3.3067626953125, -3.07281494140625, -2.8388671875, -2.60491943359375, -2.3709716796875, -2.13702392578125, -1.903076171875, -1.66912841796875, -1.4351806640625, -1.20123291015625, -0.96728515625, -0.73333740234375, -0.4993896484375, -0.26544189453125, -0.031494140625, 0.20245361328125, 0.4364013671875, 0.67034912109375, 0.904296875, 1.13824462890625, 1.3721923828125, 1.60614013671875, 1.840087890625, 2.07403564453125, 2.3079833984375, 2.54193115234375, 2.77587890625, 3.00982666015625, 3.2437744140625, 3.47772216796875, 3.711669921875, 3.94561767578125, 4.1795654296875, 4.41351318359375, 4.6474609375, 4.88140869140625, 5.1153564453125, 5.34930419921875, 5.583251953125, 5.81719970703125, 6.0511474609375, 6.28509521484375, 6.51904296875, 6.75299072265625, 6.9869384765625, 7.22088623046875, 7.454833984375, 7.68878173828125, 7.9227294921875, 8.15667724609375, 8.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 8.0, 15.0, 16.0, 23.0, 31.0, 59.0, 108.0, 254.0, 2047.0, 1078.0, 209.0, 71.0, 49.0, 23.0, 18.0, 9.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.3968505859375, -3.293701171875, -3.1905517578125, -3.08740234375, -2.9842529296875, -2.881103515625, -2.7779541015625, -2.6748046875, -2.5716552734375, -2.468505859375, -2.3653564453125, -2.26220703125, -2.1590576171875, -2.055908203125, -1.9527587890625, -1.849609375, -1.7464599609375, -1.643310546875, -1.5401611328125, -1.43701171875, -1.3338623046875, -1.230712890625, -1.1275634765625, -1.0244140625, -0.9212646484375, -0.818115234375, -0.7149658203125, -0.61181640625, -0.5086669921875, -0.405517578125, -0.3023681640625, -0.19921875, -0.0960693359375, 0.007080078125, 0.1102294921875, 0.21337890625, 0.3165283203125, 0.419677734375, 0.5228271484375, 0.6259765625, 0.7291259765625, 0.832275390625, 0.9354248046875, 1.03857421875, 1.1417236328125, 1.244873046875, 1.3480224609375, 1.451171875, 1.5543212890625, 1.657470703125, 1.7606201171875, 1.86376953125, 1.9669189453125, 2.070068359375, 2.1732177734375, 2.2763671875, 2.3795166015625, 2.482666015625, 2.5858154296875, 2.68896484375, 2.7921142578125, 2.895263671875, 2.9984130859375, 3.1015625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 13.0, 11.0, 32.0, 58.0, 116.0, 214.0, 239.0, 171.0, 87.0, 33.0, 12.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.76390075683594, -31.960107803344727, -31.156314849853516, -30.352521896362305, -29.548728942871094, -28.74493408203125, -27.94114112854004, -27.137348175048828, -26.333555221557617, -25.529762268066406, -24.725969314575195, -23.922176361083984, -23.11838150024414, -22.314590454101562, -21.51079559326172, -20.707002639770508, -19.903209686279297, -19.099416732788086, -18.295623779296875, -17.491830825805664, -16.688037872314453, -15.884243965148926, -15.080450057983398, -14.276657104492188, -13.472864151000977, -12.669071197509766, -11.865278244018555, -11.061484336853027, -10.257691383361816, -9.453898429870605, -8.650104522705078, -7.846311569213867, -7.042516708374023, -6.2387237548828125, -5.434930324554443, -4.631136894226074, -3.8273439407348633, -3.0235509872436523, -2.219757556915283, -1.415964126586914, -0.6121711730957031, 0.19162201881408691, 0.995415210723877, 1.799208402633667, 2.603001594543457, 3.406794548034668, 4.210587978363037, 5.014381408691406, 5.818174362182617, 6.621967315673828, 7.425760746002197, 8.229554176330566, 9.033347129821777, 9.837140083312988, 10.640933990478516, 11.444726943969727, 12.248519897460938, 13.052312850952148, 13.85610580444336, 14.659899711608887, 15.463692665100098, 16.267486572265625, 17.071279525756836, 17.875072479248047, 18.678865432739258]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 10.0, 7.0, 10.0, 15.0, 14.0, 18.0, 23.0, 26.0, 22.0, 16.0, 16.0, 24.0, 36.0, 36.0, 35.0, 28.0, 23.0, 37.0, 38.0, 46.0, 37.0, 37.0, 26.0, 48.0, 39.0, 27.0, 31.0, 37.0, 27.0, 29.0, 20.0, 21.0, 27.0, 17.0, 19.0, 12.0, 18.0, 6.0, 9.0, 6.0, 5.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.768549919128418, -7.523983955383301, -7.279418468475342, -7.034852504730225, -6.790286540985107, -6.545721054077148, -6.301155090332031, -6.056589126586914, -5.812023162841797, -5.56745719909668, -5.322891712188721, -5.0783257484436035, -4.833759784698486, -4.589194297790527, -4.34462833404541, -4.100062370300293, -3.855496883392334, -3.610931158065796, -3.3663651943206787, -3.1217994689941406, -2.8772335052490234, -2.6326677799224854, -2.3881020545959473, -2.14353609085083, -1.898970365524292, -1.6544045209884644, -1.4098386764526367, -1.1652729511260986, -0.920707106590271, -0.6761412620544434, -0.4315755367279053, -0.18700969219207764, 0.05755615234375, 0.30212196707725525, 0.5466877818107605, 0.7912535667419434, 1.035819411277771, 1.2803852558135986, 1.5249509811401367, 1.7695168256759644, 2.014082670211792, 2.25864839553833, 2.5032143592834473, 2.7477800846099854, 2.9923458099365234, 3.2369117736816406, 3.4814774990081787, 3.726043224334717, 3.970609188079834, 4.215175151824951, 4.45974063873291, 4.704306602478027, 4.9488725662231445, 5.193438529968262, 5.438004016876221, 5.682569980621338, 5.927135467529297, 6.171701431274414, 6.416266918182373, 6.66083288192749, 6.905398845672607, 7.149964332580566, 7.394530296325684, 7.639096260070801, 7.883662223815918]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 22.0, 34.0, 50.0, 64.0, 104.0, 173.0, 286.0, 463.0, 945.0, 1736.0, 3683.0, 8535.0, 23269.0, 78233.0, 326714.0, 442365.0, 111117.0, 30635.0, 11017.0, 4489.0, 2094.0, 1043.0, 583.0, 353.0, 176.0, 110.0, 73.0, 46.0, 44.0, 27.0, 9.0, 15.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.80859375, -7.5728759765625, -7.337158203125, -7.1014404296875, -6.86572265625, -6.6300048828125, -6.394287109375, -6.1585693359375, -5.9228515625, -5.6871337890625, -5.451416015625, -5.2156982421875, -4.97998046875, -4.7442626953125, -4.508544921875, -4.2728271484375, -4.037109375, -3.8013916015625, -3.565673828125, -3.3299560546875, -3.09423828125, -2.8585205078125, -2.622802734375, -2.3870849609375, -2.1513671875, -1.9156494140625, -1.679931640625, -1.4442138671875, -1.20849609375, -0.9727783203125, -0.737060546875, -0.5013427734375, -0.265625, -0.0299072265625, 0.205810546875, 0.4415283203125, 0.67724609375, 0.9129638671875, 1.148681640625, 1.3843994140625, 1.6201171875, 1.8558349609375, 2.091552734375, 2.3272705078125, 2.56298828125, 2.7987060546875, 3.034423828125, 3.2701416015625, 3.505859375, 3.7415771484375, 3.977294921875, 4.2130126953125, 4.44873046875, 4.6844482421875, 4.920166015625, 5.1558837890625, 5.3916015625, 5.6273193359375, 5.863037109375, 6.0987548828125, 6.33447265625, 6.5701904296875, 6.805908203125, 7.0416259765625, 7.27734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 6.0, 7.0, 11.0, 13.0, 17.0, 20.0, 25.0, 24.0, 32.0, 46.0, 41.0, 51.0, 45.0, 52.0, 62.0, 58.0, 52.0, 46.0, 51.0, 46.0, 44.0, 45.0, 36.0, 35.0, 27.0, 16.0, 24.0, 19.0, 9.0, 10.0, 10.0, 6.0, 9.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.126953125, -2.067626953125, -2.00830078125, -1.948974609375, -1.8896484375, -1.830322265625, -1.77099609375, -1.711669921875, -1.65234375, -1.593017578125, -1.53369140625, -1.474365234375, -1.4150390625, -1.355712890625, -1.29638671875, -1.237060546875, -1.177734375, -1.118408203125, -1.05908203125, -0.999755859375, -0.9404296875, -0.881103515625, -0.82177734375, -0.762451171875, -0.703125, -0.643798828125, -0.58447265625, -0.525146484375, -0.4658203125, -0.406494140625, -0.34716796875, -0.287841796875, -0.228515625, -0.169189453125, -0.10986328125, -0.050537109375, 0.0087890625, 0.068115234375, 0.12744140625, 0.186767578125, 0.24609375, 0.305419921875, 0.36474609375, 0.424072265625, 0.4833984375, 0.542724609375, 0.60205078125, 0.661376953125, 0.720703125, 0.780029296875, 0.83935546875, 0.898681640625, 0.9580078125, 1.017333984375, 1.07666015625, 1.135986328125, 1.1953125, 1.254638671875, 1.31396484375, 1.373291015625, 1.4326171875, 1.491943359375, 1.55126953125, 1.610595703125, 1.669921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 1.0, 6.0, 6.0, 8.0, 13.0, 12.0, 25.0, 47.0, 74.0, 115.0, 205.0, 391.0, 711.0, 1533.0, 3881.0, 12997.0, 62778.0, 432086.0, 447519.0, 65846.0, 13079.0, 4092.0, 1549.0, 738.0, 346.0, 179.0, 128.0, 62.0, 41.0, 25.0, 26.0, 8.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.96875, -6.719970703125, -6.47119140625, -6.222412109375, -5.9736328125, -5.724853515625, -5.47607421875, -5.227294921875, -4.978515625, -4.729736328125, -4.48095703125, -4.232177734375, -3.9833984375, -3.734619140625, -3.48583984375, -3.237060546875, -2.98828125, -2.739501953125, -2.49072265625, -2.241943359375, -1.9931640625, -1.744384765625, -1.49560546875, -1.246826171875, -0.998046875, -0.749267578125, -0.50048828125, -0.251708984375, -0.0029296875, 0.245849609375, 0.49462890625, 0.743408203125, 0.9921875, 1.240966796875, 1.48974609375, 1.738525390625, 1.9873046875, 2.236083984375, 2.48486328125, 2.733642578125, 2.982421875, 3.231201171875, 3.47998046875, 3.728759765625, 3.9775390625, 4.226318359375, 4.47509765625, 4.723876953125, 4.97265625, 5.221435546875, 5.47021484375, 5.718994140625, 5.9677734375, 6.216552734375, 6.46533203125, 6.714111328125, 6.962890625, 7.211669921875, 7.46044921875, 7.709228515625, 7.9580078125, 8.206787109375, 8.45556640625, 8.704345703125, 8.953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 8.0, 17.0, 29.0, 26.0, 30.0, 40.0, 39.0, 58.0, 65.0, 61.0, 76.0, 73.0, 59.0, 59.0, 49.0, 49.0, 52.0, 47.0, 42.0, 27.0, 21.0, 12.0, 13.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3673095703125, -11.039306640625, -10.7113037109375, -10.38330078125, -10.0552978515625, -9.727294921875, -9.3992919921875, -9.0712890625, -8.7432861328125, -8.415283203125, -8.0872802734375, -7.75927734375, -7.4312744140625, -7.103271484375, -6.7752685546875, -6.447265625, -6.1192626953125, -5.791259765625, -5.4632568359375, -5.13525390625, -4.8072509765625, -4.479248046875, -4.1512451171875, -3.8232421875, -3.4952392578125, -3.167236328125, -2.8392333984375, -2.51123046875, -2.1832275390625, -1.855224609375, -1.5272216796875, -1.19921875, -0.8712158203125, -0.543212890625, -0.2152099609375, 0.11279296875, 0.4407958984375, 0.768798828125, 1.0968017578125, 1.4248046875, 1.7528076171875, 2.080810546875, 2.4088134765625, 2.73681640625, 3.0648193359375, 3.392822265625, 3.7208251953125, 4.048828125, 4.3768310546875, 4.704833984375, 5.0328369140625, 5.36083984375, 5.6888427734375, 6.016845703125, 6.3448486328125, 6.6728515625, 7.0008544921875, 7.328857421875, 7.6568603515625, 7.98486328125, 8.3128662109375, 8.640869140625, 8.9688720703125, 9.296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 8.0, 14.0, 11.0, 13.0, 26.0, 35.0, 49.0, 61.0, 110.0, 164.0, 304.0, 577.0, 1272.0, 3731.0, 13942.0, 128652.0, 841808.0, 45433.0, 7869.0, 2396.0, 978.0, 459.0, 213.0, 138.0, 81.0, 52.0, 37.0, 34.0, 19.0, 21.0, 10.0, 5.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.5625, -9.29168701171875, -9.0208740234375, -8.75006103515625, -8.479248046875, -8.20843505859375, -7.9376220703125, -7.66680908203125, -7.39599609375, -7.12518310546875, -6.8543701171875, -6.58355712890625, -6.312744140625, -6.04193115234375, -5.7711181640625, -5.50030517578125, -5.2294921875, -4.95867919921875, -4.6878662109375, -4.41705322265625, -4.146240234375, -3.87542724609375, -3.6046142578125, -3.33380126953125, -3.06298828125, -2.79217529296875, -2.5213623046875, -2.25054931640625, -1.979736328125, -1.70892333984375, -1.4381103515625, -1.16729736328125, -0.896484375, -0.62567138671875, -0.3548583984375, -0.08404541015625, 0.186767578125, 0.45758056640625, 0.7283935546875, 0.99920654296875, 1.27001953125, 1.54083251953125, 1.8116455078125, 2.08245849609375, 2.353271484375, 2.62408447265625, 2.8948974609375, 3.16571044921875, 3.4365234375, 3.70733642578125, 3.9781494140625, 4.24896240234375, 4.519775390625, 4.79058837890625, 5.0614013671875, 5.33221435546875, 5.60302734375, 5.87384033203125, 6.1446533203125, 6.41546630859375, 6.686279296875, 6.95709228515625, 7.2279052734375, 7.49871826171875, 7.76953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 15.0, 14.0, 12.0, 23.0, 27.0, 30.0, 51.0, 72.0, 102.0, 223.0, 125.0, 74.0, 51.0, 52.0, 34.0, 14.0, 13.0, 8.0, 17.0, 5.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009412765502929688, -0.0009168311953544617, -0.0008923858404159546, -0.0008679404854774475, -0.0008434951305389404, -0.0008190497756004333, -0.0007946044206619263, -0.0007701590657234192, -0.0007457137107849121, -0.000721268355846405, -0.000696823000907898, -0.0006723776459693909, -0.0006479322910308838, -0.0006234869360923767, -0.0005990415811538696, -0.0005745962262153625, -0.0005501508712768555, -0.0005257055163383484, -0.0005012601613998413, -0.00047681480646133423, -0.00045236945152282715, -0.00042792409658432007, -0.000403478741645813, -0.0003790333867073059, -0.00035458803176879883, -0.00033014267683029175, -0.00030569732189178467, -0.0002812519669532776, -0.0002568066120147705, -0.00023236125707626343, -0.00020791590213775635, -0.00018347054719924927, -0.0001590251922607422, -0.0001345798373222351, -0.00011013448238372803, -8.568912744522095e-05, -6.124377250671387e-05, -3.679841756820679e-05, -1.2353062629699707e-05, 1.2092292308807373e-05, 3.653764724731445e-05, 6.098300218582153e-05, 8.542835712432861e-05, 0.0001098737120628357, 0.00013431906700134277, 0.00015876442193984985, 0.00018320977687835693, 0.00020765513181686401, 0.0002321004867553711, 0.0002565458416938782, 0.00028099119663238525, 0.00030543655157089233, 0.0003298819065093994, 0.0003543272614479065, 0.0003787726163864136, 0.00040321797132492065, 0.00042766332626342773, 0.0004521086812019348, 0.0004765540361404419, 0.000500999391078949, 0.0005254447460174561, 0.0005498901009559631, 0.0005743354558944702, 0.0005987808108329773, 0.0006232261657714844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 6.0, 2.0, 8.0, 8.0, 9.0, 10.0, 23.0, 34.0, 52.0, 69.0, 169.0, 379.0, 622.0, 1539.0, 4229.0, 16813.0, 142488.0, 815066.0, 52646.0, 9375.0, 2787.0, 1105.0, 495.0, 273.0, 135.0, 74.0, 46.0, 28.0, 12.0, 15.0, 10.0, 11.0, 2.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.09375, -9.807861328125, -9.52197265625, -9.236083984375, -8.9501953125, -8.664306640625, -8.37841796875, -8.092529296875, -7.806640625, -7.520751953125, -7.23486328125, -6.948974609375, -6.6630859375, -6.377197265625, -6.09130859375, -5.805419921875, -5.51953125, -5.233642578125, -4.94775390625, -4.661865234375, -4.3759765625, -4.090087890625, -3.80419921875, -3.518310546875, -3.232421875, -2.946533203125, -2.66064453125, -2.374755859375, -2.0888671875, -1.802978515625, -1.51708984375, -1.231201171875, -0.9453125, -0.659423828125, -0.37353515625, -0.087646484375, 0.1982421875, 0.484130859375, 0.77001953125, 1.055908203125, 1.341796875, 1.627685546875, 1.91357421875, 2.199462890625, 2.4853515625, 2.771240234375, 3.05712890625, 3.343017578125, 3.62890625, 3.914794921875, 4.20068359375, 4.486572265625, 4.7724609375, 5.058349609375, 5.34423828125, 5.630126953125, 5.916015625, 6.201904296875, 6.48779296875, 6.773681640625, 7.0595703125, 7.345458984375, 7.63134765625, 7.917236328125, 8.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 18.0, 42.0, 63.0, 163.0, 369.0, 153.0, 65.0, 35.0, 23.0, 8.0, 11.0, 7.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.53955078125, -12.1416015625, -11.74365234375, -11.345703125, -10.94775390625, -10.5498046875, -10.15185546875, -9.75390625, -9.35595703125, -8.9580078125, -8.56005859375, -8.162109375, -7.76416015625, -7.3662109375, -6.96826171875, -6.5703125, -6.17236328125, -5.7744140625, -5.37646484375, -4.978515625, -4.58056640625, -4.1826171875, -3.78466796875, -3.38671875, -2.98876953125, -2.5908203125, -2.19287109375, -1.794921875, -1.39697265625, -0.9990234375, -0.60107421875, -0.203125, 0.19482421875, 0.5927734375, 0.99072265625, 1.388671875, 1.78662109375, 2.1845703125, 2.58251953125, 2.98046875, 3.37841796875, 3.7763671875, 4.17431640625, 4.572265625, 4.97021484375, 5.3681640625, 5.76611328125, 6.1640625, 6.56201171875, 6.9599609375, 7.35791015625, 7.755859375, 8.15380859375, 8.5517578125, 8.94970703125, 9.34765625, 9.74560546875, 10.1435546875, 10.54150390625, 10.939453125, 11.33740234375, 11.7353515625, 12.13330078125, 12.53125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 12.0, 20.0, 36.0, 45.0, 84.0, 133.0, 164.0, 143.0, 141.0, 87.0, 50.0, 37.0, 18.0, 7.0, 6.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.37358093261719, -95.91415405273438, -93.4547348022461, -90.99530792236328, -88.53588104248047, -86.07646179199219, -83.61703491210938, -81.15760803222656, -78.69818115234375, -76.23875427246094, -73.77933502197266, -71.31990814208984, -68.86048126220703, -66.40106201171875, -63.94163513183594, -61.482208251953125, -59.022789001464844, -56.5633659362793, -54.103939056396484, -51.64451599121094, -49.185089111328125, -46.72566604614258, -44.26624298095703, -41.80681610107422, -39.34739303588867, -36.887969970703125, -34.42854309082031, -31.969120025634766, -29.509695053100586, -27.050270080566406, -24.59084701538086, -22.13142204284668, -19.67198944091797, -17.21256446838379, -14.753140449523926, -12.293716430664062, -9.834291458129883, -7.374866485595703, -4.91544246673584, -2.4560184478759766, 0.003406524658203125, 2.4628310203552246, 4.922255516052246, 7.381680011749268, 9.841104507446289, 12.300529479980469, 14.759953498840332, 17.219377517700195, 19.678802490234375, 22.138227462768555, 24.597652435302734, 27.05707550048828, 29.51650047302246, 31.97592544555664, 34.43534851074219, 36.894775390625, 39.35419845581055, 41.813621520996094, 44.273048400878906, 46.73247146606445, 49.19189453125, 51.65132141113281, 54.11074447631836, 56.570167541503906, 59.02959442138672]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 10.0, 12.0, 13.0, 27.0, 41.0, 26.0, 51.0, 51.0, 50.0, 72.0, 68.0, 88.0, 74.0, 78.0, 61.0, 52.0, 40.0, 37.0, 31.0, 28.0, 22.0, 12.0, 9.0, 15.0, 5.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.62456512451172, -73.2418212890625, -70.85906982421875, -68.47632598876953, -66.09358215332031, -63.71083068847656, -61.328086853027344, -58.94533920288086, -56.562591552734375, -54.17984390258789, -51.797096252441406, -49.41435241699219, -47.0316047668457, -44.64885711669922, -42.26611328125, -39.883365631103516, -37.50061798095703, -35.11787033081055, -32.73512268066406, -30.352378845214844, -27.96963119506836, -25.586883544921875, -23.204137802124023, -20.821392059326172, -18.438644409179688, -16.055896759033203, -13.673151016235352, -11.290404319763184, -8.907657623291016, -6.524910926818848, -4.14216423034668, -1.7594184875488281, 0.6233367919921875, 3.0060834884643555, 5.388830184936523, 7.771576881408691, 10.15432357788086, 12.537070274353027, 14.919816970825195, 17.302562713623047, 19.68531036376953, 22.068058013916016, 24.450803756713867, 26.83354949951172, 29.216297149658203, 31.599044799804688, 33.981788635253906, 36.36453628540039, 38.747283935546875, 41.13003158569336, 43.512779235839844, 45.89552307128906, 48.27827072143555, 50.66101837158203, 53.04376220703125, 55.426509857177734, 57.80925750732422, 60.1920051574707, 62.57475280761719, 64.9574966430664, 67.34024047851562, 69.72299194335938, 72.1057357788086, 74.48847961425781, 76.87123107910156]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 12.0, 27.0, 31.0, 42.0, 59.0, 95.0, 158.0, 287.0, 563.0, 1397.0, 4719.0, 29558.0, 3899255.0, 240417.0, 12952.0, 2740.0, 955.0, 382.0, 227.0, 119.0, 93.0, 42.0, 35.0, 22.0, 20.0, 16.0, 10.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.654052734375, -12.07373046875, -11.493408203125, -10.9130859375, -10.332763671875, -9.75244140625, -9.172119140625, -8.591796875, -8.011474609375, -7.43115234375, -6.850830078125, -6.2705078125, -5.690185546875, -5.10986328125, -4.529541015625, -3.94921875, -3.368896484375, -2.78857421875, -2.208251953125, -1.6279296875, -1.047607421875, -0.46728515625, 0.113037109375, 0.693359375, 1.273681640625, 1.85400390625, 2.434326171875, 3.0146484375, 3.594970703125, 4.17529296875, 4.755615234375, 5.3359375, 5.916259765625, 6.49658203125, 7.076904296875, 7.6572265625, 8.237548828125, 8.81787109375, 9.398193359375, 9.978515625, 10.558837890625, 11.13916015625, 11.719482421875, 12.2998046875, 12.880126953125, 13.46044921875, 14.040771484375, 14.62109375, 15.201416015625, 15.78173828125, 16.362060546875, 16.9423828125, 17.522705078125, 18.10302734375, 18.683349609375, 19.263671875, 19.843994140625, 20.42431640625, 21.004638671875, 21.5849609375, 22.165283203125, 22.74560546875, 23.325927734375, 23.90625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 14.0, 20.0, 17.0, 27.0, 22.0, 36.0, 38.0, 42.0, 49.0, 60.0, 70.0, 74.0, 56.0, 55.0, 53.0, 51.0, 45.0, 50.0, 40.0, 42.0, 27.0, 21.0, 17.0, 13.0, 14.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.096588134765625, -2.01348876953125, -1.930389404296875, -1.8472900390625, -1.764190673828125, -1.68109130859375, -1.597991943359375, -1.514892578125, -1.431793212890625, -1.34869384765625, -1.265594482421875, -1.1824951171875, -1.099395751953125, -1.01629638671875, -0.933197021484375, -0.85009765625, -0.766998291015625, -0.68389892578125, -0.600799560546875, -0.5177001953125, -0.434600830078125, -0.35150146484375, -0.268402099609375, -0.185302734375, -0.102203369140625, -0.01910400390625, 0.063995361328125, 0.1470947265625, 0.230194091796875, 0.31329345703125, 0.396392822265625, 0.4794921875, 0.562591552734375, 0.64569091796875, 0.728790283203125, 0.8118896484375, 0.894989013671875, 0.97808837890625, 1.061187744140625, 1.144287109375, 1.227386474609375, 1.31048583984375, 1.393585205078125, 1.4766845703125, 1.559783935546875, 1.64288330078125, 1.725982666015625, 1.80908203125, 1.892181396484375, 1.97528076171875, 2.058380126953125, 2.1414794921875, 2.224578857421875, 2.30767822265625, 2.390777587890625, 2.473876953125, 2.556976318359375, 2.64007568359375, 2.723175048828125, 2.8062744140625, 2.889373779296875, 2.97247314453125, 3.055572509765625, 3.138671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 13.0, 14.0, 24.0, 29.0, 42.0, 74.0, 117.0, 239.0, 660.0, 2014.0, 8595.0, 84413.0, 3977323.0, 107642.0, 9565.0, 2240.0, 688.0, 238.0, 123.0, 84.0, 38.0, 27.0, 20.0, 21.0, 5.0, 8.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.5048828125, -16.931640625, -16.3583984375, -15.78515625, -15.2119140625, -14.638671875, -14.0654296875, -13.4921875, -12.9189453125, -12.345703125, -11.7724609375, -11.19921875, -10.6259765625, -10.052734375, -9.4794921875, -8.90625, -8.3330078125, -7.759765625, -7.1865234375, -6.61328125, -6.0400390625, -5.466796875, -4.8935546875, -4.3203125, -3.7470703125, -3.173828125, -2.6005859375, -2.02734375, -1.4541015625, -0.880859375, -0.3076171875, 0.265625, 0.8388671875, 1.412109375, 1.9853515625, 2.55859375, 3.1318359375, 3.705078125, 4.2783203125, 4.8515625, 5.4248046875, 5.998046875, 6.5712890625, 7.14453125, 7.7177734375, 8.291015625, 8.8642578125, 9.4375, 10.0107421875, 10.583984375, 11.1572265625, 11.73046875, 12.3037109375, 12.876953125, 13.4501953125, 14.0234375, 14.5966796875, 15.169921875, 15.7431640625, 16.31640625, 16.8896484375, 17.462890625, 18.0361328125, 18.609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 10.0, 15.0, 20.0, 47.0, 95.0, 249.0, 2606.0, 746.0, 164.0, 53.0, 23.0, 15.0, 11.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.703125, -13.40362548828125, -13.1041259765625, -12.80462646484375, -12.505126953125, -12.20562744140625, -11.9061279296875, -11.60662841796875, -11.30712890625, -11.00762939453125, -10.7081298828125, -10.40863037109375, -10.109130859375, -9.80963134765625, -9.5101318359375, -9.21063232421875, -8.9111328125, -8.61163330078125, -8.3121337890625, -8.01263427734375, -7.713134765625, -7.41363525390625, -7.1141357421875, -6.81463623046875, -6.51513671875, -6.21563720703125, -5.9161376953125, -5.61663818359375, -5.317138671875, -5.01763916015625, -4.7181396484375, -4.41864013671875, -4.119140625, -3.81964111328125, -3.5201416015625, -3.22064208984375, -2.921142578125, -2.62164306640625, -2.3221435546875, -2.02264404296875, -1.72314453125, -1.42364501953125, -1.1241455078125, -0.82464599609375, -0.525146484375, -0.22564697265625, 0.0738525390625, 0.37335205078125, 0.6728515625, 0.97235107421875, 1.2718505859375, 1.57135009765625, 1.870849609375, 2.17034912109375, 2.4698486328125, 2.76934814453125, 3.06884765625, 3.36834716796875, 3.6678466796875, 3.96734619140625, 4.266845703125, 4.56634521484375, 4.8658447265625, 5.16534423828125, 5.46484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 25.0, 93.0, 234.0, 305.0, 202.0, 99.0, 20.0, 10.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.431304931640625, -47.46857452392578, -45.50584030151367, -43.54310607910156, -41.58037567138672, -39.617645263671875, -37.654911041259766, -35.692176818847656, -33.72944641113281, -31.766714096069336, -29.80398178100586, -27.841249465942383, -25.878517150878906, -23.91578483581543, -21.953052520751953, -19.990320205688477, -18.027587890625, -16.064855575561523, -14.102123260498047, -12.13939094543457, -10.176658630371094, -8.213926315307617, -6.251194000244141, -4.288461685180664, -2.3257293701171875, -0.36299705505371094, 1.5997352600097656, 3.562467575073242, 5.525199890136719, 7.487932205200195, 9.450664520263672, 11.413396835327148, 13.376129150390625, 15.338861465454102, 17.301593780517578, 19.264326095581055, 21.22705841064453, 23.189790725708008, 25.152523040771484, 27.11525535583496, 29.077987670898438, 31.040719985961914, 33.00345230102539, 34.9661865234375, 36.928916931152344, 38.89164733886719, 40.8543815612793, 42.817115783691406, 44.77984619140625, 46.742576599121094, 48.7053108215332, 50.66804504394531, 52.630775451660156, 54.593505859375, 56.55624008178711, 58.51897430419922, 60.48170471191406, 62.444435119628906, 64.40716552734375, 66.36990356445312, 68.33263397216797, 70.29536437988281, 72.25810241699219, 74.22083282470703, 76.18356323242188]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 15.0, 9.0, 18.0, 20.0, 20.0, 16.0, 35.0, 32.0, 35.0, 47.0, 58.0, 47.0, 48.0, 44.0, 51.0, 58.0, 45.0, 48.0, 38.0, 45.0, 47.0, 31.0, 34.0, 25.0, 26.0, 20.0, 15.0, 12.0, 12.0, 8.0, 4.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.807159423828125, -16.178470611572266, -15.549779891967773, -14.921090126037598, -14.292400360107422, -13.663711547851562, -13.035021781921387, -12.406332015991211, -11.777642250061035, -11.14895248413086, -10.520262718200684, -9.891572952270508, -9.262884140014648, -8.634193420410156, -8.005504608154297, -7.376814842224121, -6.748125076293945, -6.1194353103637695, -5.490745544433594, -4.862056255340576, -4.2333664894104, -3.6046767234802246, -2.975987195968628, -2.3472976684570312, -1.7186079025268555, -1.0899182558059692, -0.461228609085083, 0.16746103763580322, 0.7961506843566895, 1.4248404502868652, 2.053529977798462, 2.6822195053100586, 3.3109092712402344, 3.93959903717041, 4.568288803100586, 5.1969780921936035, 5.825667858123779, 6.454357624053955, 7.083046913146973, 7.711736679077148, 8.340426445007324, 8.9691162109375, 9.597805976867676, 10.226495742797852, 10.855184555053711, 11.483875274658203, 12.112564086914062, 12.741253852844238, 13.369943618774414, 13.99863338470459, 14.627323150634766, 15.256012916564941, 15.884702682495117, 16.513391494750977, 17.14208221435547, 17.770771026611328, 18.399459838867188, 19.028148651123047, 19.65683937072754, 20.2855281829834, 20.91421890258789, 21.54290771484375, 22.171598434448242, 22.8002872467041, 23.428977966308594]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 14.0, 26.0, 33.0, 48.0, 52.0, 91.0, 142.0, 206.0, 345.0, 540.0, 808.0, 1243.0, 2084.0, 3539.0, 6382.0, 11588.0, 22468.0, 46735.0, 102524.0, 207235.0, 273550.0, 190378.0, 91835.0, 41560.0, 20427.0, 10458.0, 5619.0, 3248.0, 1949.0, 1264.0, 751.0, 467.0, 289.0, 186.0, 141.0, 90.0, 60.0, 40.0, 33.0, 20.0, 13.0, 15.0, 12.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.171875, -4.03912353515625, -3.9063720703125, -3.77362060546875, -3.640869140625, -3.50811767578125, -3.3753662109375, -3.24261474609375, -3.10986328125, -2.97711181640625, -2.8443603515625, -2.71160888671875, -2.578857421875, -2.44610595703125, -2.3133544921875, -2.18060302734375, -2.0478515625, -1.91510009765625, -1.7823486328125, -1.64959716796875, -1.516845703125, -1.38409423828125, -1.2513427734375, -1.11859130859375, -0.98583984375, -0.85308837890625, -0.7203369140625, -0.58758544921875, -0.454833984375, -0.32208251953125, -0.1893310546875, -0.05657958984375, 0.076171875, 0.20892333984375, 0.3416748046875, 0.47442626953125, 0.607177734375, 0.73992919921875, 0.8726806640625, 1.00543212890625, 1.13818359375, 1.27093505859375, 1.4036865234375, 1.53643798828125, 1.669189453125, 1.80194091796875, 1.9346923828125, 2.06744384765625, 2.2001953125, 2.33294677734375, 2.4656982421875, 2.59844970703125, 2.731201171875, 2.86395263671875, 2.9967041015625, 3.12945556640625, 3.26220703125, 3.39495849609375, 3.5277099609375, 3.66046142578125, 3.793212890625, 3.92596435546875, 4.0587158203125, 4.19146728515625, 4.32421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 10.0, 11.0, 12.0, 17.0, 11.0, 13.0, 22.0, 22.0, 29.0, 27.0, 40.0, 44.0, 53.0, 45.0, 66.0, 54.0, 52.0, 48.0, 56.0, 52.0, 49.0, 28.0, 39.0, 33.0, 31.0, 31.0, 24.0, 13.0, 17.0, 9.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.35589599609375, -2.2781982421875, -2.20050048828125, -2.122802734375, -2.04510498046875, -1.9674072265625, -1.88970947265625, -1.81201171875, -1.73431396484375, -1.6566162109375, -1.57891845703125, -1.501220703125, -1.42352294921875, -1.3458251953125, -1.26812744140625, -1.1904296875, -1.11273193359375, -1.0350341796875, -0.95733642578125, -0.879638671875, -0.80194091796875, -0.7242431640625, -0.64654541015625, -0.56884765625, -0.49114990234375, -0.4134521484375, -0.33575439453125, -0.258056640625, -0.18035888671875, -0.1026611328125, -0.02496337890625, 0.052734375, 0.13043212890625, 0.2081298828125, 0.28582763671875, 0.363525390625, 0.44122314453125, 0.5189208984375, 0.59661865234375, 0.67431640625, 0.75201416015625, 0.8297119140625, 0.90740966796875, 0.985107421875, 1.06280517578125, 1.1405029296875, 1.21820068359375, 1.2958984375, 1.37359619140625, 1.4512939453125, 1.52899169921875, 1.606689453125, 1.68438720703125, 1.7620849609375, 1.83978271484375, 1.91748046875, 1.99517822265625, 2.0728759765625, 2.15057373046875, 2.228271484375, 2.30596923828125, 2.3836669921875, 2.46136474609375, 2.5390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 5.0, 11.0, 17.0, 17.0, 37.0, 45.0, 78.0, 121.0, 192.0, 392.0, 894.0, 2109.0, 6402.0, 23298.0, 122211.0, 589259.0, 247245.0, 40712.0, 9884.0, 3160.0, 1154.0, 564.0, 265.0, 157.0, 113.0, 46.0, 45.0, 25.0, 25.0, 10.0, 13.0, 7.0, 3.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.421875, -9.08154296875, -8.7412109375, -8.40087890625, -8.060546875, -7.72021484375, -7.3798828125, -7.03955078125, -6.69921875, -6.35888671875, -6.0185546875, -5.67822265625, -5.337890625, -4.99755859375, -4.6572265625, -4.31689453125, -3.9765625, -3.63623046875, -3.2958984375, -2.95556640625, -2.615234375, -2.27490234375, -1.9345703125, -1.59423828125, -1.25390625, -0.91357421875, -0.5732421875, -0.23291015625, 0.107421875, 0.44775390625, 0.7880859375, 1.12841796875, 1.46875, 1.80908203125, 2.1494140625, 2.48974609375, 2.830078125, 3.17041015625, 3.5107421875, 3.85107421875, 4.19140625, 4.53173828125, 4.8720703125, 5.21240234375, 5.552734375, 5.89306640625, 6.2333984375, 6.57373046875, 6.9140625, 7.25439453125, 7.5947265625, 7.93505859375, 8.275390625, 8.61572265625, 8.9560546875, 9.29638671875, 9.63671875, 9.97705078125, 10.3173828125, 10.65771484375, 10.998046875, 11.33837890625, 11.6787109375, 12.01904296875, 12.359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 3.0, 6.0, 7.0, 3.0, 7.0, 15.0, 14.0, 21.0, 25.0, 28.0, 31.0, 33.0, 41.0, 43.0, 37.0, 52.0, 58.0, 54.0, 56.0, 49.0, 49.0, 45.0, 50.0, 49.0, 42.0, 30.0, 28.0, 26.0, 23.0, 20.0, 11.0, 13.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -13.95068359375, -13.4638671875, -12.97705078125, -12.490234375, -12.00341796875, -11.5166015625, -11.02978515625, -10.54296875, -10.05615234375, -9.5693359375, -9.08251953125, -8.595703125, -8.10888671875, -7.6220703125, -7.13525390625, -6.6484375, -6.16162109375, -5.6748046875, -5.18798828125, -4.701171875, -4.21435546875, -3.7275390625, -3.24072265625, -2.75390625, -2.26708984375, -1.7802734375, -1.29345703125, -0.806640625, -0.31982421875, 0.1669921875, 0.65380859375, 1.140625, 1.62744140625, 2.1142578125, 2.60107421875, 3.087890625, 3.57470703125, 4.0615234375, 4.54833984375, 5.03515625, 5.52197265625, 6.0087890625, 6.49560546875, 6.982421875, 7.46923828125, 7.9560546875, 8.44287109375, 8.9296875, 9.41650390625, 9.9033203125, 10.39013671875, 10.876953125, 11.36376953125, 11.8505859375, 12.33740234375, 12.82421875, 13.31103515625, 13.7978515625, 14.28466796875, 14.771484375, 15.25830078125, 15.7451171875, 16.23193359375, 16.71875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 16.0, 11.0, 22.0, 41.0, 56.0, 89.0, 141.0, 259.0, 565.0, 1325.0, 4702.0, 29540.0, 524099.0, 454925.0, 25944.0, 4360.0, 1278.0, 530.0, 260.0, 166.0, 69.0, 41.0, 29.0, 19.0, 22.0, 9.0, 6.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.8690185546875, -7.597412109375, -7.3258056640625, -7.05419921875, -6.7825927734375, -6.510986328125, -6.2393798828125, -5.9677734375, -5.6961669921875, -5.424560546875, -5.1529541015625, -4.88134765625, -4.6097412109375, -4.338134765625, -4.0665283203125, -3.794921875, -3.5233154296875, -3.251708984375, -2.9801025390625, -2.70849609375, -2.4368896484375, -2.165283203125, -1.8936767578125, -1.6220703125, -1.3504638671875, -1.078857421875, -0.8072509765625, -0.53564453125, -0.2640380859375, 0.007568359375, 0.2791748046875, 0.55078125, 0.8223876953125, 1.093994140625, 1.3656005859375, 1.63720703125, 1.9088134765625, 2.180419921875, 2.4520263671875, 2.7236328125, 2.9952392578125, 3.266845703125, 3.5384521484375, 3.81005859375, 4.0816650390625, 4.353271484375, 4.6248779296875, 4.896484375, 5.1680908203125, 5.439697265625, 5.7113037109375, 5.98291015625, 6.2545166015625, 6.526123046875, 6.7977294921875, 7.0693359375, 7.3409423828125, 7.612548828125, 7.8841552734375, 8.15576171875, 8.4273681640625, 8.698974609375, 8.9705810546875, 9.2421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 13.0, 16.0, 17.0, 44.0, 53.0, 88.0, 113.0, 110.0, 137.0, 137.0, 99.0, 54.0, 46.0, 20.0, 13.0, 17.0, 3.0, 4.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00133514404296875, -0.0012993142008781433, -0.0012634843587875366, -0.00122765451669693, -0.0011918246746063232, -0.0011559948325157166, -0.0011201649904251099, -0.0010843351483345032, -0.0010485053062438965, -0.0010126754641532898, -0.000976845622062683, -0.0009410157799720764, -0.0009051859378814697, -0.000869356095790863, -0.0008335262537002563, -0.0007976964116096497, -0.000761866569519043, -0.0007260367274284363, -0.0006902068853378296, -0.0006543770432472229, -0.0006185472011566162, -0.0005827173590660095, -0.0005468875169754028, -0.0005110576748847961, -0.00047522783279418945, -0.00043939799070358276, -0.0004035681486129761, -0.0003677383065223694, -0.0003319084644317627, -0.000296078622341156, -0.0002602487802505493, -0.00022441893815994263, -0.00018858909606933594, -0.00015275925397872925, -0.00011692941188812256, -8.109956979751587e-05, -4.526972770690918e-05, -9.43988561630249e-06, 2.63899564743042e-05, 6.221979856491089e-05, 9.804964065551758e-05, 0.00013387948274612427, 0.00016970932483673096, 0.00020553916692733765, 0.00024136900901794434, 0.000277198851108551, 0.0003130286931991577, 0.0003488585352897644, 0.0003846883773803711, 0.0004205182194709778, 0.00045634806156158447, 0.0004921779036521912, 0.0005280077457427979, 0.0005638375878334045, 0.0005996674299240112, 0.0006354972720146179, 0.0006713271141052246, 0.0007071569561958313, 0.000742986798286438, 0.0007788166403770447, 0.0008146464824676514, 0.0008504763245582581, 0.0008863061666488647, 0.0009221360087394714, 0.0009579658508300781]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 16.0, 17.0, 30.0, 44.0, 61.0, 122.0, 243.0, 529.0, 1518.0, 5311.0, 28190.0, 302965.0, 627259.0, 68544.0, 9524.0, 2554.0, 861.0, 341.0, 188.0, 87.0, 50.0, 43.0, 16.0, 6.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.62890625, -6.39385986328125, -6.1588134765625, -5.92376708984375, -5.688720703125, -5.45367431640625, -5.2186279296875, -4.98358154296875, -4.74853515625, -4.51348876953125, -4.2784423828125, -4.04339599609375, -3.808349609375, -3.57330322265625, -3.3382568359375, -3.10321044921875, -2.8681640625, -2.63311767578125, -2.3980712890625, -2.16302490234375, -1.927978515625, -1.69293212890625, -1.4578857421875, -1.22283935546875, -0.98779296875, -0.75274658203125, -0.5177001953125, -0.28265380859375, -0.047607421875, 0.18743896484375, 0.4224853515625, 0.65753173828125, 0.892578125, 1.12762451171875, 1.3626708984375, 1.59771728515625, 1.832763671875, 2.06781005859375, 2.3028564453125, 2.53790283203125, 2.77294921875, 3.00799560546875, 3.2430419921875, 3.47808837890625, 3.713134765625, 3.94818115234375, 4.1832275390625, 4.41827392578125, 4.6533203125, 4.88836669921875, 5.1234130859375, 5.35845947265625, 5.593505859375, 5.82855224609375, 6.0635986328125, 6.29864501953125, 6.53369140625, 6.76873779296875, 7.0037841796875, 7.23883056640625, 7.473876953125, 7.70892333984375, 7.9439697265625, 8.17901611328125, 8.4140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 9.0, 6.0, 11.0, 12.0, 28.0, 45.0, 54.0, 72.0, 76.0, 107.0, 108.0, 118.0, 104.0, 66.0, 64.0, 27.0, 31.0, 18.0, 9.0, 6.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.2890625, -10.03662109375, -9.7841796875, -9.53173828125, -9.279296875, -9.02685546875, -8.7744140625, -8.52197265625, -8.26953125, -8.01708984375, -7.7646484375, -7.51220703125, -7.259765625, -7.00732421875, -6.7548828125, -6.50244140625, -6.25, -5.99755859375, -5.7451171875, -5.49267578125, -5.240234375, -4.98779296875, -4.7353515625, -4.48291015625, -4.23046875, -3.97802734375, -3.7255859375, -3.47314453125, -3.220703125, -2.96826171875, -2.7158203125, -2.46337890625, -2.2109375, -1.95849609375, -1.7060546875, -1.45361328125, -1.201171875, -0.94873046875, -0.6962890625, -0.44384765625, -0.19140625, 0.06103515625, 0.3134765625, 0.56591796875, 0.818359375, 1.07080078125, 1.3232421875, 1.57568359375, 1.828125, 2.08056640625, 2.3330078125, 2.58544921875, 2.837890625, 3.09033203125, 3.3427734375, 3.59521484375, 3.84765625, 4.10009765625, 4.3525390625, 4.60498046875, 4.857421875, 5.10986328125, 5.3623046875, 5.61474609375, 5.8671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 32.0, 102.0, 358.0, 365.0, 105.0, 30.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-381.563232421875, -374.3453674316406, -367.1274719238281, -359.90960693359375, -352.69171142578125, -345.4738464355469, -338.2559509277344, -331.0380859375, -323.8201904296875, -316.6023254394531, -309.3844299316406, -302.16656494140625, -294.94866943359375, -287.7308044433594, -280.5129089355469, -273.2950439453125, -266.0771789550781, -258.85931396484375, -251.64141845703125, -244.4235382080078, -237.20565795898438, -229.98779296875, -222.76991271972656, -215.55203247070312, -208.3341522216797, -201.11627197265625, -193.8983917236328, -186.68051147460938, -179.462646484375, -172.2447509765625, -165.02688598632812, -157.8090057373047, -150.5911102294922, -143.37322998046875, -136.1553497314453, -128.93746948242188, -121.71959686279297, -114.50171661376953, -107.28384399414062, -100.06596374511719, -92.84808349609375, -85.63020324707031, -78.41232299804688, -71.19445037841797, -63.97657012939453, -56.758689880371094, -49.54081344604492, -42.32293701171875, -35.10505676269531, -27.887178421020508, -20.669300079345703, -13.451421737670898, -6.233543395996094, 0.9843368530273438, 8.202213287353516, 15.420089721679688, 22.637969970703125, 29.85584831237793, 37.073726654052734, 44.291603088378906, 51.509483337402344, 58.72736358642578, 65.94523620605469, 73.16311645507812, 80.38099670410156]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 11.0, 12.0, 17.0, 18.0, 14.0, 26.0, 35.0, 45.0, 49.0, 44.0, 40.0, 50.0, 49.0, 52.0, 62.0, 52.0, 54.0, 51.0, 47.0, 37.0, 31.0, 31.0, 16.0, 20.0, 17.0, 13.0, 18.0, 7.0, 7.0, 12.0, 9.0, 6.0, 3.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.94235229492188, -84.39067077636719, -81.83899688720703, -79.28732299804688, -76.73564147949219, -74.1839599609375, -71.63228607177734, -69.08061218261719, -66.5289306640625, -63.97725296020508, -61.425575256347656, -58.873897552490234, -56.32221984863281, -53.77054214477539, -51.21886444091797, -48.66718673706055, -46.115509033203125, -43.5638313293457, -41.01215362548828, -38.46047592163086, -35.90879821777344, -33.357120513916016, -30.805442810058594, -28.253765106201172, -25.70208740234375, -23.150409698486328, -20.598731994628906, -18.047054290771484, -15.495376586914062, -12.94369888305664, -10.392021179199219, -7.840343475341797, -5.288665771484375, -2.736988067626953, -0.18531036376953125, 2.3663673400878906, 4.9180450439453125, 7.469722747802734, 10.021400451660156, 12.573078155517578, 15.124755859375, 17.676433563232422, 20.228111267089844, 22.779788970947266, 25.331466674804688, 27.88314437866211, 30.43482208251953, 32.98649978637695, 35.538177490234375, 38.0898551940918, 40.64153289794922, 43.19321060180664, 45.74488830566406, 48.296566009521484, 50.848243713378906, 53.39992141723633, 55.95159912109375, 58.50327682495117, 61.054954528808594, 63.606632232666016, 66.15830993652344, 68.70999145507812, 71.26166534423828, 73.81333923339844, 76.36502075195312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 12.0, 11.0, 30.0, 37.0, 87.0, 167.0, 353.0, 814.0, 2620.0, 12684.0, 4027777.0, 139608.0, 6990.0, 1823.0, 684.0, 294.0, 122.0, 58.0, 39.0, 19.0, 15.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.2781982421875, -11.626708984375, -10.9752197265625, -10.32373046875, -9.6722412109375, -9.020751953125, -8.3692626953125, -7.7177734375, -7.0662841796875, -6.414794921875, -5.7633056640625, -5.11181640625, -4.4603271484375, -3.808837890625, -3.1573486328125, -2.505859375, -1.8543701171875, -1.202880859375, -0.5513916015625, 0.10009765625, 0.7515869140625, 1.403076171875, 2.0545654296875, 2.7060546875, 3.3575439453125, 4.009033203125, 4.6605224609375, 5.31201171875, 5.9635009765625, 6.614990234375, 7.2664794921875, 7.91796875, 8.5694580078125, 9.220947265625, 9.8724365234375, 10.52392578125, 11.1754150390625, 11.826904296875, 12.4783935546875, 13.1298828125, 13.7813720703125, 14.432861328125, 15.0843505859375, 15.73583984375, 16.3873291015625, 17.038818359375, 17.6903076171875, 18.341796875, 18.9932861328125, 19.644775390625, 20.2962646484375, 20.94775390625, 21.5992431640625, 22.250732421875, 22.9022216796875, 23.5537109375, 24.2052001953125, 24.856689453125, 25.5081787109375, 26.15966796875, 26.8111572265625, 27.462646484375, 28.1141357421875, 28.765625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 16.0, 25.0, 17.0, 27.0, 39.0, 51.0, 50.0, 54.0, 72.0, 58.0, 66.0, 75.0, 78.0, 61.0, 61.0, 45.0, 40.0, 22.0, 28.0, 21.0, 29.0, 9.0, 15.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.43585205078125, -4.3013916015625, -4.16693115234375, -4.032470703125, -3.89801025390625, -3.7635498046875, -3.62908935546875, -3.49462890625, -3.36016845703125, -3.2257080078125, -3.09124755859375, -2.956787109375, -2.82232666015625, -2.6878662109375, -2.55340576171875, -2.4189453125, -2.28448486328125, -2.1500244140625, -2.01556396484375, -1.881103515625, -1.74664306640625, -1.6121826171875, -1.47772216796875, -1.34326171875, -1.20880126953125, -1.0743408203125, -0.93988037109375, -0.805419921875, -0.67095947265625, -0.5364990234375, -0.40203857421875, -0.267578125, -0.13311767578125, 0.0013427734375, 0.13580322265625, 0.270263671875, 0.40472412109375, 0.5391845703125, 0.67364501953125, 0.80810546875, 0.94256591796875, 1.0770263671875, 1.21148681640625, 1.345947265625, 1.48040771484375, 1.6148681640625, 1.74932861328125, 1.8837890625, 2.01824951171875, 2.1527099609375, 2.28717041015625, 2.421630859375, 2.55609130859375, 2.6905517578125, 2.82501220703125, 2.95947265625, 3.09393310546875, 3.2283935546875, 3.36285400390625, 3.497314453125, 3.63177490234375, 3.7662353515625, 3.90069580078125, 4.03515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 2.0, 6.0, 6.0, 8.0, 21.0, 30.0, 42.0, 67.0, 104.0, 114.0, 186.0, 267.0, 461.0, 893.0, 1780.0, 4454.0, 16115.0, 313246.0, 3820009.0, 25838.0, 5951.0, 2255.0, 1023.0, 514.0, 298.0, 185.0, 137.0, 85.0, 62.0, 36.0, 23.0, 17.0, 18.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.6851806640625, -14.143798828125, -13.6024169921875, -13.06103515625, -12.5196533203125, -11.978271484375, -11.4368896484375, -10.8955078125, -10.3541259765625, -9.812744140625, -9.2713623046875, -8.72998046875, -8.1885986328125, -7.647216796875, -7.1058349609375, -6.564453125, -6.0230712890625, -5.481689453125, -4.9403076171875, -4.39892578125, -3.8575439453125, -3.316162109375, -2.7747802734375, -2.2333984375, -1.6920166015625, -1.150634765625, -0.6092529296875, -0.06787109375, 0.4735107421875, 1.014892578125, 1.5562744140625, 2.09765625, 2.6390380859375, 3.180419921875, 3.7218017578125, 4.26318359375, 4.8045654296875, 5.345947265625, 5.8873291015625, 6.4287109375, 6.9700927734375, 7.511474609375, 8.0528564453125, 8.59423828125, 9.1356201171875, 9.677001953125, 10.2183837890625, 10.759765625, 11.3011474609375, 11.842529296875, 12.3839111328125, 12.92529296875, 13.4666748046875, 14.008056640625, 14.5494384765625, 15.0908203125, 15.6322021484375, 16.173583984375, 16.7149658203125, 17.25634765625, 17.7977294921875, 18.339111328125, 18.8804931640625, 19.421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 11.0, 13.0, 35.0, 201.0, 3446.0, 244.0, 50.0, 31.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.2890625, -6.133819580078125, -5.97857666015625, -5.823333740234375, -5.6680908203125, -5.512847900390625, -5.35760498046875, -5.202362060546875, -5.047119140625, -4.891876220703125, -4.73663330078125, -4.581390380859375, -4.4261474609375, -4.270904541015625, -4.11566162109375, -3.960418701171875, -3.80517578125, -3.649932861328125, -3.49468994140625, -3.339447021484375, -3.1842041015625, -3.028961181640625, -2.87371826171875, -2.718475341796875, -2.563232421875, -2.407989501953125, -2.25274658203125, -2.097503662109375, -1.9422607421875, -1.787017822265625, -1.63177490234375, -1.476531982421875, -1.3212890625, -1.166046142578125, -1.01080322265625, -0.855560302734375, -0.7003173828125, -0.545074462890625, -0.38983154296875, -0.234588623046875, -0.079345703125, 0.075897216796875, 0.23114013671875, 0.386383056640625, 0.5416259765625, 0.696868896484375, 0.85211181640625, 1.007354736328125, 1.16259765625, 1.317840576171875, 1.47308349609375, 1.628326416015625, 1.7835693359375, 1.938812255859375, 2.09405517578125, 2.249298095703125, 2.404541015625, 2.559783935546875, 2.71502685546875, 2.870269775390625, 3.0255126953125, 3.180755615234375, 3.33599853515625, 3.491241455078125, 3.646484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 14.0, 58.0, 124.0, 283.0, 269.0, 137.0, 74.0, 24.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.465678215026855, -10.735272407531738, -10.004866600036621, -9.27446174621582, -8.544055938720703, -7.813649654388428, -7.083244323730469, -6.352838516235352, -5.622432708740234, -4.892026901245117, -4.16162109375, -3.431215763092041, -2.700809955596924, -1.9704041481018066, -1.2399988174438477, -0.5095930099487305, 0.22081279754638672, 0.9512184858322144, 1.681624174118042, 2.41202974319458, 3.1424355506896973, 3.8728413581848145, 4.603246688842773, 5.333652496337891, 6.064058303833008, 6.794464111328125, 7.524869918823242, 8.25527572631836, 8.985681533813477, 9.716087341308594, 10.446492195129395, 11.176898002624512, 11.907302856445312, 12.63770866394043, 13.368114471435547, 14.098520278930664, 14.828926086425781, 15.559331893920898, 16.289737701416016, 17.0201416015625, 17.75054931640625, 18.480955123901367, 19.211360931396484, 19.9417667388916, 20.67217254638672, 21.402578353881836, 22.132984161376953, 22.863388061523438, 23.593793869018555, 24.324199676513672, 25.05460548400879, 25.785011291503906, 26.515417098999023, 27.24582290649414, 27.976226806640625, 28.706634521484375, 29.43703842163086, 30.167444229125977, 30.897850036621094, 31.62825584411621, 32.35866165161133, 33.08906555175781, 33.81947326660156, 34.54987716674805, 35.2802848815918]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 11.0, 6.0, 14.0, 16.0, 22.0, 28.0, 33.0, 26.0, 27.0, 30.0, 41.0, 37.0, 31.0, 36.0, 49.0, 36.0, 48.0, 37.0, 39.0, 41.0, 48.0, 33.0, 34.0, 33.0, 28.0, 23.0, 27.0, 17.0, 25.0, 21.0, 12.0, 11.0, 12.0, 11.0, 7.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.57032585144043, -7.336163520812988, -7.102000713348389, -6.867838382720947, -6.633675575256348, -6.399513244628906, -6.165350437164307, -5.931188106536865, -5.697025299072266, -5.462862968444824, -5.228700160980225, -4.994537830352783, -4.760375022888184, -4.526212692260742, -4.292049884796143, -4.057887554168701, -3.8237249851226807, -3.58956241607666, -3.3553998470306396, -3.121237277984619, -2.8870747089385986, -2.652912139892578, -2.4187498092651367, -2.184587001800537, -1.9504245519638062, -1.7162619829177856, -1.4820994138717651, -1.2479369640350342, -1.0137743949890137, -0.7796118259429932, -0.5454492568969727, -0.31128668785095215, -0.07712411880493164, 0.15703843533992767, 0.391200989484787, 0.6253635287284851, 0.8595260977745056, 1.0936886072158813, 1.3278511762619019, 1.5620137453079224, 1.7961763143539429, 2.030338764190674, 2.2645013332366943, 2.498663902282715, 2.7328264713287354, 2.966989040374756, 3.2011516094207764, 3.435314178466797, 3.6694767475128174, 3.903639316558838, 4.137801647186279, 4.371964454650879, 4.60612678527832, 4.84028959274292, 5.074451923370361, 5.308614730834961, 5.542777061462402, 5.776939392089844, 6.011102199554443, 6.245264530181885, 6.479427337646484, 6.713589668273926, 6.947752475738525, 7.181914806365967, 7.416077613830566]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 12.0, 19.0, 37.0, 55.0, 75.0, 126.0, 214.0, 409.0, 778.0, 1441.0, 3450.0, 8033.0, 21690.0, 65041.0, 201302.0, 392371.0, 234971.0, 76669.0, 25067.0, 9343.0, 3877.0, 1691.0, 833.0, 437.0, 231.0, 131.0, 86.0, 62.0, 29.0, 21.0, 12.0, 11.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -7.046875, -6.80859375, -6.5703125, -6.33203125, -6.09375, -5.85546875, -5.6171875, -5.37890625, -5.140625, -4.90234375, -4.6640625, -4.42578125, -4.1875, -3.94921875, -3.7109375, -3.47265625, -3.234375, -2.99609375, -2.7578125, -2.51953125, -2.28125, -2.04296875, -1.8046875, -1.56640625, -1.328125, -1.08984375, -0.8515625, -0.61328125, -0.375, -0.13671875, 0.1015625, 0.33984375, 0.578125, 0.81640625, 1.0546875, 1.29296875, 1.53125, 1.76953125, 2.0078125, 2.24609375, 2.484375, 2.72265625, 2.9609375, 3.19921875, 3.4375, 3.67578125, 3.9140625, 4.15234375, 4.390625, 4.62890625, 4.8671875, 5.10546875, 5.34375, 5.58203125, 5.8203125, 6.05859375, 6.296875, 6.53515625, 6.7734375, 7.01171875, 7.25, 7.48828125, 7.7265625, 7.96484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 5.0, 9.0, 4.0, 13.0, 24.0, 17.0, 33.0, 30.0, 33.0, 46.0, 40.0, 42.0, 63.0, 48.0, 50.0, 40.0, 66.0, 53.0, 74.0, 53.0, 52.0, 33.0, 23.0, 30.0, 20.0, 31.0, 11.0, 16.0, 7.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.576171875, -3.454986572265625, -3.33380126953125, -3.212615966796875, -3.0914306640625, -2.970245361328125, -2.84906005859375, -2.727874755859375, -2.606689453125, -2.485504150390625, -2.36431884765625, -2.243133544921875, -2.1219482421875, -2.000762939453125, -1.87957763671875, -1.758392333984375, -1.63720703125, -1.516021728515625, -1.39483642578125, -1.273651123046875, -1.1524658203125, -1.031280517578125, -0.91009521484375, -0.788909912109375, -0.667724609375, -0.546539306640625, -0.42535400390625, -0.304168701171875, -0.1829833984375, -0.061798095703125, 0.05938720703125, 0.180572509765625, 0.3017578125, 0.422943115234375, 0.54412841796875, 0.665313720703125, 0.7864990234375, 0.907684326171875, 1.02886962890625, 1.150054931640625, 1.271240234375, 1.392425537109375, 1.51361083984375, 1.634796142578125, 1.7559814453125, 1.877166748046875, 1.99835205078125, 2.119537353515625, 2.24072265625, 2.361907958984375, 2.48309326171875, 2.604278564453125, 2.7254638671875, 2.846649169921875, 2.96783447265625, 3.089019775390625, 3.210205078125, 3.331390380859375, 3.45257568359375, 3.573760986328125, 3.6949462890625, 3.816131591796875, 3.93731689453125, 4.058502197265625, 4.1796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 19.0, 35.0, 51.0, 46.0, 110.0, 166.0, 296.0, 659.0, 1687.0, 5620.0, 30385.0, 272254.0, 641137.0, 79300.0, 11807.0, 2903.0, 1025.0, 434.0, 215.0, 136.0, 88.0, 44.0, 39.0, 18.0, 12.0, 12.0, 8.0, 4.0, 6.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5, -14.0357666015625, -13.571533203125, -13.1072998046875, -12.64306640625, -12.1788330078125, -11.714599609375, -11.2503662109375, -10.7861328125, -10.3218994140625, -9.857666015625, -9.3934326171875, -8.92919921875, -8.4649658203125, -8.000732421875, -7.5364990234375, -7.072265625, -6.6080322265625, -6.143798828125, -5.6795654296875, -5.21533203125, -4.7510986328125, -4.286865234375, -3.8226318359375, -3.3583984375, -2.8941650390625, -2.429931640625, -1.9656982421875, -1.50146484375, -1.0372314453125, -0.572998046875, -0.1087646484375, 0.35546875, 0.8197021484375, 1.283935546875, 1.7481689453125, 2.21240234375, 2.6766357421875, 3.140869140625, 3.6051025390625, 4.0693359375, 4.5335693359375, 4.997802734375, 5.4620361328125, 5.92626953125, 6.3905029296875, 6.854736328125, 7.3189697265625, 7.783203125, 8.2474365234375, 8.711669921875, 9.1759033203125, 9.64013671875, 10.1043701171875, 10.568603515625, 11.0328369140625, 11.4970703125, 11.9613037109375, 12.425537109375, 12.8897705078125, 13.35400390625, 13.8182373046875, 14.282470703125, 14.7467041015625, 15.2109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 5.0, 7.0, 9.0, 18.0, 20.0, 27.0, 24.0, 24.0, 35.0, 56.0, 48.0, 49.0, 43.0, 61.0, 62.0, 44.0, 55.0, 54.0, 49.0, 55.0, 36.0, 40.0, 28.0, 25.0, 29.0, 30.0, 7.0, 13.0, 10.0, 12.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.130859375, -19.46484375, -18.798828125, -18.1328125, -17.466796875, -16.80078125, -16.134765625, -15.46875, -14.802734375, -14.13671875, -13.470703125, -12.8046875, -12.138671875, -11.47265625, -10.806640625, -10.140625, -9.474609375, -8.80859375, -8.142578125, -7.4765625, -6.810546875, -6.14453125, -5.478515625, -4.8125, -4.146484375, -3.48046875, -2.814453125, -2.1484375, -1.482421875, -0.81640625, -0.150390625, 0.515625, 1.181640625, 1.84765625, 2.513671875, 3.1796875, 3.845703125, 4.51171875, 5.177734375, 5.84375, 6.509765625, 7.17578125, 7.841796875, 8.5078125, 9.173828125, 9.83984375, 10.505859375, 11.171875, 11.837890625, 12.50390625, 13.169921875, 13.8359375, 14.501953125, 15.16796875, 15.833984375, 16.5, 17.166015625, 17.83203125, 18.498046875, 19.1640625, 19.830078125, 20.49609375, 21.162109375, 21.828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 27.0, 39.0, 65.0, 115.0, 264.0, 568.0, 1336.0, 4035.0, 20751.0, 221216.0, 709086.0, 76880.0, 9941.0, 2517.0, 893.0, 366.0, 197.0, 107.0, 45.0, 34.0, 16.0, 11.0, 7.0, 1.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.1104736328125, -4.908447265625, -4.7064208984375, -4.50439453125, -4.3023681640625, -4.100341796875, -3.8983154296875, -3.6962890625, -3.4942626953125, -3.292236328125, -3.0902099609375, -2.88818359375, -2.6861572265625, -2.484130859375, -2.2821044921875, -2.080078125, -1.8780517578125, -1.676025390625, -1.4739990234375, -1.27197265625, -1.0699462890625, -0.867919921875, -0.6658935546875, -0.4638671875, -0.2618408203125, -0.059814453125, 0.1422119140625, 0.34423828125, 0.5462646484375, 0.748291015625, 0.9503173828125, 1.15234375, 1.3543701171875, 1.556396484375, 1.7584228515625, 1.96044921875, 2.1624755859375, 2.364501953125, 2.5665283203125, 2.7685546875, 2.9705810546875, 3.172607421875, 3.3746337890625, 3.57666015625, 3.7786865234375, 3.980712890625, 4.1827392578125, 4.384765625, 4.5867919921875, 4.788818359375, 4.9908447265625, 5.19287109375, 5.3948974609375, 5.596923828125, 5.7989501953125, 6.0009765625, 6.2030029296875, 6.405029296875, 6.6070556640625, 6.80908203125, 7.0111083984375, 7.213134765625, 7.4151611328125, 7.6171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 8.0, 5.0, 6.0, 8.0, 21.0, 36.0, 34.0, 37.0, 60.0, 74.0, 82.0, 94.0, 99.0, 84.0, 66.0, 65.0, 47.0, 37.0, 31.0, 19.0, 16.0, 18.0, 15.0, 13.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000850677490234375, -0.0008278191089630127, -0.0008049607276916504, -0.0007821023464202881, -0.0007592439651489258, -0.0007363855838775635, -0.0007135272026062012, -0.0006906688213348389, -0.0006678104400634766, -0.0006449520587921143, -0.000622093677520752, -0.0005992352962493896, -0.0005763769149780273, -0.000553518533706665, -0.0005306601524353027, -0.0005078017711639404, -0.0004849433898925781, -0.0004620850086212158, -0.0004392266273498535, -0.0004163682460784912, -0.0003935098648071289, -0.0003706514835357666, -0.0003477931022644043, -0.000324934720993042, -0.0003020763397216797, -0.0002792179584503174, -0.0002563595771789551, -0.00023350119590759277, -0.00021064281463623047, -0.00018778443336486816, -0.00016492605209350586, -0.00014206767082214355, -0.00011920928955078125, -9.635090827941895e-05, -7.349252700805664e-05, -5.0634145736694336e-05, -2.777576446533203e-05, -4.9173831939697266e-06, 1.7940998077392578e-05, 4.079937934875488e-05, 6.365776062011719e-05, 8.651614189147949e-05, 0.0001093745231628418, 0.0001322329044342041, 0.0001550912857055664, 0.0001779496669769287, 0.00020080804824829102, 0.00022366642951965332, 0.0002465248107910156, 0.00026938319206237793, 0.00029224157333374023, 0.00031509995460510254, 0.00033795833587646484, 0.00036081671714782715, 0.00038367509841918945, 0.00040653347969055176, 0.00042939186096191406, 0.00045225024223327637, 0.00047510862350463867, 0.000497967004776001, 0.0005208253860473633, 0.0005436837673187256, 0.0005665421485900879, 0.0005894005298614502, 0.0006122589111328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 8.0, 1.0, 3.0, 3.0, 7.0, 11.0, 32.0, 33.0, 72.0, 130.0, 259.0, 590.0, 1838.0, 8213.0, 79356.0, 756652.0, 182426.0, 14674.0, 2684.0, 845.0, 325.0, 172.0, 88.0, 34.0, 36.0, 22.0, 12.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.37408447265625, -6.1348876953125, -5.89569091796875, -5.656494140625, -5.41729736328125, -5.1781005859375, -4.93890380859375, -4.69970703125, -4.46051025390625, -4.2213134765625, -3.98211669921875, -3.742919921875, -3.50372314453125, -3.2645263671875, -3.02532958984375, -2.7861328125, -2.54693603515625, -2.3077392578125, -2.06854248046875, -1.829345703125, -1.59014892578125, -1.3509521484375, -1.11175537109375, -0.87255859375, -0.63336181640625, -0.3941650390625, -0.15496826171875, 0.084228515625, 0.32342529296875, 0.5626220703125, 0.80181884765625, 1.041015625, 1.28021240234375, 1.5194091796875, 1.75860595703125, 1.997802734375, 2.23699951171875, 2.4761962890625, 2.71539306640625, 2.95458984375, 3.19378662109375, 3.4329833984375, 3.67218017578125, 3.911376953125, 4.15057373046875, 4.3897705078125, 4.62896728515625, 4.8681640625, 5.10736083984375, 5.3465576171875, 5.58575439453125, 5.824951171875, 6.06414794921875, 6.3033447265625, 6.54254150390625, 6.78173828125, 7.02093505859375, 7.2601318359375, 7.49932861328125, 7.738525390625, 7.97772216796875, 8.2169189453125, 8.45611572265625, 8.6953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 5.0, 15.0, 18.0, 25.0, 28.0, 43.0, 70.0, 116.0, 163.0, 150.0, 125.0, 78.0, 57.0, 29.0, 24.0, 22.0, 14.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.692138671875, -11.36083984375, -11.029541015625, -10.6982421875, -10.366943359375, -10.03564453125, -9.704345703125, -9.373046875, -9.041748046875, -8.71044921875, -8.379150390625, -8.0478515625, -7.716552734375, -7.38525390625, -7.053955078125, -6.72265625, -6.391357421875, -6.06005859375, -5.728759765625, -5.3974609375, -5.066162109375, -4.73486328125, -4.403564453125, -4.072265625, -3.740966796875, -3.40966796875, -3.078369140625, -2.7470703125, -2.415771484375, -2.08447265625, -1.753173828125, -1.421875, -1.090576171875, -0.75927734375, -0.427978515625, -0.0966796875, 0.234619140625, 0.56591796875, 0.897216796875, 1.228515625, 1.559814453125, 1.89111328125, 2.222412109375, 2.5537109375, 2.885009765625, 3.21630859375, 3.547607421875, 3.87890625, 4.210205078125, 4.54150390625, 4.872802734375, 5.2041015625, 5.535400390625, 5.86669921875, 6.197998046875, 6.529296875, 6.860595703125, 7.19189453125, 7.523193359375, 7.8544921875, 8.185791015625, 8.51708984375, 8.848388671875, 9.1796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 15.0, 15.0, 31.0, 81.0, 164.0, 236.0, 222.0, 120.0, 60.0, 27.0, 19.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-194.8741455078125, -190.68942260742188, -186.50469970703125, -182.31997680664062, -178.13525390625, -173.95054626464844, -169.7658233642578, -165.5811004638672, -161.39637756347656, -157.21165466308594, -153.0269317626953, -148.8422088623047, -144.65750122070312, -140.4727783203125, -136.28805541992188, -132.10333251953125, -127.91860961914062, -123.73388671875, -119.54916381835938, -115.36444854736328, -111.17972564697266, -106.99500274658203, -102.81028747558594, -98.62556457519531, -94.44084167480469, -90.25611877441406, -86.07139587402344, -81.88668060302734, -77.70195770263672, -73.5172348022461, -69.33251953125, -65.14779663085938, -60.96308135986328, -56.778358459472656, -52.5936393737793, -48.40892028808594, -44.22419738769531, -40.03947448730469, -35.85475540161133, -31.670034408569336, -27.485313415527344, -23.30059242248535, -19.11587142944336, -14.931150436401367, -10.746429443359375, -6.561708450317383, -2.3769874572753906, 1.8077335357666016, 5.992454528808594, 10.177175521850586, 14.361896514892578, 18.54661750793457, 22.731338500976562, 26.916059494018555, 31.100780487060547, 35.285499572753906, 39.47022247314453, 43.654945373535156, 47.839664459228516, 52.024383544921875, 56.2091064453125, 60.393829345703125, 64.57855224609375, 68.76326751708984, 72.94799041748047]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 7.0, 12.0, 12.0, 16.0, 13.0, 23.0, 27.0, 36.0, 28.0, 34.0, 37.0, 47.0, 47.0, 69.0, 69.0, 54.0, 60.0, 68.0, 45.0, 44.0, 42.0, 30.0, 26.0, 28.0, 19.0, 21.0, 18.0, 12.0, 13.0, 6.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.84974670410156, -81.9218978881836, -78.99404907226562, -76.06619262695312, -73.13834381103516, -70.21049499511719, -67.28264617919922, -64.35479736328125, -61.426944732666016, -58.49909591674805, -55.57124328613281, -52.643394470214844, -49.715545654296875, -46.78769302368164, -43.85984420776367, -40.93199157714844, -38.00414276123047, -35.0762939453125, -32.148441314697266, -29.220592498779297, -26.292741775512695, -23.364891052246094, -20.437042236328125, -17.509191513061523, -14.581340789794922, -11.65349006652832, -8.725640296936035, -5.79779052734375, -2.8699398040771484, 0.057910919189453125, 2.985759735107422, 5.913610458374023, 8.841461181640625, 11.769311904907227, 14.697161674499512, 17.625011444091797, 20.5528621673584, 23.480712890625, 26.40856170654297, 29.33641242980957, 32.26426315307617, 35.19211196899414, 38.119964599609375, 41.047813415527344, 43.97566223144531, 46.90351486206055, 49.831363677978516, 52.75921630859375, 55.68706512451172, 58.61491394042969, 61.54276657104492, 64.47061157226562, 67.39846801757812, 70.3263168334961, 73.25416564941406, 76.18201446533203, 79.10986328125, 82.03771209716797, 84.96556091308594, 87.89341735839844, 90.8212661743164, 93.74911499023438, 96.67696380615234, 99.60481262207031, 102.53266906738281]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 11.0, 6.0, 17.0, 27.0, 47.0, 85.0, 159.0, 231.0, 475.0, 865.0, 1792.0, 4257.0, 14868.0, 149728.0, 3962519.0, 45016.0, 8309.0, 3036.0, 1326.0, 673.0, 338.0, 198.0, 120.0, 64.0, 32.0, 25.0, 14.0, 17.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.64251708984375, -7.3280029296875, -7.01348876953125, -6.698974609375, -6.38446044921875, -6.0699462890625, -5.75543212890625, -5.44091796875, -5.12640380859375, -4.8118896484375, -4.49737548828125, -4.182861328125, -3.86834716796875, -3.5538330078125, -3.23931884765625, -2.9248046875, -2.61029052734375, -2.2957763671875, -1.98126220703125, -1.666748046875, -1.35223388671875, -1.0377197265625, -0.72320556640625, -0.40869140625, -0.09417724609375, 0.2203369140625, 0.53485107421875, 0.849365234375, 1.16387939453125, 1.4783935546875, 1.79290771484375, 2.107421875, 2.42193603515625, 2.7364501953125, 3.05096435546875, 3.365478515625, 3.67999267578125, 3.9945068359375, 4.30902099609375, 4.62353515625, 4.93804931640625, 5.2525634765625, 5.56707763671875, 5.881591796875, 6.19610595703125, 6.5106201171875, 6.82513427734375, 7.1396484375, 7.45416259765625, 7.7686767578125, 8.08319091796875, 8.397705078125, 8.71221923828125, 9.0267333984375, 9.34124755859375, 9.65576171875, 9.97027587890625, 10.2847900390625, 10.59930419921875, 10.913818359375, 11.22833251953125, 11.5428466796875, 11.85736083984375, 12.171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 8.0, 12.0, 31.0, 20.0, 28.0, 35.0, 39.0, 57.0, 61.0, 53.0, 52.0, 57.0, 72.0, 83.0, 80.0, 46.0, 43.0, 44.0, 34.0, 32.0, 28.0, 20.0, 16.0, 9.0, 10.0, 5.0, 8.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0390625, -4.8951416015625, -4.751220703125, -4.6072998046875, -4.46337890625, -4.3194580078125, -4.175537109375, -4.0316162109375, -3.8876953125, -3.7437744140625, -3.599853515625, -3.4559326171875, -3.31201171875, -3.1680908203125, -3.024169921875, -2.8802490234375, -2.736328125, -2.5924072265625, -2.448486328125, -2.3045654296875, -2.16064453125, -2.0167236328125, -1.872802734375, -1.7288818359375, -1.5849609375, -1.4410400390625, -1.297119140625, -1.1531982421875, -1.00927734375, -0.8653564453125, -0.721435546875, -0.5775146484375, -0.43359375, -0.2896728515625, -0.145751953125, -0.0018310546875, 0.14208984375, 0.2860107421875, 0.429931640625, 0.5738525390625, 0.7177734375, 0.8616943359375, 1.005615234375, 1.1495361328125, 1.29345703125, 1.4373779296875, 1.581298828125, 1.7252197265625, 1.869140625, 2.0130615234375, 2.156982421875, 2.3009033203125, 2.44482421875, 2.5887451171875, 2.732666015625, 2.8765869140625, 3.0205078125, 3.1644287109375, 3.308349609375, 3.4522705078125, 3.59619140625, 3.7401123046875, 3.884033203125, 4.0279541015625, 4.171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 3.0, 10.0, 18.0, 29.0, 31.0, 58.0, 79.0, 123.0, 199.0, 283.0, 478.0, 752.0, 1255.0, 2421.0, 5071.0, 12644.0, 45062.0, 492917.0, 3520472.0, 80274.0, 18330.0, 6729.0, 3066.0, 1591.0, 945.0, 493.0, 339.0, 206.0, 138.0, 86.0, 48.0, 32.0, 34.0, 24.0, 7.0, 6.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.55047607421875, -7.3001708984375, -7.04986572265625, -6.799560546875, -6.54925537109375, -6.2989501953125, -6.04864501953125, -5.79833984375, -5.54803466796875, -5.2977294921875, -5.04742431640625, -4.797119140625, -4.54681396484375, -4.2965087890625, -4.04620361328125, -3.7958984375, -3.54559326171875, -3.2952880859375, -3.04498291015625, -2.794677734375, -2.54437255859375, -2.2940673828125, -2.04376220703125, -1.79345703125, -1.54315185546875, -1.2928466796875, -1.04254150390625, -0.792236328125, -0.54193115234375, -0.2916259765625, -0.04132080078125, 0.208984375, 0.45928955078125, 0.7095947265625, 0.95989990234375, 1.210205078125, 1.46051025390625, 1.7108154296875, 1.96112060546875, 2.21142578125, 2.46173095703125, 2.7120361328125, 2.96234130859375, 3.212646484375, 3.46295166015625, 3.7132568359375, 3.96356201171875, 4.2138671875, 4.46417236328125, 4.7144775390625, 4.96478271484375, 5.215087890625, 5.46539306640625, 5.7156982421875, 5.96600341796875, 6.21630859375, 6.46661376953125, 6.7169189453125, 6.96722412109375, 7.217529296875, 7.46783447265625, 7.7181396484375, 7.96844482421875, 8.21875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 7.0, 2.0, 6.0, 11.0, 29.0, 46.0, 91.0, 318.0, 2920.0, 416.0, 110.0, 45.0, 29.0, 13.0, 10.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.326416015625, -3.22119140625, -3.115966796875, -3.0107421875, -2.905517578125, -2.80029296875, -2.695068359375, -2.58984375, -2.484619140625, -2.37939453125, -2.274169921875, -2.1689453125, -2.063720703125, -1.95849609375, -1.853271484375, -1.748046875, -1.642822265625, -1.53759765625, -1.432373046875, -1.3271484375, -1.221923828125, -1.11669921875, -1.011474609375, -0.90625, -0.801025390625, -0.69580078125, -0.590576171875, -0.4853515625, -0.380126953125, -0.27490234375, -0.169677734375, -0.064453125, 0.040771484375, 0.14599609375, 0.251220703125, 0.3564453125, 0.461669921875, 0.56689453125, 0.672119140625, 0.77734375, 0.882568359375, 0.98779296875, 1.093017578125, 1.1982421875, 1.303466796875, 1.40869140625, 1.513916015625, 1.619140625, 1.724365234375, 1.82958984375, 1.934814453125, 2.0400390625, 2.145263671875, 2.25048828125, 2.355712890625, 2.4609375, 2.566162109375, 2.67138671875, 2.776611328125, 2.8818359375, 2.987060546875, 3.09228515625, 3.197509765625, 3.302734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 11.0, 16.0, 19.0, 52.0, 59.0, 113.0, 122.0, 130.0, 116.0, 126.0, 92.0, 67.0, 28.0, 18.0, 5.0, 10.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.685128211975098, -11.318992614746094, -10.95285701751709, -10.586721420288086, -10.220586776733398, -9.854451179504395, -9.48831558227539, -9.122179985046387, -8.756044387817383, -8.389908790588379, -8.023773193359375, -7.657638072967529, -7.291502475738525, -6.9253668785095215, -6.559231758117676, -6.193096160888672, -5.826960563659668, -5.460824966430664, -5.09468936920166, -4.7285542488098145, -4.3624186515808105, -3.9962830543518066, -3.630147695541382, -3.264012336730957, -2.897876739501953, -2.531741142272949, -2.1656057834625244, -1.79947030544281, -1.4333348274230957, -1.0671993494033813, -0.701063871383667, -0.3349285125732422, 0.03120708465576172, 0.3973425626754761, 0.7634780406951904, 1.1296135187149048, 1.4957489967346191, 1.8618844747543335, 2.228019952774048, 2.5941553115844727, 2.9602909088134766, 3.3264265060424805, 3.6925618648529053, 4.05869722366333, 4.424832820892334, 4.790968418121338, 5.157103538513184, 5.5232391357421875, 5.889374732971191, 6.255510330200195, 6.621645927429199, 6.987781047821045, 7.353916645050049, 7.720052242279053, 8.086187362670898, 8.452322959899902, 8.818458557128906, 9.18459415435791, 9.550729751586914, 9.916865348815918, 10.283000946044922, 10.64913558959961, 11.015271186828613, 11.381406784057617, 11.747542381286621]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 2.0, 8.0, 11.0, 8.0, 7.0, 12.0, 17.0, 12.0, 20.0, 24.0, 22.0, 20.0, 27.0, 35.0, 35.0, 39.0, 48.0, 45.0, 40.0, 44.0, 47.0, 58.0, 40.0, 34.0, 32.0, 30.0, 40.0, 34.0, 29.0, 33.0, 14.0, 17.0, 17.0, 14.0, 10.0, 11.0, 4.0, 12.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.698233604431152, -4.536670207977295, -4.375106334686279, -4.213542938232422, -4.051979064941406, -3.890415668487549, -3.7288520336151123, -3.567288398742676, -3.4057250022888184, -3.244161367416382, -3.0825977325439453, -2.921034336090088, -2.7594707012176514, -2.597907066345215, -2.4363434314727783, -2.274779796600342, -2.1132161617279053, -1.9516525268554688, -1.7900890111923218, -1.6285253763198853, -1.4669618606567383, -1.3053982257843018, -1.1438345909118652, -0.9822710752487183, -0.8207074403762817, -0.65914386510849, -0.49758026003837585, -0.3360166549682617, -0.17445307970046997, -0.012889504432678223, 0.1486741304397583, 0.3102376461029053, 0.4718012809753418, 0.6333648562431335, 0.7949284315109253, 0.9564920663833618, 1.1180555820465088, 1.2796192169189453, 1.4411828517913818, 1.6027463674545288, 1.7643100023269653, 1.9258736371994019, 2.087437152862549, 2.2490007877349854, 2.410564422607422, 2.5721278190612793, 2.733691692352295, 2.8952550888061523, 3.056818723678589, 3.2183823585510254, 3.379945993423462, 3.5415096282958984, 3.703073024749756, 3.8646366596221924, 4.026200294494629, 4.187763690948486, 4.349327564239502, 4.510890960693359, 4.672454833984375, 4.834018230438232, 4.995582103729248, 5.1571455001831055, 5.318709373474121, 5.4802727699279785, 5.641836166381836]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 21.0, 19.0, 37.0, 55.0, 102.0, 174.0, 273.0, 598.0, 1138.0, 2467.0, 5746.0, 14423.0, 40051.0, 124097.0, 336015.0, 333638.0, 124455.0, 40121.0, 14484.0, 5737.0, 2481.0, 1093.0, 585.0, 301.0, 170.0, 110.0, 57.0, 36.0, 21.0, 13.0, 7.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484375, -6.28173828125, -6.0791015625, -5.87646484375, -5.673828125, -5.47119140625, -5.2685546875, -5.06591796875, -4.86328125, -4.66064453125, -4.4580078125, -4.25537109375, -4.052734375, -3.85009765625, -3.6474609375, -3.44482421875, -3.2421875, -3.03955078125, -2.8369140625, -2.63427734375, -2.431640625, -2.22900390625, -2.0263671875, -1.82373046875, -1.62109375, -1.41845703125, -1.2158203125, -1.01318359375, -0.810546875, -0.60791015625, -0.4052734375, -0.20263671875, 0.0, 0.20263671875, 0.4052734375, 0.60791015625, 0.810546875, 1.01318359375, 1.2158203125, 1.41845703125, 1.62109375, 1.82373046875, 2.0263671875, 2.22900390625, 2.431640625, 2.63427734375, 2.8369140625, 3.03955078125, 3.2421875, 3.44482421875, 3.6474609375, 3.85009765625, 4.052734375, 4.25537109375, 4.4580078125, 4.66064453125, 4.86328125, 5.06591796875, 5.2685546875, 5.47119140625, 5.673828125, 5.87646484375, 6.0791015625, 6.28173828125, 6.484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 7.0, 15.0, 8.0, 30.0, 17.0, 21.0, 31.0, 37.0, 38.0, 55.0, 44.0, 45.0, 73.0, 63.0, 57.0, 68.0, 70.0, 53.0, 48.0, 41.0, 37.0, 37.0, 22.0, 19.0, 11.0, 20.0, 12.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.78515625, -4.648284912109375, -4.51141357421875, -4.374542236328125, -4.2376708984375, -4.100799560546875, -3.96392822265625, -3.827056884765625, -3.690185546875, -3.553314208984375, -3.41644287109375, -3.279571533203125, -3.1427001953125, -3.005828857421875, -2.86895751953125, -2.732086181640625, -2.59521484375, -2.458343505859375, -2.32147216796875, -2.184600830078125, -2.0477294921875, -1.910858154296875, -1.77398681640625, -1.637115478515625, -1.500244140625, -1.363372802734375, -1.22650146484375, -1.089630126953125, -0.9527587890625, -0.815887451171875, -0.67901611328125, -0.542144775390625, -0.4052734375, -0.268402099609375, -0.13153076171875, 0.005340576171875, 0.1422119140625, 0.279083251953125, 0.41595458984375, 0.552825927734375, 0.689697265625, 0.826568603515625, 0.96343994140625, 1.100311279296875, 1.2371826171875, 1.374053955078125, 1.51092529296875, 1.647796630859375, 1.78466796875, 1.921539306640625, 2.05841064453125, 2.195281982421875, 2.3321533203125, 2.469024658203125, 2.60589599609375, 2.742767333984375, 2.879638671875, 3.016510009765625, 3.15338134765625, 3.290252685546875, 3.4271240234375, 3.563995361328125, 3.70086669921875, 3.837738037109375, 3.974609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 12.0, 11.0, 22.0, 13.0, 23.0, 28.0, 34.0, 42.0, 64.0, 119.0, 184.0, 342.0, 657.0, 1406.0, 3428.0, 10949.0, 49323.0, 331484.0, 539024.0, 86163.0, 16759.0, 4745.0, 1796.0, 862.0, 408.0, 221.0, 127.0, 92.0, 54.0, 46.0, 23.0, 26.0, 15.0, 9.0, 7.0, 9.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.4296875, -10.1151123046875, -9.800537109375, -9.4859619140625, -9.17138671875, -8.8568115234375, -8.542236328125, -8.2276611328125, -7.9130859375, -7.5985107421875, -7.283935546875, -6.9693603515625, -6.65478515625, -6.3402099609375, -6.025634765625, -5.7110595703125, -5.396484375, -5.0819091796875, -4.767333984375, -4.4527587890625, -4.13818359375, -3.8236083984375, -3.509033203125, -3.1944580078125, -2.8798828125, -2.5653076171875, -2.250732421875, -1.9361572265625, -1.62158203125, -1.3070068359375, -0.992431640625, -0.6778564453125, -0.36328125, -0.0487060546875, 0.265869140625, 0.5804443359375, 0.89501953125, 1.2095947265625, 1.524169921875, 1.8387451171875, 2.1533203125, 2.4678955078125, 2.782470703125, 3.0970458984375, 3.41162109375, 3.7261962890625, 4.040771484375, 4.3553466796875, 4.669921875, 4.9844970703125, 5.299072265625, 5.6136474609375, 5.92822265625, 6.2427978515625, 6.557373046875, 6.8719482421875, 7.1865234375, 7.5010986328125, 7.815673828125, 8.1302490234375, 8.44482421875, 8.7593994140625, 9.073974609375, 9.3885498046875, 9.703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 15.0, 18.0, 19.0, 23.0, 37.0, 31.0, 34.0, 45.0, 54.0, 54.0, 55.0, 57.0, 60.0, 63.0, 70.0, 49.0, 43.0, 43.0, 36.0, 35.0, 37.0, 23.0, 13.0, 17.0, 12.0, 9.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -21.154296875, -20.52734375, -19.900390625, -19.2734375, -18.646484375, -18.01953125, -17.392578125, -16.765625, -16.138671875, -15.51171875, -14.884765625, -14.2578125, -13.630859375, -13.00390625, -12.376953125, -11.75, -11.123046875, -10.49609375, -9.869140625, -9.2421875, -8.615234375, -7.98828125, -7.361328125, -6.734375, -6.107421875, -5.48046875, -4.853515625, -4.2265625, -3.599609375, -2.97265625, -2.345703125, -1.71875, -1.091796875, -0.46484375, 0.162109375, 0.7890625, 1.416015625, 2.04296875, 2.669921875, 3.296875, 3.923828125, 4.55078125, 5.177734375, 5.8046875, 6.431640625, 7.05859375, 7.685546875, 8.3125, 8.939453125, 9.56640625, 10.193359375, 10.8203125, 11.447265625, 12.07421875, 12.701171875, 13.328125, 13.955078125, 14.58203125, 15.208984375, 15.8359375, 16.462890625, 17.08984375, 17.716796875, 18.34375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 8.0, 7.0, 8.0, 7.0, 10.0, 18.0, 23.0, 27.0, 67.0, 151.0, 280.0, 772.0, 3899.0, 57321.0, 909933.0, 70167.0, 4305.0, 878.0, 323.0, 137.0, 79.0, 47.0, 31.0, 13.0, 11.0, 14.0, 6.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.2120361328125, -9.916259765625, -9.6204833984375, -9.32470703125, -9.0289306640625, -8.733154296875, -8.4373779296875, -8.1416015625, -7.8458251953125, -7.550048828125, -7.2542724609375, -6.95849609375, -6.6627197265625, -6.366943359375, -6.0711669921875, -5.775390625, -5.4796142578125, -5.183837890625, -4.8880615234375, -4.59228515625, -4.2965087890625, -4.000732421875, -3.7049560546875, -3.4091796875, -3.1134033203125, -2.817626953125, -2.5218505859375, -2.22607421875, -1.9302978515625, -1.634521484375, -1.3387451171875, -1.04296875, -0.7471923828125, -0.451416015625, -0.1556396484375, 0.14013671875, 0.4359130859375, 0.731689453125, 1.0274658203125, 1.3232421875, 1.6190185546875, 1.914794921875, 2.2105712890625, 2.50634765625, 2.8021240234375, 3.097900390625, 3.3936767578125, 3.689453125, 3.9852294921875, 4.281005859375, 4.5767822265625, 4.87255859375, 5.1683349609375, 5.464111328125, 5.7598876953125, 6.0556640625, 6.3514404296875, 6.647216796875, 6.9429931640625, 7.23876953125, 7.5345458984375, 7.830322265625, 8.1260986328125, 8.421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 10.0, 5.0, 15.0, 15.0, 30.0, 29.0, 48.0, 53.0, 54.0, 70.0, 77.0, 66.0, 70.0, 84.0, 68.0, 62.0, 40.0, 37.0, 37.0, 37.0, 18.0, 18.0, 10.0, 11.0, 6.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0007157325744628906, -0.0006964579224586487, -0.0006771832704544067, -0.0006579086184501648, -0.0006386339664459229, -0.0006193593144416809, -0.000600084662437439, -0.000580810010433197, -0.0005615353584289551, -0.0005422607064247131, -0.0005229860544204712, -0.0005037114024162292, -0.0004844367504119873, -0.00046516209840774536, -0.0004458874464035034, -0.0004266127943992615, -0.00040733814239501953, -0.0003880634903907776, -0.00036878883838653564, -0.0003495141863822937, -0.00033023953437805176, -0.0003109648823738098, -0.00029169023036956787, -0.00027241557836532593, -0.000253140926361084, -0.00023386627435684204, -0.0002145916223526001, -0.00019531697034835815, -0.0001760423183441162, -0.00015676766633987427, -0.00013749301433563232, -0.00011821836233139038, -9.894371032714844e-05, -7.96690583229065e-05, -6.039440631866455e-05, -4.111975431442261e-05, -2.1845102310180664e-05, -2.5704503059387207e-06, 1.6704201698303223e-05, 3.5978853702545166e-05, 5.525350570678711e-05, 7.452815771102905e-05, 9.3802809715271e-05, 0.00011307746171951294, 0.00013235211372375488, 0.00015162676572799683, 0.00017090141773223877, 0.0001901760697364807, 0.00020945072174072266, 0.0002287253737449646, 0.00024800002574920654, 0.0002672746777534485, 0.00028654932975769043, 0.0003058239817619324, 0.0003250986337661743, 0.00034437328577041626, 0.0003636479377746582, 0.00038292258977890015, 0.0004021972417831421, 0.00042147189378738403, 0.000440746545791626, 0.0004600211977958679, 0.00047929584980010986, 0.0004985705018043518, 0.0005178451538085938]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 7.0, 5.0, 11.0, 9.0, 24.0, 15.0, 35.0, 65.0, 118.0, 175.0, 422.0, 811.0, 1954.0, 7284.0, 58708.0, 727021.0, 229378.0, 16736.0, 3494.0, 1203.0, 495.0, 233.0, 131.0, 85.0, 50.0, 19.0, 19.0, 13.0, 8.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.453125, -6.236083984375, -6.01904296875, -5.802001953125, -5.5849609375, -5.367919921875, -5.15087890625, -4.933837890625, -4.716796875, -4.499755859375, -4.28271484375, -4.065673828125, -3.8486328125, -3.631591796875, -3.41455078125, -3.197509765625, -2.98046875, -2.763427734375, -2.54638671875, -2.329345703125, -2.1123046875, -1.895263671875, -1.67822265625, -1.461181640625, -1.244140625, -1.027099609375, -0.81005859375, -0.593017578125, -0.3759765625, -0.158935546875, 0.05810546875, 0.275146484375, 0.4921875, 0.709228515625, 0.92626953125, 1.143310546875, 1.3603515625, 1.577392578125, 1.79443359375, 2.011474609375, 2.228515625, 2.445556640625, 2.66259765625, 2.879638671875, 3.0966796875, 3.313720703125, 3.53076171875, 3.747802734375, 3.96484375, 4.181884765625, 4.39892578125, 4.615966796875, 4.8330078125, 5.050048828125, 5.26708984375, 5.484130859375, 5.701171875, 5.918212890625, 6.13525390625, 6.352294921875, 6.5693359375, 6.786376953125, 7.00341796875, 7.220458984375, 7.4375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 20.0, 21.0, 15.0, 38.0, 45.0, 64.0, 97.0, 99.0, 108.0, 116.0, 99.0, 82.0, 63.0, 39.0, 26.0, 15.0, 11.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.49609375, -7.290283203125, -7.08447265625, -6.878662109375, -6.6728515625, -6.467041015625, -6.26123046875, -6.055419921875, -5.849609375, -5.643798828125, -5.43798828125, -5.232177734375, -5.0263671875, -4.820556640625, -4.61474609375, -4.408935546875, -4.203125, -3.997314453125, -3.79150390625, -3.585693359375, -3.3798828125, -3.174072265625, -2.96826171875, -2.762451171875, -2.556640625, -2.350830078125, -2.14501953125, -1.939208984375, -1.7333984375, -1.527587890625, -1.32177734375, -1.115966796875, -0.91015625, -0.704345703125, -0.49853515625, -0.292724609375, -0.0869140625, 0.118896484375, 0.32470703125, 0.530517578125, 0.736328125, 0.942138671875, 1.14794921875, 1.353759765625, 1.5595703125, 1.765380859375, 1.97119140625, 2.177001953125, 2.3828125, 2.588623046875, 2.79443359375, 3.000244140625, 3.2060546875, 3.411865234375, 3.61767578125, 3.823486328125, 4.029296875, 4.235107421875, 4.44091796875, 4.646728515625, 4.8525390625, 5.058349609375, 5.26416015625, 5.469970703125, 5.67578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 14.0, 30.0, 64.0, 132.0, 211.0, 239.0, 143.0, 74.0, 30.0, 16.0, 18.0, 9.0, 8.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.56095886230469, -84.87007904052734, -81.17919921875, -77.48831939697266, -73.79743957519531, -70.10655975341797, -66.41567993164062, -62.724796295166016, -59.03391647338867, -55.34303665161133, -51.652156829833984, -47.961273193359375, -44.27039337158203, -40.57951354980469, -36.888633728027344, -33.19775390625, -29.506874084472656, -25.815994262695312, -22.12511444091797, -18.434232711791992, -14.743352890014648, -11.052473068237305, -7.361591339111328, -3.6707115173339844, 0.020168304443359375, 3.7110486030578613, 7.401928901672363, 11.092809677124023, 14.783689498901367, 18.47456932067871, 22.165451049804688, 25.85633087158203, 29.547210693359375, 33.23809051513672, 36.92897033691406, 40.619850158691406, 44.31072998046875, 48.001609802246094, 51.6924934387207, 55.38337326049805, 59.07425308227539, 62.765132904052734, 66.45601654052734, 70.14689636230469, 73.83777618408203, 77.52865600585938, 81.21953582763672, 84.91041564941406, 88.6012954711914, 92.29217529296875, 95.9830551147461, 99.67393493652344, 103.36481475830078, 107.05569458007812, 110.74658203125, 114.43745422363281, 118.12834167480469, 121.81922149658203, 125.51010131835938, 129.20098876953125, 132.89186096191406, 136.58274841308594, 140.27362060546875, 143.96450805664062, 147.65538024902344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 13.0, 17.0, 18.0, 17.0, 26.0, 31.0, 28.0, 30.0, 27.0, 40.0, 48.0, 36.0, 45.0, 49.0, 51.0, 54.0, 62.0, 51.0, 42.0, 42.0, 37.0, 33.0, 28.0, 23.0, 15.0, 21.0, 21.0, 21.0, 11.0, 13.0, 4.0, 3.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-82.78804016113281, -80.41075134277344, -78.03346252441406, -75.65617370605469, -73.27888488769531, -70.90159606933594, -68.52430725097656, -66.14701843261719, -63.76972961425781, -61.39244079589844, -59.01515197753906, -56.63786315917969, -54.26057434082031, -51.88328552246094, -49.50599670410156, -47.12870788574219, -44.75141906738281, -42.37413024902344, -39.99684143066406, -37.61955261230469, -35.24226379394531, -32.86497497558594, -30.487686157226562, -28.110397338867188, -25.733108520507812, -23.355819702148438, -20.978530883789062, -18.601242065429688, -16.223953247070312, -13.846664428710938, -11.469375610351562, -9.092086791992188, -6.714805603027344, -4.337516784667969, -1.9602279663085938, 0.41706085205078125, 2.7943496704101562, 5.171638488769531, 7.548927307128906, 9.926216125488281, 12.303504943847656, 14.680793762207031, 17.058082580566406, 19.43537139892578, 21.812660217285156, 24.18994903564453, 26.567237854003906, 28.94452667236328, 31.321815490722656, 33.69910430908203, 36.076393127441406, 38.45368194580078, 40.830970764160156, 43.20825958251953, 45.585548400878906, 47.96283721923828, 50.340126037597656, 52.71741485595703, 55.094703674316406, 57.47199249267578, 59.849281311035156, 62.22657012939453, 64.6038589477539, 66.98114776611328, 69.35843658447266]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 13.0, 17.0, 26.0, 33.0, 59.0, 70.0, 131.0, 184.0, 331.0, 535.0, 1026.0, 1973.0, 4596.0, 14555.0, 93138.0, 3992438.0, 65254.0, 12010.0, 3896.0, 1771.0, 902.0, 505.0, 298.0, 197.0, 106.0, 69.0, 45.0, 33.0, 20.0, 19.0, 10.0, 2.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.56640625, -6.31793212890625, -6.0694580078125, -5.82098388671875, -5.572509765625, -5.32403564453125, -5.0755615234375, -4.82708740234375, -4.57861328125, -4.33013916015625, -4.0816650390625, -3.83319091796875, -3.584716796875, -3.33624267578125, -3.0877685546875, -2.83929443359375, -2.5908203125, -2.34234619140625, -2.0938720703125, -1.84539794921875, -1.596923828125, -1.34844970703125, -1.0999755859375, -0.85150146484375, -0.60302734375, -0.35455322265625, -0.1060791015625, 0.14239501953125, 0.390869140625, 0.63934326171875, 0.8878173828125, 1.13629150390625, 1.384765625, 1.63323974609375, 1.8817138671875, 2.13018798828125, 2.378662109375, 2.62713623046875, 2.8756103515625, 3.12408447265625, 3.37255859375, 3.62103271484375, 3.8695068359375, 4.11798095703125, 4.366455078125, 4.61492919921875, 4.8634033203125, 5.11187744140625, 5.3603515625, 5.60882568359375, 5.8572998046875, 6.10577392578125, 6.354248046875, 6.60272216796875, 6.8511962890625, 7.09967041015625, 7.34814453125, 7.59661865234375, 7.8450927734375, 8.09356689453125, 8.342041015625, 8.59051513671875, 8.8389892578125, 9.08746337890625, 9.3359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 4.0, 6.0, 3.0, 9.0, 10.0, 9.0, 14.0, 21.0, 29.0, 24.0, 22.0, 42.0, 35.0, 41.0, 34.0, 44.0, 41.0, 51.0, 44.0, 45.0, 57.0, 49.0, 31.0, 57.0, 46.0, 31.0, 28.0, 35.0, 18.0, 19.0, 20.0, 15.0, 15.0, 8.0, 7.0, 9.0, 8.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.708984375, -3.60821533203125, -3.5074462890625, -3.40667724609375, -3.305908203125, -3.20513916015625, -3.1043701171875, -3.00360107421875, -2.90283203125, -2.80206298828125, -2.7012939453125, -2.60052490234375, -2.499755859375, -2.39898681640625, -2.2982177734375, -2.19744873046875, -2.0966796875, -1.99591064453125, -1.8951416015625, -1.79437255859375, -1.693603515625, -1.59283447265625, -1.4920654296875, -1.39129638671875, -1.29052734375, -1.18975830078125, -1.0889892578125, -0.98822021484375, -0.887451171875, -0.78668212890625, -0.6859130859375, -0.58514404296875, -0.484375, -0.38360595703125, -0.2828369140625, -0.18206787109375, -0.081298828125, 0.01947021484375, 0.1202392578125, 0.22100830078125, 0.32177734375, 0.42254638671875, 0.5233154296875, 0.62408447265625, 0.724853515625, 0.82562255859375, 0.9263916015625, 1.02716064453125, 1.1279296875, 1.22869873046875, 1.3294677734375, 1.43023681640625, 1.531005859375, 1.63177490234375, 1.7325439453125, 1.83331298828125, 1.93408203125, 2.03485107421875, 2.1356201171875, 2.23638916015625, 2.337158203125, 2.43792724609375, 2.5386962890625, 2.63946533203125, 2.740234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 5.0, 13.0, 15.0, 27.0, 38.0, 44.0, 51.0, 70.0, 101.0, 154.0, 227.0, 349.0, 492.0, 805.0, 1376.0, 2769.0, 6123.0, 18437.0, 101080.0, 3875148.0, 149781.0, 22659.0, 7221.0, 3093.0, 1556.0, 901.0, 549.0, 367.0, 236.0, 178.0, 111.0, 87.0, 47.0, 56.0, 32.0, 24.0, 16.0, 10.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.921875, -8.6844482421875, -8.447021484375, -8.2095947265625, -7.97216796875, -7.7347412109375, -7.497314453125, -7.2598876953125, -7.0224609375, -6.7850341796875, -6.547607421875, -6.3101806640625, -6.07275390625, -5.8353271484375, -5.597900390625, -5.3604736328125, -5.123046875, -4.8856201171875, -4.648193359375, -4.4107666015625, -4.17333984375, -3.9359130859375, -3.698486328125, -3.4610595703125, -3.2236328125, -2.9862060546875, -2.748779296875, -2.5113525390625, -2.27392578125, -2.0364990234375, -1.799072265625, -1.5616455078125, -1.32421875, -1.0867919921875, -0.849365234375, -0.6119384765625, -0.37451171875, -0.1370849609375, 0.100341796875, 0.3377685546875, 0.5751953125, 0.8126220703125, 1.050048828125, 1.2874755859375, 1.52490234375, 1.7623291015625, 1.999755859375, 2.2371826171875, 2.474609375, 2.7120361328125, 2.949462890625, 3.1868896484375, 3.42431640625, 3.6617431640625, 3.899169921875, 4.1365966796875, 4.3740234375, 4.6114501953125, 4.848876953125, 5.0863037109375, 5.32373046875, 5.5611572265625, 5.798583984375, 6.0360107421875, 6.2734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 6.0, 8.0, 24.0, 36.0, 75.0, 158.0, 856.0, 2534.0, 172.0, 83.0, 44.0, 16.0, 13.0, 11.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.462890625, -2.396453857421875, -2.33001708984375, -2.263580322265625, -2.1971435546875, -2.130706787109375, -2.06427001953125, -1.997833251953125, -1.931396484375, -1.864959716796875, -1.79852294921875, -1.732086181640625, -1.6656494140625, -1.599212646484375, -1.53277587890625, -1.466339111328125, -1.39990234375, -1.333465576171875, -1.26702880859375, -1.200592041015625, -1.1341552734375, -1.067718505859375, -1.00128173828125, -0.934844970703125, -0.868408203125, -0.801971435546875, -0.73553466796875, -0.669097900390625, -0.6026611328125, -0.536224365234375, -0.46978759765625, -0.403350830078125, -0.3369140625, -0.270477294921875, -0.20404052734375, -0.137603759765625, -0.0711669921875, -0.004730224609375, 0.06170654296875, 0.128143310546875, 0.194580078125, 0.261016845703125, 0.32745361328125, 0.393890380859375, 0.4603271484375, 0.526763916015625, 0.59320068359375, 0.659637451171875, 0.72607421875, 0.792510986328125, 0.85894775390625, 0.925384521484375, 0.9918212890625, 1.058258056640625, 1.12469482421875, 1.191131591796875, 1.257568359375, 1.324005126953125, 1.39044189453125, 1.456878662109375, 1.5233154296875, 1.589752197265625, 1.65618896484375, 1.722625732421875, 1.7890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 16.0, 21.0, 30.0, 47.0, 61.0, 92.0, 110.0, 110.0, 85.0, 111.0, 87.0, 65.0, 42.0, 41.0, 23.0, 13.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9436798095703125, -6.709510803222656, -6.475341320037842, -6.2411723136901855, -6.007002830505371, -5.772833824157715, -5.538664817810059, -5.304495334625244, -5.070326328277588, -4.836157321929932, -4.601987838745117, -4.367818832397461, -4.1336493492126465, -3.8994803428649902, -3.665311098098755, -3.4311418533325195, -3.196972608566284, -2.962803363800049, -2.7286341190338135, -2.494464874267578, -2.260295867919922, -2.0261266231536865, -1.7919573783874512, -1.5577882528305054, -1.32361900806427, -1.0894497632980347, -0.8552806377410889, -0.6211113929748535, -0.38694220781326294, -0.15277302265167236, 0.08139622211456299, 0.3155653476715088, 0.5497345924377441, 0.7839037775993347, 1.0180729627609253, 1.2522422075271606, 1.4864113330841064, 1.7205805778503418, 1.9547498226165771, 2.1889190673828125, 2.4230880737304688, 2.657257318496704, 2.8914265632629395, 3.1255955696105957, 3.359764814376831, 3.5939340591430664, 3.8281033039093018, 4.062272548675537, 4.296442031860352, 4.530611038208008, 4.764780521392822, 4.9989495277404785, 5.233119010925293, 5.467288017272949, 5.7014570236206055, 5.93562650680542, 6.169795513153076, 6.403964519500732, 6.638134002685547, 6.872303009033203, 7.106472492218018, 7.340641498565674, 7.574810981750488, 7.8089799880981445, 8.0431489944458]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 3.0, 11.0, 7.0, 10.0, 14.0, 18.0, 21.0, 27.0, 23.0, 16.0, 36.0, 31.0, 38.0, 38.0, 43.0, 48.0, 41.0, 56.0, 38.0, 48.0, 47.0, 35.0, 47.0, 26.0, 39.0, 40.0, 24.0, 25.0, 22.0, 15.0, 21.0, 11.0, 16.0, 9.0, 7.0, 11.0, 5.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8736374378204346, -3.743974208831787, -3.6143109798431396, -3.484647750854492, -3.3549842834472656, -3.2253212928771973, -3.0956578254699707, -2.9659945964813232, -2.836331367492676, -2.7066681385040283, -2.577004909515381, -2.4473416805267334, -2.317678451538086, -2.1880149841308594, -2.058351755142212, -1.9286885261535645, -1.799025297164917, -1.6693620681762695, -1.539698839187622, -1.410035490989685, -1.2803722620010376, -1.1507090330123901, -1.0210456848144531, -0.8913824558258057, -0.7617192268371582, -0.6320559978485107, -0.5023927092552185, -0.37272945046424866, -0.2430661916732788, -0.11340296268463135, 0.01626032590866089, 0.14592361450195312, 0.2755866050720215, 0.40524986386299133, 0.5349131226539612, 0.6645764112472534, 0.7942396402359009, 0.9239028692245483, 1.0535662174224854, 1.1832294464111328, 1.3128926753997803, 1.4425559043884277, 1.5722191333770752, 1.7018824815750122, 1.8315457105636597, 1.9612089395523071, 2.090872287750244, 2.2205355167388916, 2.350198745727539, 2.4798619747161865, 2.609525203704834, 2.7391884326934814, 2.868851661682129, 2.9985151290893555, 3.128178358078003, 3.2578415870666504, 3.387504816055298, 3.5171680450439453, 3.6468312740325928, 3.7764945030212402, 3.906157970428467, 4.035820960998535, 4.165484428405762, 4.295147895812988, 4.424810886383057]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 7.0, 7.0, 8.0, 15.0, 22.0, 26.0, 31.0, 48.0, 73.0, 116.0, 162.0, 251.0, 365.0, 596.0, 968.0, 1650.0, 2956.0, 5666.0, 10903.0, 22284.0, 47528.0, 104965.0, 219127.0, 289837.0, 181455.0, 83511.0, 38117.0, 17942.0, 8953.0, 4628.0, 2511.0, 1467.0, 820.0, 498.0, 340.0, 234.0, 137.0, 100.0, 63.0, 55.0, 38.0, 19.0, 18.0, 8.0, 12.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-4.15625, -4.031646728515625, -3.90704345703125, -3.782440185546875, -3.6578369140625, -3.533233642578125, -3.40863037109375, -3.284027099609375, -3.159423828125, -3.034820556640625, -2.91021728515625, -2.785614013671875, -2.6610107421875, -2.536407470703125, -2.41180419921875, -2.287200927734375, -2.16259765625, -2.037994384765625, -1.91339111328125, -1.788787841796875, -1.6641845703125, -1.539581298828125, -1.41497802734375, -1.290374755859375, -1.165771484375, -1.041168212890625, -0.91656494140625, -0.791961669921875, -0.6673583984375, -0.542755126953125, -0.41815185546875, -0.293548583984375, -0.1689453125, -0.044342041015625, 0.08026123046875, 0.204864501953125, 0.3294677734375, 0.454071044921875, 0.57867431640625, 0.703277587890625, 0.827880859375, 0.952484130859375, 1.07708740234375, 1.201690673828125, 1.3262939453125, 1.450897216796875, 1.57550048828125, 1.700103759765625, 1.82470703125, 1.949310302734375, 2.07391357421875, 2.198516845703125, 2.3231201171875, 2.447723388671875, 2.57232666015625, 2.696929931640625, 2.821533203125, 2.946136474609375, 3.07073974609375, 3.195343017578125, 3.3199462890625, 3.444549560546875, 3.56915283203125, 3.693756103515625, 3.818359375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 6.0, 8.0, 7.0, 10.0, 12.0, 12.0, 17.0, 25.0, 16.0, 25.0, 37.0, 30.0, 34.0, 33.0, 38.0, 32.0, 41.0, 39.0, 42.0, 39.0, 51.0, 39.0, 36.0, 49.0, 40.0, 34.0, 36.0, 28.0, 23.0, 19.0, 23.0, 19.0, 15.0, 13.0, 16.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.173828125, -3.0811767578125, -2.988525390625, -2.8958740234375, -2.80322265625, -2.7105712890625, -2.617919921875, -2.5252685546875, -2.4326171875, -2.3399658203125, -2.247314453125, -2.1546630859375, -2.06201171875, -1.9693603515625, -1.876708984375, -1.7840576171875, -1.69140625, -1.5987548828125, -1.506103515625, -1.4134521484375, -1.32080078125, -1.2281494140625, -1.135498046875, -1.0428466796875, -0.9501953125, -0.8575439453125, -0.764892578125, -0.6722412109375, -0.57958984375, -0.4869384765625, -0.394287109375, -0.3016357421875, -0.208984375, -0.1163330078125, -0.023681640625, 0.0689697265625, 0.16162109375, 0.2542724609375, 0.346923828125, 0.4395751953125, 0.5322265625, 0.6248779296875, 0.717529296875, 0.8101806640625, 0.90283203125, 0.9954833984375, 1.088134765625, 1.1807861328125, 1.2734375, 1.3660888671875, 1.458740234375, 1.5513916015625, 1.64404296875, 1.7366943359375, 1.829345703125, 1.9219970703125, 2.0146484375, 2.1072998046875, 2.199951171875, 2.2926025390625, 2.38525390625, 2.4779052734375, 2.570556640625, 2.6632080078125, 2.755859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 16.0, 13.0, 35.0, 53.0, 78.0, 83.0, 139.0, 249.0, 344.0, 764.0, 1578.0, 4092.0, 14826.0, 84589.0, 609362.0, 282312.0, 36770.0, 7973.0, 2689.0, 1125.0, 555.0, 337.0, 187.0, 115.0, 72.0, 45.0, 51.0, 19.0, 24.0, 15.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.9140625, -10.6173095703125, -10.320556640625, -10.0238037109375, -9.72705078125, -9.4302978515625, -9.133544921875, -8.8367919921875, -8.5400390625, -8.2432861328125, -7.946533203125, -7.6497802734375, -7.35302734375, -7.0562744140625, -6.759521484375, -6.4627685546875, -6.166015625, -5.8692626953125, -5.572509765625, -5.2757568359375, -4.97900390625, -4.6822509765625, -4.385498046875, -4.0887451171875, -3.7919921875, -3.4952392578125, -3.198486328125, -2.9017333984375, -2.60498046875, -2.3082275390625, -2.011474609375, -1.7147216796875, -1.41796875, -1.1212158203125, -0.824462890625, -0.5277099609375, -0.23095703125, 0.0657958984375, 0.362548828125, 0.6593017578125, 0.9560546875, 1.2528076171875, 1.549560546875, 1.8463134765625, 2.14306640625, 2.4398193359375, 2.736572265625, 3.0333251953125, 3.330078125, 3.6268310546875, 3.923583984375, 4.2203369140625, 4.51708984375, 4.8138427734375, 5.110595703125, 5.4073486328125, 5.7041015625, 6.0008544921875, 6.297607421875, 6.5943603515625, 6.89111328125, 7.1878662109375, 7.484619140625, 7.7813720703125, 8.078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 9.0, 6.0, 6.0, 13.0, 13.0, 12.0, 14.0, 18.0, 20.0, 29.0, 35.0, 35.0, 38.0, 45.0, 42.0, 33.0, 46.0, 56.0, 46.0, 47.0, 46.0, 45.0, 46.0, 46.0, 34.0, 22.0, 30.0, 20.0, 26.0, 9.0, 13.0, 16.0, 18.0, 15.0, 14.0, 9.0, 2.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.234375, -14.7626953125, -14.291015625, -13.8193359375, -13.34765625, -12.8759765625, -12.404296875, -11.9326171875, -11.4609375, -10.9892578125, -10.517578125, -10.0458984375, -9.57421875, -9.1025390625, -8.630859375, -8.1591796875, -7.6875, -7.2158203125, -6.744140625, -6.2724609375, -5.80078125, -5.3291015625, -4.857421875, -4.3857421875, -3.9140625, -3.4423828125, -2.970703125, -2.4990234375, -2.02734375, -1.5556640625, -1.083984375, -0.6123046875, -0.140625, 0.3310546875, 0.802734375, 1.2744140625, 1.74609375, 2.2177734375, 2.689453125, 3.1611328125, 3.6328125, 4.1044921875, 4.576171875, 5.0478515625, 5.51953125, 5.9912109375, 6.462890625, 6.9345703125, 7.40625, 7.8779296875, 8.349609375, 8.8212890625, 9.29296875, 9.7646484375, 10.236328125, 10.7080078125, 11.1796875, 11.6513671875, 12.123046875, 12.5947265625, 13.06640625, 13.5380859375, 14.009765625, 14.4814453125, 14.953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 12.0, 14.0, 15.0, 21.0, 28.0, 58.0, 94.0, 160.0, 333.0, 752.0, 1860.0, 7104.0, 64304.0, 851936.0, 108545.0, 9433.0, 2211.0, 846.0, 351.0, 181.0, 113.0, 61.0, 40.0, 31.0, 16.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27734375, -6.07208251953125, -5.8668212890625, -5.66156005859375, -5.456298828125, -5.25103759765625, -5.0457763671875, -4.84051513671875, -4.63525390625, -4.42999267578125, -4.2247314453125, -4.01947021484375, -3.814208984375, -3.60894775390625, -3.4036865234375, -3.19842529296875, -2.9931640625, -2.78790283203125, -2.5826416015625, -2.37738037109375, -2.172119140625, -1.96685791015625, -1.7615966796875, -1.55633544921875, -1.35107421875, -1.14581298828125, -0.9405517578125, -0.73529052734375, -0.530029296875, -0.32476806640625, -0.1195068359375, 0.08575439453125, 0.291015625, 0.49627685546875, 0.7015380859375, 0.90679931640625, 1.112060546875, 1.31732177734375, 1.5225830078125, 1.72784423828125, 1.93310546875, 2.13836669921875, 2.3436279296875, 2.54888916015625, 2.754150390625, 2.95941162109375, 3.1646728515625, 3.36993408203125, 3.5751953125, 3.78045654296875, 3.9857177734375, 4.19097900390625, 4.396240234375, 4.60150146484375, 4.8067626953125, 5.01202392578125, 5.21728515625, 5.42254638671875, 5.6278076171875, 5.83306884765625, 6.038330078125, 6.24359130859375, 6.4488525390625, 6.65411376953125, 6.859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 11.0, 5.0, 13.0, 30.0, 49.0, 76.0, 81.0, 136.0, 165.0, 141.0, 88.0, 81.0, 45.0, 32.0, 14.0, 17.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00072479248046875, -0.0006909668445587158, -0.0006571412086486816, -0.0006233155727386475, -0.0005894899368286133, -0.0005556643009185791, -0.0005218386650085449, -0.00048801302909851074, -0.00045418739318847656, -0.0004203617572784424, -0.0003865361213684082, -0.000352710485458374, -0.00031888484954833984, -0.00028505921363830566, -0.0002512335777282715, -0.0002174079418182373, -0.00018358230590820312, -0.00014975666999816895, -0.00011593103408813477, -8.210539817810059e-05, -4.8279762268066406e-05, -1.4454126358032227e-05, 1.9371509552001953e-05, 5.319714546203613e-05, 8.702278137207031e-05, 0.00012084841728210449, 0.00015467405319213867, 0.00018849968910217285, 0.00022232532501220703, 0.0002561509609222412, 0.0002899765968322754, 0.00032380223274230957, 0.00035762786865234375, 0.00039145350456237793, 0.0004252791404724121, 0.0004591047763824463, 0.0004929304122924805, 0.0005267560482025146, 0.0005605816841125488, 0.000594407320022583, 0.0006282329559326172, 0.0006620585918426514, 0.0006958842277526855, 0.0007297098636627197, 0.0007635354995727539, 0.0007973611354827881, 0.0008311867713928223, 0.0008650124073028564, 0.0008988380432128906, 0.0009326636791229248, 0.000966489315032959, 0.0010003149509429932, 0.0010341405868530273, 0.0010679662227630615, 0.0011017918586730957, 0.0011356174945831299, 0.001169443130493164, 0.0012032687664031982, 0.0012370944023132324, 0.0012709200382232666, 0.0013047456741333008, 0.001338571310043335, 0.0013723969459533691, 0.0014062225818634033, 0.0014400482177734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 12.0, 18.0, 18.0, 34.0, 48.0, 73.0, 109.0, 225.0, 449.0, 881.0, 2137.0, 6736.0, 34496.0, 371707.0, 568461.0, 49797.0, 8659.0, 2601.0, 1018.0, 471.0, 246.0, 137.0, 84.0, 43.0, 33.0, 20.0, 7.0, 7.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.08709716796875, -3.9241943359375, -3.76129150390625, -3.598388671875, -3.43548583984375, -3.2725830078125, -3.10968017578125, -2.94677734375, -2.78387451171875, -2.6209716796875, -2.45806884765625, -2.295166015625, -2.13226318359375, -1.9693603515625, -1.80645751953125, -1.6435546875, -1.48065185546875, -1.3177490234375, -1.15484619140625, -0.991943359375, -0.82904052734375, -0.6661376953125, -0.50323486328125, -0.34033203125, -0.17742919921875, -0.0145263671875, 0.14837646484375, 0.311279296875, 0.47418212890625, 0.6370849609375, 0.79998779296875, 0.962890625, 1.12579345703125, 1.2886962890625, 1.45159912109375, 1.614501953125, 1.77740478515625, 1.9403076171875, 2.10321044921875, 2.26611328125, 2.42901611328125, 2.5919189453125, 2.75482177734375, 2.917724609375, 3.08062744140625, 3.2435302734375, 3.40643310546875, 3.5693359375, 3.73223876953125, 3.8951416015625, 4.05804443359375, 4.220947265625, 4.38385009765625, 4.5467529296875, 4.70965576171875, 4.87255859375, 5.03546142578125, 5.1983642578125, 5.36126708984375, 5.524169921875, 5.68707275390625, 5.8499755859375, 6.01287841796875, 6.17578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 12.0, 13.0, 12.0, 18.0, 30.0, 40.0, 47.0, 62.0, 93.0, 110.0, 106.0, 96.0, 95.0, 68.0, 50.0, 32.0, 28.0, 19.0, 15.0, 9.0, 10.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.5833740234375, -5.416748046875, -5.2501220703125, -5.08349609375, -4.9168701171875, -4.750244140625, -4.5836181640625, -4.4169921875, -4.2503662109375, -4.083740234375, -3.9171142578125, -3.75048828125, -3.5838623046875, -3.417236328125, -3.2506103515625, -3.083984375, -2.9173583984375, -2.750732421875, -2.5841064453125, -2.41748046875, -2.2508544921875, -2.084228515625, -1.9176025390625, -1.7509765625, -1.5843505859375, -1.417724609375, -1.2510986328125, -1.08447265625, -0.9178466796875, -0.751220703125, -0.5845947265625, -0.41796875, -0.2513427734375, -0.084716796875, 0.0819091796875, 0.24853515625, 0.4151611328125, 0.581787109375, 0.7484130859375, 0.9150390625, 1.0816650390625, 1.248291015625, 1.4149169921875, 1.58154296875, 1.7481689453125, 1.914794921875, 2.0814208984375, 2.248046875, 2.4146728515625, 2.581298828125, 2.7479248046875, 2.91455078125, 3.0811767578125, 3.247802734375, 3.4144287109375, 3.5810546875, 3.7476806640625, 3.914306640625, 4.0809326171875, 4.24755859375, 4.4141845703125, 4.580810546875, 4.7474365234375, 4.9140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 11.0, 20.0, 19.0, 58.0, 108.0, 122.0, 168.0, 199.0, 112.0, 70.0, 47.0, 22.0, 13.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.09539794921875, -96.62400817871094, -94.15262603759766, -91.68123626708984, -89.20984649658203, -86.73846435546875, -84.26707458496094, -81.79568481445312, -79.32430267333984, -76.85291290283203, -74.38153076171875, -71.91014099121094, -69.43875122070312, -66.96736907958984, -64.49597930908203, -62.024593353271484, -59.55320358276367, -57.081817626953125, -54.61042785644531, -52.139041900634766, -49.66765594482422, -47.196266174316406, -44.72488021850586, -42.25349426269531, -39.7821044921875, -37.31071853637695, -34.83932876586914, -32.367942810058594, -29.896556854248047, -27.425168991088867, -24.953781127929688, -22.48239517211914, -20.011009216308594, -17.539621353149414, -15.068235397338867, -12.596847534179688, -10.125460624694824, -7.654073715209961, -5.182685852050781, -2.7112998962402344, -0.2399120330810547, 2.2314751148223877, 4.70286226272583, 7.174249649047852, 9.645636558532715, 12.117023468017578, 14.588411331176758, 17.059797286987305, 19.531185150146484, 22.002573013305664, 24.47395896911621, 26.94534683227539, 29.416732788085938, 31.888120651245117, 34.3595085144043, 36.830894470214844, 39.302284240722656, 41.7736701965332, 44.245059967041016, 46.71644592285156, 49.18783187866211, 51.659217834472656, 54.13060760498047, 56.601993560791016, 59.07337951660156]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 8.0, 8.0, 12.0, 10.0, 12.0, 18.0, 15.0, 20.0, 23.0, 31.0, 40.0, 43.0, 32.0, 34.0, 43.0, 48.0, 46.0, 63.0, 41.0, 54.0, 40.0, 40.0, 33.0, 39.0, 33.0, 27.0, 22.0, 35.0, 21.0, 18.0, 17.0, 14.0, 6.0, 10.0, 7.0, 9.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.31007385253906, -63.313865661621094, -61.31765365600586, -59.32144546508789, -57.32523727416992, -55.32902526855469, -53.33281707763672, -51.33660888671875, -49.34040069580078, -47.34419250488281, -45.34798049926758, -43.35177230834961, -41.35556411743164, -39.359352111816406, -37.36314392089844, -35.36693572998047, -33.370723724365234, -31.374513626098633, -29.378305435180664, -27.382095336914062, -25.385887145996094, -23.389677047729492, -21.39346694946289, -19.397258758544922, -17.40104866027832, -15.404839515686035, -13.40863037109375, -11.412420272827148, -9.416211128234863, -7.420001983642578, -5.423791885375977, -3.4275827407836914, -1.4313735961914062, 0.564835786819458, 2.5610451698303223, 4.557254791259766, 6.553463935852051, 8.549673080444336, 10.545883178710938, 12.542092323303223, 14.538301467895508, 16.53451156616211, 18.530719757080078, 20.52692985534668, 22.52313995361328, 24.51934814453125, 26.51555824279785, 28.511768341064453, 30.507976531982422, 32.50418472290039, 34.500396728515625, 36.496604919433594, 38.49281311035156, 40.48902130126953, 42.485233306884766, 44.481441497802734, 46.47765350341797, 48.47386169433594, 50.47007369995117, 52.46628189086914, 54.46249008178711, 56.458702087402344, 58.45491027832031, 60.45111846923828, 62.44732666015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 24.0, 29.0, 39.0, 65.0, 95.0, 211.0, 349.0, 701.0, 1645.0, 4105.0, 13059.0, 68639.0, 3906199.0, 168472.0, 20804.0, 5930.0, 2116.0, 893.0, 395.0, 224.0, 122.0, 57.0, 47.0, 24.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.666015625, -9.37890625, -9.091796875, -8.8046875, -8.517578125, -8.23046875, -7.943359375, -7.65625, -7.369140625, -7.08203125, -6.794921875, -6.5078125, -6.220703125, -5.93359375, -5.646484375, -5.359375, -5.072265625, -4.78515625, -4.498046875, -4.2109375, -3.923828125, -3.63671875, -3.349609375, -3.0625, -2.775390625, -2.48828125, -2.201171875, -1.9140625, -1.626953125, -1.33984375, -1.052734375, -0.765625, -0.478515625, -0.19140625, 0.095703125, 0.3828125, 0.669921875, 0.95703125, 1.244140625, 1.53125, 1.818359375, 2.10546875, 2.392578125, 2.6796875, 2.966796875, 3.25390625, 3.541015625, 3.828125, 4.115234375, 4.40234375, 4.689453125, 4.9765625, 5.263671875, 5.55078125, 5.837890625, 6.125, 6.412109375, 6.69921875, 6.986328125, 7.2734375, 7.560546875, 7.84765625, 8.134765625, 8.421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 13.0, 6.0, 18.0, 25.0, 28.0, 47.0, 67.0, 81.0, 78.0, 75.0, 103.0, 89.0, 83.0, 62.0, 55.0, 45.0, 44.0, 19.0, 20.0, 12.0, 12.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.046875, -7.861358642578125, -7.67584228515625, -7.490325927734375, -7.3048095703125, -7.119293212890625, -6.93377685546875, -6.748260498046875, -6.562744140625, -6.377227783203125, -6.19171142578125, -6.006195068359375, -5.8206787109375, -5.635162353515625, -5.44964599609375, -5.264129638671875, -5.07861328125, -4.893096923828125, -4.70758056640625, -4.522064208984375, -4.3365478515625, -4.151031494140625, -3.96551513671875, -3.779998779296875, -3.594482421875, -3.408966064453125, -3.22344970703125, -3.037933349609375, -2.8524169921875, -2.666900634765625, -2.48138427734375, -2.295867919921875, -2.1103515625, -1.924835205078125, -1.73931884765625, -1.553802490234375, -1.3682861328125, -1.182769775390625, -0.99725341796875, -0.811737060546875, -0.626220703125, -0.440704345703125, -0.25518798828125, -0.069671630859375, 0.1158447265625, 0.301361083984375, 0.48687744140625, 0.672393798828125, 0.85791015625, 1.043426513671875, 1.22894287109375, 1.414459228515625, 1.5999755859375, 1.785491943359375, 1.97100830078125, 2.156524658203125, 2.342041015625, 2.527557373046875, 2.71307373046875, 2.898590087890625, 3.0841064453125, 3.269622802734375, 3.45513916015625, 3.640655517578125, 3.826171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 12.0, 7.0, 14.0, 20.0, 20.0, 46.0, 59.0, 52.0, 98.0, 134.0, 231.0, 308.0, 506.0, 995.0, 2025.0, 6090.0, 25508.0, 343521.0, 3740699.0, 57346.0, 10194.0, 3166.0, 1361.0, 658.0, 401.0, 247.0, 168.0, 97.0, 63.0, 56.0, 45.0, 34.0, 30.0, 16.0, 15.0, 16.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.390380859375, -10.04638671875, -9.702392578125, -9.3583984375, -9.014404296875, -8.67041015625, -8.326416015625, -7.982421875, -7.638427734375, -7.29443359375, -6.950439453125, -6.6064453125, -6.262451171875, -5.91845703125, -5.574462890625, -5.23046875, -4.886474609375, -4.54248046875, -4.198486328125, -3.8544921875, -3.510498046875, -3.16650390625, -2.822509765625, -2.478515625, -2.134521484375, -1.79052734375, -1.446533203125, -1.1025390625, -0.758544921875, -0.41455078125, -0.070556640625, 0.2734375, 0.617431640625, 0.96142578125, 1.305419921875, 1.6494140625, 1.993408203125, 2.33740234375, 2.681396484375, 3.025390625, 3.369384765625, 3.71337890625, 4.057373046875, 4.4013671875, 4.745361328125, 5.08935546875, 5.433349609375, 5.77734375, 6.121337890625, 6.46533203125, 6.809326171875, 7.1533203125, 7.497314453125, 7.84130859375, 8.185302734375, 8.529296875, 8.873291015625, 9.21728515625, 9.561279296875, 9.9052734375, 10.249267578125, 10.59326171875, 10.937255859375, 11.28125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 18.0, 15.0, 24.0, 63.0, 217.0, 2948.0, 576.0, 129.0, 45.0, 18.0, 6.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.397705078125, -6.13916015625, -5.880615234375, -5.6220703125, -5.363525390625, -5.10498046875, -4.846435546875, -4.587890625, -4.329345703125, -4.07080078125, -3.812255859375, -3.5537109375, -3.295166015625, -3.03662109375, -2.778076171875, -2.51953125, -2.260986328125, -2.00244140625, -1.743896484375, -1.4853515625, -1.226806640625, -0.96826171875, -0.709716796875, -0.451171875, -0.192626953125, 0.06591796875, 0.324462890625, 0.5830078125, 0.841552734375, 1.10009765625, 1.358642578125, 1.6171875, 1.875732421875, 2.13427734375, 2.392822265625, 2.6513671875, 2.909912109375, 3.16845703125, 3.427001953125, 3.685546875, 3.944091796875, 4.20263671875, 4.461181640625, 4.7197265625, 4.978271484375, 5.23681640625, 5.495361328125, 5.75390625, 6.012451171875, 6.27099609375, 6.529541015625, 6.7880859375, 7.046630859375, 7.30517578125, 7.563720703125, 7.822265625, 8.080810546875, 8.33935546875, 8.597900390625, 8.8564453125, 9.114990234375, 9.37353515625, 9.632080078125, 9.890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 18.0, 24.0, 40.0, 65.0, 105.0, 106.0, 124.0, 145.0, 136.0, 77.0, 52.0, 32.0, 22.0, 7.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.251514434814453, -15.594195365905762, -14.93687629699707, -14.279558181762695, -13.622239112854004, -12.964920043945312, -12.307600975036621, -11.65028190612793, -10.992963790893555, -10.335644721984863, -9.678325653076172, -9.021007537841797, -8.363688468933105, -7.706369400024414, -7.049050331115723, -6.3917317390441895, -5.73441219329834, -5.077093124389648, -4.419774532318115, -3.762455463409424, -3.1051366329193115, -2.447817802429199, -1.7904987335205078, -1.1331801414489746, -0.4758610725402832, 0.18145781755447388, 0.838776707649231, 1.4960956573486328, 2.153414487838745, 2.8107333183288574, 3.468052387237549, 4.125370979309082, 4.782690048217773, 5.440009117126465, 6.097327709197998, 6.7546467781066895, 7.411965370178223, 8.069284439086914, 8.726603507995605, 9.383922576904297, 10.041240692138672, 10.698559761047363, 11.355878829956055, 12.01319694519043, 12.670516014099121, 13.327835083007812, 13.985154151916504, 14.642473220825195, 15.299792289733887, 15.957111358642578, 16.614429473876953, 17.27174949645996, 17.929067611694336, 18.586387634277344, 19.24370574951172, 19.901023864746094, 20.5583438873291, 21.215662002563477, 21.872982025146484, 22.53030014038086, 23.187620162963867, 23.844938278198242, 24.50225830078125, 25.159576416015625, 25.81689453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 9.0, 24.0, 17.0, 18.0, 32.0, 28.0, 36.0, 51.0, 52.0, 39.0, 58.0, 63.0, 73.0, 67.0, 60.0, 63.0, 50.0, 57.0, 37.0, 27.0, 30.0, 25.0, 23.0, 12.0, 13.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.553426742553711, -13.98253345489502, -13.411641120910645, -12.840747833251953, -12.269855499267578, -11.698962211608887, -11.128068923950195, -10.55717658996582, -9.986283302307129, -9.415390014648438, -8.844497680664062, -8.273604393005371, -7.702711582183838, -7.131818771362305, -6.560925483703613, -5.99003267288208, -5.419139862060547, -4.848247051239014, -4.2773542404174805, -3.706460952758789, -3.135568141937256, -2.5646753311157227, -1.9937822818756104, -1.422889232635498, -0.8519964218139648, -0.2811034917831421, 0.28978943824768066, 0.8606823682785034, 1.4315752983093262, 2.0024681091308594, 2.5733611583709717, 3.144254207611084, 3.71514892578125, 4.286041736602783, 4.856934547424316, 5.427827835083008, 5.998720645904541, 6.569613456726074, 7.140506744384766, 7.711399555206299, 8.282292366027832, 8.853185653686523, 9.424077987670898, 9.99497127532959, 10.565864562988281, 11.136756896972656, 11.707650184631348, 12.278543472290039, 12.849435806274414, 13.420329093933105, 13.99122142791748, 14.562114715576172, 15.133007049560547, 15.703900337219238, 16.27479362487793, 16.845685958862305, 17.416580200195312, 17.987472534179688, 18.558366775512695, 19.12925910949707, 19.700151443481445, 20.271045684814453, 20.841938018798828, 21.412830352783203, 21.983722686767578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 10.0, 15.0, 20.0, 36.0, 43.0, 91.0, 136.0, 264.0, 536.0, 1154.0, 3247.0, 10789.0, 49441.0, 271069.0, 536361.0, 138474.0, 26368.0, 6600.0, 2066.0, 850.0, 425.0, 245.0, 107.0, 77.0, 46.0, 32.0, 14.0, 15.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.826416015625, -6.56689453125, -6.307373046875, -6.0478515625, -5.788330078125, -5.52880859375, -5.269287109375, -5.009765625, -4.750244140625, -4.49072265625, -4.231201171875, -3.9716796875, -3.712158203125, -3.45263671875, -3.193115234375, -2.93359375, -2.674072265625, -2.41455078125, -2.155029296875, -1.8955078125, -1.635986328125, -1.37646484375, -1.116943359375, -0.857421875, -0.597900390625, -0.33837890625, -0.078857421875, 0.1806640625, 0.440185546875, 0.69970703125, 0.959228515625, 1.21875, 1.478271484375, 1.73779296875, 1.997314453125, 2.2568359375, 2.516357421875, 2.77587890625, 3.035400390625, 3.294921875, 3.554443359375, 3.81396484375, 4.073486328125, 4.3330078125, 4.592529296875, 4.85205078125, 5.111572265625, 5.37109375, 5.630615234375, 5.89013671875, 6.149658203125, 6.4091796875, 6.668701171875, 6.92822265625, 7.187744140625, 7.447265625, 7.706787109375, 7.96630859375, 8.225830078125, 8.4853515625, 8.744873046875, 9.00439453125, 9.263916015625, 9.5234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 17.0, 27.0, 27.0, 36.0, 40.0, 66.0, 68.0, 63.0, 87.0, 86.0, 94.0, 77.0, 67.0, 59.0, 45.0, 44.0, 21.0, 24.0, 9.0, 17.0, 8.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.87451171875, -6.6865234375, -6.49853515625, -6.310546875, -6.12255859375, -5.9345703125, -5.74658203125, -5.55859375, -5.37060546875, -5.1826171875, -4.99462890625, -4.806640625, -4.61865234375, -4.4306640625, -4.24267578125, -4.0546875, -3.86669921875, -3.6787109375, -3.49072265625, -3.302734375, -3.11474609375, -2.9267578125, -2.73876953125, -2.55078125, -2.36279296875, -2.1748046875, -1.98681640625, -1.798828125, -1.61083984375, -1.4228515625, -1.23486328125, -1.046875, -0.85888671875, -0.6708984375, -0.48291015625, -0.294921875, -0.10693359375, 0.0810546875, 0.26904296875, 0.45703125, 0.64501953125, 0.8330078125, 1.02099609375, 1.208984375, 1.39697265625, 1.5849609375, 1.77294921875, 1.9609375, 2.14892578125, 2.3369140625, 2.52490234375, 2.712890625, 2.90087890625, 3.0888671875, 3.27685546875, 3.46484375, 3.65283203125, 3.8408203125, 4.02880859375, 4.216796875, 4.40478515625, 4.5927734375, 4.78076171875, 4.96875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 13.0, 12.0, 23.0, 19.0, 58.0, 76.0, 127.0, 202.0, 402.0, 804.0, 2079.0, 7730.0, 70663.0, 798547.0, 150931.0, 11998.0, 2749.0, 949.0, 491.0, 275.0, 154.0, 75.0, 47.0, 33.0, 20.0, 18.0, 15.0, 12.0, 7.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.640625, -16.1983642578125, -15.756103515625, -15.3138427734375, -14.87158203125, -14.4293212890625, -13.987060546875, -13.5447998046875, -13.1025390625, -12.6602783203125, -12.218017578125, -11.7757568359375, -11.33349609375, -10.8912353515625, -10.448974609375, -10.0067138671875, -9.564453125, -9.1221923828125, -8.679931640625, -8.2376708984375, -7.79541015625, -7.3531494140625, -6.910888671875, -6.4686279296875, -6.0263671875, -5.5841064453125, -5.141845703125, -4.6995849609375, -4.25732421875, -3.8150634765625, -3.372802734375, -2.9305419921875, -2.48828125, -2.0460205078125, -1.603759765625, -1.1614990234375, -0.71923828125, -0.2769775390625, 0.165283203125, 0.6075439453125, 1.0498046875, 1.4920654296875, 1.934326171875, 2.3765869140625, 2.81884765625, 3.2611083984375, 3.703369140625, 4.1456298828125, 4.587890625, 5.0301513671875, 5.472412109375, 5.9146728515625, 6.35693359375, 6.7991943359375, 7.241455078125, 7.6837158203125, 8.1259765625, 8.5682373046875, 9.010498046875, 9.4527587890625, 9.89501953125, 10.3372802734375, 10.779541015625, 11.2218017578125, 11.6640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 9.0, 20.0, 14.0, 20.0, 30.0, 34.0, 32.0, 44.0, 47.0, 48.0, 70.0, 58.0, 59.0, 67.0, 51.0, 63.0, 52.0, 46.0, 42.0, 30.0, 31.0, 21.0, 22.0, 22.0, 13.0, 12.0, 8.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.783203125, -18.17578125, -17.568359375, -16.9609375, -16.353515625, -15.74609375, -15.138671875, -14.53125, -13.923828125, -13.31640625, -12.708984375, -12.1015625, -11.494140625, -10.88671875, -10.279296875, -9.671875, -9.064453125, -8.45703125, -7.849609375, -7.2421875, -6.634765625, -6.02734375, -5.419921875, -4.8125, -4.205078125, -3.59765625, -2.990234375, -2.3828125, -1.775390625, -1.16796875, -0.560546875, 0.046875, 0.654296875, 1.26171875, 1.869140625, 2.4765625, 3.083984375, 3.69140625, 4.298828125, 4.90625, 5.513671875, 6.12109375, 6.728515625, 7.3359375, 7.943359375, 8.55078125, 9.158203125, 9.765625, 10.373046875, 10.98046875, 11.587890625, 12.1953125, 12.802734375, 13.41015625, 14.017578125, 14.625, 15.232421875, 15.83984375, 16.447265625, 17.0546875, 17.662109375, 18.26953125, 18.876953125, 19.484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 10.0, 11.0, 10.0, 19.0, 23.0, 41.0, 86.0, 181.0, 426.0, 1185.0, 6110.0, 138020.0, 872239.0, 26263.0, 2679.0, 653.0, 288.0, 144.0, 66.0, 39.0, 25.0, 15.0, 4.0, 6.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.6929931640625, -6.456298828125, -6.2196044921875, -5.98291015625, -5.7462158203125, -5.509521484375, -5.2728271484375, -5.0361328125, -4.7994384765625, -4.562744140625, -4.3260498046875, -4.08935546875, -3.8526611328125, -3.615966796875, -3.3792724609375, -3.142578125, -2.9058837890625, -2.669189453125, -2.4324951171875, -2.19580078125, -1.9591064453125, -1.722412109375, -1.4857177734375, -1.2490234375, -1.0123291015625, -0.775634765625, -0.5389404296875, -0.30224609375, -0.0655517578125, 0.171142578125, 0.4078369140625, 0.64453125, 0.8812255859375, 1.117919921875, 1.3546142578125, 1.59130859375, 1.8280029296875, 2.064697265625, 2.3013916015625, 2.5380859375, 2.7747802734375, 3.011474609375, 3.2481689453125, 3.48486328125, 3.7215576171875, 3.958251953125, 4.1949462890625, 4.431640625, 4.6683349609375, 4.905029296875, 5.1417236328125, 5.37841796875, 5.6151123046875, 5.851806640625, 6.0885009765625, 6.3251953125, 6.5618896484375, 6.798583984375, 7.0352783203125, 7.27197265625, 7.5086669921875, 7.745361328125, 7.9820556640625, 8.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 8.0, 12.0, 9.0, 11.0, 15.0, 18.0, 15.0, 28.0, 26.0, 40.0, 41.0, 64.0, 70.0, 129.0, 95.0, 93.0, 53.0, 40.0, 47.0, 33.0, 27.0, 23.0, 21.0, 12.0, 11.0, 14.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005870312452316284, -0.0005660951137542725, -0.0005451589822769165, -0.0005242228507995605, -0.0005032867193222046, -0.00048235058784484863, -0.0004614144563674927, -0.0004404783248901367, -0.00041954219341278076, -0.0003986060619354248, -0.00037766993045806885, -0.0003567337989807129, -0.00033579766750335693, -0.000314861536026001, -0.000293925404548645, -0.00027298927307128906, -0.0002520531415939331, -0.00023111701011657715, -0.0002101808786392212, -0.00018924474716186523, -0.00016830861568450928, -0.00014737248420715332, -0.00012643635272979736, -0.0001055002212524414, -8.456408977508545e-05, -6.362795829772949e-05, -4.2691826820373535e-05, -2.1755695343017578e-05, -8.195638656616211e-07, 2.0116567611694336e-05, 4.105269908905029e-05, 6.198883056640625e-05, 8.292496204376221e-05, 0.00010386109352111816, 0.00012479722499847412, 0.00014573335647583008, 0.00016666948795318604, 0.000187605619430542, 0.00020854175090789795, 0.0002294778823852539, 0.00025041401386260986, 0.0002713501453399658, 0.0002922862768173218, 0.00031322240829467773, 0.0003341585397720337, 0.00035509467124938965, 0.0003760308027267456, 0.00039696693420410156, 0.0004179030656814575, 0.0004388391971588135, 0.00045977532863616943, 0.0004807114601135254, 0.0005016475915908813, 0.0005225837230682373, 0.0005435198545455933, 0.0005644559860229492, 0.0005853921175003052, 0.0006063282489776611, 0.0006272643804550171, 0.000648200511932373, 0.000669136643409729, 0.000690072774887085, 0.0007110089063644409, 0.0007319450378417969]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 8.0, 12.0, 17.0, 31.0, 53.0, 105.0, 211.0, 477.0, 1113.0, 3396.0, 18832.0, 301730.0, 680317.0, 34584.0, 5018.0, 1506.0, 574.0, 257.0, 125.0, 67.0, 40.0, 21.0, 12.0, 8.0, 4.0, 9.0, 5.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.828125, -6.6337890625, -6.439453125, -6.2451171875, -6.05078125, -5.8564453125, -5.662109375, -5.4677734375, -5.2734375, -5.0791015625, -4.884765625, -4.6904296875, -4.49609375, -4.3017578125, -4.107421875, -3.9130859375, -3.71875, -3.5244140625, -3.330078125, -3.1357421875, -2.94140625, -2.7470703125, -2.552734375, -2.3583984375, -2.1640625, -1.9697265625, -1.775390625, -1.5810546875, -1.38671875, -1.1923828125, -0.998046875, -0.8037109375, -0.609375, -0.4150390625, -0.220703125, -0.0263671875, 0.16796875, 0.3623046875, 0.556640625, 0.7509765625, 0.9453125, 1.1396484375, 1.333984375, 1.5283203125, 1.72265625, 1.9169921875, 2.111328125, 2.3056640625, 2.5, 2.6943359375, 2.888671875, 3.0830078125, 3.27734375, 3.4716796875, 3.666015625, 3.8603515625, 4.0546875, 4.2490234375, 4.443359375, 4.6376953125, 4.83203125, 5.0263671875, 5.220703125, 5.4150390625, 5.609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 8.0, 18.0, 16.0, 19.0, 36.0, 35.0, 49.0, 79.0, 95.0, 110.0, 103.0, 120.0, 72.0, 61.0, 52.0, 28.0, 29.0, 18.0, 17.0, 12.0, 2.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.96539306640625, -5.8057861328125, -5.64617919921875, -5.486572265625, -5.32696533203125, -5.1673583984375, -5.00775146484375, -4.84814453125, -4.68853759765625, -4.5289306640625, -4.36932373046875, -4.209716796875, -4.05010986328125, -3.8905029296875, -3.73089599609375, -3.5712890625, -3.41168212890625, -3.2520751953125, -3.09246826171875, -2.932861328125, -2.77325439453125, -2.6136474609375, -2.45404052734375, -2.29443359375, -2.13482666015625, -1.9752197265625, -1.81561279296875, -1.656005859375, -1.49639892578125, -1.3367919921875, -1.17718505859375, -1.017578125, -0.85797119140625, -0.6983642578125, -0.53875732421875, -0.379150390625, -0.21954345703125, -0.0599365234375, 0.09967041015625, 0.25927734375, 0.41888427734375, 0.5784912109375, 0.73809814453125, 0.897705078125, 1.05731201171875, 1.2169189453125, 1.37652587890625, 1.5361328125, 1.69573974609375, 1.8553466796875, 2.01495361328125, 2.174560546875, 2.33416748046875, 2.4937744140625, 2.65338134765625, 2.81298828125, 2.97259521484375, 3.1322021484375, 3.29180908203125, 3.451416015625, 3.61102294921875, 3.7706298828125, 3.93023681640625, 4.08984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 14.0, 25.0, 63.0, 140.0, 170.0, 202.0, 173.0, 90.0, 54.0, 22.0, 9.0, 4.0, 8.0, 8.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-125.43487548828125, -122.29891204833984, -119.16295623779297, -116.02699279785156, -112.89102935791016, -109.75507354736328, -106.61911010742188, -103.483154296875, -100.3471908569336, -97.21122741699219, -94.07527160644531, -90.9393081665039, -87.8033447265625, -84.66738891601562, -81.53142547607422, -78.39546203613281, -75.25950622558594, -72.12354278564453, -68.98758697509766, -65.85162353515625, -62.71566390991211, -59.57970428466797, -56.44374084472656, -53.30778121948242, -50.17181396484375, -47.03585433959961, -43.8998908996582, -40.76393127441406, -37.62797164916992, -34.49201202392578, -31.356048583984375, -28.220088958740234, -25.084129333496094, -21.94816780090332, -18.81220817565918, -15.676246643066406, -12.54028606414795, -9.404325485229492, -6.268363952636719, -3.132404327392578, 0.0035572052001953125, 3.1395180225372314, 6.275478839874268, 9.411439895629883, 12.54740047454834, 15.683361053466797, 18.81932258605957, 21.95528221130371, 25.091243743896484, 28.227205276489258, 31.3631649017334, 34.49912643432617, 37.63508605957031, 40.77104949951172, 43.90700912475586, 47.04296875, 50.178932189941406, 53.31489181518555, 56.45085525512695, 59.586814880371094, 62.722774505615234, 65.85873413085938, 68.99469757080078, 72.13066101074219, 75.26661682128906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 11.0, 3.0, 3.0, 2.0, 7.0, 15.0, 18.0, 16.0, 26.0, 25.0, 23.0, 15.0, 19.0, 43.0, 37.0, 37.0, 35.0, 53.0, 53.0, 44.0, 46.0, 54.0, 52.0, 44.0, 36.0, 46.0, 35.0, 31.0, 29.0, 27.0, 20.0, 22.0, 15.0, 15.0, 8.0, 9.0, 6.0, 5.0, 3.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-72.56350708007812, -70.47933197021484, -68.39515686035156, -66.31098937988281, -64.22681427001953, -62.14263916015625, -60.05846405029297, -57.97428894042969, -55.890113830566406, -53.805938720703125, -51.72176742553711, -49.63759231567383, -47.55341720581055, -45.46924591064453, -43.38507080078125, -41.30089569091797, -39.21672439575195, -37.13254928588867, -35.048377990722656, -32.964202880859375, -30.880027770996094, -28.795854568481445, -26.711681365966797, -24.627506256103516, -22.543333053588867, -20.45915985107422, -18.374984741210938, -16.29081153869629, -14.206637382507324, -12.12246322631836, -10.038290023803711, -7.954115867614746, -5.869945526123047, -3.785771608352661, -1.7015976905822754, 0.38257598876953125, 2.466750144958496, 4.550924301147461, 6.635097503662109, 8.719271659851074, 10.803445816040039, 12.887619972229004, 14.971794128417969, 17.055967330932617, 19.140140533447266, 21.224315643310547, 23.308488845825195, 25.392662048339844, 27.476837158203125, 29.561010360717773, 31.645185470581055, 33.7293586730957, 35.813533782958984, 37.897705078125, 39.98188018798828, 42.06605529785156, 44.150230407714844, 46.234405517578125, 48.31857681274414, 50.40275192260742, 52.4869270324707, 54.57109832763672, 56.6552734375, 58.73944854736328, 60.8236198425293]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 20.0, 28.0, 33.0, 51.0, 79.0, 166.0, 257.0, 506.0, 935.0, 2124.0, 5446.0, 17966.0, 111379.0, 2667598.0, 1299682.0, 66438.0, 13622.0, 4473.0, 1729.0, 823.0, 379.0, 208.0, 112.0, 63.0, 52.0, 24.0, 10.0, 14.0, 8.0, 4.0, 7.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.52423095703125, -6.3258056640625, -6.12738037109375, -5.928955078125, -5.73052978515625, -5.5321044921875, -5.33367919921875, -5.13525390625, -4.93682861328125, -4.7384033203125, -4.53997802734375, -4.341552734375, -4.14312744140625, -3.9447021484375, -3.74627685546875, -3.5478515625, -3.34942626953125, -3.1510009765625, -2.95257568359375, -2.754150390625, -2.55572509765625, -2.3572998046875, -2.15887451171875, -1.96044921875, -1.76202392578125, -1.5635986328125, -1.36517333984375, -1.166748046875, -0.96832275390625, -0.7698974609375, -0.57147216796875, -0.373046875, -0.17462158203125, 0.0238037109375, 0.22222900390625, 0.420654296875, 0.61907958984375, 0.8175048828125, 1.01593017578125, 1.21435546875, 1.41278076171875, 1.6112060546875, 1.80963134765625, 2.008056640625, 2.20648193359375, 2.4049072265625, 2.60333251953125, 2.8017578125, 3.00018310546875, 3.1986083984375, 3.39703369140625, 3.595458984375, 3.79388427734375, 3.9923095703125, 4.19073486328125, 4.38916015625, 4.58758544921875, 4.7860107421875, 4.98443603515625, 5.182861328125, 5.38128662109375, 5.5797119140625, 5.77813720703125, 5.9765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 8.0, 4.0, 7.0, 7.0, 11.0, 12.0, 23.0, 20.0, 33.0, 33.0, 41.0, 47.0, 57.0, 43.0, 50.0, 58.0, 60.0, 56.0, 61.0, 54.0, 46.0, 51.0, 29.0, 46.0, 25.0, 20.0, 24.0, 18.0, 17.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.676849365234375, -3.55682373046875, -3.436798095703125, -3.3167724609375, -3.196746826171875, -3.07672119140625, -2.956695556640625, -2.836669921875, -2.716644287109375, -2.59661865234375, -2.476593017578125, -2.3565673828125, -2.236541748046875, -2.11651611328125, -1.996490478515625, -1.87646484375, -1.756439208984375, -1.63641357421875, -1.516387939453125, -1.3963623046875, -1.276336669921875, -1.15631103515625, -1.036285400390625, -0.916259765625, -0.796234130859375, -0.67620849609375, -0.556182861328125, -0.4361572265625, -0.316131591796875, -0.19610595703125, -0.076080322265625, 0.0439453125, 0.163970947265625, 0.28399658203125, 0.404022216796875, 0.5240478515625, 0.644073486328125, 0.76409912109375, 0.884124755859375, 1.004150390625, 1.124176025390625, 1.24420166015625, 1.364227294921875, 1.4842529296875, 1.604278564453125, 1.72430419921875, 1.844329833984375, 1.96435546875, 2.084381103515625, 2.20440673828125, 2.324432373046875, 2.4444580078125, 2.564483642578125, 2.68450927734375, 2.804534912109375, 2.924560546875, 3.044586181640625, 3.16461181640625, 3.284637451171875, 3.4046630859375, 3.524688720703125, 3.64471435546875, 3.764739990234375, 3.884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 8.0, 16.0, 27.0, 27.0, 41.0, 82.0, 106.0, 267.0, 625.0, 1626.0, 5389.0, 24889.0, 276876.0, 3706919.0, 153122.0, 17822.0, 4202.0, 1262.0, 488.0, 207.0, 111.0, 56.0, 30.0, 17.0, 14.0, 7.0, 16.0, 9.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0546875, -7.7376708984375, -7.420654296875, -7.1036376953125, -6.78662109375, -6.4696044921875, -6.152587890625, -5.8355712890625, -5.5185546875, -5.2015380859375, -4.884521484375, -4.5675048828125, -4.25048828125, -3.9334716796875, -3.616455078125, -3.2994384765625, -2.982421875, -2.6654052734375, -2.348388671875, -2.0313720703125, -1.71435546875, -1.3973388671875, -1.080322265625, -0.7633056640625, -0.4462890625, -0.1292724609375, 0.187744140625, 0.5047607421875, 0.82177734375, 1.1387939453125, 1.455810546875, 1.7728271484375, 2.08984375, 2.4068603515625, 2.723876953125, 3.0408935546875, 3.35791015625, 3.6749267578125, 3.991943359375, 4.3089599609375, 4.6259765625, 4.9429931640625, 5.260009765625, 5.5770263671875, 5.89404296875, 6.2110595703125, 6.528076171875, 6.8450927734375, 7.162109375, 7.4791259765625, 7.796142578125, 8.1131591796875, 8.43017578125, 8.7471923828125, 9.064208984375, 9.3812255859375, 9.6982421875, 10.0152587890625, 10.332275390625, 10.6492919921875, 10.96630859375, 11.2833251953125, 11.600341796875, 11.9173583984375, 12.234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 9.0, 11.0, 15.0, 19.0, 25.0, 37.0, 61.0, 90.0, 206.0, 474.0, 983.0, 1071.0, 506.0, 227.0, 131.0, 67.0, 38.0, 28.0, 11.0, 14.0, 11.0, 7.0, 3.0, 6.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8359375, -9.5286865234375, -9.221435546875, -8.9141845703125, -8.60693359375, -8.2996826171875, -7.992431640625, -7.6851806640625, -7.3779296875, -7.0706787109375, -6.763427734375, -6.4561767578125, -6.14892578125, -5.8416748046875, -5.534423828125, -5.2271728515625, -4.919921875, -4.6126708984375, -4.305419921875, -3.9981689453125, -3.69091796875, -3.3836669921875, -3.076416015625, -2.7691650390625, -2.4619140625, -2.1546630859375, -1.847412109375, -1.5401611328125, -1.23291015625, -0.9256591796875, -0.618408203125, -0.3111572265625, -0.00390625, 0.3033447265625, 0.610595703125, 0.9178466796875, 1.22509765625, 1.5323486328125, 1.839599609375, 2.1468505859375, 2.4541015625, 2.7613525390625, 3.068603515625, 3.3758544921875, 3.68310546875, 3.9903564453125, 4.297607421875, 4.6048583984375, 4.912109375, 5.2193603515625, 5.526611328125, 5.8338623046875, 6.14111328125, 6.4483642578125, 6.755615234375, 7.0628662109375, 7.3701171875, 7.6773681640625, 7.984619140625, 8.2918701171875, 8.59912109375, 8.9063720703125, 9.213623046875, 9.5208740234375, 9.828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 11.0, 10.0, 16.0, 34.0, 59.0, 113.0, 167.0, 147.0, 163.0, 104.0, 64.0, 41.0, 22.0, 13.0, 10.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.25428009033203, -49.22071075439453, -47.18714141845703, -45.1535758972168, -43.1200065612793, -41.0864372253418, -39.05287170410156, -37.01930236816406, -34.98573303222656, -32.95216369628906, -30.918596267700195, -28.885028839111328, -26.851459503173828, -24.817890167236328, -22.78432273864746, -20.750755310058594, -18.717185974121094, -16.683616638183594, -14.650049209594727, -12.616480827331543, -10.58291244506836, -8.549344062805176, -6.515775680541992, -4.482207298278809, -2.448638916015625, -0.4150705337524414, 1.6184978485107422, 3.652066230773926, 5.685634613037109, 7.719202995300293, 9.752771377563477, 11.78633975982666, 13.819900512695312, 15.853468894958496, 17.88703727722168, 19.920604705810547, 21.954174041748047, 23.987743377685547, 26.021310806274414, 28.05487823486328, 30.08844757080078, 32.12201690673828, 34.15558624267578, 36.189151763916016, 38.222721099853516, 40.256290435791016, 42.28985595703125, 44.32342529296875, 46.35699462890625, 48.39056396484375, 50.42413330078125, 52.457698822021484, 54.491268157958984, 56.524837493896484, 58.55840301513672, 60.59197235107422, 62.62554168701172, 64.65911102294922, 66.69268035888672, 68.72624969482422, 70.75981140136719, 72.79338073730469, 74.82695007324219, 76.86051940917969, 78.89408874511719]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 9.0, 13.0, 16.0, 15.0, 25.0, 33.0, 32.0, 38.0, 44.0, 32.0, 51.0, 42.0, 59.0, 50.0, 65.0, 47.0, 44.0, 38.0, 47.0, 39.0, 42.0, 32.0, 26.0, 27.0, 24.0, 23.0, 19.0, 17.0, 8.0, 5.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.69305419921875, -45.42817306518555, -44.16329574584961, -42.898414611816406, -41.63353729248047, -40.368656158447266, -39.10377502441406, -37.838897705078125, -36.57401657104492, -35.30913543701172, -34.04425811767578, -32.77937698364258, -31.514497756958008, -30.249618530273438, -28.984737396240234, -27.719858169555664, -26.454978942871094, -25.190099716186523, -23.925220489501953, -22.66033935546875, -21.39546012878418, -20.13058090209961, -18.865699768066406, -17.600820541381836, -16.335941314697266, -15.071062088012695, -13.806181907653809, -12.541301727294922, -11.276422500610352, -10.011543273925781, -8.746663093566895, -7.481782913208008, -6.216907501220703, -4.952027797698975, -3.687148094177246, -2.4222683906555176, -1.157388687133789, 0.10749101638793945, 1.372370719909668, 2.6372509002685547, 3.902130126953125, 5.1670098304748535, 6.431889533996582, 7.6967692375183105, 8.961648941040039, 10.22652816772461, 11.491408348083496, 12.756288528442383, 14.021167755126953, 15.286046981811523, 16.550926208496094, 17.815807342529297, 19.080686569213867, 20.345565795898438, 21.61044692993164, 22.87532615661621, 24.14020538330078, 25.40508460998535, 26.669963836669922, 27.934844970703125, 29.199724197387695, 30.464603424072266, 31.72948455810547, 32.994361877441406, 34.25924301147461]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 9.0, 4.0, 10.0, 15.0, 21.0, 34.0, 56.0, 84.0, 101.0, 164.0, 243.0, 354.0, 619.0, 915.0, 1577.0, 2604.0, 4471.0, 7903.0, 14019.0, 26372.0, 50693.0, 97250.0, 182971.0, 255718.0, 187599.0, 100678.0, 52316.0, 27921.0, 14454.0, 7969.0, 4525.0, 2621.0, 1565.0, 963.0, 620.0, 379.0, 238.0, 157.0, 112.0, 64.0, 50.0, 39.0, 28.0, 14.0, 17.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.5367431640625, -2.444580078125, -2.3524169921875, -2.26025390625, -2.1680908203125, -2.075927734375, -1.9837646484375, -1.8916015625, -1.7994384765625, -1.707275390625, -1.6151123046875, -1.52294921875, -1.4307861328125, -1.338623046875, -1.2464599609375, -1.154296875, -1.0621337890625, -0.969970703125, -0.8778076171875, -0.78564453125, -0.6934814453125, -0.601318359375, -0.5091552734375, -0.4169921875, -0.3248291015625, -0.232666015625, -0.1405029296875, -0.04833984375, 0.0438232421875, 0.135986328125, 0.2281494140625, 0.3203125, 0.4124755859375, 0.504638671875, 0.5968017578125, 0.68896484375, 0.7811279296875, 0.873291015625, 0.9654541015625, 1.0576171875, 1.1497802734375, 1.241943359375, 1.3341064453125, 1.42626953125, 1.5184326171875, 1.610595703125, 1.7027587890625, 1.794921875, 1.8870849609375, 1.979248046875, 2.0714111328125, 2.16357421875, 2.2557373046875, 2.347900390625, 2.4400634765625, 2.5322265625, 2.6243896484375, 2.716552734375, 2.8087158203125, 2.90087890625, 2.9930419921875, 3.085205078125, 3.1773681640625, 3.26953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 4.0, 14.0, 16.0, 7.0, 21.0, 16.0, 27.0, 25.0, 27.0, 43.0, 49.0, 41.0, 41.0, 43.0, 36.0, 64.0, 49.0, 51.0, 46.0, 47.0, 33.0, 38.0, 32.0, 36.0, 33.0, 29.0, 22.0, 22.0, 16.0, 13.0, 8.0, 15.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.96875, -3.86480712890625, -3.7608642578125, -3.65692138671875, -3.552978515625, -3.44903564453125, -3.3450927734375, -3.24114990234375, -3.13720703125, -3.03326416015625, -2.9293212890625, -2.82537841796875, -2.721435546875, -2.61749267578125, -2.5135498046875, -2.40960693359375, -2.3056640625, -2.20172119140625, -2.0977783203125, -1.99383544921875, -1.889892578125, -1.78594970703125, -1.6820068359375, -1.57806396484375, -1.47412109375, -1.37017822265625, -1.2662353515625, -1.16229248046875, -1.058349609375, -0.95440673828125, -0.8504638671875, -0.74652099609375, -0.642578125, -0.53863525390625, -0.4346923828125, -0.33074951171875, -0.226806640625, -0.12286376953125, -0.0189208984375, 0.08502197265625, 0.18896484375, 0.29290771484375, 0.3968505859375, 0.50079345703125, 0.604736328125, 0.70867919921875, 0.8126220703125, 0.91656494140625, 1.0205078125, 1.12445068359375, 1.2283935546875, 1.33233642578125, 1.436279296875, 1.54022216796875, 1.6441650390625, 1.74810791015625, 1.85205078125, 1.95599365234375, 2.0599365234375, 2.16387939453125, 2.267822265625, 2.37176513671875, 2.4757080078125, 2.57965087890625, 2.68359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 5.0, 5.0, 8.0, 11.0, 9.0, 11.0, 31.0, 33.0, 49.0, 56.0, 88.0, 158.0, 248.0, 429.0, 851.0, 1774.0, 4999.0, 28960.0, 463717.0, 507850.0, 30135.0, 5118.0, 1845.0, 856.0, 495.0, 283.0, 167.0, 120.0, 58.0, 51.0, 36.0, 29.0, 18.0, 12.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.6524658203125, -10.258056640625, -9.8636474609375, -9.46923828125, -9.0748291015625, -8.680419921875, -8.2860107421875, -7.8916015625, -7.4971923828125, -7.102783203125, -6.7083740234375, -6.31396484375, -5.9195556640625, -5.525146484375, -5.1307373046875, -4.736328125, -4.3419189453125, -3.947509765625, -3.5531005859375, -3.15869140625, -2.7642822265625, -2.369873046875, -1.9754638671875, -1.5810546875, -1.1866455078125, -0.792236328125, -0.3978271484375, -0.00341796875, 0.3909912109375, 0.785400390625, 1.1798095703125, 1.57421875, 1.9686279296875, 2.363037109375, 2.7574462890625, 3.15185546875, 3.5462646484375, 3.940673828125, 4.3350830078125, 4.7294921875, 5.1239013671875, 5.518310546875, 5.9127197265625, 6.30712890625, 6.7015380859375, 7.095947265625, 7.4903564453125, 7.884765625, 8.2791748046875, 8.673583984375, 9.0679931640625, 9.46240234375, 9.8568115234375, 10.251220703125, 10.6456298828125, 11.0400390625, 11.4344482421875, 11.828857421875, 12.2232666015625, 12.61767578125, 13.0120849609375, 13.406494140625, 13.8009033203125, 14.1953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 15.0, 7.0, 19.0, 14.0, 14.0, 23.0, 22.0, 35.0, 44.0, 28.0, 36.0, 52.0, 55.0, 54.0, 65.0, 51.0, 62.0, 35.0, 53.0, 52.0, 35.0, 30.0, 32.0, 32.0, 35.0, 17.0, 15.0, 12.0, 5.0, 7.0, 10.0, 3.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.7596435546875, -13.261474609375, -12.7633056640625, -12.26513671875, -11.7669677734375, -11.268798828125, -10.7706298828125, -10.2724609375, -9.7742919921875, -9.276123046875, -8.7779541015625, -8.27978515625, -7.7816162109375, -7.283447265625, -6.7852783203125, -6.287109375, -5.7889404296875, -5.290771484375, -4.7926025390625, -4.29443359375, -3.7962646484375, -3.298095703125, -2.7999267578125, -2.3017578125, -1.8035888671875, -1.305419921875, -0.8072509765625, -0.30908203125, 0.1890869140625, 0.687255859375, 1.1854248046875, 1.68359375, 2.1817626953125, 2.679931640625, 3.1781005859375, 3.67626953125, 4.1744384765625, 4.672607421875, 5.1707763671875, 5.6689453125, 6.1671142578125, 6.665283203125, 7.1634521484375, 7.66162109375, 8.1597900390625, 8.657958984375, 9.1561279296875, 9.654296875, 10.1524658203125, 10.650634765625, 11.1488037109375, 11.64697265625, 12.1451416015625, 12.643310546875, 13.1414794921875, 13.6396484375, 14.1378173828125, 14.635986328125, 15.1341552734375, 15.63232421875, 16.1304931640625, 16.628662109375, 17.1268310546875, 17.625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 17.0, 25.0, 46.0, 58.0, 104.0, 179.0, 326.0, 714.0, 1950.0, 6777.0, 45098.0, 769729.0, 199910.0, 17728.0, 3600.0, 1198.0, 465.0, 262.0, 134.0, 68.0, 40.0, 33.0, 22.0, 14.0, 14.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.943603515625, -5.75048828125, -5.557373046875, -5.3642578125, -5.171142578125, -4.97802734375, -4.784912109375, -4.591796875, -4.398681640625, -4.20556640625, -4.012451171875, -3.8193359375, -3.626220703125, -3.43310546875, -3.239990234375, -3.046875, -2.853759765625, -2.66064453125, -2.467529296875, -2.2744140625, -2.081298828125, -1.88818359375, -1.695068359375, -1.501953125, -1.308837890625, -1.11572265625, -0.922607421875, -0.7294921875, -0.536376953125, -0.34326171875, -0.150146484375, 0.04296875, 0.236083984375, 0.42919921875, 0.622314453125, 0.8154296875, 1.008544921875, 1.20166015625, 1.394775390625, 1.587890625, 1.781005859375, 1.97412109375, 2.167236328125, 2.3603515625, 2.553466796875, 2.74658203125, 2.939697265625, 3.1328125, 3.325927734375, 3.51904296875, 3.712158203125, 3.9052734375, 4.098388671875, 4.29150390625, 4.484619140625, 4.677734375, 4.870849609375, 5.06396484375, 5.257080078125, 5.4501953125, 5.643310546875, 5.83642578125, 6.029541015625, 6.22265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 14.0, 12.0, 20.0, 22.0, 32.0, 39.0, 75.0, 114.0, 156.0, 145.0, 98.0, 60.0, 47.0, 40.0, 23.0, 11.0, 16.0, 7.0, 13.0, 12.0, 6.0, 4.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0014009475708007812, -0.0013674795627593994, -0.0013340115547180176, -0.0013005435466766357, -0.001267075538635254, -0.001233607530593872, -0.0012001395225524902, -0.0011666715145111084, -0.0011332035064697266, -0.0010997354984283447, -0.0010662674903869629, -0.001032799482345581, -0.0009993314743041992, -0.0009658634662628174, -0.0009323954582214355, -0.0008989274501800537, -0.0008654594421386719, -0.00083199143409729, -0.0007985234260559082, -0.0007650554180145264, -0.0007315874099731445, -0.0006981194019317627, -0.0006646513938903809, -0.000631183385848999, -0.0005977153778076172, -0.0005642473697662354, -0.0005307793617248535, -0.0004973113536834717, -0.00046384334564208984, -0.000430375337600708, -0.00039690732955932617, -0.00036343932151794434, -0.0003299713134765625, -0.00029650330543518066, -0.00026303529739379883, -0.000229567289352417, -0.00019609928131103516, -0.00016263127326965332, -0.00012916326522827148, -9.569525718688965e-05, -6.222724914550781e-05, -2.8759241104125977e-05, 4.708766937255859e-06, 3.8176774978637695e-05, 7.164478302001953e-05, 0.00010511279106140137, 0.0001385807991027832, 0.00017204880714416504, 0.00020551681518554688, 0.0002389848232269287, 0.00027245283126831055, 0.0003059208393096924, 0.0003393888473510742, 0.00037285685539245605, 0.0004063248634338379, 0.0004397928714752197, 0.00047326087951660156, 0.0005067288875579834, 0.0005401968955993652, 0.0005736649036407471, 0.0006071329116821289, 0.0006406009197235107, 0.0006740689277648926, 0.0007075369358062744, 0.0007410049438476562]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 16.0, 11.0, 15.0, 25.0, 52.0, 59.0, 126.0, 208.0, 368.0, 674.0, 1399.0, 3474.0, 13306.0, 86020.0, 795038.0, 123156.0, 16882.0, 4505.0, 1558.0, 749.0, 361.0, 207.0, 148.0, 75.0, 43.0, 24.0, 20.0, 14.0, 5.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.625, -4.4288330078125, -4.232666015625, -4.0364990234375, -3.84033203125, -3.6441650390625, -3.447998046875, -3.2518310546875, -3.0556640625, -2.8594970703125, -2.663330078125, -2.4671630859375, -2.27099609375, -2.0748291015625, -1.878662109375, -1.6824951171875, -1.486328125, -1.2901611328125, -1.093994140625, -0.8978271484375, -0.70166015625, -0.5054931640625, -0.309326171875, -0.1131591796875, 0.0830078125, 0.2791748046875, 0.475341796875, 0.6715087890625, 0.86767578125, 1.0638427734375, 1.260009765625, 1.4561767578125, 1.65234375, 1.8485107421875, 2.044677734375, 2.2408447265625, 2.43701171875, 2.6331787109375, 2.829345703125, 3.0255126953125, 3.2216796875, 3.4178466796875, 3.614013671875, 3.8101806640625, 4.00634765625, 4.2025146484375, 4.398681640625, 4.5948486328125, 4.791015625, 4.9871826171875, 5.183349609375, 5.3795166015625, 5.57568359375, 5.7718505859375, 5.968017578125, 6.1641845703125, 6.3603515625, 6.5565185546875, 6.752685546875, 6.9488525390625, 7.14501953125, 7.3411865234375, 7.537353515625, 7.7335205078125, 7.9296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 7.0, 9.0, 13.0, 18.0, 18.0, 20.0, 46.0, 59.0, 64.0, 84.0, 114.0, 132.0, 94.0, 78.0, 61.0, 53.0, 30.0, 29.0, 12.0, 15.0, 11.0, 5.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.71917724609375, -3.5360107421875, -3.35284423828125, -3.169677734375, -2.98651123046875, -2.8033447265625, -2.62017822265625, -2.43701171875, -2.25384521484375, -2.0706787109375, -1.88751220703125, -1.704345703125, -1.52117919921875, -1.3380126953125, -1.15484619140625, -0.9716796875, -0.78851318359375, -0.6053466796875, -0.42218017578125, -0.239013671875, -0.05584716796875, 0.1273193359375, 0.31048583984375, 0.49365234375, 0.67681884765625, 0.8599853515625, 1.04315185546875, 1.226318359375, 1.40948486328125, 1.5926513671875, 1.77581787109375, 1.958984375, 2.14215087890625, 2.3253173828125, 2.50848388671875, 2.691650390625, 2.87481689453125, 3.0579833984375, 3.24114990234375, 3.42431640625, 3.60748291015625, 3.7906494140625, 3.97381591796875, 4.156982421875, 4.34014892578125, 4.5233154296875, 4.70648193359375, 4.8896484375, 5.07281494140625, 5.2559814453125, 5.43914794921875, 5.622314453125, 5.80548095703125, 5.9886474609375, 6.17181396484375, 6.35498046875, 6.53814697265625, 6.7213134765625, 6.90447998046875, 7.087646484375, 7.27081298828125, 7.4539794921875, 7.63714599609375, 7.8203125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 25.0, 66.0, 215.0, 371.0, 183.0, 71.0, 26.0, 17.0, 8.0, 4.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.49900817871094, -143.09243774414062, -138.6858673095703, -134.279296875, -129.8727264404297, -125.46615600585938, -121.05958557128906, -116.65301513671875, -112.24644470214844, -107.83987426757812, -103.43330383300781, -99.0267333984375, -94.62016296386719, -90.21359252929688, -85.80702209472656, -81.40045166015625, -76.99388122558594, -72.58731079101562, -68.18074035644531, -63.774169921875, -59.36759948730469, -54.961029052734375, -50.55445861816406, -46.14788818359375, -41.74131774902344, -37.334747314453125, -32.92817687988281, -28.5216064453125, -24.115036010742188, -19.708465576171875, -15.301895141601562, -10.89532470703125, -6.48876953125, -2.0821990966796875, 2.324371337890625, 6.7309417724609375, 11.13751220703125, 15.544082641601562, 19.950653076171875, 24.357223510742188, 28.7637939453125, 33.17036437988281, 37.576934814453125, 41.98350524902344, 46.39007568359375, 50.79664611816406, 55.203216552734375, 59.60978698730469, 64.016357421875, 68.42292785644531, 72.82949829101562, 77.23606872558594, 81.64263916015625, 86.04920959472656, 90.45578002929688, 94.86235046386719, 99.2689208984375, 103.67549133300781, 108.08206176757812, 112.48863220214844, 116.89520263671875, 121.30177307128906, 125.70834350585938, 130.1149139404297, 134.521484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 6.0, 7.0, 15.0, 23.0, 12.0, 14.0, 28.0, 25.0, 29.0, 30.0, 32.0, 33.0, 36.0, 51.0, 43.0, 64.0, 38.0, 63.0, 53.0, 45.0, 39.0, 48.0, 32.0, 30.0, 31.0, 17.0, 21.0, 21.0, 20.0, 10.0, 8.0, 10.0, 8.0, 10.0, 14.0, 7.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.07443618774414, -57.34138870239258, -55.608341217041016, -53.87529754638672, -52.142250061035156, -50.409202575683594, -48.67615509033203, -46.94310760498047, -45.210060119628906, -43.477012634277344, -41.74396514892578, -40.01091766357422, -38.27787399291992, -36.54482650756836, -34.8117790222168, -33.078731536865234, -31.345687866210938, -29.612640380859375, -27.879594802856445, -26.146547317504883, -24.413501739501953, -22.68045425415039, -20.947406768798828, -19.214359283447266, -17.481313705444336, -15.74826717376709, -14.015220642089844, -12.282173156738281, -10.549126625061035, -8.816080093383789, -7.083032608032227, -5.3499860763549805, -3.616943359375, -1.8838965892791748, -0.1508498191833496, 1.5821971893310547, 3.315243721008301, 5.048290252685547, 6.781337738037109, 8.514384269714355, 10.247430801391602, 11.980477333068848, 13.713523864746094, 15.446571350097656, 17.17961883544922, 18.91266441345215, 20.64571189880371, 22.37875747680664, 24.111804962158203, 25.844852447509766, 27.577898025512695, 29.310945510864258, 31.043991088867188, 32.77703857421875, 34.51008605957031, 36.243133544921875, 37.97618103027344, 39.709228515625, 41.44227600097656, 43.175323486328125, 44.90836715698242, 46.641414642333984, 48.37446212768555, 50.10750961303711, 51.840553283691406]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 14.0, 14.0, 22.0, 30.0, 50.0, 82.0, 137.0, 253.0, 1639.0, 1248495.0, 2941079.0, 1770.0, 317.0, 147.0, 81.0, 44.0, 39.0, 17.0, 14.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -22.972900390625, -22.05517578125, -21.137451171875, -20.2197265625, -19.302001953125, -18.38427734375, -17.466552734375, -16.548828125, -15.631103515625, -14.71337890625, -13.795654296875, -12.8779296875, -11.960205078125, -11.04248046875, -10.124755859375, -9.20703125, -8.289306640625, -7.37158203125, -6.453857421875, -5.5361328125, -4.618408203125, -3.70068359375, -2.782958984375, -1.865234375, -0.947509765625, -0.02978515625, 0.887939453125, 1.8056640625, 2.723388671875, 3.64111328125, 4.558837890625, 5.4765625, 6.394287109375, 7.31201171875, 8.229736328125, 9.1474609375, 10.065185546875, 10.98291015625, 11.900634765625, 12.818359375, 13.736083984375, 14.65380859375, 15.571533203125, 16.4892578125, 17.406982421875, 18.32470703125, 19.242431640625, 20.16015625, 21.077880859375, 21.99560546875, 22.913330078125, 23.8310546875, 24.748779296875, 25.66650390625, 26.584228515625, 27.501953125, 28.419677734375, 29.33740234375, 30.255126953125, 31.1728515625, 32.090576171875, 33.00830078125, 33.926025390625, 34.84375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 6.0, 5.0, 0.0, 1.0, 2.0, 8.0, 8.0, 6.0, 5.0, 16.0, 23.0, 25.0, 25.0, 42.0, 29.0, 29.0, 46.0, 46.0, 54.0, 57.0, 62.0, 53.0, 47.0, 59.0, 45.0, 44.0, 42.0, 52.0, 32.0, 29.0, 27.0, 20.0, 13.0, 21.0, 11.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.35498046875, -4.2412109375, -4.12744140625, -4.013671875, -3.89990234375, -3.7861328125, -3.67236328125, -3.55859375, -3.44482421875, -3.3310546875, -3.21728515625, -3.103515625, -2.98974609375, -2.8759765625, -2.76220703125, -2.6484375, -2.53466796875, -2.4208984375, -2.30712890625, -2.193359375, -2.07958984375, -1.9658203125, -1.85205078125, -1.73828125, -1.62451171875, -1.5107421875, -1.39697265625, -1.283203125, -1.16943359375, -1.0556640625, -0.94189453125, -0.828125, -0.71435546875, -0.6005859375, -0.48681640625, -0.373046875, -0.25927734375, -0.1455078125, -0.03173828125, 0.08203125, 0.19580078125, 0.3095703125, 0.42333984375, 0.537109375, 0.65087890625, 0.7646484375, 0.87841796875, 0.9921875, 1.10595703125, 1.2197265625, 1.33349609375, 1.447265625, 1.56103515625, 1.6748046875, 1.78857421875, 1.90234375, 2.01611328125, 2.1298828125, 2.24365234375, 2.357421875, 2.47119140625, 2.5849609375, 2.69873046875, 2.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 15.0, 14.0, 42.0, 44.0, 81.0, 151.0, 222.0, 463.0, 878.0, 1666.0, 3966.0, 10174.0, 34389.0, 214353.0, 2951054.0, 873902.0, 74277.0, 17620.0, 5951.0, 2389.0, 1151.0, 622.0, 297.0, 188.0, 120.0, 89.0, 47.0, 28.0, 15.0, 16.0, 7.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.2791748046875, -5.081787109375, -4.8843994140625, -4.68701171875, -4.4896240234375, -4.292236328125, -4.0948486328125, -3.8974609375, -3.7000732421875, -3.502685546875, -3.3052978515625, -3.10791015625, -2.9105224609375, -2.713134765625, -2.5157470703125, -2.318359375, -2.1209716796875, -1.923583984375, -1.7261962890625, -1.52880859375, -1.3314208984375, -1.134033203125, -0.9366455078125, -0.7392578125, -0.5418701171875, -0.344482421875, -0.1470947265625, 0.05029296875, 0.2476806640625, 0.445068359375, 0.6424560546875, 0.83984375, 1.0372314453125, 1.234619140625, 1.4320068359375, 1.62939453125, 1.8267822265625, 2.024169921875, 2.2215576171875, 2.4189453125, 2.6163330078125, 2.813720703125, 3.0111083984375, 3.20849609375, 3.4058837890625, 3.603271484375, 3.8006591796875, 3.998046875, 4.1954345703125, 4.392822265625, 4.5902099609375, 4.78759765625, 4.9849853515625, 5.182373046875, 5.3797607421875, 5.5771484375, 5.7745361328125, 5.971923828125, 6.1693115234375, 6.36669921875, 6.5640869140625, 6.761474609375, 6.9588623046875, 7.15625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 7.0, 7.0, 14.0, 12.0, 21.0, 38.0, 52.0, 87.0, 143.0, 269.0, 462.0, 705.0, 822.0, 580.0, 340.0, 186.0, 107.0, 53.0, 44.0, 38.0, 17.0, 8.0, 18.0, 6.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.3753662109375, -6.164794921875, -5.9542236328125, -5.74365234375, -5.5330810546875, -5.322509765625, -5.1119384765625, -4.9013671875, -4.6907958984375, -4.480224609375, -4.2696533203125, -4.05908203125, -3.8485107421875, -3.637939453125, -3.4273681640625, -3.216796875, -3.0062255859375, -2.795654296875, -2.5850830078125, -2.37451171875, -2.1639404296875, -1.953369140625, -1.7427978515625, -1.5322265625, -1.3216552734375, -1.111083984375, -0.9005126953125, -0.68994140625, -0.4793701171875, -0.268798828125, -0.0582275390625, 0.15234375, 0.3629150390625, 0.573486328125, 0.7840576171875, 0.99462890625, 1.2052001953125, 1.415771484375, 1.6263427734375, 1.8369140625, 2.0474853515625, 2.258056640625, 2.4686279296875, 2.67919921875, 2.8897705078125, 3.100341796875, 3.3109130859375, 3.521484375, 3.7320556640625, 3.942626953125, 4.1531982421875, 4.36376953125, 4.5743408203125, 4.784912109375, 4.9954833984375, 5.2060546875, 5.4166259765625, 5.627197265625, 5.8377685546875, 6.04833984375, 6.2589111328125, 6.469482421875, 6.6800537109375, 6.890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 16.0, 27.0, 48.0, 85.0, 167.0, 207.0, 180.0, 146.0, 56.0, 24.0, 11.0, 10.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.01990509033203, -64.9867172241211, -62.95352554321289, -60.92033386230469, -58.88714599609375, -56.85395431518555, -54.820762634277344, -52.787574768066406, -50.75438690185547, -48.721195220947266, -46.68800735473633, -44.654815673828125, -42.62162780761719, -40.588436126708984, -38.55524444580078, -36.522056579589844, -34.48886489868164, -32.45567321777344, -30.4224853515625, -28.389293670654297, -26.35610580444336, -24.322914123535156, -22.289724349975586, -20.256534576416016, -18.223344802856445, -16.190155029296875, -14.156965255737305, -12.123774528503418, -10.090584754943848, -8.057394981384277, -6.024204254150391, -3.9910144805908203, -1.9578208923339844, 0.07536911964416504, 2.1085591316223145, 4.141749382019043, 6.174939155578613, 8.208128929138184, 10.24131965637207, 12.27450942993164, 14.307699203491211, 16.34088897705078, 18.37407875061035, 20.407268524169922, 22.440460205078125, 24.473648071289062, 26.506839752197266, 28.540029525756836, 30.573219299316406, 32.60641098022461, 34.63959884643555, 36.67279052734375, 38.70597839355469, 40.73917007446289, 42.772361755371094, 44.80554962158203, 46.83873748779297, 48.87192916870117, 50.90511703491211, 52.93830871582031, 54.97149658203125, 57.00468826293945, 59.037879943847656, 61.071067810058594, 63.1042594909668]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 12.0, 12.0, 12.0, 15.0, 21.0, 20.0, 19.0, 27.0, 31.0, 21.0, 34.0, 38.0, 47.0, 50.0, 42.0, 51.0, 52.0, 48.0, 38.0, 33.0, 46.0, 47.0, 41.0, 33.0, 29.0, 26.0, 27.0, 27.0, 12.0, 15.0, 10.0, 10.0, 6.0, 4.0, 5.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.61740493774414, -22.8070068359375, -21.99660873413086, -21.18621063232422, -20.375810623168945, -19.565412521362305, -18.755014419555664, -17.944616317749023, -17.13421630859375, -16.32381820678711, -15.513419151306152, -14.703021049499512, -13.892621994018555, -13.082223892211914, -12.271825790405273, -11.461427688598633, -10.651029586791992, -9.840631484985352, -9.030232429504395, -8.219834327697754, -7.409435749053955, -6.599037170410156, -5.788639068603516, -4.978240489959717, -4.167841911315918, -3.357443332672119, -2.5470449924468994, -1.7366466522216797, -0.9262480735778809, -0.11584949493408203, 0.6945486068725586, 1.5049471855163574, 2.3153457641601562, 3.125744342803955, 3.936142683029175, 4.7465410232543945, 5.556939601898193, 6.367338180541992, 7.177736282348633, 7.988134860992432, 8.79853343963623, 9.608931541442871, 10.419330596923828, 11.229728698730469, 12.04012680053711, 12.850525856018066, 13.660923957824707, 14.471323013305664, 15.281721115112305, 16.092119216918945, 16.902517318725586, 17.71291732788086, 18.5233154296875, 19.33371353149414, 20.14411163330078, 20.954509735107422, 21.764907836914062, 22.575305938720703, 23.385704040527344, 24.196102142333984, 25.006502151489258, 25.8169002532959, 26.62729835510254, 27.43769645690918, 28.248096466064453]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 12.0, 5.0, 10.0, 18.0, 13.0, 39.0, 41.0, 81.0, 106.0, 175.0, 242.0, 396.0, 677.0, 1181.0, 1882.0, 3507.0, 6548.0, 12387.0, 24335.0, 51175.0, 116088.0, 260839.0, 299696.0, 144679.0, 63278.0, 29183.0, 14607.0, 7535.0, 4131.0, 2259.0, 1374.0, 757.0, 487.0, 268.0, 185.0, 129.0, 71.0, 45.0, 31.0, 22.0, 19.0, 16.0, 4.0, 14.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.08984375, -3.973419189453125, -3.85699462890625, -3.740570068359375, -3.6241455078125, -3.507720947265625, -3.39129638671875, -3.274871826171875, -3.158447265625, -3.042022705078125, -2.92559814453125, -2.809173583984375, -2.6927490234375, -2.576324462890625, -2.45989990234375, -2.343475341796875, -2.22705078125, -2.110626220703125, -1.99420166015625, -1.877777099609375, -1.7613525390625, -1.644927978515625, -1.52850341796875, -1.412078857421875, -1.295654296875, -1.179229736328125, -1.06280517578125, -0.946380615234375, -0.8299560546875, -0.713531494140625, -0.59710693359375, -0.480682373046875, -0.3642578125, -0.247833251953125, -0.13140869140625, -0.014984130859375, 0.1014404296875, 0.217864990234375, 0.33428955078125, 0.450714111328125, 0.567138671875, 0.683563232421875, 0.79998779296875, 0.916412353515625, 1.0328369140625, 1.149261474609375, 1.26568603515625, 1.382110595703125, 1.49853515625, 1.614959716796875, 1.73138427734375, 1.847808837890625, 1.9642333984375, 2.080657958984375, 2.19708251953125, 2.313507080078125, 2.429931640625, 2.546356201171875, 2.66278076171875, 2.779205322265625, 2.8956298828125, 3.012054443359375, 3.12847900390625, 3.244903564453125, 3.361328125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 10.0, 7.0, 8.0, 14.0, 15.0, 15.0, 16.0, 25.0, 28.0, 25.0, 28.0, 29.0, 36.0, 47.0, 35.0, 42.0, 50.0, 47.0, 40.0, 48.0, 45.0, 44.0, 37.0, 28.0, 29.0, 29.0, 32.0, 25.0, 36.0, 19.0, 29.0, 15.0, 14.0, 9.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.775634765625, -2.68408203125, -2.592529296875, -2.5009765625, -2.409423828125, -2.31787109375, -2.226318359375, -2.134765625, -2.043212890625, -1.95166015625, -1.860107421875, -1.7685546875, -1.677001953125, -1.58544921875, -1.493896484375, -1.40234375, -1.310791015625, -1.21923828125, -1.127685546875, -1.0361328125, -0.944580078125, -0.85302734375, -0.761474609375, -0.669921875, -0.578369140625, -0.48681640625, -0.395263671875, -0.3037109375, -0.212158203125, -0.12060546875, -0.029052734375, 0.0625, 0.154052734375, 0.24560546875, 0.337158203125, 0.4287109375, 0.520263671875, 0.61181640625, 0.703369140625, 0.794921875, 0.886474609375, 0.97802734375, 1.069580078125, 1.1611328125, 1.252685546875, 1.34423828125, 1.435791015625, 1.52734375, 1.618896484375, 1.71044921875, 1.802001953125, 1.8935546875, 1.985107421875, 2.07666015625, 2.168212890625, 2.259765625, 2.351318359375, 2.44287109375, 2.534423828125, 2.6259765625, 2.717529296875, 2.80908203125, 2.900634765625, 2.9921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 9.0, 20.0, 20.0, 43.0, 74.0, 114.0, 203.0, 363.0, 872.0, 2449.0, 9593.0, 66058.0, 772733.0, 171693.0, 18153.0, 3768.0, 1227.0, 517.0, 247.0, 155.0, 67.0, 47.0, 23.0, 30.0, 15.0, 16.0, 6.0, 1.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0859375, -14.6632080078125, -14.240478515625, -13.8177490234375, -13.39501953125, -12.9722900390625, -12.549560546875, -12.1268310546875, -11.7041015625, -11.2813720703125, -10.858642578125, -10.4359130859375, -10.01318359375, -9.5904541015625, -9.167724609375, -8.7449951171875, -8.322265625, -7.8995361328125, -7.476806640625, -7.0540771484375, -6.63134765625, -6.2086181640625, -5.785888671875, -5.3631591796875, -4.9404296875, -4.5177001953125, -4.094970703125, -3.6722412109375, -3.24951171875, -2.8267822265625, -2.404052734375, -1.9813232421875, -1.55859375, -1.1358642578125, -0.713134765625, -0.2904052734375, 0.13232421875, 0.5550537109375, 0.977783203125, 1.4005126953125, 1.8232421875, 2.2459716796875, 2.668701171875, 3.0914306640625, 3.51416015625, 3.9368896484375, 4.359619140625, 4.7823486328125, 5.205078125, 5.6278076171875, 6.050537109375, 6.4732666015625, 6.89599609375, 7.3187255859375, 7.741455078125, 8.1641845703125, 8.5869140625, 9.0096435546875, 9.432373046875, 9.8551025390625, 10.27783203125, 10.7005615234375, 11.123291015625, 11.5460205078125, 11.96875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 13.0, 14.0, 16.0, 18.0, 30.0, 19.0, 30.0, 29.0, 35.0, 57.0, 62.0, 54.0, 62.0, 74.0, 71.0, 51.0, 42.0, 37.0, 40.0, 31.0, 22.0, 37.0, 20.0, 19.0, 18.0, 15.0, 10.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.052978515625, -14.59814453125, -14.143310546875, -13.6884765625, -13.233642578125, -12.77880859375, -12.323974609375, -11.869140625, -11.414306640625, -10.95947265625, -10.504638671875, -10.0498046875, -9.594970703125, -9.14013671875, -8.685302734375, -8.23046875, -7.775634765625, -7.32080078125, -6.865966796875, -6.4111328125, -5.956298828125, -5.50146484375, -5.046630859375, -4.591796875, -4.136962890625, -3.68212890625, -3.227294921875, -2.7724609375, -2.317626953125, -1.86279296875, -1.407958984375, -0.953125, -0.498291015625, -0.04345703125, 0.411376953125, 0.8662109375, 1.321044921875, 1.77587890625, 2.230712890625, 2.685546875, 3.140380859375, 3.59521484375, 4.050048828125, 4.5048828125, 4.959716796875, 5.41455078125, 5.869384765625, 6.32421875, 6.779052734375, 7.23388671875, 7.688720703125, 8.1435546875, 8.598388671875, 9.05322265625, 9.508056640625, 9.962890625, 10.417724609375, 10.87255859375, 11.327392578125, 11.7822265625, 12.237060546875, 12.69189453125, 13.146728515625, 13.6015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 18.0, 24.0, 62.0, 136.0, 417.0, 1534.0, 11937.0, 406207.0, 611973.0, 13860.0, 1693.0, 418.0, 137.0, 54.0, 26.0, 11.0, 13.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75390625, -7.41717529296875, -7.0804443359375, -6.74371337890625, -6.406982421875, -6.07025146484375, -5.7335205078125, -5.39678955078125, -5.06005859375, -4.72332763671875, -4.3865966796875, -4.04986572265625, -3.713134765625, -3.37640380859375, -3.0396728515625, -2.70294189453125, -2.3662109375, -2.02947998046875, -1.6927490234375, -1.35601806640625, -1.019287109375, -0.68255615234375, -0.3458251953125, -0.00909423828125, 0.32763671875, 0.66436767578125, 1.0010986328125, 1.33782958984375, 1.674560546875, 2.01129150390625, 2.3480224609375, 2.68475341796875, 3.021484375, 3.35821533203125, 3.6949462890625, 4.03167724609375, 4.368408203125, 4.70513916015625, 5.0418701171875, 5.37860107421875, 5.71533203125, 6.05206298828125, 6.3887939453125, 6.72552490234375, 7.062255859375, 7.39898681640625, 7.7357177734375, 8.07244873046875, 8.4091796875, 8.74591064453125, 9.0826416015625, 9.41937255859375, 9.756103515625, 10.09283447265625, 10.4295654296875, 10.76629638671875, 11.10302734375, 11.43975830078125, 11.7764892578125, 12.11322021484375, 12.449951171875, 12.78668212890625, 13.1234130859375, 13.46014404296875, 13.796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 4.0, 8.0, 12.0, 10.0, 20.0, 17.0, 41.0, 52.0, 66.0, 102.0, 146.0, 112.0, 128.0, 66.0, 37.0, 31.0, 26.0, 18.0, 21.0, 18.0, 7.0, 8.0, 7.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010356903076171875, -0.0010033398866653442, -0.000970989465713501, -0.0009386390447616577, -0.0009062886238098145, -0.0008739382028579712, -0.0008415877819061279, -0.0008092373609542847, -0.0007768869400024414, -0.0007445365190505981, -0.0007121860980987549, -0.0006798356771469116, -0.0006474852561950684, -0.0006151348352432251, -0.0005827844142913818, -0.0005504339933395386, -0.0005180835723876953, -0.00048573315143585205, -0.0004533827304840088, -0.00042103230953216553, -0.00038868188858032227, -0.000356331467628479, -0.00032398104667663574, -0.0002916306257247925, -0.0002592802047729492, -0.00022692978382110596, -0.0001945793628692627, -0.00016222894191741943, -0.00012987852096557617, -9.752810001373291e-05, -6.517767906188965e-05, -3.282725811004639e-05, -4.76837158203125e-07, 3.187358379364014e-05, 6.42240047454834e-05, 9.657442569732666e-05, 0.00012892484664916992, 0.00016127526760101318, 0.00019362568855285645, 0.0002259761095046997, 0.00025832653045654297, 0.00029067695140838623, 0.0003230273723602295, 0.00035537779331207275, 0.000387728214263916, 0.0004200786352157593, 0.00045242905616760254, 0.0004847794771194458, 0.0005171298980712891, 0.0005494803190231323, 0.0005818307399749756, 0.0006141811609268188, 0.0006465315818786621, 0.0006788820028305054, 0.0007112324237823486, 0.0007435828447341919, 0.0007759332656860352, 0.0008082836866378784, 0.0008406341075897217, 0.0008729845285415649, 0.0009053349494934082, 0.0009376853704452515, 0.0009700357913970947, 0.001002386212348938, 0.0010347366333007812]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 3.0, 11.0, 9.0, 22.0, 27.0, 35.0, 50.0, 80.0, 135.0, 173.0, 341.0, 582.0, 1146.0, 2604.0, 7201.0, 23943.0, 119765.0, 710470.0, 141890.0, 26643.0, 7809.0, 2737.0, 1265.0, 641.0, 337.0, 198.0, 138.0, 91.0, 59.0, 28.0, 34.0, 23.0, 21.0, 13.0, 11.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.2608642578125, -4.111572265625, -3.9622802734375, -3.81298828125, -3.6636962890625, -3.514404296875, -3.3651123046875, -3.2158203125, -3.0665283203125, -2.917236328125, -2.7679443359375, -2.61865234375, -2.4693603515625, -2.320068359375, -2.1707763671875, -2.021484375, -1.8721923828125, -1.722900390625, -1.5736083984375, -1.42431640625, -1.2750244140625, -1.125732421875, -0.9764404296875, -0.8271484375, -0.6778564453125, -0.528564453125, -0.3792724609375, -0.22998046875, -0.0806884765625, 0.068603515625, 0.2178955078125, 0.3671875, 0.5164794921875, 0.665771484375, 0.8150634765625, 0.96435546875, 1.1136474609375, 1.262939453125, 1.4122314453125, 1.5615234375, 1.7108154296875, 1.860107421875, 2.0093994140625, 2.15869140625, 2.3079833984375, 2.457275390625, 2.6065673828125, 2.755859375, 2.9051513671875, 3.054443359375, 3.2037353515625, 3.35302734375, 3.5023193359375, 3.651611328125, 3.8009033203125, 3.9501953125, 4.0994873046875, 4.248779296875, 4.3980712890625, 4.54736328125, 4.6966552734375, 4.845947265625, 4.9952392578125, 5.14453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 6.0, 3.0, 6.0, 4.0, 10.0, 5.0, 11.0, 13.0, 24.0, 27.0, 42.0, 49.0, 75.0, 82.0, 95.0, 91.0, 99.0, 66.0, 85.0, 51.0, 46.0, 25.0, 18.0, 23.0, 14.0, 4.0, 2.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.62652587890625, -4.4835205078125, -4.34051513671875, -4.197509765625, -4.05450439453125, -3.9114990234375, -3.76849365234375, -3.62548828125, -3.48248291015625, -3.3394775390625, -3.19647216796875, -3.053466796875, -2.91046142578125, -2.7674560546875, -2.62445068359375, -2.4814453125, -2.33843994140625, -2.1954345703125, -2.05242919921875, -1.909423828125, -1.76641845703125, -1.6234130859375, -1.48040771484375, -1.33740234375, -1.19439697265625, -1.0513916015625, -0.90838623046875, -0.765380859375, -0.62237548828125, -0.4793701171875, -0.33636474609375, -0.193359375, -0.05035400390625, 0.0926513671875, 0.23565673828125, 0.378662109375, 0.52166748046875, 0.6646728515625, 0.80767822265625, 0.95068359375, 1.09368896484375, 1.2366943359375, 1.37969970703125, 1.522705078125, 1.66571044921875, 1.8087158203125, 1.95172119140625, 2.0947265625, 2.23773193359375, 2.3807373046875, 2.52374267578125, 2.666748046875, 2.80975341796875, 2.9527587890625, 3.09576416015625, 3.23876953125, 3.38177490234375, 3.5247802734375, 3.66778564453125, 3.810791015625, 3.95379638671875, 4.0968017578125, 4.23980712890625, 4.3828125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 8.0, 11.0, 26.0, 48.0, 142.0, 338.0, 224.0, 130.0, 44.0, 20.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.65896606445312, -73.74069213867188, -69.8224105834961, -65.90413665771484, -61.98585510253906, -58.06758117675781, -54.1493034362793, -50.23102569580078, -46.312747955322266, -42.39447021484375, -38.476192474365234, -34.55791473388672, -30.639638900756836, -26.72136116027832, -22.803085327148438, -18.884807586669922, -14.966529846191406, -11.04825210571289, -7.129975318908691, -3.211698532104492, 0.7065792083740234, 4.624856948852539, 8.543132781982422, 12.461410522460938, 16.379688262939453, 20.29796600341797, 24.216243743896484, 28.134519577026367, 32.05279541015625, 35.97107696533203, 39.88935089111328, 43.8076286315918, 47.72590637207031, 51.64418411254883, 55.562461853027344, 59.480735778808594, 63.399017333984375, 67.31729125976562, 71.23556518554688, 75.15384674072266, 79.07212829589844, 82.99040222167969, 86.90868377685547, 90.82695770263672, 94.7452392578125, 98.66351318359375, 102.581787109375, 106.50006866455078, 110.41834259033203, 114.33661651611328, 118.25489807128906, 122.17317199707031, 126.0914535522461, 130.00973510742188, 133.92800903320312, 137.84628295898438, 141.76455688476562, 145.68283081054688, 149.60110473632812, 153.51939392089844, 157.4376678466797, 161.35594177246094, 165.2742156982422, 169.1925048828125, 173.11077880859375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 5.0, 9.0, 11.0, 9.0, 15.0, 20.0, 18.0, 19.0, 28.0, 31.0, 32.0, 33.0, 25.0, 40.0, 41.0, 54.0, 46.0, 37.0, 65.0, 47.0, 58.0, 47.0, 33.0, 37.0, 36.0, 32.0, 25.0, 20.0, 27.0, 17.0, 15.0, 11.0, 11.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.30426025390625, -43.69240188598633, -42.080543518066406, -40.468685150146484, -38.85682678222656, -37.24496841430664, -35.63311004638672, -34.0212516784668, -32.409393310546875, -30.797534942626953, -29.18567657470703, -27.57381820678711, -25.961959838867188, -24.350101470947266, -22.738243103027344, -21.126384735107422, -19.514528274536133, -17.90266990661621, -16.29081153869629, -14.678953170776367, -13.067094802856445, -11.45523738861084, -9.843379020690918, -8.231520652770996, -6.619662284851074, -5.007803916931152, -3.3959457874298096, -1.7840876579284668, -0.17222929000854492, 1.4396286010742188, 3.0514869689941406, 4.6633453369140625, 6.275203704833984, 7.887062072753906, 9.498920440673828, 11.11077880859375, 12.722637176513672, 14.334494590759277, 15.9463529586792, 17.558212280273438, 19.17007064819336, 20.78192901611328, 22.393787384033203, 24.005645751953125, 25.617504119873047, 27.22936248779297, 28.84122085571289, 30.453079223632812, 32.06493377685547, 33.67679214477539, 35.28865051269531, 36.900508880615234, 38.512367248535156, 40.12422561645508, 41.736083984375, 43.34794235229492, 44.959800720214844, 46.571659088134766, 48.18351745605469, 49.79537582397461, 51.40723419189453, 53.01909255981445, 54.630950927734375, 56.2428092956543, 57.85466766357422]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 6.0, 6.0, 9.0, 10.0, 18.0, 23.0, 38.0, 56.0, 83.0, 131.0, 257.0, 362.0, 791.0, 1474.0, 2941.0, 6677.0, 17368.0, 56378.0, 294909.0, 1984249.0, 1545879.0, 212504.0, 44781.0, 14182.0, 5643.0, 2555.0, 1246.0, 664.0, 402.0, 220.0, 137.0, 87.0, 45.0, 50.0, 24.0, 25.0, 14.0, 7.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.28125, -4.15118408203125, -4.0211181640625, -3.89105224609375, -3.760986328125, -3.63092041015625, -3.5008544921875, -3.37078857421875, -3.24072265625, -3.11065673828125, -2.9805908203125, -2.85052490234375, -2.720458984375, -2.59039306640625, -2.4603271484375, -2.33026123046875, -2.2001953125, -2.07012939453125, -1.9400634765625, -1.80999755859375, -1.679931640625, -1.54986572265625, -1.4197998046875, -1.28973388671875, -1.15966796875, -1.02960205078125, -0.8995361328125, -0.76947021484375, -0.639404296875, -0.50933837890625, -0.3792724609375, -0.24920654296875, -0.119140625, 0.01092529296875, 0.1409912109375, 0.27105712890625, 0.401123046875, 0.53118896484375, 0.6612548828125, 0.79132080078125, 0.92138671875, 1.05145263671875, 1.1815185546875, 1.31158447265625, 1.441650390625, 1.57171630859375, 1.7017822265625, 1.83184814453125, 1.9619140625, 2.09197998046875, 2.2220458984375, 2.35211181640625, 2.482177734375, 2.61224365234375, 2.7423095703125, 2.87237548828125, 3.00244140625, 3.13250732421875, 3.2625732421875, 3.39263916015625, 3.522705078125, 3.65277099609375, 3.7828369140625, 3.91290283203125, 4.04296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 21.0, 11.0, 19.0, 30.0, 32.0, 35.0, 35.0, 33.0, 33.0, 45.0, 46.0, 52.0, 46.0, 47.0, 48.0, 49.0, 31.0, 57.0, 45.0, 34.0, 33.0, 36.0, 34.0, 26.0, 17.0, 12.0, 20.0, 15.0, 10.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.525390625, -3.426300048828125, -3.32720947265625, -3.228118896484375, -3.1290283203125, -3.029937744140625, -2.93084716796875, -2.831756591796875, -2.732666015625, -2.633575439453125, -2.53448486328125, -2.435394287109375, -2.3363037109375, -2.237213134765625, -2.13812255859375, -2.039031982421875, -1.93994140625, -1.840850830078125, -1.74176025390625, -1.642669677734375, -1.5435791015625, -1.444488525390625, -1.34539794921875, -1.246307373046875, -1.147216796875, -1.048126220703125, -0.94903564453125, -0.849945068359375, -0.7508544921875, -0.651763916015625, -0.55267333984375, -0.453582763671875, -0.3544921875, -0.255401611328125, -0.15631103515625, -0.057220458984375, 0.0418701171875, 0.140960693359375, 0.24005126953125, 0.339141845703125, 0.438232421875, 0.537322998046875, 0.63641357421875, 0.735504150390625, 0.8345947265625, 0.933685302734375, 1.03277587890625, 1.131866455078125, 1.23095703125, 1.330047607421875, 1.42913818359375, 1.528228759765625, 1.6273193359375, 1.726409912109375, 1.82550048828125, 1.924591064453125, 2.023681640625, 2.122772216796875, 2.22186279296875, 2.320953369140625, 2.4200439453125, 2.519134521484375, 2.61822509765625, 2.717315673828125, 2.81640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 7.0, 5.0, 13.0, 15.0, 19.0, 52.0, 106.0, 187.0, 489.0, 1769.0, 9368.0, 93839.0, 3547178.0, 512619.0, 23521.0, 3418.0, 924.0, 367.0, 205.0, 74.0, 48.0, 23.0, 10.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.466796875, -8.05859375, -7.650390625, -7.2421875, -6.833984375, -6.42578125, -6.017578125, -5.609375, -5.201171875, -4.79296875, -4.384765625, -3.9765625, -3.568359375, -3.16015625, -2.751953125, -2.34375, -1.935546875, -1.52734375, -1.119140625, -0.7109375, -0.302734375, 0.10546875, 0.513671875, 0.921875, 1.330078125, 1.73828125, 2.146484375, 2.5546875, 2.962890625, 3.37109375, 3.779296875, 4.1875, 4.595703125, 5.00390625, 5.412109375, 5.8203125, 6.228515625, 6.63671875, 7.044921875, 7.453125, 7.861328125, 8.26953125, 8.677734375, 9.0859375, 9.494140625, 9.90234375, 10.310546875, 10.71875, 11.126953125, 11.53515625, 11.943359375, 12.3515625, 12.759765625, 13.16796875, 13.576171875, 13.984375, 14.392578125, 14.80078125, 15.208984375, 15.6171875, 16.025390625, 16.43359375, 16.841796875, 17.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 15.0, 14.0, 31.0, 38.0, 45.0, 60.0, 99.0, 152.0, 277.0, 476.0, 803.0, 759.0, 537.0, 295.0, 155.0, 105.0, 56.0, 39.0, 32.0, 22.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.10546875, -5.81658935546875, -5.5277099609375, -5.23883056640625, -4.949951171875, -4.66107177734375, -4.3721923828125, -4.08331298828125, -3.79443359375, -3.50555419921875, -3.2166748046875, -2.92779541015625, -2.638916015625, -2.35003662109375, -2.0611572265625, -1.77227783203125, -1.4833984375, -1.19451904296875, -0.9056396484375, -0.61676025390625, -0.327880859375, -0.03900146484375, 0.2498779296875, 0.53875732421875, 0.82763671875, 1.11651611328125, 1.4053955078125, 1.69427490234375, 1.983154296875, 2.27203369140625, 2.5609130859375, 2.84979248046875, 3.138671875, 3.42755126953125, 3.7164306640625, 4.00531005859375, 4.294189453125, 4.58306884765625, 4.8719482421875, 5.16082763671875, 5.44970703125, 5.73858642578125, 6.0274658203125, 6.31634521484375, 6.605224609375, 6.89410400390625, 7.1829833984375, 7.47186279296875, 7.7607421875, 8.04962158203125, 8.3385009765625, 8.62738037109375, 8.916259765625, 9.20513916015625, 9.4940185546875, 9.78289794921875, 10.07177734375, 10.36065673828125, 10.6495361328125, 10.93841552734375, 11.227294921875, 11.51617431640625, 11.8050537109375, 12.09393310546875, 12.3828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 23.0, 26.0, 47.0, 62.0, 111.0, 162.0, 130.0, 126.0, 102.0, 59.0, 46.0, 28.0, 13.0, 6.0, 8.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.352508544921875, -57.27739715576172, -55.2022819519043, -53.127166748046875, -51.05205535888672, -48.97694396972656, -46.90182876586914, -44.82671356201172, -42.75160217285156, -40.676490783691406, -38.601375579833984, -36.52626037597656, -34.451148986816406, -32.37603759765625, -30.300922393798828, -28.22580909729004, -26.15069580078125, -24.07558250427246, -22.000469207763672, -19.925355911254883, -17.850242614746094, -15.775129318237305, -13.700016021728516, -11.624902725219727, -9.549789428710938, -7.474676132202148, -5.399562835693359, -3.3244495391845703, -1.2493362426757812, 0.8257770538330078, 2.900890350341797, 4.976003646850586, 7.051109313964844, 9.126222610473633, 11.201335906982422, 13.276449203491211, 15.3515625, 17.42667579650879, 19.501789093017578, 21.576902389526367, 23.652015686035156, 25.727128982543945, 27.802242279052734, 29.877355575561523, 31.952468872070312, 34.02758026123047, 36.10269546508789, 38.17781066894531, 40.25292205810547, 42.328033447265625, 44.40314865112305, 46.47826385498047, 48.553375244140625, 50.62848663330078, 52.7036018371582, 54.778717041015625, 56.85382843017578, 58.92893981933594, 61.00405502319336, 63.07917022705078, 65.15428161621094, 67.2293930053711, 69.30450439453125, 71.37962341308594, 73.4547348022461]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 7.0, 5.0, 8.0, 9.0, 10.0, 8.0, 18.0, 14.0, 29.0, 27.0, 25.0, 34.0, 26.0, 33.0, 36.0, 45.0, 32.0, 47.0, 40.0, 48.0, 35.0, 51.0, 42.0, 46.0, 42.0, 40.0, 39.0, 27.0, 23.0, 21.0, 20.0, 22.0, 20.0, 16.0, 7.0, 17.0, 14.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.987953186035156, -34.789764404296875, -33.591575622558594, -32.39338302612305, -31.195194244384766, -29.997005462646484, -28.79881477355957, -27.600624084472656, -26.402435302734375, -25.204246520996094, -24.00605583190918, -22.807865142822266, -21.609676361083984, -20.411487579345703, -19.21329689025879, -18.015106201171875, -16.816917419433594, -15.618727684020996, -14.420537948608398, -13.2223482131958, -12.024158477783203, -10.825968742370605, -9.627779006958008, -8.42958927154541, -7.2313995361328125, -6.033209800720215, -4.835020065307617, -3.6368303298950195, -2.438640594482422, -1.2404508590698242, -0.04226112365722656, 1.155928611755371, 2.3541221618652344, 3.552311897277832, 4.75050163269043, 5.948691368103027, 7.146881103515625, 8.345070838928223, 9.54326057434082, 10.741450309753418, 11.939640045166016, 13.137829780578613, 14.336019515991211, 15.534209251403809, 16.732398986816406, 17.930587768554688, 19.1287784576416, 20.326969146728516, 21.525157928466797, 22.723346710205078, 23.921537399291992, 25.119728088378906, 26.317916870117188, 27.51610565185547, 28.714296340942383, 29.912487030029297, 31.110675811767578, 32.30886459350586, 33.507057189941406, 34.70524597167969, 35.90343475341797, 37.10162353515625, 38.29981231689453, 39.49800491333008, 40.69619369506836]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 0.0, 3.0, 8.0, 8.0, 17.0, 17.0, 18.0, 18.0, 39.0, 57.0, 119.0, 179.0, 289.0, 430.0, 750.0, 1337.0, 2370.0, 4686.0, 9465.0, 20552.0, 44445.0, 100904.0, 226102.0, 315433.0, 177058.0, 78156.0, 34412.0, 15901.0, 7519.0, 3646.0, 1985.0, 1051.0, 551.0, 389.0, 218.0, 141.0, 104.0, 58.0, 35.0, 29.0, 22.0, 10.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8359375, -3.7052001953125, -3.574462890625, -3.4437255859375, -3.31298828125, -3.1822509765625, -3.051513671875, -2.9207763671875, -2.7900390625, -2.6593017578125, -2.528564453125, -2.3978271484375, -2.26708984375, -2.1363525390625, -2.005615234375, -1.8748779296875, -1.744140625, -1.6134033203125, -1.482666015625, -1.3519287109375, -1.22119140625, -1.0904541015625, -0.959716796875, -0.8289794921875, -0.6982421875, -0.5675048828125, -0.436767578125, -0.3060302734375, -0.17529296875, -0.0445556640625, 0.086181640625, 0.2169189453125, 0.34765625, 0.4783935546875, 0.609130859375, 0.7398681640625, 0.87060546875, 1.0013427734375, 1.132080078125, 1.2628173828125, 1.3935546875, 1.5242919921875, 1.655029296875, 1.7857666015625, 1.91650390625, 2.0472412109375, 2.177978515625, 2.3087158203125, 2.439453125, 2.5701904296875, 2.700927734375, 2.8316650390625, 2.96240234375, 3.0931396484375, 3.223876953125, 3.3546142578125, 3.4853515625, 3.6160888671875, 3.746826171875, 3.8775634765625, 4.00830078125, 4.1390380859375, 4.269775390625, 4.4005126953125, 4.53125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 17.0, 13.0, 7.0, 14.0, 20.0, 19.0, 22.0, 31.0, 35.0, 31.0, 38.0, 43.0, 39.0, 43.0, 38.0, 58.0, 34.0, 39.0, 42.0, 43.0, 35.0, 41.0, 32.0, 33.0, 28.0, 21.0, 35.0, 18.0, 17.0, 18.0, 10.0, 14.0, 12.0, 8.0, 3.0, 8.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.818359375, -2.73150634765625, -2.6446533203125, -2.55780029296875, -2.470947265625, -2.38409423828125, -2.2972412109375, -2.21038818359375, -2.12353515625, -2.03668212890625, -1.9498291015625, -1.86297607421875, -1.776123046875, -1.68927001953125, -1.6024169921875, -1.51556396484375, -1.4287109375, -1.34185791015625, -1.2550048828125, -1.16815185546875, -1.081298828125, -0.99444580078125, -0.9075927734375, -0.82073974609375, -0.73388671875, -0.64703369140625, -0.5601806640625, -0.47332763671875, -0.386474609375, -0.29962158203125, -0.2127685546875, -0.12591552734375, -0.0390625, 0.04779052734375, 0.1346435546875, 0.22149658203125, 0.308349609375, 0.39520263671875, 0.4820556640625, 0.56890869140625, 0.65576171875, 0.74261474609375, 0.8294677734375, 0.91632080078125, 1.003173828125, 1.09002685546875, 1.1768798828125, 1.26373291015625, 1.3505859375, 1.43743896484375, 1.5242919921875, 1.61114501953125, 1.697998046875, 1.78485107421875, 1.8717041015625, 1.95855712890625, 2.04541015625, 2.13226318359375, 2.2191162109375, 2.30596923828125, 2.392822265625, 2.47967529296875, 2.5665283203125, 2.65338134765625, 2.740234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 9.0, 13.0, 12.0, 14.0, 19.0, 35.0, 63.0, 81.0, 141.0, 192.0, 349.0, 565.0, 1082.0, 2426.0, 6518.0, 31169.0, 319643.0, 623961.0, 47800.0, 8546.0, 2961.0, 1266.0, 678.0, 371.0, 202.0, 145.0, 85.0, 66.0, 37.0, 33.0, 16.0, 10.0, 8.0, 7.0, 10.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6015625, -12.1964111328125, -11.791259765625, -11.3861083984375, -10.98095703125, -10.5758056640625, -10.170654296875, -9.7655029296875, -9.3603515625, -8.9552001953125, -8.550048828125, -8.1448974609375, -7.73974609375, -7.3345947265625, -6.929443359375, -6.5242919921875, -6.119140625, -5.7139892578125, -5.308837890625, -4.9036865234375, -4.49853515625, -4.0933837890625, -3.688232421875, -3.2830810546875, -2.8779296875, -2.4727783203125, -2.067626953125, -1.6624755859375, -1.25732421875, -0.8521728515625, -0.447021484375, -0.0418701171875, 0.36328125, 0.7684326171875, 1.173583984375, 1.5787353515625, 1.98388671875, 2.3890380859375, 2.794189453125, 3.1993408203125, 3.6044921875, 4.0096435546875, 4.414794921875, 4.8199462890625, 5.22509765625, 5.6302490234375, 6.035400390625, 6.4405517578125, 6.845703125, 7.2508544921875, 7.656005859375, 8.0611572265625, 8.46630859375, 8.8714599609375, 9.276611328125, 9.6817626953125, 10.0869140625, 10.4920654296875, 10.897216796875, 11.3023681640625, 11.70751953125, 12.1126708984375, 12.517822265625, 12.9229736328125, 13.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 6.0, 2.0, 2.0, 7.0, 9.0, 10.0, 9.0, 19.0, 19.0, 31.0, 23.0, 41.0, 45.0, 49.0, 55.0, 50.0, 55.0, 42.0, 62.0, 52.0, 54.0, 48.0, 49.0, 40.0, 36.0, 34.0, 34.0, 24.0, 26.0, 20.0, 10.0, 17.0, 3.0, 4.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.15625, -15.6763916015625, -15.196533203125, -14.7166748046875, -14.23681640625, -13.7569580078125, -13.277099609375, -12.7972412109375, -12.3173828125, -11.8375244140625, -11.357666015625, -10.8778076171875, -10.39794921875, -9.9180908203125, -9.438232421875, -8.9583740234375, -8.478515625, -7.9986572265625, -7.518798828125, -7.0389404296875, -6.55908203125, -6.0792236328125, -5.599365234375, -5.1195068359375, -4.6396484375, -4.1597900390625, -3.679931640625, -3.2000732421875, -2.72021484375, -2.2403564453125, -1.760498046875, -1.2806396484375, -0.80078125, -0.3209228515625, 0.158935546875, 0.6387939453125, 1.11865234375, 1.5985107421875, 2.078369140625, 2.5582275390625, 3.0380859375, 3.5179443359375, 3.997802734375, 4.4776611328125, 4.95751953125, 5.4373779296875, 5.917236328125, 6.3970947265625, 6.876953125, 7.3568115234375, 7.836669921875, 8.3165283203125, 8.79638671875, 9.2762451171875, 9.756103515625, 10.2359619140625, 10.7158203125, 11.1956787109375, 11.675537109375, 12.1553955078125, 12.63525390625, 13.1151123046875, 13.594970703125, 14.0748291015625, 14.5546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 6.0, 13.0, 17.0, 17.0, 39.0, 32.0, 55.0, 72.0, 97.0, 179.0, 241.0, 379.0, 626.0, 997.0, 1799.0, 3759.0, 8757.0, 25082.0, 85721.0, 541910.0, 279767.0, 64801.0, 19549.0, 7287.0, 3132.0, 1614.0, 931.0, 576.0, 344.0, 232.0, 170.0, 110.0, 73.0, 45.0, 36.0, 36.0, 15.0, 8.0, 7.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.61322021484375, -3.4881591796875, -3.36309814453125, -3.238037109375, -3.11297607421875, -2.9879150390625, -2.86285400390625, -2.73779296875, -2.61273193359375, -2.4876708984375, -2.36260986328125, -2.237548828125, -2.11248779296875, -1.9874267578125, -1.86236572265625, -1.7373046875, -1.61224365234375, -1.4871826171875, -1.36212158203125, -1.237060546875, -1.11199951171875, -0.9869384765625, -0.86187744140625, -0.73681640625, -0.61175537109375, -0.4866943359375, -0.36163330078125, -0.236572265625, -0.11151123046875, 0.0135498046875, 0.13861083984375, 0.263671875, 0.38873291015625, 0.5137939453125, 0.63885498046875, 0.763916015625, 0.88897705078125, 1.0140380859375, 1.13909912109375, 1.26416015625, 1.38922119140625, 1.5142822265625, 1.63934326171875, 1.764404296875, 1.88946533203125, 2.0145263671875, 2.13958740234375, 2.2646484375, 2.38970947265625, 2.5147705078125, 2.63983154296875, 2.764892578125, 2.88995361328125, 3.0150146484375, 3.14007568359375, 3.26513671875, 3.39019775390625, 3.5152587890625, 3.64031982421875, 3.765380859375, 3.89044189453125, 4.0155029296875, 4.14056396484375, 4.265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 2.0, 6.0, 4.0, 9.0, 16.0, 12.0, 11.0, 24.0, 29.0, 40.0, 46.0, 54.0, 54.0, 111.0, 148.0, 108.0, 65.0, 39.0, 40.0, 20.0, 32.0, 26.0, 17.0, 12.0, 19.0, 8.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0014753341674804688, -0.0014349520206451416, -0.0013945698738098145, -0.0013541877269744873, -0.0013138055801391602, -0.001273423433303833, -0.0012330412864685059, -0.0011926591396331787, -0.0011522769927978516, -0.0011118948459625244, -0.0010715126991271973, -0.0010311305522918701, -0.000990748405456543, -0.0009503662586212158, -0.0009099841117858887, -0.0008696019649505615, -0.0008292198181152344, -0.0007888376712799072, -0.0007484555244445801, -0.0007080733776092529, -0.0006676912307739258, -0.0006273090839385986, -0.0005869269371032715, -0.0005465447902679443, -0.0005061626434326172, -0.00046578049659729004, -0.0004253983497619629, -0.00038501620292663574, -0.0003446340560913086, -0.00030425190925598145, -0.0002638697624206543, -0.00022348761558532715, -0.00018310546875, -0.00014272332191467285, -0.0001023411750793457, -6.195902824401855e-05, -2.1576881408691406e-05, 1.8805265426635742e-05, 5.918741226196289e-05, 9.956955909729004e-05, 0.0001399517059326172, 0.00018033385276794434, 0.00022071599960327148, 0.00026109814643859863, 0.0003014802932739258, 0.00034186244010925293, 0.0003822445869445801, 0.0004226267337799072, 0.0004630088806152344, 0.0005033910274505615, 0.0005437731742858887, 0.0005841553211212158, 0.000624537467956543, 0.0006649196147918701, 0.0007053017616271973, 0.0007456839084625244, 0.0007860660552978516, 0.0008264482021331787, 0.0008668303489685059, 0.000907212495803833, 0.0009475946426391602, 0.0009879767894744873, 0.0010283589363098145, 0.0010687410831451416, 0.0011091232299804688]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 0.0, 5.0, 13.0, 18.0, 30.0, 39.0, 56.0, 88.0, 127.0, 163.0, 258.0, 392.0, 593.0, 1057.0, 1931.0, 4585.0, 12766.0, 46389.0, 238761.0, 622563.0, 85148.0, 20646.0, 6752.0, 2746.0, 1351.0, 743.0, 448.0, 286.0, 177.0, 116.0, 72.0, 68.0, 42.0, 30.0, 25.0, 15.0, 11.0, 11.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.626708984375, -4.46826171875, -4.309814453125, -4.1513671875, -3.992919921875, -3.83447265625, -3.676025390625, -3.517578125, -3.359130859375, -3.20068359375, -3.042236328125, -2.8837890625, -2.725341796875, -2.56689453125, -2.408447265625, -2.25, -2.091552734375, -1.93310546875, -1.774658203125, -1.6162109375, -1.457763671875, -1.29931640625, -1.140869140625, -0.982421875, -0.823974609375, -0.66552734375, -0.507080078125, -0.3486328125, -0.190185546875, -0.03173828125, 0.126708984375, 0.28515625, 0.443603515625, 0.60205078125, 0.760498046875, 0.9189453125, 1.077392578125, 1.23583984375, 1.394287109375, 1.552734375, 1.711181640625, 1.86962890625, 2.028076171875, 2.1865234375, 2.344970703125, 2.50341796875, 2.661865234375, 2.8203125, 2.978759765625, 3.13720703125, 3.295654296875, 3.4541015625, 3.612548828125, 3.77099609375, 3.929443359375, 4.087890625, 4.246337890625, 4.40478515625, 4.563232421875, 4.7216796875, 4.880126953125, 5.03857421875, 5.197021484375, 5.35546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 15.0, 17.0, 15.0, 21.0, 18.0, 27.0, 35.0, 29.0, 44.0, 60.0, 90.0, 93.0, 92.0, 75.0, 65.0, 51.0, 45.0, 36.0, 26.0, 23.0, 20.0, 18.0, 11.0, 6.0, 8.0, 7.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.54937744140625, -4.4073486328125, -4.26531982421875, -4.123291015625, -3.98126220703125, -3.8392333984375, -3.69720458984375, -3.55517578125, -3.41314697265625, -3.2711181640625, -3.12908935546875, -2.987060546875, -2.84503173828125, -2.7030029296875, -2.56097412109375, -2.4189453125, -2.27691650390625, -2.1348876953125, -1.99285888671875, -1.850830078125, -1.70880126953125, -1.5667724609375, -1.42474365234375, -1.28271484375, -1.14068603515625, -0.9986572265625, -0.85662841796875, -0.714599609375, -0.57257080078125, -0.4305419921875, -0.28851318359375, -0.146484375, -0.00445556640625, 0.1375732421875, 0.27960205078125, 0.421630859375, 0.56365966796875, 0.7056884765625, 0.84771728515625, 0.98974609375, 1.13177490234375, 1.2738037109375, 1.41583251953125, 1.557861328125, 1.69989013671875, 1.8419189453125, 1.98394775390625, 2.1259765625, 2.26800537109375, 2.4100341796875, 2.55206298828125, 2.694091796875, 2.83612060546875, 2.9781494140625, 3.12017822265625, 3.26220703125, 3.40423583984375, 3.5462646484375, 3.68829345703125, 3.830322265625, 3.97235107421875, 4.1143798828125, 4.25640869140625, 4.3984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 3.0, 7.0, 9.0, 11.0, 44.0, 92.0, 147.0, 259.0, 189.0, 100.0, 65.0, 18.0, 21.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-118.05953979492188, -114.7703628540039, -111.48119354248047, -108.1920166015625, -104.90284729003906, -101.6136703491211, -98.32449340820312, -95.03532409667969, -91.74614715576172, -88.45697021484375, -85.16780090332031, -81.87862396240234, -78.58944702148438, -75.30027770996094, -72.01110076904297, -68.721923828125, -65.43275451660156, -62.14358139038086, -58.854408264160156, -55.56523132324219, -52.276058197021484, -48.98688507080078, -45.69770812988281, -42.40853500366211, -39.119361877441406, -35.8301887512207, -32.541015625, -29.25183868408203, -25.962665557861328, -22.673492431640625, -19.38431739807129, -16.095142364501953, -12.805961608886719, -9.5167875289917, -6.22761344909668, -2.93843936920166, 0.3507347106933594, 3.6399078369140625, 6.929082870483398, 10.218257904052734, 13.507431030273438, 16.79660415649414, 20.085779190063477, 23.374954223632812, 26.664127349853516, 29.95330047607422, 33.24247741699219, 36.53165054321289, 39.820823669433594, 43.1099967956543, 46.399169921875, 49.68834686279297, 52.97751998901367, 56.266693115234375, 59.555870056152344, 62.84504318237305, 66.13421630859375, 69.42339324951172, 72.71256256103516, 76.00173950195312, 79.29090881347656, 82.58008575439453, 85.8692626953125, 89.15843200683594, 92.4476089477539]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 4.0, 11.0, 5.0, 7.0, 21.0, 15.0, 10.0, 18.0, 20.0, 32.0, 28.0, 33.0, 30.0, 30.0, 34.0, 36.0, 50.0, 48.0, 79.0, 57.0, 59.0, 33.0, 36.0, 32.0, 27.0, 29.0, 22.0, 24.0, 24.0, 26.0, 8.0, 14.0, 17.0, 13.0, 7.0, 7.0, 9.0, 6.0, 11.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-49.10178756713867, -47.68122100830078, -46.260650634765625, -44.84008026123047, -43.41951370239258, -41.99894714355469, -40.57837677001953, -39.157806396484375, -37.737239837646484, -36.316673278808594, -34.89610290527344, -33.47553253173828, -32.05496597290039, -30.634397506713867, -29.213829040527344, -27.79326057434082, -26.372692108154297, -24.952123641967773, -23.53155517578125, -22.110986709594727, -20.690418243408203, -19.26984977722168, -17.849281311035156, -16.428712844848633, -15.00814437866211, -13.587575912475586, -12.167007446289062, -10.746438980102539, -9.325870513916016, -7.905302047729492, -6.484733581542969, -5.064165115356445, -3.6436004638671875, -2.223031997680664, -0.8024635314941406, 0.6181049346923828, 2.0386734008789062, 3.4592418670654297, 4.879810333251953, 6.300378799438477, 7.720947265625, 9.141515731811523, 10.562084197998047, 11.98265266418457, 13.403221130371094, 14.823789596557617, 16.24435806274414, 17.664926528930664, 19.085494995117188, 20.50606346130371, 21.926631927490234, 23.347200393676758, 24.76776885986328, 26.188337326049805, 27.608905792236328, 29.02947425842285, 30.450042724609375, 31.8706111907959, 33.29117965698242, 34.71174621582031, 36.13231658935547, 37.552886962890625, 38.973453521728516, 40.394020080566406, 41.81459045410156]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 1.0, 14.0, 10.0, 17.0, 16.0, 30.0, 35.0, 75.0, 108.0, 178.0, 309.0, 582.0, 1150.0, 2432.0, 6325.0, 20025.0, 98394.0, 1223594.0, 2539467.0, 249981.0, 36085.0, 9327.0, 3156.0, 1417.0, 671.0, 359.0, 190.0, 115.0, 69.0, 53.0, 26.0, 23.0, 15.0, 11.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.12890625, -4.9532470703125, -4.777587890625, -4.6019287109375, -4.42626953125, -4.2506103515625, -4.074951171875, -3.8992919921875, -3.7236328125, -3.5479736328125, -3.372314453125, -3.1966552734375, -3.02099609375, -2.8453369140625, -2.669677734375, -2.4940185546875, -2.318359375, -2.1427001953125, -1.967041015625, -1.7913818359375, -1.61572265625, -1.4400634765625, -1.264404296875, -1.0887451171875, -0.9130859375, -0.7374267578125, -0.561767578125, -0.3861083984375, -0.21044921875, -0.0347900390625, 0.140869140625, 0.3165283203125, 0.4921875, 0.6678466796875, 0.843505859375, 1.0191650390625, 1.19482421875, 1.3704833984375, 1.546142578125, 1.7218017578125, 1.8974609375, 2.0731201171875, 2.248779296875, 2.4244384765625, 2.60009765625, 2.7757568359375, 2.951416015625, 3.1270751953125, 3.302734375, 3.4783935546875, 3.654052734375, 3.8297119140625, 4.00537109375, 4.1810302734375, 4.356689453125, 4.5323486328125, 4.7080078125, 4.8836669921875, 5.059326171875, 5.2349853515625, 5.41064453125, 5.5863037109375, 5.761962890625, 5.9376220703125, 6.11328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 11.0, 11.0, 9.0, 12.0, 15.0, 32.0, 33.0, 38.0, 33.0, 53.0, 54.0, 42.0, 59.0, 71.0, 59.0, 57.0, 56.0, 61.0, 38.0, 45.0, 41.0, 41.0, 26.0, 21.0, 10.0, 19.0, 9.0, 6.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.00189208984375, -2.8865966796875, -2.77130126953125, -2.656005859375, -2.54071044921875, -2.4254150390625, -2.31011962890625, -2.19482421875, -2.07952880859375, -1.9642333984375, -1.84893798828125, -1.733642578125, -1.61834716796875, -1.5030517578125, -1.38775634765625, -1.2724609375, -1.15716552734375, -1.0418701171875, -0.92657470703125, -0.811279296875, -0.69598388671875, -0.5806884765625, -0.46539306640625, -0.35009765625, -0.23480224609375, -0.1195068359375, -0.00421142578125, 0.111083984375, 0.22637939453125, 0.3416748046875, 0.45697021484375, 0.572265625, 0.68756103515625, 0.8028564453125, 0.91815185546875, 1.033447265625, 1.14874267578125, 1.2640380859375, 1.37933349609375, 1.49462890625, 1.60992431640625, 1.7252197265625, 1.84051513671875, 1.955810546875, 2.07110595703125, 2.1864013671875, 2.30169677734375, 2.4169921875, 2.53228759765625, 2.6475830078125, 2.76287841796875, 2.878173828125, 2.99346923828125, 3.1087646484375, 3.22406005859375, 3.33935546875, 3.45465087890625, 3.5699462890625, 3.68524169921875, 3.800537109375, 3.91583251953125, 4.0311279296875, 4.14642333984375, 4.26171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 11.0, 5.0, 14.0, 17.0, 32.0, 64.0, 66.0, 168.0, 276.0, 541.0, 1290.0, 3430.0, 12040.0, 59669.0, 812959.0, 3091720.0, 176051.0, 25616.0, 6178.0, 2060.0, 885.0, 448.0, 263.0, 165.0, 111.0, 59.0, 49.0, 37.0, 21.0, 12.0, 6.0, 9.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1953125, -7.93310546875, -7.6708984375, -7.40869140625, -7.146484375, -6.88427734375, -6.6220703125, -6.35986328125, -6.09765625, -5.83544921875, -5.5732421875, -5.31103515625, -5.048828125, -4.78662109375, -4.5244140625, -4.26220703125, -4.0, -3.73779296875, -3.4755859375, -3.21337890625, -2.951171875, -2.68896484375, -2.4267578125, -2.16455078125, -1.90234375, -1.64013671875, -1.3779296875, -1.11572265625, -0.853515625, -0.59130859375, -0.3291015625, -0.06689453125, 0.1953125, 0.45751953125, 0.7197265625, 0.98193359375, 1.244140625, 1.50634765625, 1.7685546875, 2.03076171875, 2.29296875, 2.55517578125, 2.8173828125, 3.07958984375, 3.341796875, 3.60400390625, 3.8662109375, 4.12841796875, 4.390625, 4.65283203125, 4.9150390625, 5.17724609375, 5.439453125, 5.70166015625, 5.9638671875, 6.22607421875, 6.48828125, 6.75048828125, 7.0126953125, 7.27490234375, 7.537109375, 7.79931640625, 8.0615234375, 8.32373046875, 8.5859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 12.0, 19.0, 25.0, 59.0, 113.0, 159.0, 290.0, 611.0, 958.0, 812.0, 487.0, 227.0, 117.0, 55.0, 42.0, 25.0, 13.0, 14.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.5963134765625, -7.262939453125, -6.9295654296875, -6.59619140625, -6.2628173828125, -5.929443359375, -5.5960693359375, -5.2626953125, -4.9293212890625, -4.595947265625, -4.2625732421875, -3.92919921875, -3.5958251953125, -3.262451171875, -2.9290771484375, -2.595703125, -2.2623291015625, -1.928955078125, -1.5955810546875, -1.26220703125, -0.9288330078125, -0.595458984375, -0.2620849609375, 0.0712890625, 0.4046630859375, 0.738037109375, 1.0714111328125, 1.40478515625, 1.7381591796875, 2.071533203125, 2.4049072265625, 2.73828125, 3.0716552734375, 3.405029296875, 3.7384033203125, 4.07177734375, 4.4051513671875, 4.738525390625, 5.0718994140625, 5.4052734375, 5.7386474609375, 6.072021484375, 6.4053955078125, 6.73876953125, 7.0721435546875, 7.405517578125, 7.7388916015625, 8.072265625, 8.4056396484375, 8.739013671875, 9.0723876953125, 9.40576171875, 9.7391357421875, 10.072509765625, 10.4058837890625, 10.7392578125, 11.0726318359375, 11.406005859375, 11.7393798828125, 12.07275390625, 12.4061279296875, 12.739501953125, 13.0728759765625, 13.40625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 21.0, 31.0, 81.0, 138.0, 230.0, 227.0, 152.0, 59.0, 22.0, 11.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-141.0215301513672, -137.81118774414062, -134.600830078125, -131.39048767089844, -128.1801300048828, -124.96978759765625, -121.75943756103516, -118.54908752441406, -115.33873748779297, -112.12838745117188, -108.91803741455078, -105.70768737792969, -102.49734497070312, -99.28699493408203, -96.07664489746094, -92.86629486083984, -89.65594482421875, -86.44559478759766, -83.23524475097656, -80.02490234375, -76.8145523071289, -73.60420227050781, -70.39385223388672, -67.18350219726562, -63.97315979003906, -60.76280975341797, -57.55246353149414, -54.34211349487305, -51.13176345825195, -47.921417236328125, -44.71106719970703, -41.50071716308594, -38.290367126464844, -35.08001708984375, -31.86966896057129, -28.659320831298828, -25.448970794677734, -22.238622665405273, -19.028274536132812, -15.817924499511719, -12.607576370239258, -9.39722728729248, -6.186878681182861, -2.976530075073242, 0.23381900787353516, 3.4441680908203125, 6.654516220092773, 9.864866256713867, 13.075214385986328, 16.28556251525879, 19.495912551879883, 22.706260681152344, 25.916610717773438, 29.1269588470459, 32.33730697631836, 35.54765701293945, 38.75800323486328, 41.968353271484375, 45.1786994934082, 48.3890495300293, 51.59939956665039, 54.80974578857422, 58.02009582519531, 61.230445861816406, 64.4407958984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 8.0, 9.0, 24.0, 25.0, 41.0, 46.0, 57.0, 76.0, 92.0, 81.0, 93.0, 97.0, 75.0, 75.0, 56.0, 54.0, 27.0, 29.0, 13.0, 12.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.31664276123047, -71.4379653930664, -69.55928039550781, -67.68060302734375, -65.80192565917969, -63.923240661621094, -62.04456329345703, -60.1658821105957, -58.287200927734375, -56.40851974487305, -54.529842376708984, -52.651161193847656, -50.77248001098633, -48.893798828125, -47.01512145996094, -45.13644027709961, -43.25775909423828, -41.37907791137695, -39.50040054321289, -37.62171936035156, -35.743038177490234, -33.864356994628906, -31.985679626464844, -30.106998443603516, -28.228321075439453, -26.349641799926758, -24.47096061706543, -22.592281341552734, -20.713600158691406, -18.83492088317871, -16.956241607666016, -15.077560424804688, -13.19887924194336, -11.320199012756348, -9.441518783569336, -7.562839031219482, -5.684158802032471, -3.805479049682617, -1.9267988204956055, -0.04811859130859375, 1.830561637878418, 3.7092418670654297, 5.587922096252441, 7.466601848602295, 9.345281600952148, 11.22396183013916, 13.102642059326172, 14.981322288513184, 16.860002517700195, 18.73868179321289, 20.61736297607422, 22.496042251586914, 24.374723434448242, 26.253402709960938, 28.132083892822266, 30.01076316833496, 31.889442443847656, 33.768123626708984, 35.64680099487305, 37.525482177734375, 39.4041633605957, 41.28284454345703, 43.161521911621094, 45.04020309448242, 46.91888427734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 18.0, 4.0, 25.0, 21.0, 35.0, 41.0, 61.0, 96.0, 136.0, 210.0, 408.0, 705.0, 1406.0, 3004.0, 7098.0, 18265.0, 51425.0, 151955.0, 385561.0, 279027.0, 94863.0, 32555.0, 12178.0, 4918.0, 2152.0, 1015.0, 537.0, 290.0, 176.0, 117.0, 73.0, 41.0, 44.0, 21.0, 19.0, 13.0, 8.0, 11.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.27734375, -5.08740234375, -4.8974609375, -4.70751953125, -4.517578125, -4.32763671875, -4.1376953125, -3.94775390625, -3.7578125, -3.56787109375, -3.3779296875, -3.18798828125, -2.998046875, -2.80810546875, -2.6181640625, -2.42822265625, -2.23828125, -2.04833984375, -1.8583984375, -1.66845703125, -1.478515625, -1.28857421875, -1.0986328125, -0.90869140625, -0.71875, -0.52880859375, -0.3388671875, -0.14892578125, 0.041015625, 0.23095703125, 0.4208984375, 0.61083984375, 0.80078125, 0.99072265625, 1.1806640625, 1.37060546875, 1.560546875, 1.75048828125, 1.9404296875, 2.13037109375, 2.3203125, 2.51025390625, 2.7001953125, 2.89013671875, 3.080078125, 3.27001953125, 3.4599609375, 3.64990234375, 3.83984375, 4.02978515625, 4.2197265625, 4.40966796875, 4.599609375, 4.78955078125, 4.9794921875, 5.16943359375, 5.359375, 5.54931640625, 5.7392578125, 5.92919921875, 6.119140625, 6.30908203125, 6.4990234375, 6.68896484375, 6.87890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 7.0, 8.0, 12.0, 14.0, 12.0, 18.0, 16.0, 24.0, 28.0, 25.0, 38.0, 33.0, 26.0, 42.0, 48.0, 44.0, 52.0, 46.0, 49.0, 43.0, 56.0, 44.0, 36.0, 25.0, 27.0, 31.0, 29.0, 24.0, 20.0, 26.0, 11.0, 14.0, 12.0, 9.0, 5.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.677703857421875, -2.58978271484375, -2.501861572265625, -2.4139404296875, -2.326019287109375, -2.23809814453125, -2.150177001953125, -2.062255859375, -1.974334716796875, -1.88641357421875, -1.798492431640625, -1.7105712890625, -1.622650146484375, -1.53472900390625, -1.446807861328125, -1.35888671875, -1.270965576171875, -1.18304443359375, -1.095123291015625, -1.0072021484375, -0.919281005859375, -0.83135986328125, -0.743438720703125, -0.655517578125, -0.567596435546875, -0.47967529296875, -0.391754150390625, -0.3038330078125, -0.215911865234375, -0.12799072265625, -0.040069580078125, 0.0478515625, 0.135772705078125, 0.22369384765625, 0.311614990234375, 0.3995361328125, 0.487457275390625, 0.57537841796875, 0.663299560546875, 0.751220703125, 0.839141845703125, 0.92706298828125, 1.014984130859375, 1.1029052734375, 1.190826416015625, 1.27874755859375, 1.366668701171875, 1.45458984375, 1.542510986328125, 1.63043212890625, 1.718353271484375, 1.8062744140625, 1.894195556640625, 1.98211669921875, 2.070037841796875, 2.157958984375, 2.245880126953125, 2.33380126953125, 2.421722412109375, 2.5096435546875, 2.597564697265625, 2.68548583984375, 2.773406982421875, 2.861328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 11.0, 18.0, 21.0, 41.0, 63.0, 78.0, 75.0, 143.0, 234.0, 400.0, 786.0, 1801.0, 5094.0, 22990.0, 262390.0, 699722.0, 42592.0, 7410.0, 2346.0, 1026.0, 478.0, 266.0, 166.0, 94.0, 79.0, 53.0, 40.0, 35.0, 20.0, 15.0, 12.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.2265625, -14.7215576171875, -14.216552734375, -13.7115478515625, -13.20654296875, -12.7015380859375, -12.196533203125, -11.6915283203125, -11.1865234375, -10.6815185546875, -10.176513671875, -9.6715087890625, -9.16650390625, -8.6614990234375, -8.156494140625, -7.6514892578125, -7.146484375, -6.6414794921875, -6.136474609375, -5.6314697265625, -5.12646484375, -4.6214599609375, -4.116455078125, -3.6114501953125, -3.1064453125, -2.6014404296875, -2.096435546875, -1.5914306640625, -1.08642578125, -0.5814208984375, -0.076416015625, 0.4285888671875, 0.93359375, 1.4385986328125, 1.943603515625, 2.4486083984375, 2.95361328125, 3.4586181640625, 3.963623046875, 4.4686279296875, 4.9736328125, 5.4786376953125, 5.983642578125, 6.4886474609375, 6.99365234375, 7.4986572265625, 8.003662109375, 8.5086669921875, 9.013671875, 9.5186767578125, 10.023681640625, 10.5286865234375, 11.03369140625, 11.5386962890625, 12.043701171875, 12.5487060546875, 13.0537109375, 13.5587158203125, 14.063720703125, 14.5687255859375, 15.07373046875, 15.5787353515625, 16.083740234375, 16.5887451171875, 17.09375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 15.0, 29.0, 15.0, 22.0, 30.0, 25.0, 34.0, 41.0, 45.0, 42.0, 55.0, 52.0, 47.0, 45.0, 46.0, 41.0, 39.0, 40.0, 44.0, 43.0, 23.0, 32.0, 24.0, 19.0, 15.0, 19.0, 13.0, 10.0, 8.0, 10.0, 7.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.0689697265625, -9.692626953125, -9.3162841796875, -8.93994140625, -8.5635986328125, -8.187255859375, -7.8109130859375, -7.4345703125, -7.0582275390625, -6.681884765625, -6.3055419921875, -5.92919921875, -5.5528564453125, -5.176513671875, -4.8001708984375, -4.423828125, -4.0474853515625, -3.671142578125, -3.2947998046875, -2.91845703125, -2.5421142578125, -2.165771484375, -1.7894287109375, -1.4130859375, -1.0367431640625, -0.660400390625, -0.2840576171875, 0.09228515625, 0.4686279296875, 0.844970703125, 1.2213134765625, 1.59765625, 1.9739990234375, 2.350341796875, 2.7266845703125, 3.10302734375, 3.4793701171875, 3.855712890625, 4.2320556640625, 4.6083984375, 4.9847412109375, 5.361083984375, 5.7374267578125, 6.11376953125, 6.4901123046875, 6.866455078125, 7.2427978515625, 7.619140625, 7.9954833984375, 8.371826171875, 8.7481689453125, 9.12451171875, 9.5008544921875, 9.877197265625, 10.2535400390625, 10.6298828125, 11.0062255859375, 11.382568359375, 11.7589111328125, 12.13525390625, 12.5115966796875, 12.887939453125, 13.2642822265625, 13.640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 4.0, 11.0, 14.0, 9.0, 13.0, 28.0, 38.0, 54.0, 101.0, 127.0, 206.0, 331.0, 644.0, 1649.0, 5197.0, 21656.0, 125957.0, 778997.0, 89913.0, 16582.0, 4204.0, 1409.0, 599.0, 291.0, 180.0, 100.0, 75.0, 39.0, 35.0, 32.0, 17.0, 7.0, 6.0, 8.0, 4.0, 6.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.25421142578125, -5.0474853515625, -4.84075927734375, -4.634033203125, -4.42730712890625, -4.2205810546875, -4.01385498046875, -3.80712890625, -3.60040283203125, -3.3936767578125, -3.18695068359375, -2.980224609375, -2.77349853515625, -2.5667724609375, -2.36004638671875, -2.1533203125, -1.94659423828125, -1.7398681640625, -1.53314208984375, -1.326416015625, -1.11968994140625, -0.9129638671875, -0.70623779296875, -0.49951171875, -0.29278564453125, -0.0860595703125, 0.12066650390625, 0.327392578125, 0.53411865234375, 0.7408447265625, 0.94757080078125, 1.154296875, 1.36102294921875, 1.5677490234375, 1.77447509765625, 1.981201171875, 2.18792724609375, 2.3946533203125, 2.60137939453125, 2.80810546875, 3.01483154296875, 3.2215576171875, 3.42828369140625, 3.635009765625, 3.84173583984375, 4.0484619140625, 4.25518798828125, 4.4619140625, 4.66864013671875, 4.8753662109375, 5.08209228515625, 5.288818359375, 5.49554443359375, 5.7022705078125, 5.90899658203125, 6.11572265625, 6.32244873046875, 6.5291748046875, 6.73590087890625, 6.942626953125, 7.14935302734375, 7.3560791015625, 7.56280517578125, 7.76953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 9.0, 6.0, 13.0, 18.0, 30.0, 30.0, 56.0, 82.0, 161.0, 234.0, 116.0, 64.0, 30.0, 39.0, 27.0, 17.0, 11.0, 8.0, 11.0, 7.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020313262939453125, -0.001968294382095337, -0.0019052624702453613, -0.0018422305583953857, -0.0017791986465454102, -0.0017161667346954346, -0.001653134822845459, -0.0015901029109954834, -0.0015270709991455078, -0.0014640390872955322, -0.0014010071754455566, -0.001337975263595581, -0.0012749433517456055, -0.0012119114398956299, -0.0011488795280456543, -0.0010858476161956787, -0.0010228157043457031, -0.0009597837924957275, -0.000896751880645752, -0.0008337199687957764, -0.0007706880569458008, -0.0007076561450958252, -0.0006446242332458496, -0.000581592321395874, -0.0005185604095458984, -0.00045552849769592285, -0.00039249658584594727, -0.0003294646739959717, -0.0002664327621459961, -0.0002034008502960205, -0.00014036893844604492, -7.733702659606934e-05, -1.430511474609375e-05, 4.8726797103881836e-05, 0.00011175870895385742, 0.000174790620803833, 0.0002378225326538086, 0.0003008544445037842, 0.00036388635635375977, 0.00042691826820373535, 0.0004899501800537109, 0.0005529820919036865, 0.0006160140037536621, 0.0006790459156036377, 0.0007420778274536133, 0.0008051097393035889, 0.0008681416511535645, 0.00093117356300354, 0.0009942054748535156, 0.0010572373867034912, 0.0011202692985534668, 0.0011833012104034424, 0.001246333122253418, 0.0013093650341033936, 0.0013723969459533691, 0.0014354288578033447, 0.0014984607696533203, 0.001561492681503296, 0.0016245245933532715, 0.001687556505203247, 0.0017505884170532227, 0.0018136203289031982, 0.0018766522407531738, 0.0019396841526031494, 0.002002716064453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 7.0, 5.0, 8.0, 8.0, 12.0, 20.0, 33.0, 33.0, 62.0, 69.0, 99.0, 163.0, 238.0, 342.0, 516.0, 890.0, 1884.0, 4569.0, 13609.0, 46619.0, 249356.0, 622222.0, 75506.0, 20171.0, 6614.0, 2503.0, 1236.0, 588.0, 360.0, 250.0, 179.0, 111.0, 81.0, 66.0, 34.0, 23.0, 20.0, 16.0, 4.0, 10.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.765625, -4.61273193359375, -4.4598388671875, -4.30694580078125, -4.154052734375, -4.00115966796875, -3.8482666015625, -3.69537353515625, -3.54248046875, -3.38958740234375, -3.2366943359375, -3.08380126953125, -2.930908203125, -2.77801513671875, -2.6251220703125, -2.47222900390625, -2.3193359375, -2.16644287109375, -2.0135498046875, -1.86065673828125, -1.707763671875, -1.55487060546875, -1.4019775390625, -1.24908447265625, -1.09619140625, -0.94329833984375, -0.7904052734375, -0.63751220703125, -0.484619140625, -0.33172607421875, -0.1788330078125, -0.02593994140625, 0.126953125, 0.27984619140625, 0.4327392578125, 0.58563232421875, 0.738525390625, 0.89141845703125, 1.0443115234375, 1.19720458984375, 1.35009765625, 1.50299072265625, 1.6558837890625, 1.80877685546875, 1.961669921875, 2.11456298828125, 2.2674560546875, 2.42034912109375, 2.5732421875, 2.72613525390625, 2.8790283203125, 3.03192138671875, 3.184814453125, 3.33770751953125, 3.4906005859375, 3.64349365234375, 3.79638671875, 3.94927978515625, 4.1021728515625, 4.25506591796875, 4.407958984375, 4.56085205078125, 4.7137451171875, 4.86663818359375, 5.01953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 11.0, 11.0, 20.0, 21.0, 16.0, 20.0, 30.0, 34.0, 49.0, 45.0, 49.0, 77.0, 95.0, 96.0, 79.0, 65.0, 50.0, 43.0, 28.0, 28.0, 19.0, 15.0, 5.0, 16.0, 9.0, 5.0, 7.0, 5.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.47265625, -3.360565185546875, -3.24847412109375, -3.136383056640625, -3.0242919921875, -2.912200927734375, -2.80010986328125, -2.688018798828125, -2.575927734375, -2.463836669921875, -2.35174560546875, -2.239654541015625, -2.1275634765625, -2.015472412109375, -1.90338134765625, -1.791290283203125, -1.67919921875, -1.567108154296875, -1.45501708984375, -1.342926025390625, -1.2308349609375, -1.118743896484375, -1.00665283203125, -0.894561767578125, -0.782470703125, -0.670379638671875, -0.55828857421875, -0.446197509765625, -0.3341064453125, -0.222015380859375, -0.10992431640625, 0.002166748046875, 0.1142578125, 0.226348876953125, 0.33843994140625, 0.450531005859375, 0.5626220703125, 0.674713134765625, 0.78680419921875, 0.898895263671875, 1.010986328125, 1.123077392578125, 1.23516845703125, 1.347259521484375, 1.4593505859375, 1.571441650390625, 1.68353271484375, 1.795623779296875, 1.90771484375, 2.019805908203125, 2.13189697265625, 2.243988037109375, 2.3560791015625, 2.468170166015625, 2.58026123046875, 2.692352294921875, 2.804443359375, 2.916534423828125, 3.02862548828125, 3.140716552734375, 3.2528076171875, 3.364898681640625, 3.47698974609375, 3.589080810546875, 3.701171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 14.0, 17.0, 54.0, 126.0, 263.0, 263.0, 127.0, 59.0, 20.0, 18.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-123.2546615600586, -119.6417236328125, -116.02877807617188, -112.41583251953125, -108.80289459228516, -105.18995666503906, -101.57701110839844, -97.96406555175781, -94.35112762451172, -90.73818969726562, -87.125244140625, -83.51229858398438, -79.89936065673828, -76.28642272949219, -72.67347717285156, -69.06053161621094, -65.44759368896484, -61.834651947021484, -58.221710205078125, -54.608768463134766, -50.995826721191406, -47.38288497924805, -43.76994323730469, -40.15700149536133, -36.54405975341797, -32.93111801147461, -29.31817626953125, -25.70523452758789, -22.09229278564453, -18.479351043701172, -14.866409301757812, -11.253467559814453, -7.640525817871094, -4.027584075927734, -0.414642333984375, 3.1982994079589844, 6.811241149902344, 10.424182891845703, 14.037124633789062, 17.650066375732422, 21.26300811767578, 24.87594985961914, 28.4888916015625, 32.10183334350586, 35.71477508544922, 39.32771682739258, 42.94065856933594, 46.5536003112793, 50.166542053222656, 53.779483795166016, 57.392425537109375, 61.005367279052734, 64.6183090209961, 68.23124694824219, 71.84419250488281, 75.45713806152344, 79.07007598876953, 82.68301391601562, 86.29595947265625, 89.90890502929688, 93.52184295654297, 97.13478088378906, 100.74772644042969, 104.36067199707031, 107.9736099243164]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 8.0, 4.0, 2.0, 1.0, 8.0, 12.0, 13.0, 12.0, 10.0, 14.0, 19.0, 15.0, 18.0, 31.0, 31.0, 29.0, 42.0, 34.0, 45.0, 59.0, 63.0, 53.0, 64.0, 69.0, 42.0, 42.0, 32.0, 24.0, 23.0, 27.0, 21.0, 28.0, 15.0, 13.0, 18.0, 15.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.525146484375, -42.01411819458008, -40.503089904785156, -38.992061614990234, -37.48103332519531, -35.970001220703125, -34.4589729309082, -32.94794464111328, -31.43691635131836, -29.925888061523438, -28.414859771728516, -26.90382957458496, -25.39280128479004, -23.881772994995117, -22.370742797851562, -20.85971450805664, -19.34868621826172, -17.837657928466797, -16.326629638671875, -14.81559944152832, -13.304571151733398, -11.793542861938477, -10.282513618469238, -8.771484375, -7.260456085205078, -5.749427318572998, -4.238398551940918, -2.727369785308838, -1.2163410186767578, 0.29468774795532227, 1.8057165145874023, 3.3167457580566406, 4.8277740478515625, 6.338802814483643, 7.849831581115723, 9.360860824584961, 10.871889114379883, 12.382917404174805, 13.893946647644043, 15.404975891113281, 16.916004180908203, 18.427032470703125, 19.938060760498047, 21.4490909576416, 22.960119247436523, 24.471147537231445, 25.982177734375, 27.493206024169922, 29.004234313964844, 30.515262603759766, 32.02629089355469, 33.53731918334961, 35.04834747314453, 36.55937957763672, 38.07040786743164, 39.58143615722656, 41.092464447021484, 42.603492736816406, 44.11452102661133, 45.62554931640625, 47.13658142089844, 48.64760971069336, 50.15863800048828, 51.6696662902832, 53.180694580078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 13.0, 16.0, 18.0, 31.0, 33.0, 67.0, 98.0, 161.0, 230.0, 477.0, 918.0, 1828.0, 4594.0, 13422.0, 59088.0, 698442.0, 3020474.0, 341547.0, 37277.0, 9252.0, 3221.0, 1374.0, 689.0, 323.0, 227.0, 159.0, 84.0, 62.0, 42.0, 32.0, 15.0, 14.0, 9.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.58203125, -6.39056396484375, -6.1990966796875, -6.00762939453125, -5.816162109375, -5.62469482421875, -5.4332275390625, -5.24176025390625, -5.05029296875, -4.85882568359375, -4.6673583984375, -4.47589111328125, -4.284423828125, -4.09295654296875, -3.9014892578125, -3.71002197265625, -3.5185546875, -3.32708740234375, -3.1356201171875, -2.94415283203125, -2.752685546875, -2.56121826171875, -2.3697509765625, -2.17828369140625, -1.98681640625, -1.79534912109375, -1.6038818359375, -1.41241455078125, -1.220947265625, -1.02947998046875, -0.8380126953125, -0.64654541015625, -0.455078125, -0.26361083984375, -0.0721435546875, 0.11932373046875, 0.310791015625, 0.50225830078125, 0.6937255859375, 0.88519287109375, 1.07666015625, 1.26812744140625, 1.4595947265625, 1.65106201171875, 1.842529296875, 2.03399658203125, 2.2254638671875, 2.41693115234375, 2.6083984375, 2.79986572265625, 2.9913330078125, 3.18280029296875, 3.374267578125, 3.56573486328125, 3.7572021484375, 3.94866943359375, 4.14013671875, 4.33160400390625, 4.5230712890625, 4.71453857421875, 4.906005859375, 5.09747314453125, 5.2889404296875, 5.48040771484375, 5.671875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 6.0, 3.0, 4.0, 4.0, 11.0, 11.0, 30.0, 21.0, 28.0, 50.0, 56.0, 49.0, 57.0, 66.0, 64.0, 66.0, 74.0, 66.0, 68.0, 61.0, 49.0, 38.0, 29.0, 27.0, 21.0, 16.0, 14.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.363677978515625, -2.22930908203125, -2.094940185546875, -1.9605712890625, -1.826202392578125, -1.69183349609375, -1.557464599609375, -1.423095703125, -1.288726806640625, -1.15435791015625, -1.019989013671875, -0.8856201171875, -0.751251220703125, -0.61688232421875, -0.482513427734375, -0.34814453125, -0.213775634765625, -0.07940673828125, 0.054962158203125, 0.1893310546875, 0.323699951171875, 0.45806884765625, 0.592437744140625, 0.726806640625, 0.861175537109375, 0.99554443359375, 1.129913330078125, 1.2642822265625, 1.398651123046875, 1.53302001953125, 1.667388916015625, 1.8017578125, 1.936126708984375, 2.07049560546875, 2.204864501953125, 2.3392333984375, 2.473602294921875, 2.60797119140625, 2.742340087890625, 2.876708984375, 3.011077880859375, 3.14544677734375, 3.279815673828125, 3.4141845703125, 3.548553466796875, 3.68292236328125, 3.817291259765625, 3.95166015625, 4.086029052734375, 4.22039794921875, 4.354766845703125, 4.4891357421875, 4.623504638671875, 4.75787353515625, 4.892242431640625, 5.026611328125, 5.160980224609375, 5.29534912109375, 5.429718017578125, 5.5640869140625, 5.698455810546875, 5.83282470703125, 5.967193603515625, 6.1015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 15.0, 27.0, 47.0, 81.0, 133.0, 294.0, 610.0, 1349.0, 3511.0, 16487.0, 271368.0, 3771930.0, 112049.0, 10959.0, 2904.0, 1221.0, 587.0, 282.0, 191.0, 86.0, 42.0, 27.0, 16.0, 14.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.8515625, -14.443359375, -14.03515625, -13.626953125, -13.21875, -12.810546875, -12.40234375, -11.994140625, -11.5859375, -11.177734375, -10.76953125, -10.361328125, -9.953125, -9.544921875, -9.13671875, -8.728515625, -8.3203125, -7.912109375, -7.50390625, -7.095703125, -6.6875, -6.279296875, -5.87109375, -5.462890625, -5.0546875, -4.646484375, -4.23828125, -3.830078125, -3.421875, -3.013671875, -2.60546875, -2.197265625, -1.7890625, -1.380859375, -0.97265625, -0.564453125, -0.15625, 0.251953125, 0.66015625, 1.068359375, 1.4765625, 1.884765625, 2.29296875, 2.701171875, 3.109375, 3.517578125, 3.92578125, 4.333984375, 4.7421875, 5.150390625, 5.55859375, 5.966796875, 6.375, 6.783203125, 7.19140625, 7.599609375, 8.0078125, 8.416015625, 8.82421875, 9.232421875, 9.640625, 10.048828125, 10.45703125, 10.865234375, 11.2734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 14.0, 15.0, 23.0, 40.0, 85.0, 155.0, 333.0, 639.0, 1066.0, 797.0, 402.0, 219.0, 104.0, 63.0, 31.0, 17.0, 19.0, 11.0, 9.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.765625, -9.436767578125, -9.10791015625, -8.779052734375, -8.4501953125, -8.121337890625, -7.79248046875, -7.463623046875, -7.134765625, -6.805908203125, -6.47705078125, -6.148193359375, -5.8193359375, -5.490478515625, -5.16162109375, -4.832763671875, -4.50390625, -4.175048828125, -3.84619140625, -3.517333984375, -3.1884765625, -2.859619140625, -2.53076171875, -2.201904296875, -1.873046875, -1.544189453125, -1.21533203125, -0.886474609375, -0.5576171875, -0.228759765625, 0.10009765625, 0.428955078125, 0.7578125, 1.086669921875, 1.41552734375, 1.744384765625, 2.0732421875, 2.402099609375, 2.73095703125, 3.059814453125, 3.388671875, 3.717529296875, 4.04638671875, 4.375244140625, 4.7041015625, 5.032958984375, 5.36181640625, 5.690673828125, 6.01953125, 6.348388671875, 6.67724609375, 7.006103515625, 7.3349609375, 7.663818359375, 7.99267578125, 8.321533203125, 8.650390625, 8.979248046875, 9.30810546875, 9.636962890625, 9.9658203125, 10.294677734375, 10.62353515625, 10.952392578125, 11.28125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 16.0, 41.0, 182.0, 343.0, 286.0, 86.0, 21.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.53707885742188, -187.4213409423828, -182.3055877685547, -177.18984985351562, -172.0740966796875, -166.95835876464844, -161.84262084960938, -156.72686767578125, -151.6111297607422, -146.49539184570312, -141.379638671875, -136.26390075683594, -131.14816284179688, -126.03240966796875, -120.91667175292969, -115.8009262084961, -110.6851806640625, -105.5694351196289, -100.45368957519531, -95.33795166015625, -90.22220611572266, -85.10646057128906, -79.99072265625, -74.8749771118164, -69.75923156738281, -64.64348602294922, -59.52774429321289, -54.41200256347656, -49.29625701904297, -44.180511474609375, -39.06476974487305, -33.94902801513672, -28.833267211914062, -23.7175235748291, -18.60177993774414, -13.48603630065918, -8.370292663574219, -3.254549026489258, 1.8611946105957031, 6.976936340332031, 12.092681884765625, 17.208425521850586, 22.324169158935547, 27.439912796020508, 32.55565643310547, 37.67140197753906, 42.78714370727539, 47.90288543701172, 53.01863098144531, 58.134376525878906, 63.250118255615234, 68.36585998535156, 73.48160552978516, 78.59735107421875, 83.71308898925781, 88.8288345336914, 93.944580078125, 99.0603256225586, 104.17607116699219, 109.29180908203125, 114.40755462646484, 119.52330017089844, 124.6390380859375, 129.75479125976562, 134.8705291748047]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 18.0, 20.0, 26.0, 33.0, 35.0, 38.0, 48.0, 65.0, 72.0, 78.0, 83.0, 69.0, 63.0, 71.0, 59.0, 52.0, 49.0, 34.0, 21.0, 16.0, 16.0, 7.0, 8.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.65948486328125, -29.259729385375977, -27.859973907470703, -26.460220336914062, -25.06046485900879, -23.660709381103516, -22.260953903198242, -20.86119842529297, -19.461444854736328, -18.061689376831055, -16.66193389892578, -15.262179374694824, -13.862424850463867, -12.462669372558594, -11.06291389465332, -9.663159370422363, -8.263402938842773, -6.863647937774658, -5.463892936706543, -4.0641374588012695, -2.6643824577331543, -1.264627456665039, 0.13512802124023438, 1.5348825454711914, 2.934638023376465, 4.33439302444458, 5.734148025512695, 7.133903503417969, 8.533658981323242, 9.9334135055542, 11.333168983459473, 12.73292350769043, 14.132678985595703, 15.532434463500977, 16.93218994140625, 18.33194351196289, 19.731698989868164, 21.131454467773438, 22.53120994567871, 23.930965423583984, 25.330718994140625, 26.7304744720459, 28.130229949951172, 29.529983520507812, 30.929738998413086, 32.32949447631836, 33.729248046875, 35.129005432128906, 36.52876281738281, 37.92851638793945, 39.32827377319336, 40.72802734375, 42.127784729003906, 43.52753829956055, 44.92729187011719, 46.327049255371094, 47.726802825927734, 49.126556396484375, 50.52631378173828, 51.92606735229492, 53.32582473754883, 54.72557830810547, 56.125335693359375, 57.525089263916016, 58.924842834472656]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 9.0, 9.0, 24.0, 26.0, 54.0, 80.0, 135.0, 260.0, 663.0, 1928.0, 7149.0, 37819.0, 265645.0, 593287.0, 116801.0, 18444.0, 3920.0, 1275.0, 480.0, 234.0, 119.0, 73.0, 43.0, 28.0, 13.0, 11.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.3338623046875, -10.003662109375, -9.6734619140625, -9.34326171875, -9.0130615234375, -8.682861328125, -8.3526611328125, -8.0224609375, -7.6922607421875, -7.362060546875, -7.0318603515625, -6.70166015625, -6.3714599609375, -6.041259765625, -5.7110595703125, -5.380859375, -5.0506591796875, -4.720458984375, -4.3902587890625, -4.06005859375, -3.7298583984375, -3.399658203125, -3.0694580078125, -2.7392578125, -2.4090576171875, -2.078857421875, -1.7486572265625, -1.41845703125, -1.0882568359375, -0.758056640625, -0.4278564453125, -0.09765625, 0.2325439453125, 0.562744140625, 0.8929443359375, 1.22314453125, 1.5533447265625, 1.883544921875, 2.2137451171875, 2.5439453125, 2.8741455078125, 3.204345703125, 3.5345458984375, 3.86474609375, 4.1949462890625, 4.525146484375, 4.8553466796875, 5.185546875, 5.5157470703125, 5.845947265625, 6.1761474609375, 6.50634765625, 6.8365478515625, 7.166748046875, 7.4969482421875, 7.8271484375, 8.1573486328125, 8.487548828125, 8.8177490234375, 9.14794921875, 9.4781494140625, 9.808349609375, 10.1385498046875, 10.46875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 5.0, 18.0, 17.0, 22.0, 36.0, 41.0, 53.0, 53.0, 69.0, 81.0, 81.0, 81.0, 74.0, 69.0, 68.0, 52.0, 43.0, 44.0, 27.0, 22.0, 16.0, 18.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.217926025390625, -3.05108642578125, -2.884246826171875, -2.7174072265625, -2.550567626953125, -2.38372802734375, -2.216888427734375, -2.050048828125, -1.883209228515625, -1.71636962890625, -1.549530029296875, -1.3826904296875, -1.215850830078125, -1.04901123046875, -0.882171630859375, -0.71533203125, -0.548492431640625, -0.38165283203125, -0.214813232421875, -0.0479736328125, 0.118865966796875, 0.28570556640625, 0.452545166015625, 0.619384765625, 0.786224365234375, 0.95306396484375, 1.119903564453125, 1.2867431640625, 1.453582763671875, 1.62042236328125, 1.787261962890625, 1.9541015625, 2.120941162109375, 2.28778076171875, 2.454620361328125, 2.6214599609375, 2.788299560546875, 2.95513916015625, 3.121978759765625, 3.288818359375, 3.455657958984375, 3.62249755859375, 3.789337158203125, 3.9561767578125, 4.123016357421875, 4.28985595703125, 4.456695556640625, 4.62353515625, 4.790374755859375, 4.95721435546875, 5.124053955078125, 5.2908935546875, 5.457733154296875, 5.62457275390625, 5.791412353515625, 5.958251953125, 6.125091552734375, 6.29193115234375, 6.458770751953125, 6.6256103515625, 6.792449951171875, 6.95928955078125, 7.126129150390625, 7.29296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 11.0, 16.0, 12.0, 19.0, 23.0, 47.0, 57.0, 83.0, 152.0, 230.0, 544.0, 1111.0, 2751.0, 7916.0, 29921.0, 171892.0, 672343.0, 126882.0, 23566.0, 6581.0, 2326.0, 984.0, 454.0, 238.0, 128.0, 84.0, 58.0, 37.0, 26.0, 15.0, 11.0, 9.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0703125, -8.7816162109375, -8.492919921875, -8.2042236328125, -7.91552734375, -7.6268310546875, -7.338134765625, -7.0494384765625, -6.7607421875, -6.4720458984375, -6.183349609375, -5.8946533203125, -5.60595703125, -5.3172607421875, -5.028564453125, -4.7398681640625, -4.451171875, -4.1624755859375, -3.873779296875, -3.5850830078125, -3.29638671875, -3.0076904296875, -2.718994140625, -2.4302978515625, -2.1416015625, -1.8529052734375, -1.564208984375, -1.2755126953125, -0.98681640625, -0.6981201171875, -0.409423828125, -0.1207275390625, 0.16796875, 0.4566650390625, 0.745361328125, 1.0340576171875, 1.32275390625, 1.6114501953125, 1.900146484375, 2.1888427734375, 2.4775390625, 2.7662353515625, 3.054931640625, 3.3436279296875, 3.63232421875, 3.9210205078125, 4.209716796875, 4.4984130859375, 4.787109375, 5.0758056640625, 5.364501953125, 5.6531982421875, 5.94189453125, 6.2305908203125, 6.519287109375, 6.8079833984375, 7.0966796875, 7.3853759765625, 7.674072265625, 7.9627685546875, 8.25146484375, 8.5401611328125, 8.828857421875, 9.1175537109375, 9.40625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 15.0, 13.0, 22.0, 25.0, 28.0, 38.0, 31.0, 44.0, 43.0, 37.0, 42.0, 62.0, 55.0, 50.0, 58.0, 49.0, 42.0, 38.0, 29.0, 40.0, 34.0, 21.0, 27.0, 25.0, 24.0, 15.0, 8.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.5740966796875, -12.179443359375, -11.7847900390625, -11.39013671875, -10.9954833984375, -10.600830078125, -10.2061767578125, -9.8115234375, -9.4168701171875, -9.022216796875, -8.6275634765625, -8.23291015625, -7.8382568359375, -7.443603515625, -7.0489501953125, -6.654296875, -6.2596435546875, -5.864990234375, -5.4703369140625, -5.07568359375, -4.6810302734375, -4.286376953125, -3.8917236328125, -3.4970703125, -3.1024169921875, -2.707763671875, -2.3131103515625, -1.91845703125, -1.5238037109375, -1.129150390625, -0.7344970703125, -0.33984375, 0.0548095703125, 0.449462890625, 0.8441162109375, 1.23876953125, 1.6334228515625, 2.028076171875, 2.4227294921875, 2.8173828125, 3.2120361328125, 3.606689453125, 4.0013427734375, 4.39599609375, 4.7906494140625, 5.185302734375, 5.5799560546875, 5.974609375, 6.3692626953125, 6.763916015625, 7.1585693359375, 7.55322265625, 7.9478759765625, 8.342529296875, 8.7371826171875, 9.1318359375, 9.5264892578125, 9.921142578125, 10.3157958984375, 10.71044921875, 11.1051025390625, 11.499755859375, 11.8944091796875, 12.2890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 1.0, 10.0, 10.0, 19.0, 24.0, 37.0, 75.0, 137.0, 204.0, 409.0, 812.0, 1552.0, 3434.0, 8215.0, 27099.0, 144869.0, 683105.0, 137752.0, 26276.0, 7939.0, 3397.0, 1517.0, 778.0, 372.0, 207.0, 121.0, 71.0, 41.0, 20.0, 10.0, 12.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23046875, -3.1170654296875, -3.003662109375, -2.8902587890625, -2.77685546875, -2.6634521484375, -2.550048828125, -2.4366455078125, -2.3232421875, -2.2098388671875, -2.096435546875, -1.9830322265625, -1.86962890625, -1.7562255859375, -1.642822265625, -1.5294189453125, -1.416015625, -1.3026123046875, -1.189208984375, -1.0758056640625, -0.96240234375, -0.8489990234375, -0.735595703125, -0.6221923828125, -0.5087890625, -0.3953857421875, -0.281982421875, -0.1685791015625, -0.05517578125, 0.0582275390625, 0.171630859375, 0.2850341796875, 0.3984375, 0.5118408203125, 0.625244140625, 0.7386474609375, 0.85205078125, 0.9654541015625, 1.078857421875, 1.1922607421875, 1.3056640625, 1.4190673828125, 1.532470703125, 1.6458740234375, 1.75927734375, 1.8726806640625, 1.986083984375, 2.0994873046875, 2.212890625, 2.3262939453125, 2.439697265625, 2.5531005859375, 2.66650390625, 2.7799072265625, 2.893310546875, 3.0067138671875, 3.1201171875, 3.2335205078125, 3.346923828125, 3.4603271484375, 3.57373046875, 3.6871337890625, 3.800537109375, 3.9139404296875, 4.02734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 0.0, 2.0, 8.0, 5.0, 9.0, 15.0, 28.0, 34.0, 45.0, 76.0, 119.0, 150.0, 166.0, 111.0, 73.0, 54.0, 34.0, 18.0, 11.0, 10.0, 6.0, 9.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014047622680664062, -0.0013645291328430176, -0.001324295997619629, -0.0012840628623962402, -0.0012438297271728516, -0.0012035965919494629, -0.0011633634567260742, -0.0011231303215026855, -0.0010828971862792969, -0.0010426640510559082, -0.0010024309158325195, -0.0009621977806091309, -0.0009219646453857422, -0.0008817315101623535, -0.0008414983749389648, -0.0008012652397155762, -0.0007610321044921875, -0.0007207989692687988, -0.0006805658340454102, -0.0006403326988220215, -0.0006000995635986328, -0.0005598664283752441, -0.0005196332931518555, -0.0004794001579284668, -0.0004391670227050781, -0.00039893388748168945, -0.0003587007522583008, -0.0003184676170349121, -0.00027823448181152344, -0.00023800134658813477, -0.0001977682113647461, -0.00015753507614135742, -0.00011730194091796875, -7.706880569458008e-05, -3.6835670471191406e-05, 3.3974647521972656e-06, 4.363059997558594e-05, 8.386373519897461e-05, 0.00012409687042236328, 0.00016433000564575195, 0.00020456314086914062, 0.0002447962760925293, 0.00028502941131591797, 0.00032526254653930664, 0.0003654956817626953, 0.000405728816986084, 0.00044596195220947266, 0.00048619508743286133, 0.00052642822265625, 0.0005666613578796387, 0.0006068944931030273, 0.000647127628326416, 0.0006873607635498047, 0.0007275938987731934, 0.000767827033996582, 0.0008080601692199707, 0.0008482933044433594, 0.000888526439666748, 0.0009287595748901367, 0.0009689927101135254, 0.001009225845336914, 0.0010494589805603027, 0.0010896921157836914, 0.00112992525100708, 0.0011701583862304688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 3.0, 9.0, 12.0, 16.0, 30.0, 29.0, 84.0, 117.0, 224.0, 417.0, 822.0, 1720.0, 4135.0, 10639.0, 36547.0, 178926.0, 636136.0, 134407.0, 28968.0, 8849.0, 3379.0, 1505.0, 735.0, 349.0, 183.0, 113.0, 64.0, 41.0, 24.0, 17.0, 10.0, 8.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.203582763671875, -3.09466552734375, -2.985748291015625, -2.8768310546875, -2.767913818359375, -2.65899658203125, -2.550079345703125, -2.441162109375, -2.332244873046875, -2.22332763671875, -2.114410400390625, -2.0054931640625, -1.896575927734375, -1.78765869140625, -1.678741455078125, -1.56982421875, -1.460906982421875, -1.35198974609375, -1.243072509765625, -1.1341552734375, -1.025238037109375, -0.91632080078125, -0.807403564453125, -0.698486328125, -0.589569091796875, -0.48065185546875, -0.371734619140625, -0.2628173828125, -0.153900146484375, -0.04498291015625, 0.063934326171875, 0.1728515625, 0.281768798828125, 0.39068603515625, 0.499603271484375, 0.6085205078125, 0.717437744140625, 0.82635498046875, 0.935272216796875, 1.044189453125, 1.153106689453125, 1.26202392578125, 1.370941162109375, 1.4798583984375, 1.588775634765625, 1.69769287109375, 1.806610107421875, 1.91552734375, 2.024444580078125, 2.13336181640625, 2.242279052734375, 2.3511962890625, 2.460113525390625, 2.56903076171875, 2.677947998046875, 2.786865234375, 2.895782470703125, 3.00469970703125, 3.113616943359375, 3.2225341796875, 3.331451416015625, 3.44036865234375, 3.549285888671875, 3.658203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 9.0, 9.0, 8.0, 14.0, 24.0, 23.0, 40.0, 32.0, 61.0, 78.0, 76.0, 81.0, 85.0, 76.0, 82.0, 62.0, 55.0, 40.0, 27.0, 34.0, 17.0, 12.0, 9.0, 8.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.177734375, -3.0760498046875, -2.974365234375, -2.8726806640625, -2.77099609375, -2.6693115234375, -2.567626953125, -2.4659423828125, -2.3642578125, -2.2625732421875, -2.160888671875, -2.0592041015625, -1.95751953125, -1.8558349609375, -1.754150390625, -1.6524658203125, -1.55078125, -1.4490966796875, -1.347412109375, -1.2457275390625, -1.14404296875, -1.0423583984375, -0.940673828125, -0.8389892578125, -0.7373046875, -0.6356201171875, -0.533935546875, -0.4322509765625, -0.33056640625, -0.2288818359375, -0.127197265625, -0.0255126953125, 0.076171875, 0.1778564453125, 0.279541015625, 0.3812255859375, 0.48291015625, 0.5845947265625, 0.686279296875, 0.7879638671875, 0.8896484375, 0.9913330078125, 1.093017578125, 1.1947021484375, 1.29638671875, 1.3980712890625, 1.499755859375, 1.6014404296875, 1.703125, 1.8048095703125, 1.906494140625, 2.0081787109375, 2.10986328125, 2.2115478515625, 2.313232421875, 2.4149169921875, 2.5166015625, 2.6182861328125, 2.719970703125, 2.8216552734375, 2.92333984375, 3.0250244140625, 3.126708984375, 3.2283935546875, 3.330078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 14.0, 27.0, 85.0, 219.0, 428.0, 147.0, 47.0, 18.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.21112060546875, -159.68402099609375, -155.1569366455078, -150.6298370361328, -146.10275268554688, -141.57565307617188, -137.04856872558594, -132.52146911621094, -127.994384765625, -123.46729278564453, -118.94020080566406, -114.4131088256836, -109.88601684570312, -105.35892486572266, -100.83183288574219, -96.30473327636719, -91.77764129638672, -87.25054931640625, -82.72345733642578, -78.19636535644531, -73.66927337646484, -69.14218139648438, -64.61508178710938, -60.08799362182617, -55.5609016418457, -51.033809661865234, -46.506717681884766, -41.97962188720703, -37.45252990722656, -32.925437927246094, -28.398345947265625, -23.871253967285156, -19.344161987304688, -14.817070007324219, -10.289977073669434, -5.762884140014648, -1.2357921600341797, 3.291299819946289, 7.818393707275391, 12.34548568725586, 16.872577667236328, 21.399669647216797, 25.926761627197266, 30.453855514526367, 34.98094940185547, 39.50804138183594, 44.035133361816406, 48.562225341796875, 53.089317321777344, 57.61640930175781, 62.14350128173828, 66.67059326171875, 71.19768524169922, 75.72477722167969, 80.25187683105469, 84.77896118164062, 89.30606079101562, 93.8331527709961, 98.36024475097656, 102.88733673095703, 107.4144287109375, 111.94152069091797, 116.46861267089844, 120.99571228027344, 125.52279663085938]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 7.0, 11.0, 17.0, 14.0, 34.0, 27.0, 34.0, 35.0, 42.0, 51.0, 66.0, 101.0, 119.0, 83.0, 52.0, 53.0, 43.0, 37.0, 29.0, 29.0, 17.0, 23.0, 20.0, 15.0, 9.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-84.99681091308594, -82.939697265625, -80.88258361816406, -78.82546997070312, -76.76835632324219, -74.71125030517578, -72.65413665771484, -70.5970230102539, -68.53990936279297, -66.48279571533203, -64.4256820678711, -62.36857223510742, -60.311458587646484, -58.25434494018555, -56.197235107421875, -54.14012145996094, -52.0830078125, -50.02589416503906, -47.968780517578125, -45.91167068481445, -43.854557037353516, -41.79744338989258, -39.740333557128906, -37.68321990966797, -35.62610626220703, -33.568992614746094, -31.51188087463379, -29.454769134521484, -27.397655487060547, -25.34054183959961, -23.283430099487305, -21.226318359375, -19.169200897216797, -17.11208724975586, -15.054975509643555, -12.997862815856934, -10.940750122070312, -8.883637428283691, -6.82652473449707, -4.769412040710449, -2.712299346923828, -0.655186653137207, 1.401926040649414, 3.459038734436035, 5.516151428222656, 7.573264122009277, 9.630376815795898, 11.68748950958252, 13.74460220336914, 15.801714897155762, 17.858827590942383, 19.915939331054688, 21.973052978515625, 24.030166625976562, 26.087278366088867, 28.144390106201172, 30.20150375366211, 32.25861740112305, 34.31572723388672, 36.372840881347656, 38.429954528808594, 40.48706817626953, 42.54418182373047, 44.60129165649414, 46.65840530395508]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 13.0, 20.0, 26.0, 33.0, 45.0, 96.0, 165.0, 331.0, 804.0, 2006.0, 7290.0, 44841.0, 1067719.0, 2935887.0, 116864.0, 13012.0, 3117.0, 1095.0, 401.0, 208.0, 116.0, 72.0, 52.0, 24.0, 11.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.72900390625, -8.4736328125, -8.21826171875, -7.962890625, -7.70751953125, -7.4521484375, -7.19677734375, -6.94140625, -6.68603515625, -6.4306640625, -6.17529296875, -5.919921875, -5.66455078125, -5.4091796875, -5.15380859375, -4.8984375, -4.64306640625, -4.3876953125, -4.13232421875, -3.876953125, -3.62158203125, -3.3662109375, -3.11083984375, -2.85546875, -2.60009765625, -2.3447265625, -2.08935546875, -1.833984375, -1.57861328125, -1.3232421875, -1.06787109375, -0.8125, -0.55712890625, -0.3017578125, -0.04638671875, 0.208984375, 0.46435546875, 0.7197265625, 0.97509765625, 1.23046875, 1.48583984375, 1.7412109375, 1.99658203125, 2.251953125, 2.50732421875, 2.7626953125, 3.01806640625, 3.2734375, 3.52880859375, 3.7841796875, 4.03955078125, 4.294921875, 4.55029296875, 4.8056640625, 5.06103515625, 5.31640625, 5.57177734375, 5.8271484375, 6.08251953125, 6.337890625, 6.59326171875, 6.8486328125, 7.10400390625, 7.359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 1.0, 8.0, 10.0, 9.0, 6.0, 20.0, 27.0, 19.0, 25.0, 29.0, 32.0, 50.0, 55.0, 61.0, 53.0, 63.0, 54.0, 59.0, 55.0, 57.0, 58.0, 48.0, 33.0, 30.0, 27.0, 26.0, 30.0, 19.0, 9.0, 10.0, 8.0, 3.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.356475830078125, -3.23443603515625, -3.112396240234375, -2.9903564453125, -2.868316650390625, -2.74627685546875, -2.624237060546875, -2.502197265625, -2.380157470703125, -2.25811767578125, -2.136077880859375, -2.0140380859375, -1.891998291015625, -1.76995849609375, -1.647918701171875, -1.52587890625, -1.403839111328125, -1.28179931640625, -1.159759521484375, -1.0377197265625, -0.915679931640625, -0.79364013671875, -0.671600341796875, -0.549560546875, -0.427520751953125, -0.30548095703125, -0.183441162109375, -0.0614013671875, 0.060638427734375, 0.18267822265625, 0.304718017578125, 0.4267578125, 0.548797607421875, 0.67083740234375, 0.792877197265625, 0.9149169921875, 1.036956787109375, 1.15899658203125, 1.281036376953125, 1.403076171875, 1.525115966796875, 1.64715576171875, 1.769195556640625, 1.8912353515625, 2.013275146484375, 2.13531494140625, 2.257354736328125, 2.37939453125, 2.501434326171875, 2.62347412109375, 2.745513916015625, 2.8675537109375, 2.989593505859375, 3.11163330078125, 3.233673095703125, 3.355712890625, 3.477752685546875, 3.59979248046875, 3.721832275390625, 3.8438720703125, 3.965911865234375, 4.08795166015625, 4.209991455078125, 4.33203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 4.0, 4.0, 8.0, 14.0, 22.0, 35.0, 76.0, 219.0, 640.0, 3555.0, 76061.0, 3985436.0, 122095.0, 4782.0, 842.0, 295.0, 109.0, 49.0, 18.0, 12.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.5, -21.95849609375, -21.4169921875, -20.87548828125, -20.333984375, -19.79248046875, -19.2509765625, -18.70947265625, -18.16796875, -17.62646484375, -17.0849609375, -16.54345703125, -16.001953125, -15.46044921875, -14.9189453125, -14.37744140625, -13.8359375, -13.29443359375, -12.7529296875, -12.21142578125, -11.669921875, -11.12841796875, -10.5869140625, -10.04541015625, -9.50390625, -8.96240234375, -8.4208984375, -7.87939453125, -7.337890625, -6.79638671875, -6.2548828125, -5.71337890625, -5.171875, -4.63037109375, -4.0888671875, -3.54736328125, -3.005859375, -2.46435546875, -1.9228515625, -1.38134765625, -0.83984375, -0.29833984375, 0.2431640625, 0.78466796875, 1.326171875, 1.86767578125, 2.4091796875, 2.95068359375, 3.4921875, 4.03369140625, 4.5751953125, 5.11669921875, 5.658203125, 6.19970703125, 6.7412109375, 7.28271484375, 7.82421875, 8.36572265625, 8.9072265625, 9.44873046875, 9.990234375, 10.53173828125, 11.0732421875, 11.61474609375, 12.15625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 15.0, 19.0, 53.0, 53.0, 104.0, 169.0, 279.0, 469.0, 735.0, 823.0, 563.0, 308.0, 169.0, 104.0, 57.0, 40.0, 32.0, 16.0, 14.0, 16.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.753173828125, -4.49072265625, -4.228271484375, -3.9658203125, -3.703369140625, -3.44091796875, -3.178466796875, -2.916015625, -2.653564453125, -2.39111328125, -2.128662109375, -1.8662109375, -1.603759765625, -1.34130859375, -1.078857421875, -0.81640625, -0.553955078125, -0.29150390625, -0.029052734375, 0.2333984375, 0.495849609375, 0.75830078125, 1.020751953125, 1.283203125, 1.545654296875, 1.80810546875, 2.070556640625, 2.3330078125, 2.595458984375, 2.85791015625, 3.120361328125, 3.3828125, 3.645263671875, 3.90771484375, 4.170166015625, 4.4326171875, 4.695068359375, 4.95751953125, 5.219970703125, 5.482421875, 5.744873046875, 6.00732421875, 6.269775390625, 6.5322265625, 6.794677734375, 7.05712890625, 7.319580078125, 7.58203125, 7.844482421875, 8.10693359375, 8.369384765625, 8.6318359375, 8.894287109375, 9.15673828125, 9.419189453125, 9.681640625, 9.944091796875, 10.20654296875, 10.468994140625, 10.7314453125, 10.993896484375, 11.25634765625, 11.518798828125, 11.78125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 41.0, 117.0, 237.0, 260.0, 181.0, 92.0, 39.0, 18.0, 9.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1497802734375, -111.68578338623047, -108.22178649902344, -104.75778198242188, -101.29378509521484, -97.82978820800781, -94.36578369140625, -90.90178680419922, -87.43778991699219, -83.97379302978516, -80.50979614257812, -77.04579162597656, -73.58179473876953, -70.1177978515625, -66.65379333496094, -63.189796447753906, -59.725799560546875, -56.261802673339844, -52.79780197143555, -49.33380126953125, -45.86980438232422, -42.40580749511719, -38.94180679321289, -35.477806091308594, -32.01380920410156, -28.5498104095459, -25.085811614990234, -21.62181282043457, -18.157814025878906, -14.693815231323242, -11.229816436767578, -7.765817642211914, -4.30181884765625, -0.8378200531005859, 2.626178741455078, 6.090177536010742, 9.554176330566406, 13.01817512512207, 16.482173919677734, 19.9461727142334, 23.410171508789062, 26.874170303344727, 30.33816909790039, 33.80216979980469, 37.26616668701172, 40.73016357421875, 44.19416427612305, 47.658164978027344, 51.122161865234375, 54.586158752441406, 58.0501594543457, 61.51416015625, 64.97815704345703, 68.44215393066406, 71.90615844726562, 75.37015533447266, 78.83415222167969, 82.29814910888672, 85.76214599609375, 89.22615051269531, 92.69014739990234, 96.15414428710938, 99.61814880371094, 103.08214569091797, 106.546142578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 7.0, 9.0, 12.0, 8.0, 15.0, 18.0, 21.0, 20.0, 24.0, 35.0, 30.0, 29.0, 58.0, 44.0, 57.0, 61.0, 61.0, 38.0, 38.0, 45.0, 37.0, 47.0, 43.0, 42.0, 36.0, 29.0, 39.0, 17.0, 15.0, 12.0, 18.0, 12.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.70735168457031, -38.657447814941406, -37.607540130615234, -36.55763626098633, -35.507728576660156, -34.45782470703125, -33.40791702270508, -32.35801315307617, -31.30810546875, -30.25819969177246, -29.208293914794922, -28.158388137817383, -27.108482360839844, -26.058576583862305, -25.008670806884766, -23.95876693725586, -22.90886116027832, -21.85895538330078, -20.809049606323242, -19.759143829345703, -18.709238052368164, -17.659332275390625, -16.60942840576172, -15.559521675109863, -14.509615898132324, -13.459710121154785, -12.409804344177246, -11.359899520874023, -10.309993743896484, -9.260087966918945, -8.210182189941406, -7.160276412963867, -6.110372543334961, -5.060466766357422, -4.010560989379883, -2.960655689239502, -1.910749912261963, -0.8608441352844238, 0.18906116485595703, 1.238966941833496, 2.288872718811035, 3.338778495788574, 4.388684272766113, 5.438589572906494, 6.488495349884033, 7.538401126861572, 8.588306427001953, 9.638212203979492, 10.688117980957031, 11.73802375793457, 12.78792953491211, 13.837835311889648, 14.887741088867188, 15.937646865844727, 16.987552642822266, 18.037456512451172, 19.087364196777344, 20.137269973754883, 21.187175750732422, 22.23708152770996, 23.2869873046875, 24.33689308166504, 25.386798858642578, 26.436702728271484, 27.486608505249023]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 13.0, 30.0, 39.0, 54.0, 111.0, 215.0, 420.0, 879.0, 1985.0, 4688.0, 13104.0, 42365.0, 171197.0, 513677.0, 220865.0, 53178.0, 15947.0, 5654.0, 2170.0, 936.0, 437.0, 256.0, 127.0, 72.0, 44.0, 24.0, 11.0, 17.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.34375, -6.121826171875, -5.89990234375, -5.677978515625, -5.4560546875, -5.234130859375, -5.01220703125, -4.790283203125, -4.568359375, -4.346435546875, -4.12451171875, -3.902587890625, -3.6806640625, -3.458740234375, -3.23681640625, -3.014892578125, -2.79296875, -2.571044921875, -2.34912109375, -2.127197265625, -1.9052734375, -1.683349609375, -1.46142578125, -1.239501953125, -1.017578125, -0.795654296875, -0.57373046875, -0.351806640625, -0.1298828125, 0.092041015625, 0.31396484375, 0.535888671875, 0.7578125, 0.979736328125, 1.20166015625, 1.423583984375, 1.6455078125, 1.867431640625, 2.08935546875, 2.311279296875, 2.533203125, 2.755126953125, 2.97705078125, 3.198974609375, 3.4208984375, 3.642822265625, 3.86474609375, 4.086669921875, 4.30859375, 4.530517578125, 4.75244140625, 4.974365234375, 5.1962890625, 5.418212890625, 5.64013671875, 5.862060546875, 6.083984375, 6.305908203125, 6.52783203125, 6.749755859375, 6.9716796875, 7.193603515625, 7.41552734375, 7.637451171875, 7.859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 8.0, 11.0, 16.0, 12.0, 19.0, 27.0, 33.0, 46.0, 45.0, 46.0, 50.0, 53.0, 61.0, 64.0, 58.0, 57.0, 65.0, 50.0, 51.0, 39.0, 34.0, 27.0, 32.0, 26.0, 14.0, 11.0, 14.0, 5.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.170013427734375, -4.04315185546875, -3.916290283203125, -3.7894287109375, -3.662567138671875, -3.53570556640625, -3.408843994140625, -3.281982421875, -3.155120849609375, -3.02825927734375, -2.901397705078125, -2.7745361328125, -2.647674560546875, -2.52081298828125, -2.393951416015625, -2.26708984375, -2.140228271484375, -2.01336669921875, -1.886505126953125, -1.7596435546875, -1.632781982421875, -1.50592041015625, -1.379058837890625, -1.252197265625, -1.125335693359375, -0.99847412109375, -0.871612548828125, -0.7447509765625, -0.617889404296875, -0.49102783203125, -0.364166259765625, -0.2373046875, -0.110443115234375, 0.01641845703125, 0.143280029296875, 0.2701416015625, 0.397003173828125, 0.52386474609375, 0.650726318359375, 0.777587890625, 0.904449462890625, 1.03131103515625, 1.158172607421875, 1.2850341796875, 1.411895751953125, 1.53875732421875, 1.665618896484375, 1.79248046875, 1.919342041015625, 2.04620361328125, 2.173065185546875, 2.2999267578125, 2.426788330078125, 2.55364990234375, 2.680511474609375, 2.807373046875, 2.934234619140625, 3.06109619140625, 3.187957763671875, 3.3148193359375, 3.441680908203125, 3.56854248046875, 3.695404052734375, 3.822265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 6.0, 8.0, 12.0, 7.0, 16.0, 19.0, 23.0, 28.0, 41.0, 62.0, 59.0, 100.0, 147.0, 244.0, 361.0, 537.0, 1072.0, 2354.0, 6036.0, 20216.0, 104308.0, 714054.0, 158114.0, 27090.0, 7603.0, 2807.0, 1313.0, 697.0, 381.0, 237.0, 158.0, 130.0, 80.0, 56.0, 49.0, 33.0, 23.0, 11.0, 17.0, 4.0, 7.0, 11.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8515625, -8.580078125, -8.30859375, -8.037109375, -7.765625, -7.494140625, -7.22265625, -6.951171875, -6.6796875, -6.408203125, -6.13671875, -5.865234375, -5.59375, -5.322265625, -5.05078125, -4.779296875, -4.5078125, -4.236328125, -3.96484375, -3.693359375, -3.421875, -3.150390625, -2.87890625, -2.607421875, -2.3359375, -2.064453125, -1.79296875, -1.521484375, -1.25, -0.978515625, -0.70703125, -0.435546875, -0.1640625, 0.107421875, 0.37890625, 0.650390625, 0.921875, 1.193359375, 1.46484375, 1.736328125, 2.0078125, 2.279296875, 2.55078125, 2.822265625, 3.09375, 3.365234375, 3.63671875, 3.908203125, 4.1796875, 4.451171875, 4.72265625, 4.994140625, 5.265625, 5.537109375, 5.80859375, 6.080078125, 6.3515625, 6.623046875, 6.89453125, 7.166015625, 7.4375, 7.708984375, 7.98046875, 8.251953125, 8.5234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 8.0, 11.0, 12.0, 14.0, 10.0, 18.0, 16.0, 18.0, 18.0, 30.0, 23.0, 39.0, 38.0, 44.0, 54.0, 41.0, 60.0, 52.0, 44.0, 51.0, 53.0, 42.0, 45.0, 32.0, 35.0, 33.0, 22.0, 22.0, 20.0, 9.0, 10.0, 12.0, 13.0, 6.0, 2.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.069091796875, -9.70068359375, -9.332275390625, -8.9638671875, -8.595458984375, -8.22705078125, -7.858642578125, -7.490234375, -7.121826171875, -6.75341796875, -6.385009765625, -6.0166015625, -5.648193359375, -5.27978515625, -4.911376953125, -4.54296875, -4.174560546875, -3.80615234375, -3.437744140625, -3.0693359375, -2.700927734375, -2.33251953125, -1.964111328125, -1.595703125, -1.227294921875, -0.85888671875, -0.490478515625, -0.1220703125, 0.246337890625, 0.61474609375, 0.983154296875, 1.3515625, 1.719970703125, 2.08837890625, 2.456787109375, 2.8251953125, 3.193603515625, 3.56201171875, 3.930419921875, 4.298828125, 4.667236328125, 5.03564453125, 5.404052734375, 5.7724609375, 6.140869140625, 6.50927734375, 6.877685546875, 7.24609375, 7.614501953125, 7.98291015625, 8.351318359375, 8.7197265625, 9.088134765625, 9.45654296875, 9.824951171875, 10.193359375, 10.561767578125, 10.93017578125, 11.298583984375, 11.6669921875, 12.035400390625, 12.40380859375, 12.772216796875, 13.140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 6.0, 11.0, 11.0, 26.0, 40.0, 46.0, 65.0, 126.0, 187.0, 357.0, 638.0, 1297.0, 2634.0, 6145.0, 15337.0, 43755.0, 170960.0, 651824.0, 103945.0, 30622.0, 11412.0, 4668.0, 2144.0, 990.0, 520.0, 282.0, 178.0, 108.0, 59.0, 43.0, 27.0, 27.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 5.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.851287841796875, -2.76312255859375, -2.674957275390625, -2.5867919921875, -2.498626708984375, -2.41046142578125, -2.322296142578125, -2.234130859375, -2.145965576171875, -2.05780029296875, -1.969635009765625, -1.8814697265625, -1.793304443359375, -1.70513916015625, -1.616973876953125, -1.52880859375, -1.440643310546875, -1.35247802734375, -1.264312744140625, -1.1761474609375, -1.087982177734375, -0.99981689453125, -0.911651611328125, -0.823486328125, -0.735321044921875, -0.64715576171875, -0.558990478515625, -0.4708251953125, -0.382659912109375, -0.29449462890625, -0.206329345703125, -0.1181640625, -0.029998779296875, 0.05816650390625, 0.146331787109375, 0.2344970703125, 0.322662353515625, 0.41082763671875, 0.498992919921875, 0.587158203125, 0.675323486328125, 0.76348876953125, 0.851654052734375, 0.9398193359375, 1.027984619140625, 1.11614990234375, 1.204315185546875, 1.29248046875, 1.380645751953125, 1.46881103515625, 1.556976318359375, 1.6451416015625, 1.733306884765625, 1.82147216796875, 1.909637451171875, 1.997802734375, 2.085968017578125, 2.17413330078125, 2.262298583984375, 2.3504638671875, 2.438629150390625, 2.52679443359375, 2.614959716796875, 2.703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 10.0, 18.0, 23.0, 38.0, 35.0, 47.0, 77.0, 124.0, 107.0, 131.0, 92.0, 68.0, 44.0, 25.0, 30.0, 25.0, 15.0, 11.0, 5.0, 5.0, 8.0, 5.0, 5.0, 1.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008645057678222656, -0.0008373931050300598, -0.000810280442237854, -0.0007831677794456482, -0.0007560551166534424, -0.0007289424538612366, -0.0007018297910690308, -0.000674717128276825, -0.0006476044654846191, -0.0006204918026924133, -0.0005933791399002075, -0.0005662664771080017, -0.0005391538143157959, -0.0005120411515235901, -0.0004849284887313843, -0.00045781582593917847, -0.00043070316314697266, -0.00040359050035476685, -0.00037647783756256104, -0.0003493651747703552, -0.0003222525119781494, -0.0002951398491859436, -0.0002680271863937378, -0.00024091452360153198, -0.00021380186080932617, -0.00018668919801712036, -0.00015957653522491455, -0.00013246387243270874, -0.00010535120964050293, -7.823854684829712e-05, -5.112588405609131e-05, -2.4013221263885498e-05, 3.0994415283203125e-06, 3.0212104320526123e-05, 5.7324767112731934e-05, 8.443742990493774e-05, 0.00011155009269714355, 0.00013866275548934937, 0.00016577541828155518, 0.00019288808107376099, 0.0002200007438659668, 0.0002471134066581726, 0.0002742260694503784, 0.00030133873224258423, 0.00032845139503479004, 0.00035556405782699585, 0.00038267672061920166, 0.00040978938341140747, 0.0004369020462036133, 0.0004640147089958191, 0.0004911273717880249, 0.0005182400345802307, 0.0005453526973724365, 0.0005724653601646423, 0.0005995780229568481, 0.000626690685749054, 0.0006538033485412598, 0.0006809160113334656, 0.0007080286741256714, 0.0007351413369178772, 0.000762253999710083, 0.0007893666625022888, 0.0008164793252944946, 0.0008435919880867004, 0.0008707046508789062]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 17.0, 13.0, 13.0, 29.0, 32.0, 48.0, 98.0, 154.0, 290.0, 500.0, 947.0, 1965.0, 4770.0, 12714.0, 41747.0, 193268.0, 664169.0, 89964.0, 23685.0, 8070.0, 3112.0, 1368.0, 679.0, 346.0, 173.0, 135.0, 82.0, 51.0, 31.0, 19.0, 21.0, 15.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.347442626953125, -3.24371337890625, -3.139984130859375, -3.0362548828125, -2.932525634765625, -2.82879638671875, -2.725067138671875, -2.621337890625, -2.517608642578125, -2.41387939453125, -2.310150146484375, -2.2064208984375, -2.102691650390625, -1.99896240234375, -1.895233154296875, -1.79150390625, -1.687774658203125, -1.58404541015625, -1.480316162109375, -1.3765869140625, -1.272857666015625, -1.16912841796875, -1.065399169921875, -0.961669921875, -0.857940673828125, -0.75421142578125, -0.650482177734375, -0.5467529296875, -0.443023681640625, -0.33929443359375, -0.235565185546875, -0.1318359375, -0.028106689453125, 0.07562255859375, 0.179351806640625, 0.2830810546875, 0.386810302734375, 0.49053955078125, 0.594268798828125, 0.697998046875, 0.801727294921875, 0.90545654296875, 1.009185791015625, 1.1129150390625, 1.216644287109375, 1.32037353515625, 1.424102783203125, 1.52783203125, 1.631561279296875, 1.73529052734375, 1.839019775390625, 1.9427490234375, 2.046478271484375, 2.15020751953125, 2.253936767578125, 2.357666015625, 2.461395263671875, 2.56512451171875, 2.668853759765625, 2.7725830078125, 2.876312255859375, 2.98004150390625, 3.083770751953125, 3.1875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 9.0, 15.0, 13.0, 9.0, 9.0, 27.0, 37.0, 40.0, 65.0, 93.0, 110.0, 114.0, 109.0, 69.0, 56.0, 48.0, 40.0, 24.0, 21.0, 14.0, 14.0, 5.0, 14.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.968109130859375, -2.86395263671875, -2.759796142578125, -2.6556396484375, -2.551483154296875, -2.44732666015625, -2.343170166015625, -2.239013671875, -2.134857177734375, -2.03070068359375, -1.926544189453125, -1.8223876953125, -1.718231201171875, -1.61407470703125, -1.509918212890625, -1.40576171875, -1.301605224609375, -1.19744873046875, -1.093292236328125, -0.9891357421875, -0.884979248046875, -0.78082275390625, -0.676666259765625, -0.572509765625, -0.468353271484375, -0.36419677734375, -0.260040283203125, -0.1558837890625, -0.051727294921875, 0.05242919921875, 0.156585693359375, 0.2607421875, 0.364898681640625, 0.46905517578125, 0.573211669921875, 0.6773681640625, 0.781524658203125, 0.88568115234375, 0.989837646484375, 1.093994140625, 1.198150634765625, 1.30230712890625, 1.406463623046875, 1.5106201171875, 1.614776611328125, 1.71893310546875, 1.823089599609375, 1.92724609375, 2.031402587890625, 2.13555908203125, 2.239715576171875, 2.3438720703125, 2.448028564453125, 2.55218505859375, 2.656341552734375, 2.760498046875, 2.864654541015625, 2.96881103515625, 3.072967529296875, 3.1771240234375, 3.281280517578125, 3.38543701171875, 3.489593505859375, 3.59375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 7.0, 15.0, 21.0, 59.0, 96.0, 248.0, 261.0, 115.0, 70.0, 52.0, 25.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.06014633178711, -56.257965087890625, -53.45578384399414, -50.653602600097656, -47.85142135620117, -45.04924011230469, -42.2470588684082, -39.44487762451172, -36.642696380615234, -33.84051513671875, -31.038333892822266, -28.23615264892578, -25.433971405029297, -22.631790161132812, -19.829608917236328, -17.027427673339844, -14.22524642944336, -11.423065185546875, -8.62088394165039, -5.818702697753906, -3.016521453857422, -0.2143402099609375, 2.587841033935547, 5.390022277832031, 8.192203521728516, 10.994384765625, 13.796566009521484, 16.59874725341797, 19.400928497314453, 22.203109741210938, 25.005290985107422, 27.807472229003906, 30.609649658203125, 33.41183090209961, 36.214012145996094, 39.01619338989258, 41.81837463378906, 44.62055587768555, 47.42273712158203, 50.224918365478516, 53.027099609375, 55.829280853271484, 58.63146209716797, 61.43364334106445, 64.23582458496094, 67.03800964355469, 69.8401870727539, 72.64236450195312, 75.44454956054688, 78.24673461914062, 81.04891204833984, 83.85108947753906, 86.65327453613281, 89.45545959472656, 92.25763702392578, 95.059814453125, 97.86199951171875, 100.6641845703125, 103.46636199951172, 106.26853942871094, 109.07072448730469, 111.87290954589844, 114.67508697509766, 117.47726440429688, 120.27944946289062]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 1.0, 4.0, 6.0, 10.0, 10.0, 13.0, 9.0, 18.0, 21.0, 30.0, 18.0, 26.0, 21.0, 28.0, 30.0, 35.0, 44.0, 78.0, 90.0, 104.0, 71.0, 38.0, 32.0, 29.0, 20.0, 26.0, 33.0, 24.0, 18.0, 19.0, 15.0, 11.0, 11.0, 9.0, 7.0, 13.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.99598693847656, -48.56504821777344, -47.13410568237305, -45.70316696166992, -44.2722282409668, -42.84128952026367, -41.41034698486328, -39.979408264160156, -38.54846954345703, -37.117530822753906, -35.686588287353516, -34.25564956665039, -32.824710845947266, -31.393770217895508, -29.96282958984375, -28.531890869140625, -27.100950241088867, -25.67000961303711, -24.239070892333984, -22.808130264282227, -21.3771915435791, -19.946250915527344, -18.51531219482422, -17.08437156677246, -15.65343189239502, -14.222492218017578, -12.791552543640137, -11.360612869262695, -9.929672241210938, -8.498733520507812, -7.067792892456055, -5.636853218078613, -4.205913543701172, -2.7749738693237305, -1.34403395652771, 0.08690595626831055, 1.517845630645752, 2.9487853050231934, 4.379725456237793, 5.810665130615234, 7.241604804992676, 8.672544479370117, 10.103484153747559, 11.534423828125, 12.965364456176758, 14.396303176879883, 15.82724380493164, 17.258182525634766, 18.689123153686523, 20.12006378173828, 21.551002502441406, 22.981943130493164, 24.41288185119629, 25.843822479248047, 27.274761199951172, 28.70570182800293, 30.136642456054688, 31.567583084106445, 32.9985237121582, 34.42946243286133, 35.86040115356445, 37.29133987426758, 38.72228240966797, 40.153221130371094, 41.58415985107422]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 9.0, 15.0, 18.0, 21.0, 30.0, 55.0, 79.0, 143.0, 261.0, 441.0, 954.0, 2224.0, 7361.0, 40800.0, 676812.0, 3137830.0, 292734.0, 25673.0, 5422.0, 1865.0, 644.0, 370.0, 183.0, 126.0, 66.0, 44.0, 26.0, 20.0, 17.0, 10.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.125, -9.8677978515625, -9.610595703125, -9.3533935546875, -9.09619140625, -8.8389892578125, -8.581787109375, -8.3245849609375, -8.0673828125, -7.8101806640625, -7.552978515625, -7.2957763671875, -7.03857421875, -6.7813720703125, -6.524169921875, -6.2669677734375, -6.009765625, -5.7525634765625, -5.495361328125, -5.2381591796875, -4.98095703125, -4.7237548828125, -4.466552734375, -4.2093505859375, -3.9521484375, -3.6949462890625, -3.437744140625, -3.1805419921875, -2.92333984375, -2.6661376953125, -2.408935546875, -2.1517333984375, -1.89453125, -1.6373291015625, -1.380126953125, -1.1229248046875, -0.86572265625, -0.6085205078125, -0.351318359375, -0.0941162109375, 0.1630859375, 0.4202880859375, 0.677490234375, 0.9346923828125, 1.19189453125, 1.4490966796875, 1.706298828125, 1.9635009765625, 2.220703125, 2.4779052734375, 2.735107421875, 2.9923095703125, 3.24951171875, 3.5067138671875, 3.763916015625, 4.0211181640625, 4.2783203125, 4.5355224609375, 4.792724609375, 5.0499267578125, 5.30712890625, 5.5643310546875, 5.821533203125, 6.0787353515625, 6.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 16.0, 12.0, 18.0, 16.0, 20.0, 18.0, 31.0, 29.0, 27.0, 37.0, 41.0, 35.0, 49.0, 50.0, 57.0, 65.0, 55.0, 48.0, 46.0, 47.0, 44.0, 44.0, 34.0, 41.0, 31.0, 24.0, 16.0, 15.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-4.953125, -4.838714599609375, -4.72430419921875, -4.609893798828125, -4.4954833984375, -4.381072998046875, -4.26666259765625, -4.152252197265625, -4.037841796875, -3.923431396484375, -3.80902099609375, -3.694610595703125, -3.5802001953125, -3.465789794921875, -3.35137939453125, -3.236968994140625, -3.12255859375, -3.008148193359375, -2.89373779296875, -2.779327392578125, -2.6649169921875, -2.550506591796875, -2.43609619140625, -2.321685791015625, -2.207275390625, -2.092864990234375, -1.97845458984375, -1.864044189453125, -1.7496337890625, -1.635223388671875, -1.52081298828125, -1.406402587890625, -1.2919921875, -1.177581787109375, -1.06317138671875, -0.948760986328125, -0.8343505859375, -0.719940185546875, -0.60552978515625, -0.491119384765625, -0.376708984375, -0.262298583984375, -0.14788818359375, -0.033477783203125, 0.0809326171875, 0.195343017578125, 0.30975341796875, 0.424163818359375, 0.53857421875, 0.652984619140625, 0.76739501953125, 0.881805419921875, 0.9962158203125, 1.110626220703125, 1.22503662109375, 1.339447021484375, 1.453857421875, 1.568267822265625, 1.68267822265625, 1.797088623046875, 1.9114990234375, 2.025909423828125, 2.14031982421875, 2.254730224609375, 2.369140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 9.0, 14.0, 16.0, 26.0, 59.0, 73.0, 133.0, 294.0, 592.0, 1529.0, 5109.0, 33945.0, 1137549.0, 2937632.0, 66290.0, 7705.0, 1907.0, 702.0, 341.0, 142.0, 67.0, 46.0, 22.0, 14.0, 20.0, 6.0, 5.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7421875, -13.3720703125, -13.001953125, -12.6318359375, -12.26171875, -11.8916015625, -11.521484375, -11.1513671875, -10.78125, -10.4111328125, -10.041015625, -9.6708984375, -9.30078125, -8.9306640625, -8.560546875, -8.1904296875, -7.8203125, -7.4501953125, -7.080078125, -6.7099609375, -6.33984375, -5.9697265625, -5.599609375, -5.2294921875, -4.859375, -4.4892578125, -4.119140625, -3.7490234375, -3.37890625, -3.0087890625, -2.638671875, -2.2685546875, -1.8984375, -1.5283203125, -1.158203125, -0.7880859375, -0.41796875, -0.0478515625, 0.322265625, 0.6923828125, 1.0625, 1.4326171875, 1.802734375, 2.1728515625, 2.54296875, 2.9130859375, 3.283203125, 3.6533203125, 4.0234375, 4.3935546875, 4.763671875, 5.1337890625, 5.50390625, 5.8740234375, 6.244140625, 6.6142578125, 6.984375, 7.3544921875, 7.724609375, 8.0947265625, 8.46484375, 8.8349609375, 9.205078125, 9.5751953125, 9.9453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 12.0, 18.0, 10.0, 23.0, 16.0, 34.0, 55.0, 97.0, 147.0, 204.0, 313.0, 492.0, 588.0, 641.0, 476.0, 314.0, 198.0, 151.0, 82.0, 54.0, 43.0, 29.0, 22.0, 16.0, 10.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.703125, -8.44671630859375, -8.1903076171875, -7.93389892578125, -7.677490234375, -7.42108154296875, -7.1646728515625, -6.90826416015625, -6.65185546875, -6.39544677734375, -6.1390380859375, -5.88262939453125, -5.626220703125, -5.36981201171875, -5.1134033203125, -4.85699462890625, -4.6005859375, -4.34417724609375, -4.0877685546875, -3.83135986328125, -3.574951171875, -3.31854248046875, -3.0621337890625, -2.80572509765625, -2.54931640625, -2.29290771484375, -2.0364990234375, -1.78009033203125, -1.523681640625, -1.26727294921875, -1.0108642578125, -0.75445556640625, -0.498046875, -0.24163818359375, 0.0147705078125, 0.27117919921875, 0.527587890625, 0.78399658203125, 1.0404052734375, 1.29681396484375, 1.55322265625, 1.80963134765625, 2.0660400390625, 2.32244873046875, 2.578857421875, 2.83526611328125, 3.0916748046875, 3.34808349609375, 3.6044921875, 3.86090087890625, 4.1173095703125, 4.37371826171875, 4.630126953125, 4.88653564453125, 5.1429443359375, 5.39935302734375, 5.65576171875, 5.91217041015625, 6.1685791015625, 6.42498779296875, 6.681396484375, 6.93780517578125, 7.1942138671875, 7.45062255859375, 7.70703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 21.0, 32.0, 48.0, 62.0, 67.0, 98.0, 113.0, 104.0, 120.0, 91.0, 68.0, 39.0, 30.0, 27.0, 15.0, 12.0, 9.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.77815246582031, -63.20740509033203, -61.63665771484375, -60.065914154052734, -58.49516677856445, -56.92441940307617, -55.353675842285156, -53.782928466796875, -52.212181091308594, -50.64143371582031, -49.07068634033203, -47.499942779541016, -45.929195404052734, -44.35844802856445, -42.78770446777344, -41.216957092285156, -39.646209716796875, -38.075462341308594, -36.50471496582031, -34.9339714050293, -33.363224029541016, -31.792476654052734, -30.221731185913086, -28.650985717773438, -27.080238342285156, -25.509490966796875, -23.938745498657227, -22.368000030517578, -20.797252655029297, -19.226505279541016, -17.655759811401367, -16.08501434326172, -14.514266967773438, -12.943520545959473, -11.372774124145508, -9.802027702331543, -8.231281280517578, -6.660534858703613, -5.089788436889648, -3.5190420150756836, -1.9482955932617188, -0.3775491714477539, 1.193197250366211, 2.763943672180176, 4.334690093994141, 5.9054365158081055, 7.47618293762207, 9.046929359436035, 10.61767578125, 12.188422203063965, 13.75916862487793, 15.329915046691895, 16.90066146850586, 18.47140884399414, 20.04215431213379, 21.612899780273438, 23.18364715576172, 24.75439453125, 26.32513999938965, 27.895885467529297, 29.466632843017578, 31.03738021850586, 32.608123779296875, 34.178871154785156, 35.74961853027344]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 7.0, 10.0, 5.0, 10.0, 10.0, 17.0, 11.0, 15.0, 19.0, 18.0, 24.0, 21.0, 35.0, 41.0, 42.0, 45.0, 54.0, 46.0, 45.0, 55.0, 59.0, 54.0, 39.0, 30.0, 27.0, 45.0, 24.0, 32.0, 23.0, 27.0, 15.0, 9.0, 14.0, 10.0, 12.0, 4.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 4.0], "bins": [-34.2764892578125, -33.23725128173828, -32.19801712036133, -31.15877914428711, -30.11954116821289, -29.080305099487305, -28.04106903076172, -27.0018310546875, -25.96259307861328, -24.923357009887695, -23.884119033813477, -22.84488296508789, -21.805644989013672, -20.766408920288086, -19.7271728515625, -18.68793487548828, -17.648698806762695, -16.60946273803711, -15.57022476196289, -14.530988693237305, -13.491750717163086, -12.4525146484375, -11.413277626037598, -10.374040603637695, -9.334803581237793, -8.29556655883789, -7.256329536437988, -6.217092990875244, -5.177855968475342, -4.1386189460754395, -3.0993824005126953, -2.060145378112793, -1.0209083557128906, 0.018328547477722168, 1.057565450668335, 2.096802234649658, 3.1360392570495605, 4.175276279449463, 5.214512825012207, 6.253749847412109, 7.292986869812012, 8.332223892211914, 9.371460914611816, 10.410697937011719, 11.449934005737305, 12.489171981811523, 13.52840805053711, 14.567645072937012, 15.606882095336914, 16.6461181640625, 17.68535614013672, 18.724592208862305, 19.763830184936523, 20.80306625366211, 21.842304229736328, 22.881540298461914, 23.9207763671875, 24.960012435913086, 25.999250411987305, 27.03848648071289, 28.07772445678711, 29.116960525512695, 30.15619659423828, 31.1954345703125, 32.23467254638672]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 14.0, 24.0, 42.0, 69.0, 112.0, 182.0, 317.0, 500.0, 888.0, 1615.0, 3063.0, 6142.0, 13162.0, 31156.0, 83115.0, 256549.0, 399892.0, 157401.0, 53599.0, 21477.0, 9498.0, 4442.0, 2337.0, 1185.0, 682.0, 432.0, 229.0, 132.0, 104.0, 53.0, 37.0, 22.0, 21.0, 12.0, 5.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.80078125, -3.65618896484375, -3.5115966796875, -3.36700439453125, -3.222412109375, -3.07781982421875, -2.9332275390625, -2.78863525390625, -2.64404296875, -2.49945068359375, -2.3548583984375, -2.21026611328125, -2.065673828125, -1.92108154296875, -1.7764892578125, -1.63189697265625, -1.4873046875, -1.34271240234375, -1.1981201171875, -1.05352783203125, -0.908935546875, -0.76434326171875, -0.6197509765625, -0.47515869140625, -0.33056640625, -0.18597412109375, -0.0413818359375, 0.10321044921875, 0.247802734375, 0.39239501953125, 0.5369873046875, 0.68157958984375, 0.826171875, 0.97076416015625, 1.1153564453125, 1.25994873046875, 1.404541015625, 1.54913330078125, 1.6937255859375, 1.83831787109375, 1.98291015625, 2.12750244140625, 2.2720947265625, 2.41668701171875, 2.561279296875, 2.70587158203125, 2.8504638671875, 2.99505615234375, 3.1396484375, 3.28424072265625, 3.4288330078125, 3.57342529296875, 3.718017578125, 3.86260986328125, 4.0072021484375, 4.15179443359375, 4.29638671875, 4.44097900390625, 4.5855712890625, 4.73016357421875, 4.874755859375, 5.01934814453125, 5.1639404296875, 5.30853271484375, 5.453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 4.0, 10.0, 7.0, 9.0, 13.0, 23.0, 12.0, 19.0, 34.0, 26.0, 43.0, 50.0, 45.0, 37.0, 52.0, 41.0, 57.0, 43.0, 52.0, 52.0, 48.0, 35.0, 31.0, 29.0, 34.0, 45.0, 24.0, 23.0, 20.0, 19.0, 19.0, 16.0, 4.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3046875, -4.1925048828125, -4.080322265625, -3.9681396484375, -3.85595703125, -3.7437744140625, -3.631591796875, -3.5194091796875, -3.4072265625, -3.2950439453125, -3.182861328125, -3.0706787109375, -2.95849609375, -2.8463134765625, -2.734130859375, -2.6219482421875, -2.509765625, -2.3975830078125, -2.285400390625, -2.1732177734375, -2.06103515625, -1.9488525390625, -1.836669921875, -1.7244873046875, -1.6123046875, -1.5001220703125, -1.387939453125, -1.2757568359375, -1.16357421875, -1.0513916015625, -0.939208984375, -0.8270263671875, -0.71484375, -0.6026611328125, -0.490478515625, -0.3782958984375, -0.26611328125, -0.1539306640625, -0.041748046875, 0.0704345703125, 0.1826171875, 0.2947998046875, 0.406982421875, 0.5191650390625, 0.63134765625, 0.7435302734375, 0.855712890625, 0.9678955078125, 1.080078125, 1.1922607421875, 1.304443359375, 1.4166259765625, 1.52880859375, 1.6409912109375, 1.753173828125, 1.8653564453125, 1.9775390625, 2.0897216796875, 2.201904296875, 2.3140869140625, 2.42626953125, 2.5384521484375, 2.650634765625, 2.7628173828125, 2.875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 10.0, 17.0, 16.0, 23.0, 36.0, 37.0, 63.0, 72.0, 96.0, 200.0, 263.0, 415.0, 710.0, 1403.0, 4067.0, 20331.0, 257431.0, 720710.0, 33111.0, 5644.0, 1688.0, 860.0, 477.0, 287.0, 182.0, 105.0, 80.0, 51.0, 58.0, 26.0, 22.0, 13.0, 15.0, 9.0, 9.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.1007080078125, -11.756103515625, -11.4114990234375, -11.06689453125, -10.7222900390625, -10.377685546875, -10.0330810546875, -9.6884765625, -9.3438720703125, -8.999267578125, -8.6546630859375, -8.31005859375, -7.9654541015625, -7.620849609375, -7.2762451171875, -6.931640625, -6.5870361328125, -6.242431640625, -5.8978271484375, -5.55322265625, -5.2086181640625, -4.864013671875, -4.5194091796875, -4.1748046875, -3.8302001953125, -3.485595703125, -3.1409912109375, -2.79638671875, -2.4517822265625, -2.107177734375, -1.7625732421875, -1.41796875, -1.0733642578125, -0.728759765625, -0.3841552734375, -0.03955078125, 0.3050537109375, 0.649658203125, 0.9942626953125, 1.3388671875, 1.6834716796875, 2.028076171875, 2.3726806640625, 2.71728515625, 3.0618896484375, 3.406494140625, 3.7510986328125, 4.095703125, 4.4403076171875, 4.784912109375, 5.1295166015625, 5.47412109375, 5.8187255859375, 6.163330078125, 6.5079345703125, 6.8525390625, 7.1971435546875, 7.541748046875, 7.8863525390625, 8.23095703125, 8.5755615234375, 8.920166015625, 9.2647705078125, 9.609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 10.0, 10.0, 4.0, 17.0, 16.0, 20.0, 15.0, 25.0, 28.0, 33.0, 34.0, 29.0, 48.0, 48.0, 62.0, 46.0, 40.0, 49.0, 35.0, 52.0, 36.0, 45.0, 41.0, 24.0, 33.0, 26.0, 26.0, 20.0, 22.0, 11.0, 14.0, 11.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.1015625, -11.7421875, -11.3828125, -11.0234375, -10.6640625, -10.3046875, -9.9453125, -9.5859375, -9.2265625, -8.8671875, -8.5078125, -8.1484375, -7.7890625, -7.4296875, -7.0703125, -6.7109375, -6.3515625, -5.9921875, -5.6328125, -5.2734375, -4.9140625, -4.5546875, -4.1953125, -3.8359375, -3.4765625, -3.1171875, -2.7578125, -2.3984375, -2.0390625, -1.6796875, -1.3203125, -0.9609375, -0.6015625, -0.2421875, 0.1171875, 0.4765625, 0.8359375, 1.1953125, 1.5546875, 1.9140625, 2.2734375, 2.6328125, 2.9921875, 3.3515625, 3.7109375, 4.0703125, 4.4296875, 4.7890625, 5.1484375, 5.5078125, 5.8671875, 6.2265625, 6.5859375, 6.9453125, 7.3046875, 7.6640625, 8.0234375, 8.3828125, 8.7421875, 9.1015625, 9.4609375, 9.8203125, 10.1796875, 10.5390625, 10.8984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 11.0, 21.0, 39.0, 46.0, 70.0, 133.0, 250.0, 782.0, 3105.0, 21680.0, 908550.0, 104336.0, 7211.0, 1402.0, 437.0, 184.0, 98.0, 55.0, 38.0, 30.0, 22.0, 15.0, 8.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.10784912109375, -5.8953857421875, -5.68292236328125, -5.470458984375, -5.25799560546875, -5.0455322265625, -4.83306884765625, -4.62060546875, -4.40814208984375, -4.1956787109375, -3.98321533203125, -3.770751953125, -3.55828857421875, -3.3458251953125, -3.13336181640625, -2.9208984375, -2.70843505859375, -2.4959716796875, -2.28350830078125, -2.071044921875, -1.85858154296875, -1.6461181640625, -1.43365478515625, -1.22119140625, -1.00872802734375, -0.7962646484375, -0.58380126953125, -0.371337890625, -0.15887451171875, 0.0535888671875, 0.26605224609375, 0.478515625, 0.69097900390625, 0.9034423828125, 1.11590576171875, 1.328369140625, 1.54083251953125, 1.7532958984375, 1.96575927734375, 2.17822265625, 2.39068603515625, 2.6031494140625, 2.81561279296875, 3.028076171875, 3.24053955078125, 3.4530029296875, 3.66546630859375, 3.8779296875, 4.09039306640625, 4.3028564453125, 4.51531982421875, 4.727783203125, 4.94024658203125, 5.1527099609375, 5.36517333984375, 5.57763671875, 5.79010009765625, 6.0025634765625, 6.21502685546875, 6.427490234375, 6.63995361328125, 6.8524169921875, 7.06488037109375, 7.27734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 8.0, 9.0, 10.0, 4.0, 18.0, 30.0, 36.0, 74.0, 88.0, 182.0, 183.0, 136.0, 72.0, 30.0, 28.0, 17.0, 17.0, 6.0, 7.0, 10.0, 6.0, 6.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009889602661132812, -0.0009551644325256348, -0.0009213685989379883, -0.0008875727653503418, -0.0008537769317626953, -0.0008199810981750488, -0.0007861852645874023, -0.0007523894309997559, -0.0007185935974121094, -0.0006847977638244629, -0.0006510019302368164, -0.0006172060966491699, -0.0005834102630615234, -0.000549614429473877, -0.0005158185958862305, -0.000482022762298584, -0.0004482269287109375, -0.000414431095123291, -0.00038063526153564453, -0.00034683942794799805, -0.00031304359436035156, -0.0002792477607727051, -0.0002454519271850586, -0.0002116560935974121, -0.00017786026000976562, -0.00014406442642211914, -0.00011026859283447266, -7.647275924682617e-05, -4.267692565917969e-05, -8.881092071533203e-06, 2.491474151611328e-05, 5.8710575103759766e-05, 9.250640869140625e-05, 0.00012630224227905273, 0.00016009807586669922, 0.0001938939094543457, 0.0002276897430419922, 0.00026148557662963867, 0.00029528141021728516, 0.00032907724380493164, 0.0003628730773925781, 0.0003966689109802246, 0.0004304647445678711, 0.0004642605781555176, 0.0004980564117431641, 0.0005318522453308105, 0.000565648078918457, 0.0005994439125061035, 0.00063323974609375, 0.0006670355796813965, 0.000700831413269043, 0.0007346272468566895, 0.0007684230804443359, 0.0008022189140319824, 0.0008360147476196289, 0.0008698105812072754, 0.0009036064147949219, 0.0009374022483825684, 0.0009711980819702148, 0.0010049939155578613, 0.0010387897491455078, 0.0010725855827331543, 0.0011063814163208008, 0.0011401772499084473, 0.0011739730834960938]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 7.0, 6.0, 9.0, 14.0, 10.0, 13.0, 25.0, 41.0, 49.0, 87.0, 125.0, 143.0, 302.0, 476.0, 979.0, 1942.0, 4578.0, 12866.0, 44461.0, 246592.0, 643617.0, 64204.0, 17024.0, 5836.0, 2424.0, 1138.0, 617.0, 343.0, 211.0, 120.0, 87.0, 60.0, 38.0, 28.0, 20.0, 14.0, 8.0, 10.0, 7.0, 9.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.52734375, -2.44866943359375, -2.3699951171875, -2.29132080078125, -2.212646484375, -2.13397216796875, -2.0552978515625, -1.97662353515625, -1.89794921875, -1.81927490234375, -1.7406005859375, -1.66192626953125, -1.583251953125, -1.50457763671875, -1.4259033203125, -1.34722900390625, -1.2685546875, -1.18988037109375, -1.1112060546875, -1.03253173828125, -0.953857421875, -0.87518310546875, -0.7965087890625, -0.71783447265625, -0.63916015625, -0.56048583984375, -0.4818115234375, -0.40313720703125, -0.324462890625, -0.24578857421875, -0.1671142578125, -0.08843994140625, -0.009765625, 0.06890869140625, 0.1475830078125, 0.22625732421875, 0.304931640625, 0.38360595703125, 0.4622802734375, 0.54095458984375, 0.61962890625, 0.69830322265625, 0.7769775390625, 0.85565185546875, 0.934326171875, 1.01300048828125, 1.0916748046875, 1.17034912109375, 1.2490234375, 1.32769775390625, 1.4063720703125, 1.48504638671875, 1.563720703125, 1.64239501953125, 1.7210693359375, 1.79974365234375, 1.87841796875, 1.95709228515625, 2.0357666015625, 2.11444091796875, 2.193115234375, 2.27178955078125, 2.3504638671875, 2.42913818359375, 2.5078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 7.0, 13.0, 11.0, 8.0, 22.0, 23.0, 36.0, 31.0, 47.0, 77.0, 78.0, 89.0, 92.0, 93.0, 86.0, 78.0, 44.0, 37.0, 23.0, 18.0, 19.0, 11.0, 8.0, 10.0, 9.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.3006591796875, -2.222412109375, -2.1441650390625, -2.06591796875, -1.9876708984375, -1.909423828125, -1.8311767578125, -1.7529296875, -1.6746826171875, -1.596435546875, -1.5181884765625, -1.43994140625, -1.3616943359375, -1.283447265625, -1.2052001953125, -1.126953125, -1.0487060546875, -0.970458984375, -0.8922119140625, -0.81396484375, -0.7357177734375, -0.657470703125, -0.5792236328125, -0.5009765625, -0.4227294921875, -0.344482421875, -0.2662353515625, -0.18798828125, -0.1097412109375, -0.031494140625, 0.0467529296875, 0.125, 0.2032470703125, 0.281494140625, 0.3597412109375, 0.43798828125, 0.5162353515625, 0.594482421875, 0.6727294921875, 0.7509765625, 0.8292236328125, 0.907470703125, 0.9857177734375, 1.06396484375, 1.1422119140625, 1.220458984375, 1.2987060546875, 1.376953125, 1.4552001953125, 1.533447265625, 1.6116943359375, 1.68994140625, 1.7681884765625, 1.846435546875, 1.9246826171875, 2.0029296875, 2.0811767578125, 2.159423828125, 2.2376708984375, 2.31591796875, 2.3941650390625, 2.472412109375, 2.5506591796875, 2.62890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 12.0, 24.0, 146.0, 606.0, 163.0, 33.0, 12.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.89833068847656, -201.08966064453125, -195.28099060058594, -189.47232055664062, -183.66366577148438, -177.85499572753906, -172.04632568359375, -166.23765563964844, -160.42898559570312, -154.6203155517578, -148.8116455078125, -143.00299072265625, -137.19432067871094, -131.38565063476562, -125.57698059082031, -119.768310546875, -113.95965576171875, -108.15098571777344, -102.34232330322266, -96.53365325927734, -90.72499084472656, -84.91632080078125, -79.10765075683594, -73.29898071289062, -67.49031829833984, -61.6816520690918, -55.87298583984375, -50.06431579589844, -44.25564956665039, -38.446983337402344, -32.63831329345703, -26.829647064208984, -21.020965576171875, -15.212298393249512, -9.403631210327148, -3.5949630737304688, 2.213703155517578, 8.022369384765625, 13.831039428710938, 19.639705657958984, 25.44837188720703, 31.257038116455078, 37.065704345703125, 42.87437438964844, 48.683040618896484, 54.49170684814453, 60.300376892089844, 66.10903930664062, 71.91770935058594, 77.72637939453125, 83.53504180908203, 89.34371185302734, 95.15237426757812, 100.96104431152344, 106.76971435546875, 112.57838439941406, 118.38704681396484, 124.19571685791016, 130.00437927246094, 135.81304931640625, 141.62171936035156, 147.43038940429688, 153.23904418945312, 159.04771423339844, 164.85638427734375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 8.0, 8.0, 5.0, 12.0, 14.0, 13.0, 14.0, 22.0, 20.0, 26.0, 28.0, 44.0, 25.0, 43.0, 42.0, 73.0, 165.0, 118.0, 50.0, 35.0, 46.0, 30.0, 21.0, 23.0, 24.0, 12.0, 16.0, 9.0, 14.0, 12.0, 4.0, 6.0, 12.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.14698791503906, -44.415069580078125, -42.68315124511719, -40.95123291015625, -39.21931457519531, -37.487396240234375, -35.75547790527344, -34.0235595703125, -32.29164123535156, -30.559722900390625, -28.827804565429688, -27.09588623046875, -25.363967895507812, -23.632049560546875, -21.900131225585938, -20.168212890625, -18.436294555664062, -16.704376220703125, -14.972457885742188, -13.24053955078125, -11.508621215820312, -9.776702880859375, -8.044784545898438, -6.3128662109375, -4.5809478759765625, -2.849029541015625, -1.1171112060546875, 0.61480712890625, 2.3467254638671875, 4.078643798828125, 5.8105621337890625, 7.54248046875, 9.274398803710938, 11.006317138671875, 12.738235473632812, 14.47015380859375, 16.202072143554688, 17.933990478515625, 19.665908813476562, 21.3978271484375, 23.129745483398438, 24.861663818359375, 26.593582153320312, 28.32550048828125, 30.057418823242188, 31.789337158203125, 33.52125549316406, 35.253173828125, 36.98509216308594, 38.717010498046875, 40.44892883300781, 42.18084716796875, 43.91276550292969, 45.644683837890625, 47.37660217285156, 49.1085205078125, 50.84043884277344, 52.572357177734375, 54.30427551269531, 56.03619384765625, 57.76811218261719, 59.500030517578125, 61.23194885253906, 62.9638671875, 64.69578552246094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 8.0, 22.0, 23.0, 44.0, 63.0, 104.0, 180.0, 271.0, 560.0, 1174.0, 2431.0, 5605.0, 16767.0, 75687.0, 502315.0, 2066373.0, 1264051.0, 206461.0, 35192.0, 9777.0, 3711.0, 1696.0, 747.0, 417.0, 221.0, 143.0, 85.0, 60.0, 26.0, 19.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.58984375, -7.37158203125, -7.1533203125, -6.93505859375, -6.716796875, -6.49853515625, -6.2802734375, -6.06201171875, -5.84375, -5.62548828125, -5.4072265625, -5.18896484375, -4.970703125, -4.75244140625, -4.5341796875, -4.31591796875, -4.09765625, -3.87939453125, -3.6611328125, -3.44287109375, -3.224609375, -3.00634765625, -2.7880859375, -2.56982421875, -2.3515625, -2.13330078125, -1.9150390625, -1.69677734375, -1.478515625, -1.26025390625, -1.0419921875, -0.82373046875, -0.60546875, -0.38720703125, -0.1689453125, 0.04931640625, 0.267578125, 0.48583984375, 0.7041015625, 0.92236328125, 1.140625, 1.35888671875, 1.5771484375, 1.79541015625, 2.013671875, 2.23193359375, 2.4501953125, 2.66845703125, 2.88671875, 3.10498046875, 3.3232421875, 3.54150390625, 3.759765625, 3.97802734375, 4.1962890625, 4.41455078125, 4.6328125, 4.85107421875, 5.0693359375, 5.28759765625, 5.505859375, 5.72412109375, 5.9423828125, 6.16064453125, 6.37890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 9.0, 11.0, 4.0, 7.0, 12.0, 18.0, 20.0, 26.0, 14.0, 23.0, 21.0, 40.0, 29.0, 36.0, 35.0, 43.0, 26.0, 47.0, 51.0, 46.0, 36.0, 30.0, 40.0, 33.0, 45.0, 38.0, 32.0, 34.0, 27.0, 21.0, 19.0, 17.0, 13.0, 20.0, 11.0, 16.0, 10.0, 10.0, 9.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.232421875, -3.1390380859375, -3.045654296875, -2.9522705078125, -2.85888671875, -2.7655029296875, -2.672119140625, -2.5787353515625, -2.4853515625, -2.3919677734375, -2.298583984375, -2.2052001953125, -2.11181640625, -2.0184326171875, -1.925048828125, -1.8316650390625, -1.73828125, -1.6448974609375, -1.551513671875, -1.4581298828125, -1.36474609375, -1.2713623046875, -1.177978515625, -1.0845947265625, -0.9912109375, -0.8978271484375, -0.804443359375, -0.7110595703125, -0.61767578125, -0.5242919921875, -0.430908203125, -0.3375244140625, -0.244140625, -0.1507568359375, -0.057373046875, 0.0360107421875, 0.12939453125, 0.2227783203125, 0.316162109375, 0.4095458984375, 0.5029296875, 0.5963134765625, 0.689697265625, 0.7830810546875, 0.87646484375, 0.9698486328125, 1.063232421875, 1.1566162109375, 1.25, 1.3433837890625, 1.436767578125, 1.5301513671875, 1.62353515625, 1.7169189453125, 1.810302734375, 1.9036865234375, 1.9970703125, 2.0904541015625, 2.183837890625, 2.2772216796875, 2.37060546875, 2.4639892578125, 2.557373046875, 2.6507568359375, 2.744140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 9.0, 7.0, 18.0, 29.0, 47.0, 96.0, 210.0, 656.0, 2032.0, 14262.0, 4073343.0, 98343.0, 3692.0, 903.0, 374.0, 140.0, 56.0, 24.0, 16.0, 4.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -34.12353515625, -32.9345703125, -31.74560546875, -30.556640625, -29.36767578125, -28.1787109375, -26.98974609375, -25.80078125, -24.61181640625, -23.4228515625, -22.23388671875, -21.044921875, -19.85595703125, -18.6669921875, -17.47802734375, -16.2890625, -15.10009765625, -13.9111328125, -12.72216796875, -11.533203125, -10.34423828125, -9.1552734375, -7.96630859375, -6.77734375, -5.58837890625, -4.3994140625, -3.21044921875, -2.021484375, -0.83251953125, 0.3564453125, 1.54541015625, 2.734375, 3.92333984375, 5.1123046875, 6.30126953125, 7.490234375, 8.67919921875, 9.8681640625, 11.05712890625, 12.24609375, 13.43505859375, 14.6240234375, 15.81298828125, 17.001953125, 18.19091796875, 19.3798828125, 20.56884765625, 21.7578125, 22.94677734375, 24.1357421875, 25.32470703125, 26.513671875, 27.70263671875, 28.8916015625, 30.08056640625, 31.26953125, 32.45849609375, 33.6474609375, 34.83642578125, 36.025390625, 37.21435546875, 38.4033203125, 39.59228515625, 40.78125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 13.0, 21.0, 58.0, 101.0, 261.0, 468.0, 870.0, 1000.0, 669.0, 340.0, 143.0, 67.0, 38.0, 17.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -29.110595703125, -28.33056640625, -27.550537109375, -26.7705078125, -25.990478515625, -25.21044921875, -24.430419921875, -23.650390625, -22.870361328125, -22.09033203125, -21.310302734375, -20.5302734375, -19.750244140625, -18.97021484375, -18.190185546875, -17.41015625, -16.630126953125, -15.85009765625, -15.070068359375, -14.2900390625, -13.510009765625, -12.72998046875, -11.949951171875, -11.169921875, -10.389892578125, -9.60986328125, -8.829833984375, -8.0498046875, -7.269775390625, -6.48974609375, -5.709716796875, -4.9296875, -4.149658203125, -3.36962890625, -2.589599609375, -1.8095703125, -1.029541015625, -0.24951171875, 0.530517578125, 1.310546875, 2.090576171875, 2.87060546875, 3.650634765625, 4.4306640625, 5.210693359375, 5.99072265625, 6.770751953125, 7.55078125, 8.330810546875, 9.11083984375, 9.890869140625, 10.6708984375, 11.450927734375, 12.23095703125, 13.010986328125, 13.791015625, 14.571044921875, 15.35107421875, 16.131103515625, 16.9111328125, 17.691162109375, 18.47119140625, 19.251220703125, 20.03125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 10.0, 10.0, 22.0, 33.0, 66.0, 135.0, 240.0, 230.0, 137.0, 49.0, 26.0, 13.0, 10.0, 5.0, 8.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-307.7391357421875, -301.7035217285156, -295.6678771972656, -289.63226318359375, -283.5966491699219, -277.5610046386719, -271.525390625, -265.4897766113281, -259.4541320800781, -253.4185028076172, -247.3828887939453, -241.34725952148438, -235.31163024902344, -229.2760009765625, -223.24038696289062, -217.2047576904297, -211.1691436767578, -205.13351440429688, -199.097900390625, -193.06227111816406, -187.02664184570312, -180.99102783203125, -174.9553985595703, -168.91976928710938, -162.8841552734375, -156.84852600097656, -150.8129119873047, -144.77728271484375, -138.7416534423828, -132.70602416992188, -126.67041015625, -120.63478088378906, -114.59915161132812, -108.56352996826172, -102.52790069580078, -96.49227905273438, -90.45664978027344, -84.42102813720703, -78.38540649414062, -72.34977722167969, -66.31415557861328, -60.27853012084961, -54.24290466308594, -48.20728302001953, -42.17165756225586, -36.13603210449219, -30.10041046142578, -24.06478500366211, -18.029159545898438, -11.993535041809082, -5.957910537719727, 0.0777130126953125, 6.113338470458984, 12.148963928222656, 18.184585571289062, 24.220211029052734, 30.255836486816406, 36.29146194458008, 42.32708740234375, 48.362709045410156, 54.39833450317383, 60.4339599609375, 66.4695816040039, 72.50520324707031, 78.54083251953125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 4.0, 3.0, 8.0, 24.0, 21.0, 21.0, 31.0, 37.0, 38.0, 34.0, 43.0, 44.0, 47.0, 69.0, 72.0, 74.0, 61.0, 45.0, 51.0, 43.0, 32.0, 32.0, 28.0, 29.0, 20.0, 8.0, 11.0, 16.0, 12.0, 11.0, 4.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.11773681640625, -72.55535888671875, -69.99298095703125, -67.43060302734375, -64.86823272705078, -62.30585479736328, -59.74347686767578, -57.18109893798828, -54.61872100830078, -52.05634307861328, -49.49396896362305, -46.93159103393555, -44.36921310424805, -41.80683898925781, -39.24446105957031, -36.68208312988281, -34.11970901489258, -31.55733299255371, -28.99495506286621, -26.432579040527344, -23.870201110839844, -21.307825088500977, -18.74544906616211, -16.18307113647461, -13.620695114135742, -11.058318138122559, -8.495941162109375, -5.933565139770508, -3.371188163757324, -0.8088111877441406, 1.7535648345947266, 4.315942764282227, 6.878318786621094, 9.440695762634277, 12.003072738647461, 14.565448760986328, 17.127826690673828, 19.690202713012695, 22.252578735351562, 24.814956665039062, 27.37733268737793, 29.939708709716797, 32.5020866394043, 35.06446075439453, 37.62683868408203, 40.18921661376953, 42.75159454345703, 45.31397247314453, 47.876346588134766, 50.438724517822266, 53.0010986328125, 55.5634765625, 58.1258544921875, 60.688232421875, 63.250606536865234, 65.81298828125, 68.37535858154297, 70.93773651123047, 73.50011444091797, 76.06248474121094, 78.62486267089844, 81.18724060058594, 83.74961853027344, 86.31199645996094, 88.87437438964844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 8.0, 11.0, 19.0, 31.0, 32.0, 54.0, 81.0, 125.0, 170.0, 322.0, 469.0, 851.0, 1579.0, 3023.0, 6857.0, 17587.0, 52685.0, 207330.0, 568920.0, 128472.0, 36209.0, 12696.0, 5240.0, 2483.0, 1317.0, 738.0, 434.0, 275.0, 174.0, 87.0, 69.0, 58.0, 38.0, 35.0, 14.0, 14.0, 9.0, 3.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.0560302734375, -3.889404296875, -3.7227783203125, -3.55615234375, -3.3895263671875, -3.222900390625, -3.0562744140625, -2.8896484375, -2.7230224609375, -2.556396484375, -2.3897705078125, -2.22314453125, -2.0565185546875, -1.889892578125, -1.7232666015625, -1.556640625, -1.3900146484375, -1.223388671875, -1.0567626953125, -0.89013671875, -0.7235107421875, -0.556884765625, -0.3902587890625, -0.2236328125, -0.0570068359375, 0.109619140625, 0.2762451171875, 0.44287109375, 0.6094970703125, 0.776123046875, 0.9427490234375, 1.109375, 1.2760009765625, 1.442626953125, 1.6092529296875, 1.77587890625, 1.9425048828125, 2.109130859375, 2.2757568359375, 2.4423828125, 2.6090087890625, 2.775634765625, 2.9422607421875, 3.10888671875, 3.2755126953125, 3.442138671875, 3.6087646484375, 3.775390625, 3.9420166015625, 4.108642578125, 4.2752685546875, 4.44189453125, 4.6085205078125, 4.775146484375, 4.9417724609375, 5.1083984375, 5.2750244140625, 5.441650390625, 5.6082763671875, 5.77490234375, 5.9415283203125, 6.108154296875, 6.2747802734375, 6.44140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 10.0, 13.0, 9.0, 13.0, 26.0, 27.0, 38.0, 44.0, 54.0, 69.0, 76.0, 68.0, 72.0, 80.0, 58.0, 52.0, 42.0, 48.0, 33.0, 31.0, 25.0, 24.0, 23.0, 15.0, 13.0, 10.0, 9.0, 7.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.901611328125, -5.69775390625, -5.493896484375, -5.2900390625, -5.086181640625, -4.88232421875, -4.678466796875, -4.474609375, -4.270751953125, -4.06689453125, -3.863037109375, -3.6591796875, -3.455322265625, -3.25146484375, -3.047607421875, -2.84375, -2.639892578125, -2.43603515625, -2.232177734375, -2.0283203125, -1.824462890625, -1.62060546875, -1.416748046875, -1.212890625, -1.009033203125, -0.80517578125, -0.601318359375, -0.3974609375, -0.193603515625, 0.01025390625, 0.214111328125, 0.41796875, 0.621826171875, 0.82568359375, 1.029541015625, 1.2333984375, 1.437255859375, 1.64111328125, 1.844970703125, 2.048828125, 2.252685546875, 2.45654296875, 2.660400390625, 2.8642578125, 3.068115234375, 3.27197265625, 3.475830078125, 3.6796875, 3.883544921875, 4.08740234375, 4.291259765625, 4.4951171875, 4.698974609375, 4.90283203125, 5.106689453125, 5.310546875, 5.514404296875, 5.71826171875, 5.922119140625, 6.1259765625, 6.329833984375, 6.53369140625, 6.737548828125, 6.94140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 14.0, 18.0, 29.0, 38.0, 46.0, 74.0, 108.0, 207.0, 310.0, 788.0, 2157.0, 12386.0, 342593.0, 672668.0, 13263.0, 2210.0, 758.0, 324.0, 179.0, 122.0, 85.0, 49.0, 33.0, 23.0, 20.0, 11.0, 12.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0859375, -9.7498779296875, -9.413818359375, -9.0777587890625, -8.74169921875, -8.4056396484375, -8.069580078125, -7.7335205078125, -7.3974609375, -7.0614013671875, -6.725341796875, -6.3892822265625, -6.05322265625, -5.7171630859375, -5.381103515625, -5.0450439453125, -4.708984375, -4.3729248046875, -4.036865234375, -3.7008056640625, -3.36474609375, -3.0286865234375, -2.692626953125, -2.3565673828125, -2.0205078125, -1.6844482421875, -1.348388671875, -1.0123291015625, -0.67626953125, -0.3402099609375, -0.004150390625, 0.3319091796875, 0.66796875, 1.0040283203125, 1.340087890625, 1.6761474609375, 2.01220703125, 2.3482666015625, 2.684326171875, 3.0203857421875, 3.3564453125, 3.6925048828125, 4.028564453125, 4.3646240234375, 4.70068359375, 5.0367431640625, 5.372802734375, 5.7088623046875, 6.044921875, 6.3809814453125, 6.717041015625, 7.0531005859375, 7.38916015625, 7.7252197265625, 8.061279296875, 8.3973388671875, 8.7333984375, 9.0694580078125, 9.405517578125, 9.7415771484375, 10.07763671875, 10.4136962890625, 10.749755859375, 11.0858154296875, 11.421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 3.0, 12.0, 13.0, 17.0, 24.0, 18.0, 31.0, 29.0, 38.0, 45.0, 52.0, 62.0, 80.0, 103.0, 83.0, 63.0, 64.0, 38.0, 36.0, 33.0, 23.0, 20.0, 12.0, 20.0, 20.0, 12.0, 10.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.21875, -20.586181640625, -19.95361328125, -19.321044921875, -18.6884765625, -18.055908203125, -17.42333984375, -16.790771484375, -16.158203125, -15.525634765625, -14.89306640625, -14.260498046875, -13.6279296875, -12.995361328125, -12.36279296875, -11.730224609375, -11.09765625, -10.465087890625, -9.83251953125, -9.199951171875, -8.5673828125, -7.934814453125, -7.30224609375, -6.669677734375, -6.037109375, -5.404541015625, -4.77197265625, -4.139404296875, -3.5068359375, -2.874267578125, -2.24169921875, -1.609130859375, -0.9765625, -0.343994140625, 0.28857421875, 0.921142578125, 1.5537109375, 2.186279296875, 2.81884765625, 3.451416015625, 4.083984375, 4.716552734375, 5.34912109375, 5.981689453125, 6.6142578125, 7.246826171875, 7.87939453125, 8.511962890625, 9.14453125, 9.777099609375, 10.40966796875, 11.042236328125, 11.6748046875, 12.307373046875, 12.93994140625, 13.572509765625, 14.205078125, 14.837646484375, 15.47021484375, 16.102783203125, 16.7353515625, 17.367919921875, 18.00048828125, 18.633056640625, 19.265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 6.0, 9.0, 10.0, 14.0, 29.0, 59.0, 105.0, 197.0, 472.0, 1288.0, 4854.0, 32320.0, 899592.0, 96278.0, 9924.0, 2113.0, 732.0, 262.0, 129.0, 57.0, 40.0, 25.0, 13.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.93194580078125, -1.8746337890625, -1.81732177734375, -1.760009765625, -1.70269775390625, -1.6453857421875, -1.58807373046875, -1.53076171875, -1.47344970703125, -1.4161376953125, -1.35882568359375, -1.301513671875, -1.24420166015625, -1.1868896484375, -1.12957763671875, -1.072265625, -1.01495361328125, -0.9576416015625, -0.90032958984375, -0.843017578125, -0.78570556640625, -0.7283935546875, -0.67108154296875, -0.61376953125, -0.55645751953125, -0.4991455078125, -0.44183349609375, -0.384521484375, -0.32720947265625, -0.2698974609375, -0.21258544921875, -0.1552734375, -0.09796142578125, -0.0406494140625, 0.01666259765625, 0.073974609375, 0.13128662109375, 0.1885986328125, 0.24591064453125, 0.30322265625, 0.36053466796875, 0.4178466796875, 0.47515869140625, 0.532470703125, 0.58978271484375, 0.6470947265625, 0.70440673828125, 0.76171875, 0.81903076171875, 0.8763427734375, 0.93365478515625, 0.990966796875, 1.04827880859375, 1.1055908203125, 1.16290283203125, 1.22021484375, 1.27752685546875, 1.3348388671875, 1.39215087890625, 1.449462890625, 1.50677490234375, 1.5640869140625, 1.62139892578125, 1.6787109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 2.0, 8.0, 4.0, 7.0, 13.0, 15.0, 17.0, 29.0, 30.0, 46.0, 39.0, 68.0, 77.0, 110.0, 115.0, 78.0, 83.0, 63.0, 32.0, 36.0, 30.0, 14.0, 19.0, 11.0, 8.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003216266632080078, -0.0003116726875305176, -0.00030171871185302734, -0.0002917647361755371, -0.0002818107604980469, -0.00027185678482055664, -0.0002619028091430664, -0.00025194883346557617, -0.00024199485778808594, -0.0002320408821105957, -0.00022208690643310547, -0.00021213293075561523, -0.000202178955078125, -0.00019222497940063477, -0.00018227100372314453, -0.0001723170280456543, -0.00016236305236816406, -0.00015240907669067383, -0.0001424551010131836, -0.00013250112533569336, -0.00012254714965820312, -0.00011259317398071289, -0.00010263919830322266, -9.268522262573242e-05, -8.273124694824219e-05, -7.277727127075195e-05, -6.282329559326172e-05, -5.2869319915771484e-05, -4.291534423828125e-05, -3.2961368560791016e-05, -2.300739288330078e-05, -1.3053417205810547e-05, -3.0994415283203125e-06, 6.854534149169922e-06, 1.6808509826660156e-05, 2.676248550415039e-05, 3.6716461181640625e-05, 4.667043685913086e-05, 5.6624412536621094e-05, 6.657838821411133e-05, 7.653236389160156e-05, 8.64863395690918e-05, 9.644031524658203e-05, 0.00010639429092407227, 0.0001163482666015625, 0.00012630224227905273, 0.00013625621795654297, 0.0001462101936340332, 0.00015616416931152344, 0.00016611814498901367, 0.0001760721206665039, 0.00018602609634399414, 0.00019598007202148438, 0.0002059340476989746, 0.00021588802337646484, 0.00022584199905395508, 0.0002357959747314453, 0.00024574995040893555, 0.0002557039260864258, 0.000265657901763916, 0.00027561187744140625, 0.0002855658531188965, 0.0002955198287963867, 0.00030547380447387695, 0.0003154277801513672]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 9.0, 19.0, 25.0, 48.0, 74.0, 113.0, 197.0, 441.0, 913.0, 2499.0, 7410.0, 28366.0, 253530.0, 710558.0, 31667.0, 8055.0, 2621.0, 1037.0, 444.0, 230.0, 116.0, 66.0, 37.0, 26.0, 15.0, 12.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.3339385986328125, -1.287994384765625, -1.2420501708984375, -1.19610595703125, -1.1501617431640625, -1.104217529296875, -1.0582733154296875, -1.0123291015625, -0.9663848876953125, -0.920440673828125, -0.8744964599609375, -0.82855224609375, -0.7826080322265625, -0.736663818359375, -0.6907196044921875, -0.644775390625, -0.5988311767578125, -0.552886962890625, -0.5069427490234375, -0.46099853515625, -0.4150543212890625, -0.369110107421875, -0.3231658935546875, -0.2772216796875, -0.2312774658203125, -0.185333251953125, -0.1393890380859375, -0.09344482421875, -0.0475006103515625, -0.001556396484375, 0.0443878173828125, 0.09033203125, 0.1362762451171875, 0.182220458984375, 0.2281646728515625, 0.27410888671875, 0.3200531005859375, 0.365997314453125, 0.4119415283203125, 0.4578857421875, 0.5038299560546875, 0.549774169921875, 0.5957183837890625, 0.64166259765625, 0.6876068115234375, 0.733551025390625, 0.7794952392578125, 0.825439453125, 0.8713836669921875, 0.917327880859375, 0.9632720947265625, 1.00921630859375, 1.0551605224609375, 1.101104736328125, 1.1470489501953125, 1.1929931640625, 1.2389373779296875, 1.284881591796875, 1.3308258056640625, 1.37677001953125, 1.4227142333984375, 1.468658447265625, 1.5146026611328125, 1.560546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 8.0, 10.0, 16.0, 18.0, 23.0, 38.0, 67.0, 113.0, 157.0, 174.0, 124.0, 85.0, 39.0, 28.0, 20.0, 21.0, 13.0, 4.0, 12.0, 3.0, 6.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5393218994140625, -1.470245361328125, -1.4011688232421875, -1.33209228515625, -1.2630157470703125, -1.193939208984375, -1.1248626708984375, -1.0557861328125, -0.9867095947265625, -0.917633056640625, -0.8485565185546875, -0.77947998046875, -0.7104034423828125, -0.641326904296875, -0.5722503662109375, -0.503173828125, -0.4340972900390625, -0.365020751953125, -0.2959442138671875, -0.22686767578125, -0.1577911376953125, -0.088714599609375, -0.0196380615234375, 0.0494384765625, 0.1185150146484375, 0.187591552734375, 0.2566680908203125, 0.32574462890625, 0.3948211669921875, 0.463897705078125, 0.5329742431640625, 0.60205078125, 0.6711273193359375, 0.740203857421875, 0.8092803955078125, 0.87835693359375, 0.9474334716796875, 1.016510009765625, 1.0855865478515625, 1.1546630859375, 1.2237396240234375, 1.292816162109375, 1.3618927001953125, 1.43096923828125, 1.5000457763671875, 1.569122314453125, 1.6381988525390625, 1.707275390625, 1.7763519287109375, 1.845428466796875, 1.9145050048828125, 1.98358154296875, 2.0526580810546875, 2.121734619140625, 2.1908111572265625, 2.2598876953125, 2.3289642333984375, 2.398040771484375, 2.4671173095703125, 2.53619384765625, 2.6052703857421875, 2.674346923828125, 2.7434234619140625, 2.8125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 10.0, 32.0, 40.0, 76.0, 289.0, 405.0, 68.0, 40.0, 17.0, 10.0, 9.0, 2.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.4432373046875, -111.95817565917969, -109.47310638427734, -106.988037109375, -104.50297546386719, -102.01791381835938, -99.53284454345703, -97.04777526855469, -94.56271362304688, -92.07765197753906, -89.59258270263672, -87.10751342773438, -84.62245178222656, -82.13739013671875, -79.6523208618164, -77.16725158691406, -74.68218994140625, -72.19712829589844, -69.7120590209961, -67.22698974609375, -64.74192810058594, -62.25686264038086, -59.77179718017578, -57.2867317199707, -54.801666259765625, -52.31660079956055, -49.83153533935547, -47.34646987915039, -44.86140441894531, -42.376338958740234, -39.891273498535156, -37.40620803833008, -34.92115020751953, -32.43608474731445, -29.951019287109375, -27.465953826904297, -24.98088836669922, -22.49582290649414, -20.010757446289062, -17.525691986083984, -15.040626525878906, -12.555561065673828, -10.07049560546875, -7.585430145263672, -5.100364685058594, -2.6152992248535156, -0.1302337646484375, 2.3548316955566406, 4.839897155761719, 7.324962615966797, 9.810028076171875, 12.295093536376953, 14.780158996582031, 17.26522445678711, 19.750289916992188, 22.235355377197266, 24.720420837402344, 27.205486297607422, 29.6905517578125, 32.17561721801758, 34.660682678222656, 37.145748138427734, 39.63081359863281, 42.11587905883789, 44.60094451904297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 4.0, 9.0, 7.0, 12.0, 11.0, 8.0, 11.0, 10.0, 25.0, 11.0, 11.0, 25.0, 19.0, 21.0, 33.0, 89.0, 170.0, 180.0, 87.0, 33.0, 26.0, 39.0, 27.0, 15.0, 12.0, 14.0, 12.0, 9.0, 14.0, 6.0, 10.0, 10.0, 6.0, 1.0, 9.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.523048400878906, -45.11537551879883, -43.70770263671875, -42.30002975463867, -40.892356872558594, -39.48468780517578, -38.07701110839844, -36.669342041015625, -35.26166915893555, -33.85399627685547, -32.44632339477539, -31.038650512695312, -29.630979537963867, -28.22330665588379, -26.81563377380371, -25.407962799072266, -24.000288009643555, -22.592615127563477, -21.1849422454834, -19.777271270751953, -18.369598388671875, -16.961925506591797, -15.554252624511719, -14.146580696105957, -12.738907814025879, -11.3312349319458, -9.923563003540039, -8.515890121459961, -7.108217716217041, -5.700545310974121, -4.292872428894043, -2.8852005004882812, -1.4775276184082031, -0.06985509395599365, 1.3378174304962158, 2.745490074157715, 4.153162479400635, 5.560834884643555, 6.968507766723633, 8.376179695129395, 9.783852577209473, 11.19152545928955, 12.599197387695312, 14.00687026977539, 15.414543151855469, 16.822216033935547, 18.229888916015625, 19.63755989074707, 21.04523277282715, 22.452905654907227, 23.860578536987305, 25.26824951171875, 26.675922393798828, 28.083595275878906, 29.491268157958984, 30.898941040039062, 32.30661392211914, 33.71428680419922, 35.1219596862793, 36.529632568359375, 37.93730545043945, 39.34497833251953, 40.752647399902344, 42.16032028198242, 43.5679931640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 2.0, 9.0, 11.0, 14.0, 12.0, 11.0, 7.0, 16.0, 21.0, 23.0, 39.0, 23.0, 30.0, 30.0, 47.0, 49.0, 162.0, 156.0, 61.0, 32.0, 32.0, 27.0, 27.0, 18.0, 26.0, 20.0, 15.0, 12.0, 8.0, 12.0, 3.0, 6.0, 7.0, 4.0, 1.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.6328125, -4.4921875, -4.3515625, -4.2109375, -4.0703125, -3.9296875, -3.7890625, -3.6484375, -3.5078125, -3.3671875, -3.2265625, -3.0859375, -2.9453125, -2.8046875, -2.6640625, -2.5234375, -2.3828125, -2.2421875, -2.1015625, -1.9609375, -1.8203125, -1.6796875, -1.5390625, -1.3984375, -1.2578125, -1.1171875, -0.9765625, -0.8359375, -0.6953125, -0.5546875, -0.4140625, -0.2734375, -0.1328125, 0.0078125, 0.1484375, 0.2890625, 0.4296875, 0.5703125, 0.7109375, 0.8515625, 0.9921875, 1.1328125, 1.2734375, 1.4140625, 1.5546875, 1.6953125, 1.8359375, 1.9765625, 2.1171875, 2.2578125, 2.3984375, 2.5390625, 2.6796875, 2.8203125, 2.9609375, 3.1015625, 3.2421875, 3.3828125, 3.5234375, 3.6640625, 3.8046875, 3.9453125, 4.0859375, 4.2265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 11.0, 2.0, 3.0, 7.0, 19.0, 12.0, 28.0, 29.0, 60.0, 90.0, 188.0, 457.0, 1906.0, 14915.0, 8357494.0, 11014.0, 1579.0, 421.0, 142.0, 69.0, 39.0, 26.0, 21.0, 17.0, 17.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-56.41648864746094, -54.67768859863281, -52.93889236450195, -51.200096130371094, -49.46129608154297, -47.722496032714844, -45.983699798583984, -44.244903564453125, -42.506103515625, -40.767303466796875, -39.028507232666016, -37.289710998535156, -35.55091094970703, -33.812110900878906, -32.07331466674805, -30.334516525268555, -28.595718383789062, -26.85692024230957, -25.118122100830078, -23.379323959350586, -21.640525817871094, -19.9017276763916, -18.16292953491211, -16.424131393432617, -14.685333251953125, -12.946535110473633, -11.20773696899414, -9.468938827514648, -7.730140686035156, -5.991342544555664, -4.252544403076172, -2.5137462615966797, -0.7749443054199219, 0.9638538360595703, 2.7026519775390625, 4.441450119018555, 6.180248260498047, 7.919046401977539, 9.657844543457031, 11.396642684936523, 13.135440826416016, 14.874238967895508, 16.613037109375, 18.351835250854492, 20.090633392333984, 21.829431533813477, 23.56822967529297, 25.30702781677246, 27.045825958251953, 28.784624099731445, 30.523422241210938, 32.26222229003906, 34.00101852416992, 35.73981475830078, 37.478614807128906, 39.21741485595703, 40.95621109008789, 42.69500732421875, 44.433807373046875, 46.172607421875, 47.91140365600586, 49.65019989013672, 51.388999938964844, 53.12779998779297, 54.86659622192383]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 5.0, 4.0, 2.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-104.98562622070312, -101.93575286865234, -98.88587951660156, -95.83599853515625, -92.78612518310547, -89.73625183105469, -86.6863784790039, -83.63650512695312, -80.58662414550781, -77.53675079345703, -74.48687744140625, -71.43699645996094, -68.38712310791016, -65.33724975585938, -62.287376403808594, -59.23749923706055, -56.187625885009766, -53.137752532958984, -50.08787536621094, -47.038002014160156, -43.98812484741211, -40.93825149536133, -37.88837432861328, -34.8385009765625, -31.788625717163086, -28.738750457763672, -25.688875198364258, -22.638999938964844, -19.589126586914062, -16.539249420166016, -13.489376068115234, -10.43950080871582, -7.389625549316406, -4.339750289916992, -1.2898755073547363, 1.7599992752075195, 4.809874534606934, 7.859749794006348, 10.909624099731445, 13.95949935913086, 17.009374618530273, 20.059249877929688, 23.1091251373291, 26.159000396728516, 29.208873748779297, 32.258750915527344, 35.308624267578125, 38.358497619628906, 41.40837478637695, 44.458248138427734, 47.50812530517578, 50.55799865722656, 53.60787582397461, 56.65774917602539, 59.70762634277344, 62.75749969482422, 65.807373046875, 68.85724639892578, 71.90711975097656, 74.95700073242188, 78.00687408447266, 81.05674743652344, 84.10662078857422, 87.156494140625, 90.20637512207031]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 7.0, 11.0, 14.0, 23.0, 20.0, 24.0, 32.0, 42.0, 43.0, 47.0, 59.0, 60.0, 62.0, 65.0, 57.0, 69.0, 61.0, 51.0, 41.0, 31.0, 29.0, 23.0, 26.0, 21.0, 23.0, 13.0, 9.0, 3.0, 5.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.421875, -2.32037353515625, -2.2188720703125, -2.11737060546875, -2.015869140625, -1.91436767578125, -1.8128662109375, -1.71136474609375, -1.60986328125, -1.50836181640625, -1.4068603515625, -1.30535888671875, -1.203857421875, -1.10235595703125, -1.0008544921875, -0.89935302734375, -0.7978515625, -0.69635009765625, -0.5948486328125, -0.49334716796875, -0.391845703125, -0.29034423828125, -0.1888427734375, -0.08734130859375, 0.01416015625, 0.11566162109375, 0.2171630859375, 0.31866455078125, 0.420166015625, 0.52166748046875, 0.6231689453125, 0.72467041015625, 0.826171875, 0.92767333984375, 1.0291748046875, 1.13067626953125, 1.232177734375, 1.33367919921875, 1.4351806640625, 1.53668212890625, 1.63818359375, 1.73968505859375, 1.8411865234375, 1.94268798828125, 2.044189453125, 2.14569091796875, 2.2471923828125, 2.34869384765625, 2.4501953125, 2.55169677734375, 2.6531982421875, 2.75469970703125, 2.856201171875, 2.95770263671875, 3.0592041015625, 3.16070556640625, 3.26220703125, 3.36370849609375, 3.4652099609375, 3.56671142578125, 3.668212890625, 3.76971435546875, 3.8712158203125, 3.97271728515625, 4.07421875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 7.0, 13.0, 10.0, 14.0, 18.0, 34.0, 44.0, 50.0, 67.0, 99.0, 138.0, 243.0, 474.0, 861.0, 1871.0, 3982.0, 9090.0, 21861.0, 53430.0, 127267.0, 162883.0, 83381.0, 33403.0, 13733.0, 5812.0, 2608.0, 1251.0, 580.0, 346.0, 211.0, 142.0, 77.0, 73.0, 34.0, 44.0, 30.0, 22.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.953125, -22.167724609375, -21.38232421875, -20.596923828125, -19.8115234375, -19.026123046875, -18.24072265625, -17.455322265625, -16.669921875, -15.884521484375, -15.09912109375, -14.313720703125, -13.5283203125, -12.742919921875, -11.95751953125, -11.172119140625, -10.38671875, -9.601318359375, -8.81591796875, -8.030517578125, -7.2451171875, -6.459716796875, -5.67431640625, -4.888916015625, -4.103515625, -3.318115234375, -2.53271484375, -1.747314453125, -0.9619140625, -0.176513671875, 0.60888671875, 1.394287109375, 2.1796875, 2.965087890625, 3.75048828125, 4.535888671875, 5.3212890625, 6.106689453125, 6.89208984375, 7.677490234375, 8.462890625, 9.248291015625, 10.03369140625, 10.819091796875, 11.6044921875, 12.389892578125, 13.17529296875, 13.960693359375, 14.74609375, 15.531494140625, 16.31689453125, 17.102294921875, 17.8876953125, 18.673095703125, 19.45849609375, 20.243896484375, 21.029296875, 21.814697265625, 22.60009765625, 23.385498046875, 24.1708984375, 24.956298828125, 25.74169921875, 26.527099609375, 27.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 8.0, 20.0, 20.0, 17.0, 27.0, 36.0, 43.0, 65.0, 63.0, 61.0, 62.0, 81.0, 60.0, 69.0, 66.0, 50.0, 38.0, 40.0, 37.0, 28.0, 21.0, 12.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.0933837890625, -4.925048828125, -4.7567138671875, -4.58837890625, -4.4200439453125, -4.251708984375, -4.0833740234375, -3.9150390625, -3.7467041015625, -3.578369140625, -3.4100341796875, -3.24169921875, -3.0733642578125, -2.905029296875, -2.7366943359375, -2.568359375, -2.4000244140625, -2.231689453125, -2.0633544921875, -1.89501953125, -1.7266845703125, -1.558349609375, -1.3900146484375, -1.2216796875, -1.0533447265625, -0.885009765625, -0.7166748046875, -0.54833984375, -0.3800048828125, -0.211669921875, -0.0433349609375, 0.125, 0.2933349609375, 0.461669921875, 0.6300048828125, 0.79833984375, 0.9666748046875, 1.135009765625, 1.3033447265625, 1.4716796875, 1.6400146484375, 1.808349609375, 1.9766845703125, 2.14501953125, 2.3133544921875, 2.481689453125, 2.6500244140625, 2.818359375, 2.9866943359375, 3.155029296875, 3.3233642578125, 3.49169921875, 3.6600341796875, 3.828369140625, 3.9967041015625, 4.1650390625, 4.3333740234375, 4.501708984375, 4.6700439453125, 4.83837890625, 5.0067138671875, 5.175048828125, 5.3433837890625, 5.51171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 3.0, 6.0, 20.0, 24.0, 44.0, 65.0, 83.0, 67.0, 51.0, 39.0, 27.0, 11.0, 5.0, 5.0, 10.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-45.1645622253418, -44.09144973754883, -43.01833724975586, -41.94522476196289, -40.87211227416992, -39.79899597167969, -38.72588348388672, -37.65277099609375, -36.57965850830078, -35.50654602050781, -34.433433532714844, -33.360321044921875, -32.287208557128906, -31.214094161987305, -30.140981674194336, -29.067869186401367, -27.9947566986084, -26.92164421081543, -25.84853172302246, -24.77541732788086, -23.70230484008789, -22.629192352294922, -21.556079864501953, -20.482967376708984, -19.409854888916016, -18.336742401123047, -17.263629913330078, -16.19051742553711, -15.117403030395508, -14.044290542602539, -12.97117805480957, -11.898065567016602, -10.824951171875, -9.751838684082031, -8.678725242614746, -7.605612754821777, -6.53249979019165, -5.459386825561523, -4.386274337768555, -3.3131613731384277, -2.240048408508301, -1.1669355630874634, -0.09382271766662598, 0.9792900085449219, 2.052402973175049, 3.125515937805176, 4.1986284255981445, 5.2717413902282715, 6.344854354858398, 7.417967319488525, 8.491080284118652, 9.564192771911621, 10.637306213378906, 11.710418701171875, 12.783531188964844, 13.856643676757812, 14.929757118225098, 16.002870559692383, 17.07598304748535, 18.14909553527832, 19.22220802307129, 20.29532241821289, 21.36843490600586, 22.441547393798828, 23.514659881591797]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 5.0, 3.0, 0.0, 6.0, 1.0, 6.0, 3.0, 5.0, 11.0, 15.0, 34.0, 49.0, 67.0, 71.0, 55.0, 49.0, 29.0, 16.0, 8.0, 6.0, 1.0, 7.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.482685089111328, -22.64385414123535, -21.805023193359375, -20.96619415283203, -20.127363204956055, -19.288532257080078, -18.449703216552734, -17.610872268676758, -16.77204132080078, -15.933210372924805, -15.094380378723145, -14.255550384521484, -13.416719436645508, -12.577888488769531, -11.739058494567871, -10.900228500366211, -10.061397552490234, -9.222566604614258, -8.383736610412598, -7.544906139373779, -6.706075668334961, -5.867245197296143, -5.028414726257324, -4.189584255218506, -3.3507537841796875, -2.511923313140869, -1.6730928421020508, -0.8342623710632324, 0.0045680999755859375, 0.8433985710144043, 1.6822290420532227, 2.521059513092041, 3.359891891479492, 4.1987223625183105, 5.037552833557129, 5.876383304595947, 6.715213775634766, 7.554044246673584, 8.392874717712402, 9.231704711914062, 10.070535659790039, 10.909366607666016, 11.748196601867676, 12.587026596069336, 13.425857543945312, 14.264688491821289, 15.10351848602295, 15.94234848022461, 16.781179428100586, 17.620010375976562, 18.458839416503906, 19.297670364379883, 20.13650131225586, 20.975332260131836, 21.814163208007812, 22.652992248535156, 23.491823196411133, 24.33065414428711, 25.169483184814453, 26.00831413269043, 26.847145080566406, 27.685976028442383, 28.52480697631836, 29.363636016845703, 30.20246696472168]}, "eval/loss": 6.056567668914795, "eval/wer": 1.275446251487505, "eval/runtime": 640.1555, "eval/samples_per_second": 4.127, "eval/steps_per_second": 0.517} \ No newline at end of file +{"train/loss": 5.4525, "train/learning_rate": 2.7185915492957747e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 17953, "_timestamp": 1647962455, "_step": 3001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 14.0, 12.0, 15.0, 16.0, 23.0, 17.0, 19.0, 32.0, 35.0, 36.0, 39.0, 33.0, 39.0, 48.0, 45.0, 42.0, 53.0, 52.0, 45.0, 35.0, 35.0, 33.0, 34.0, 37.0, 39.0, 28.0, 24.0, 14.0, 22.0, 12.0, 7.0, 8.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.77167510986328, -28.803977966308594, -27.836280822753906, -26.86858367919922, -25.90088653564453, -24.933189392089844, -23.965492248535156, -22.99779510498047, -22.03009796142578, -21.062400817871094, -20.094703674316406, -19.12700653076172, -18.15930938720703, -17.191612243652344, -16.223915100097656, -15.256217956542969, -14.288521766662598, -13.32082462310791, -12.353127479553223, -11.385430335998535, -10.417733192443848, -9.450037002563477, -8.482339859008789, -7.514642238616943, -6.546945095062256, -5.579247951507568, -4.611550807952881, -3.6438539028167725, -2.676156759262085, -1.7084598541259766, -0.7407627105712891, 0.22693443298339844, 1.194631576538086, 2.1623287200927734, 3.130025863647461, 4.097723007202148, 5.065420150756836, 6.033116817474365, 7.000813961029053, 7.96851110458374, 8.936208724975586, 9.903905868530273, 10.871603012084961, 11.839300155639648, 12.806997299194336, 13.774694442749023, 14.742391586303711, 15.710088729858398, 16.677783966064453, 17.64548110961914, 18.613178253173828, 19.580875396728516, 20.548572540283203, 21.51626968383789, 22.483966827392578, 23.451663970947266, 24.419361114501953, 25.38705825805664, 26.354755401611328, 27.322452545166016, 28.290149688720703, 29.25784683227539, 30.225543975830078, 31.193241119384766, 32.16093826293945]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 6.0, 9.0, 11.0, 14.0, 15.0, 18.0, 20.0, 23.0, 16.0, 29.0, 33.0, 37.0, 24.0, 32.0, 27.0, 35.0, 32.0, 44.0, 49.0, 45.0, 31.0, 35.0, 45.0, 37.0, 35.0, 40.0, 25.0, 29.0, 18.0, 19.0, 23.0, 23.0, 18.0, 14.0, 16.0, 12.0, 8.0, 9.0, 8.0, 10.0, 2.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.996685028076172, -25.12548828125, -24.254291534423828, -23.383094787597656, -22.511898040771484, -21.640701293945312, -20.76950454711914, -19.898305892944336, -19.027109146118164, -18.155912399291992, -17.28471565246582, -16.41351890563965, -15.54232120513916, -14.671124458312988, -13.799927711486816, -12.928730010986328, -12.057534217834473, -11.1863374710083, -10.315140724182129, -9.44394302368164, -8.572746276855469, -7.701549530029297, -6.830352783203125, -5.959155559539795, -5.087958812713623, -4.216762065887451, -3.345564842224121, -2.474368095397949, -1.6031711101531982, -0.7319741249084473, 0.1392226219177246, 1.0104198455810547, 1.8816165924072266, 2.7528135776519775, 3.6240105628967285, 4.4952073097229, 5.3664045333862305, 6.237601280212402, 7.108798027038574, 7.979995250701904, 8.851192474365234, 9.722389221191406, 10.593585968017578, 11.46478271484375, 12.335980415344238, 13.20717716217041, 14.078373908996582, 14.94957160949707, 15.820767402648926, 16.691965103149414, 17.563161849975586, 18.434358596801758, 19.30555534362793, 20.1767520904541, 21.047948837280273, 21.919145584106445, 22.790342330932617, 23.66153907775879, 24.53273582458496, 25.403932571411133, 26.275129318237305, 27.14632797241211, 28.01752471923828, 28.888721466064453, 29.759918212890625]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 15.0, 11.0, 24.0, 32.0, 42.0, 69.0, 121.0, 236.0, 318.0, 556.0, 867.0, 1414.0, 2515.0, 4302.0, 7574.0, 13292.0, 24470.0, 44917.0, 83028.0, 154579.0, 276027.0, 451581.0, 633359.0, 718607.0, 644385.0, 470864.0, 295488.0, 166385.0, 90777.0, 49126.0, 26160.0, 14230.0, 8049.0, 4539.0, 2524.0, 1498.0, 882.0, 563.0, 312.0, 193.0, 134.0, 76.0, 52.0, 30.0, 20.0, 15.0, 13.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.21875, -21.556640625, -20.89453125, -20.232421875, -19.5703125, -18.908203125, -18.24609375, -17.583984375, -16.921875, -16.259765625, -15.59765625, -14.935546875, -14.2734375, -13.611328125, -12.94921875, -12.287109375, -11.625, -10.962890625, -10.30078125, -9.638671875, -8.9765625, -8.314453125, -7.65234375, -6.990234375, -6.328125, -5.666015625, -5.00390625, -4.341796875, -3.6796875, -3.017578125, -2.35546875, -1.693359375, -1.03125, -0.369140625, 0.29296875, 0.955078125, 1.6171875, 2.279296875, 2.94140625, 3.603515625, 4.265625, 4.927734375, 5.58984375, 6.251953125, 6.9140625, 7.576171875, 8.23828125, 8.900390625, 9.5625, 10.224609375, 10.88671875, 11.548828125, 12.2109375, 12.873046875, 13.53515625, 14.197265625, 14.859375, 15.521484375, 16.18359375, 16.845703125, 17.5078125, 18.169921875, 18.83203125, 19.494140625, 20.15625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 6.0, 5.0, 9.0, 7.0, 17.0, 9.0, 14.0, 12.0, 17.0, 14.0, 15.0, 22.0, 31.0, 17.0, 23.0, 30.0, 39.0, 30.0, 39.0, 29.0, 42.0, 31.0, 37.0, 39.0, 24.0, 37.0, 35.0, 35.0, 21.0, 26.0, 31.0, 33.0, 24.0, 37.0, 21.0, 19.0, 20.0, 11.0, 14.0, 21.0, 10.0, 4.0, 7.0, 8.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-19.640625, -19.005126953125, -18.36962890625, -17.734130859375, -17.0986328125, -16.463134765625, -15.82763671875, -15.192138671875, -14.556640625, -13.921142578125, -13.28564453125, -12.650146484375, -12.0146484375, -11.379150390625, -10.74365234375, -10.108154296875, -9.47265625, -8.837158203125, -8.20166015625, -7.566162109375, -6.9306640625, -6.295166015625, -5.65966796875, -5.024169921875, -4.388671875, -3.753173828125, -3.11767578125, -2.482177734375, -1.8466796875, -1.211181640625, -0.57568359375, 0.059814453125, 0.6953125, 1.330810546875, 1.96630859375, 2.601806640625, 3.2373046875, 3.872802734375, 4.50830078125, 5.143798828125, 5.779296875, 6.414794921875, 7.05029296875, 7.685791015625, 8.3212890625, 8.956787109375, 9.59228515625, 10.227783203125, 10.86328125, 11.498779296875, 12.13427734375, 12.769775390625, 13.4052734375, 14.040771484375, 14.67626953125, 15.311767578125, 15.947265625, 16.582763671875, 17.21826171875, 17.853759765625, 18.4892578125, 19.124755859375, 19.76025390625, 20.395751953125, 21.03125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 12.0, 10.0, 13.0, 15.0, 34.0, 48.0, 80.0, 120.0, 136.0, 261.0, 409.0, 593.0, 884.0, 1414.0, 2157.0, 3457.0, 5359.0, 8173.0, 12487.0, 19342.0, 29995.0, 45820.0, 69398.0, 103265.0, 151915.0, 218832.0, 303579.0, 404250.0, 499370.0, 534496.0, 481463.0, 383711.0, 287391.0, 203749.0, 141630.0, 96252.0, 63868.0, 42215.0, 27500.0, 17956.0, 11545.0, 7495.0, 4894.0, 3158.0, 1936.0, 1290.0, 795.0, 549.0, 338.0, 221.0, 142.0, 82.0, 63.0, 57.0, 26.0, 22.0, 7.0, 7.0, 6.0, 8.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.1083984375, -15.560546875, -15.0126953125, -14.46484375, -13.9169921875, -13.369140625, -12.8212890625, -12.2734375, -11.7255859375, -11.177734375, -10.6298828125, -10.08203125, -9.5341796875, -8.986328125, -8.4384765625, -7.890625, -7.3427734375, -6.794921875, -6.2470703125, -5.69921875, -5.1513671875, -4.603515625, -4.0556640625, -3.5078125, -2.9599609375, -2.412109375, -1.8642578125, -1.31640625, -0.7685546875, -0.220703125, 0.3271484375, 0.875, 1.4228515625, 1.970703125, 2.5185546875, 3.06640625, 3.6142578125, 4.162109375, 4.7099609375, 5.2578125, 5.8056640625, 6.353515625, 6.9013671875, 7.44921875, 7.9970703125, 8.544921875, 9.0927734375, 9.640625, 10.1884765625, 10.736328125, 11.2841796875, 11.83203125, 12.3798828125, 12.927734375, 13.4755859375, 14.0234375, 14.5712890625, 15.119140625, 15.6669921875, 16.21484375, 16.7626953125, 17.310546875, 17.8583984375, 18.40625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 2.0, 8.0, 13.0, 17.0, 22.0, 28.0, 35.0, 57.0, 58.0, 70.0, 63.0, 91.0, 118.0, 127.0, 161.0, 184.0, 237.0, 211.0, 236.0, 248.0, 249.0, 250.0, 258.0, 201.0, 175.0, 138.0, 141.0, 129.0, 98.0, 81.0, 59.0, 63.0, 46.0, 41.0, 27.0, 29.0, 22.0, 12.0, 13.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.00390625, -7.71875, -7.43359375, -7.1484375, -6.86328125, -6.578125, -6.29296875, -6.0078125, -5.72265625, -5.4375, -5.15234375, -4.8671875, -4.58203125, -4.296875, -4.01171875, -3.7265625, -3.44140625, -3.15625, -2.87109375, -2.5859375, -2.30078125, -2.015625, -1.73046875, -1.4453125, -1.16015625, -0.875, -0.58984375, -0.3046875, -0.01953125, 0.265625, 0.55078125, 0.8359375, 1.12109375, 1.40625, 1.69140625, 1.9765625, 2.26171875, 2.546875, 2.83203125, 3.1171875, 3.40234375, 3.6875, 3.97265625, 4.2578125, 4.54296875, 4.828125, 5.11328125, 5.3984375, 5.68359375, 5.96875, 6.25390625, 6.5390625, 6.82421875, 7.109375, 7.39453125, 7.6796875, 7.96484375, 8.25, 8.53515625, 8.8203125, 9.10546875, 9.390625, 9.67578125, 9.9609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 6.0, 15.0, 13.0, 16.0, 14.0, 32.0, 26.0, 26.0, 20.0, 38.0, 25.0, 27.0, 38.0, 38.0, 43.0, 44.0, 39.0, 41.0, 47.0, 43.0, 42.0, 33.0, 34.0, 37.0, 25.0, 33.0, 29.0, 20.0, 15.0, 18.0, 14.0, 20.0, 15.0, 8.0, 5.0, 6.0, 4.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.059850692749023, -20.349275588989258, -19.638700485229492, -18.928125381469727, -18.217548370361328, -17.506973266601562, -16.796398162841797, -16.08582305908203, -15.375247955322266, -14.6646728515625, -13.954097747802734, -13.243521690368652, -12.532946586608887, -11.822371482849121, -11.111795425415039, -10.401220321655273, -9.690645217895508, -8.980070114135742, -8.269495010375977, -7.5589189529418945, -6.848343849182129, -6.137768745422363, -5.4271931648254395, -4.716617584228516, -4.00604248046875, -3.2954671382904053, -2.5848917961120605, -1.8743164539337158, -1.163741111755371, -0.45316576957702637, 0.25740957260131836, 0.9679851531982422, 1.678558349609375, 2.3891336917877197, 3.0997090339660645, 3.810284376144409, 4.520859718322754, 5.2314348220825195, 5.942010402679443, 6.652585983276367, 7.363161087036133, 8.073736190795898, 8.784311294555664, 9.494887351989746, 10.205462455749512, 10.916037559509277, 11.62661361694336, 12.337188720703125, 13.04776382446289, 13.758338928222656, 14.468914031982422, 15.179490089416504, 15.89006519317627, 16.60064125061035, 17.311216354370117, 18.021791458129883, 18.73236656188965, 19.442941665649414, 20.15351676940918, 20.864091873168945, 21.574668884277344, 22.28524398803711, 22.995819091796875, 23.70639419555664, 24.416969299316406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 4.0, 17.0, 13.0, 11.0, 16.0, 14.0, 9.0, 18.0, 36.0, 29.0, 22.0, 42.0, 21.0, 44.0, 30.0, 28.0, 38.0, 37.0, 42.0, 36.0, 34.0, 46.0, 38.0, 32.0, 27.0, 34.0, 29.0, 28.0, 29.0, 25.0, 25.0, 22.0, 12.0, 14.0, 11.0, 8.0, 9.0, 4.0, 9.0, 12.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-22.522737503051758, -21.81505584716797, -21.10737419128418, -20.39969253540039, -19.6920108795166, -18.984329223632812, -18.276649475097656, -17.568967819213867, -16.861286163330078, -16.15360450744629, -15.4459228515625, -14.738241195678711, -14.030560493469238, -13.32287883758545, -12.61519718170166, -11.907516479492188, -11.199833869934082, -10.492152214050293, -9.784470558166504, -9.076789855957031, -8.369108200073242, -7.661426544189453, -6.953744888305664, -6.246063709259033, -5.538382053375244, -4.830700397491455, -4.123019218444824, -3.415337562561035, -2.707656145095825, -1.9999747276306152, -1.2922930717468262, -0.5846118927001953, 0.12306976318359375, 0.8307512402534485, 1.5384327173233032, 2.2461142539978027, 2.9537956714630127, 3.6614770889282227, 4.369158744812012, 5.076839923858643, 5.784521579742432, 6.492203235626221, 7.199884414672852, 7.907566070556641, 8.61524772644043, 9.322929382324219, 10.030611038208008, 10.73829174041748, 11.44597339630127, 12.153655052185059, 12.861336708068848, 13.56901741027832, 14.27669906616211, 14.984380722045898, 15.692062377929688, 16.399744033813477, 17.107425689697266, 17.815107345581055, 18.522789001464844, 19.230470657348633, 19.938152313232422, 20.645832061767578, 21.353515625, 22.061195373535156, 22.768877029418945]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 5.0, 16.0, 20.0, 28.0, 45.0, 48.0, 74.0, 95.0, 165.0, 214.0, 377.0, 547.0, 762.0, 1239.0, 1817.0, 3017.0, 4966.0, 8138.0, 13982.0, 23896.0, 41118.0, 71847.0, 121867.0, 182671.0, 200374.0, 150262.0, 92502.0, 53442.0, 30278.0, 17718.0, 10470.0, 6186.0, 3694.0, 2253.0, 1529.0, 960.0, 655.0, 402.0, 250.0, 192.0, 131.0, 98.0, 64.0, 43.0, 26.0, 18.0, 9.0, 15.0, 5.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.1953125, -10.8367919921875, -10.478271484375, -10.1197509765625, -9.76123046875, -9.4027099609375, -9.044189453125, -8.6856689453125, -8.3271484375, -7.9686279296875, -7.610107421875, -7.2515869140625, -6.89306640625, -6.5345458984375, -6.176025390625, -5.8175048828125, -5.458984375, -5.1004638671875, -4.741943359375, -4.3834228515625, -4.02490234375, -3.6663818359375, -3.307861328125, -2.9493408203125, -2.5908203125, -2.2322998046875, -1.873779296875, -1.5152587890625, -1.15673828125, -0.7982177734375, -0.439697265625, -0.0811767578125, 0.27734375, 0.6358642578125, 0.994384765625, 1.3529052734375, 1.71142578125, 2.0699462890625, 2.428466796875, 2.7869873046875, 3.1455078125, 3.5040283203125, 3.862548828125, 4.2210693359375, 4.57958984375, 4.9381103515625, 5.296630859375, 5.6551513671875, 6.013671875, 6.3721923828125, 6.730712890625, 7.0892333984375, 7.44775390625, 7.8062744140625, 8.164794921875, 8.5233154296875, 8.8818359375, 9.2403564453125, 9.598876953125, 9.9573974609375, 10.31591796875, 10.6744384765625, 11.032958984375, 11.3914794921875, 11.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 12.0, 14.0, 12.0, 14.0, 20.0, 16.0, 14.0, 18.0, 25.0, 42.0, 30.0, 37.0, 37.0, 33.0, 49.0, 39.0, 22.0, 38.0, 44.0, 36.0, 42.0, 40.0, 33.0, 27.0, 30.0, 34.0, 27.0, 35.0, 15.0, 18.0, 17.0, 14.0, 16.0, 13.0, 8.0, 6.0, 10.0, 10.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-23.65625, -22.94873046875, -22.2412109375, -21.53369140625, -20.826171875, -20.11865234375, -19.4111328125, -18.70361328125, -17.99609375, -17.28857421875, -16.5810546875, -15.87353515625, -15.166015625, -14.45849609375, -13.7509765625, -13.04345703125, -12.3359375, -11.62841796875, -10.9208984375, -10.21337890625, -9.505859375, -8.79833984375, -8.0908203125, -7.38330078125, -6.67578125, -5.96826171875, -5.2607421875, -4.55322265625, -3.845703125, -3.13818359375, -2.4306640625, -1.72314453125, -1.015625, -0.30810546875, 0.3994140625, 1.10693359375, 1.814453125, 2.52197265625, 3.2294921875, 3.93701171875, 4.64453125, 5.35205078125, 6.0595703125, 6.76708984375, 7.474609375, 8.18212890625, 8.8896484375, 9.59716796875, 10.3046875, 11.01220703125, 11.7197265625, 12.42724609375, 13.134765625, 13.84228515625, 14.5498046875, 15.25732421875, 15.96484375, 16.67236328125, 17.3798828125, 18.08740234375, 18.794921875, 19.50244140625, 20.2099609375, 20.91748046875, 21.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 15.0, 25.0, 35.0, 55.0, 79.0, 127.0, 195.0, 293.0, 513.0, 856.0, 1405.0, 2497.0, 4565.0, 8636.0, 17420.0, 36332.0, 78040.0, 159764.0, 255419.0, 232008.0, 129801.0, 61420.0, 28865.0, 13921.0, 7116.0, 3805.0, 2095.0, 1234.0, 737.0, 466.0, 308.0, 161.0, 122.0, 58.0, 51.0, 31.0, 22.0, 17.0, 9.0, 7.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.7161865234375, -9.401123046875, -9.0860595703125, -8.77099609375, -8.4559326171875, -8.140869140625, -7.8258056640625, -7.5107421875, -7.1956787109375, -6.880615234375, -6.5655517578125, -6.25048828125, -5.9354248046875, -5.620361328125, -5.3052978515625, -4.990234375, -4.6751708984375, -4.360107421875, -4.0450439453125, -3.72998046875, -3.4149169921875, -3.099853515625, -2.7847900390625, -2.4697265625, -2.1546630859375, -1.839599609375, -1.5245361328125, -1.20947265625, -0.8944091796875, -0.579345703125, -0.2642822265625, 0.05078125, 0.3658447265625, 0.680908203125, 0.9959716796875, 1.31103515625, 1.6260986328125, 1.941162109375, 2.2562255859375, 2.5712890625, 2.8863525390625, 3.201416015625, 3.5164794921875, 3.83154296875, 4.1466064453125, 4.461669921875, 4.7767333984375, 5.091796875, 5.4068603515625, 5.721923828125, 6.0369873046875, 6.35205078125, 6.6671142578125, 6.982177734375, 7.2972412109375, 7.6123046875, 7.9273681640625, 8.242431640625, 8.5574951171875, 8.87255859375, 9.1876220703125, 9.502685546875, 9.8177490234375, 10.1328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 7.0, 10.0, 8.0, 14.0, 15.0, 17.0, 19.0, 32.0, 25.0, 20.0, 39.0, 34.0, 46.0, 28.0, 33.0, 37.0, 37.0, 42.0, 48.0, 54.0, 37.0, 44.0, 28.0, 37.0, 48.0, 32.0, 33.0, 26.0, 22.0, 14.0, 18.0, 20.0, 11.0, 15.0, 8.0, 10.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.4267578125, -18.806640625, -18.1865234375, -17.56640625, -16.9462890625, -16.326171875, -15.7060546875, -15.0859375, -14.4658203125, -13.845703125, -13.2255859375, -12.60546875, -11.9853515625, -11.365234375, -10.7451171875, -10.125, -9.5048828125, -8.884765625, -8.2646484375, -7.64453125, -7.0244140625, -6.404296875, -5.7841796875, -5.1640625, -4.5439453125, -3.923828125, -3.3037109375, -2.68359375, -2.0634765625, -1.443359375, -0.8232421875, -0.203125, 0.4169921875, 1.037109375, 1.6572265625, 2.27734375, 2.8974609375, 3.517578125, 4.1376953125, 4.7578125, 5.3779296875, 5.998046875, 6.6181640625, 7.23828125, 7.8583984375, 8.478515625, 9.0986328125, 9.71875, 10.3388671875, 10.958984375, 11.5791015625, 12.19921875, 12.8193359375, 13.439453125, 14.0595703125, 14.6796875, 15.2998046875, 15.919921875, 16.5400390625, 17.16015625, 17.7802734375, 18.400390625, 19.0205078125, 19.640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 6.0, 1.0, 4.0, 8.0, 12.0, 13.0, 34.0, 35.0, 61.0, 110.0, 135.0, 172.0, 286.0, 431.0, 578.0, 818.0, 1198.0, 1778.0, 2580.0, 3860.0, 6522.0, 11365.0, 21195.0, 46306.0, 132379.0, 411957.0, 259734.0, 76535.0, 31378.0, 15469.0, 8580.0, 5063.0, 3174.0, 2117.0, 1400.0, 989.0, 681.0, 456.0, 393.0, 245.0, 167.0, 114.0, 75.0, 56.0, 36.0, 22.0, 14.0, 7.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.66796875, -4.52099609375, -4.3740234375, -4.22705078125, -4.080078125, -3.93310546875, -3.7861328125, -3.63916015625, -3.4921875, -3.34521484375, -3.1982421875, -3.05126953125, -2.904296875, -2.75732421875, -2.6103515625, -2.46337890625, -2.31640625, -2.16943359375, -2.0224609375, -1.87548828125, -1.728515625, -1.58154296875, -1.4345703125, -1.28759765625, -1.140625, -0.99365234375, -0.8466796875, -0.69970703125, -0.552734375, -0.40576171875, -0.2587890625, -0.11181640625, 0.03515625, 0.18212890625, 0.3291015625, 0.47607421875, 0.623046875, 0.77001953125, 0.9169921875, 1.06396484375, 1.2109375, 1.35791015625, 1.5048828125, 1.65185546875, 1.798828125, 1.94580078125, 2.0927734375, 2.23974609375, 2.38671875, 2.53369140625, 2.6806640625, 2.82763671875, 2.974609375, 3.12158203125, 3.2685546875, 3.41552734375, 3.5625, 3.70947265625, 3.8564453125, 4.00341796875, 4.150390625, 4.29736328125, 4.4443359375, 4.59130859375, 4.73828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 12.0, 16.0, 20.0, 26.0, 29.0, 51.0, 99.0, 119.0, 128.0, 128.0, 104.0, 69.0, 55.0, 32.0, 22.0, 17.0, 14.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008611679077148438, -0.000834144651889801, -0.0008071213960647583, -0.0007800981402397156, -0.0007530748844146729, -0.0007260516285896301, -0.0006990283727645874, -0.0006720051169395447, -0.000644981861114502, -0.0006179586052894592, -0.0005909353494644165, -0.0005639120936393738, -0.0005368888378143311, -0.0005098655819892883, -0.0004828423261642456, -0.0004558190703392029, -0.00042879581451416016, -0.00040177255868911743, -0.0003747493028640747, -0.000347726047039032, -0.00032070279121398926, -0.00029367953538894653, -0.0002666562795639038, -0.00023963302373886108, -0.00021260976791381836, -0.00018558651208877563, -0.0001585632562637329, -0.00013154000043869019, -0.00010451674461364746, -7.749348878860474e-05, -5.047023296356201e-05, -2.3446977138519287e-05, 3.5762786865234375e-06, 3.059953451156616e-05, 5.762279033660889e-05, 8.464604616165161e-05, 0.00011166930198669434, 0.00013869255781173706, 0.00016571581363677979, 0.0001927390694618225, 0.00021976232528686523, 0.00024678558111190796, 0.0002738088369369507, 0.0003008320927619934, 0.00032785534858703613, 0.00035487860441207886, 0.0003819018602371216, 0.0004089251160621643, 0.00043594837188720703, 0.00046297162771224976, 0.0004899948835372925, 0.0005170181393623352, 0.0005440413951873779, 0.0005710646510124207, 0.0005980879068374634, 0.0006251111626625061, 0.0006521344184875488, 0.0006791576743125916, 0.0007061809301376343, 0.000733204185962677, 0.0007602274417877197, 0.0007872506976127625, 0.0008142739534378052, 0.0008412972092628479, 0.0008683204650878906]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 12.0, 16.0, 14.0, 34.0, 43.0, 72.0, 81.0, 144.0, 192.0, 319.0, 418.0, 666.0, 998.0, 1497.0, 2489.0, 4024.0, 6641.0, 11711.0, 21656.0, 43078.0, 86395.0, 171776.0, 270644.0, 205776.0, 106411.0, 52093.0, 26702.0, 14208.0, 7847.0, 4597.0, 2814.0, 1783.0, 1099.0, 745.0, 499.0, 338.0, 232.0, 153.0, 115.0, 80.0, 49.0, 27.0, 20.0, 17.0, 13.0, 3.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.98284912109375, -3.8485107421875, -3.71417236328125, -3.579833984375, -3.44549560546875, -3.3111572265625, -3.17681884765625, -3.04248046875, -2.90814208984375, -2.7738037109375, -2.63946533203125, -2.505126953125, -2.37078857421875, -2.2364501953125, -2.10211181640625, -1.9677734375, -1.83343505859375, -1.6990966796875, -1.56475830078125, -1.430419921875, -1.29608154296875, -1.1617431640625, -1.02740478515625, -0.89306640625, -0.75872802734375, -0.6243896484375, -0.49005126953125, -0.355712890625, -0.22137451171875, -0.0870361328125, 0.04730224609375, 0.181640625, 0.31597900390625, 0.4503173828125, 0.58465576171875, 0.718994140625, 0.85333251953125, 0.9876708984375, 1.12200927734375, 1.25634765625, 1.39068603515625, 1.5250244140625, 1.65936279296875, 1.793701171875, 1.92803955078125, 2.0623779296875, 2.19671630859375, 2.3310546875, 2.46539306640625, 2.5997314453125, 2.73406982421875, 2.868408203125, 3.00274658203125, 3.1370849609375, 3.27142333984375, 3.40576171875, 3.54010009765625, 3.6744384765625, 3.80877685546875, 3.943115234375, 4.07745361328125, 4.2117919921875, 4.34613037109375, 4.48046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 4.0, 2.0, 4.0, 6.0, 14.0, 8.0, 6.0, 14.0, 23.0, 21.0, 29.0, 48.0, 42.0, 63.0, 84.0, 96.0, 88.0, 76.0, 79.0, 56.0, 64.0, 30.0, 29.0, 21.0, 16.0, 13.0, 11.0, 9.0, 8.0, 5.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8544921875, -1.8017730712890625, -1.749053955078125, -1.6963348388671875, -1.64361572265625, -1.5908966064453125, -1.538177490234375, -1.4854583740234375, -1.4327392578125, -1.3800201416015625, -1.327301025390625, -1.2745819091796875, -1.22186279296875, -1.1691436767578125, -1.116424560546875, -1.0637054443359375, -1.010986328125, -0.9582672119140625, -0.905548095703125, -0.8528289794921875, -0.80010986328125, -0.7473907470703125, -0.694671630859375, -0.6419525146484375, -0.5892333984375, -0.5365142822265625, -0.483795166015625, -0.4310760498046875, -0.37835693359375, -0.3256378173828125, -0.272918701171875, -0.2201995849609375, -0.16748046875, -0.1147613525390625, -0.062042236328125, -0.0093231201171875, 0.04339599609375, 0.0961151123046875, 0.148834228515625, 0.2015533447265625, 0.2542724609375, 0.3069915771484375, 0.359710693359375, 0.4124298095703125, 0.46514892578125, 0.5178680419921875, 0.570587158203125, 0.6233062744140625, 0.676025390625, 0.7287445068359375, 0.781463623046875, 0.8341827392578125, 0.88690185546875, 0.9396209716796875, 0.992340087890625, 1.0450592041015625, 1.0977783203125, 1.1504974365234375, 1.203216552734375, 1.2559356689453125, 1.30865478515625, 1.3613739013671875, 1.414093017578125, 1.4668121337890625, 1.51953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 9.0, 13.0, 9.0, 12.0, 11.0, 26.0, 32.0, 25.0, 24.0, 34.0, 32.0, 29.0, 29.0, 38.0, 43.0, 42.0, 61.0, 34.0, 45.0, 37.0, 52.0, 36.0, 37.0, 37.0, 33.0, 33.0, 25.0, 22.0, 20.0, 19.0, 16.0, 14.0, 15.0, 6.0, 7.0, 8.0, 6.0, 7.0, 5.0, 4.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.369163513183594, -19.670391082763672, -18.971620559692383, -18.27284812927246, -17.574077606201172, -16.87530517578125, -16.176532745361328, -15.477762222290039, -14.778990745544434, -14.080219268798828, -13.381447792053223, -12.682676315307617, -11.983903884887695, -11.285133361816406, -10.586360931396484, -9.887589454650879, -9.188817977905273, -8.490046501159668, -7.7912750244140625, -7.092503070831299, -6.393731594085693, -5.694960117340088, -4.996188163757324, -4.297416687011719, -3.5986452102661133, -2.899873733520508, -2.2011020183563232, -1.5023303031921387, -0.8035588264465332, -0.10478734970092773, 0.5939846038818359, 1.2927560806274414, 1.991525650024414, 2.6902971267700195, 3.389068841934204, 4.087840557098389, 4.786612033843994, 5.4853835105896, 6.184155464172363, 6.882926940917969, 7.581698417663574, 8.28046989440918, 8.979241371154785, 9.67801284790039, 10.376785278320312, 11.075555801391602, 11.774328231811523, 12.473099708557129, 13.171871185302734, 13.87064266204834, 14.569414138793945, 15.268186569213867, 15.966957092285156, 16.665729522705078, 17.364501953125, 18.06327247619629, 18.762042999267578, 19.4608154296875, 20.15958595275879, 20.85835838317871, 21.55712890625, 22.255901336669922, 22.954673767089844, 23.653444290161133, 24.352216720581055]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 5.0, 3.0, 8.0, 5.0, 11.0, 8.0, 13.0, 10.0, 16.0, 14.0, 20.0, 15.0, 33.0, 29.0, 26.0, 26.0, 34.0, 33.0, 40.0, 31.0, 31.0, 32.0, 40.0, 44.0, 34.0, 36.0, 37.0, 35.0, 29.0, 34.0, 28.0, 30.0, 24.0, 28.0, 27.0, 20.0, 19.0, 10.0, 9.0, 8.0, 6.0, 9.0, 8.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-20.63979721069336, -19.99089813232422, -19.341999053955078, -18.69310188293457, -18.04420280456543, -17.39530372619629, -16.74640464782715, -16.097505569458008, -15.448607444763184, -14.799708366394043, -14.150810241699219, -13.501911163330078, -12.853012084960938, -12.204113960266113, -11.555214881896973, -10.906316757202148, -10.257417678833008, -9.608518600463867, -8.959620475769043, -8.310721397399902, -7.66182279586792, -7.0129241943359375, -6.364025115966797, -5.7151265144348145, -5.066227912902832, -4.41732931137085, -3.768430471420288, -3.1195316314697266, -2.470633029937744, -1.8217344284057617, -1.1728355884552002, -0.5239367485046387, 0.12496376037597656, 0.7738624811172485, 1.4227612018585205, 2.071660041809082, 2.7205586433410645, 3.369457244873047, 4.0183563232421875, 4.66725492477417, 5.316153526306152, 5.965052127838135, 6.613950729370117, 7.262849807739258, 7.91174840927124, 8.560647010803223, 9.209546089172363, 9.858444213867188, 10.507343292236328, 11.156242370605469, 11.805140495300293, 12.454039573669434, 13.102937698364258, 13.751836776733398, 14.400735855102539, 15.04963493347168, 15.698533058166504, 16.347431182861328, 16.99633026123047, 17.64522933959961, 18.29412841796875, 18.94302749633789, 19.5919246673584, 20.24082374572754, 20.88972282409668]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 12.0, 16.0, 18.0, 32.0, 51.0, 77.0, 147.0, 210.0, 328.0, 591.0, 1044.0, 1664.0, 2795.0, 4839.0, 8296.0, 14311.0, 23361.0, 38083.0, 59542.0, 85895.0, 113654.0, 133382.0, 137721.0, 124883.0, 100596.0, 72545.0, 48857.0, 30631.0, 18537.0, 10942.0, 6348.0, 3674.0, 2200.0, 1322.0, 732.0, 473.0, 277.0, 184.0, 109.0, 75.0, 42.0, 27.0, 18.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.308837890625, -18.64892578125, -17.989013671875, -17.3291015625, -16.669189453125, -16.00927734375, -15.349365234375, -14.689453125, -14.029541015625, -13.36962890625, -12.709716796875, -12.0498046875, -11.389892578125, -10.72998046875, -10.070068359375, -9.41015625, -8.750244140625, -8.09033203125, -7.430419921875, -6.7705078125, -6.110595703125, -5.45068359375, -4.790771484375, -4.130859375, -3.470947265625, -2.81103515625, -2.151123046875, -1.4912109375, -0.831298828125, -0.17138671875, 0.488525390625, 1.1484375, 1.808349609375, 2.46826171875, 3.128173828125, 3.7880859375, 4.447998046875, 5.10791015625, 5.767822265625, 6.427734375, 7.087646484375, 7.74755859375, 8.407470703125, 9.0673828125, 9.727294921875, 10.38720703125, 11.047119140625, 11.70703125, 12.366943359375, 13.02685546875, 13.686767578125, 14.3466796875, 15.006591796875, 15.66650390625, 16.326416015625, 16.986328125, 17.646240234375, 18.30615234375, 18.966064453125, 19.6259765625, 20.285888671875, 20.94580078125, 21.605712890625, 22.265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 4.0, 7.0, 8.0, 4.0, 9.0, 10.0, 9.0, 22.0, 19.0, 17.0, 25.0, 25.0, 29.0, 37.0, 34.0, 32.0, 44.0, 33.0, 36.0, 42.0, 34.0, 40.0, 35.0, 47.0, 32.0, 36.0, 35.0, 36.0, 36.0, 40.0, 21.0, 14.0, 21.0, 17.0, 17.0, 13.0, 12.0, 11.0, 12.0, 9.0, 5.0, 5.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-22.546875, -21.88330078125, -21.2197265625, -20.55615234375, -19.892578125, -19.22900390625, -18.5654296875, -17.90185546875, -17.23828125, -16.57470703125, -15.9111328125, -15.24755859375, -14.583984375, -13.92041015625, -13.2568359375, -12.59326171875, -11.9296875, -11.26611328125, -10.6025390625, -9.93896484375, -9.275390625, -8.61181640625, -7.9482421875, -7.28466796875, -6.62109375, -5.95751953125, -5.2939453125, -4.63037109375, -3.966796875, -3.30322265625, -2.6396484375, -1.97607421875, -1.3125, -0.64892578125, 0.0146484375, 0.67822265625, 1.341796875, 2.00537109375, 2.6689453125, 3.33251953125, 3.99609375, 4.65966796875, 5.3232421875, 5.98681640625, 6.650390625, 7.31396484375, 7.9775390625, 8.64111328125, 9.3046875, 9.96826171875, 10.6318359375, 11.29541015625, 11.958984375, 12.62255859375, 13.2861328125, 13.94970703125, 14.61328125, 15.27685546875, 15.9404296875, 16.60400390625, 17.267578125, 17.93115234375, 18.5947265625, 19.25830078125, 19.921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 14.0, 22.0, 39.0, 31.0, 56.0, 102.0, 148.0, 309.0, 461.0, 717.0, 1130.0, 1743.0, 2802.0, 4355.0, 6649.0, 10375.0, 15408.0, 22760.0, 32659.0, 45653.0, 61364.0, 78227.0, 93059.0, 104137.0, 107137.0, 102113.0, 90238.0, 74437.0, 57166.0, 42782.0, 30390.0, 20939.0, 14483.0, 9598.0, 6225.0, 4001.0, 2453.0, 1630.0, 1059.0, 650.0, 407.0, 246.0, 159.0, 87.0, 55.0, 28.0, 21.0, 9.0, 13.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.5, -17.891357421875, -17.28271484375, -16.674072265625, -16.0654296875, -15.456787109375, -14.84814453125, -14.239501953125, -13.630859375, -13.022216796875, -12.41357421875, -11.804931640625, -11.1962890625, -10.587646484375, -9.97900390625, -9.370361328125, -8.76171875, -8.153076171875, -7.54443359375, -6.935791015625, -6.3271484375, -5.718505859375, -5.10986328125, -4.501220703125, -3.892578125, -3.283935546875, -2.67529296875, -2.066650390625, -1.4580078125, -0.849365234375, -0.24072265625, 0.367919921875, 0.9765625, 1.585205078125, 2.19384765625, 2.802490234375, 3.4111328125, 4.019775390625, 4.62841796875, 5.237060546875, 5.845703125, 6.454345703125, 7.06298828125, 7.671630859375, 8.2802734375, 8.888916015625, 9.49755859375, 10.106201171875, 10.71484375, 11.323486328125, 11.93212890625, 12.540771484375, 13.1494140625, 13.758056640625, 14.36669921875, 14.975341796875, 15.583984375, 16.192626953125, 16.80126953125, 17.409912109375, 18.0185546875, 18.627197265625, 19.23583984375, 19.844482421875, 20.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 10.0, 10.0, 18.0, 5.0, 14.0, 27.0, 19.0, 16.0, 18.0, 28.0, 36.0, 31.0, 25.0, 37.0, 42.0, 30.0, 43.0, 42.0, 39.0, 40.0, 38.0, 38.0, 32.0, 31.0, 37.0, 41.0, 27.0, 27.0, 26.0, 24.0, 23.0, 16.0, 19.0, 13.0, 6.0, 8.0, 10.0, 11.0, 5.0, 6.0, 3.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-13.9765625, -13.52734375, -13.078125, -12.62890625, -12.1796875, -11.73046875, -11.28125, -10.83203125, -10.3828125, -9.93359375, -9.484375, -9.03515625, -8.5859375, -8.13671875, -7.6875, -7.23828125, -6.7890625, -6.33984375, -5.890625, -5.44140625, -4.9921875, -4.54296875, -4.09375, -3.64453125, -3.1953125, -2.74609375, -2.296875, -1.84765625, -1.3984375, -0.94921875, -0.5, -0.05078125, 0.3984375, 0.84765625, 1.296875, 1.74609375, 2.1953125, 2.64453125, 3.09375, 3.54296875, 3.9921875, 4.44140625, 4.890625, 5.33984375, 5.7890625, 6.23828125, 6.6875, 7.13671875, 7.5859375, 8.03515625, 8.484375, 8.93359375, 9.3828125, 9.83203125, 10.28125, 10.73046875, 11.1796875, 11.62890625, 12.078125, 12.52734375, 12.9765625, 13.42578125, 13.875, 14.32421875, 14.7734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 2.0, 9.0, 7.0, 11.0, 21.0, 28.0, 48.0, 74.0, 127.0, 151.0, 262.0, 377.0, 633.0, 1034.0, 1738.0, 2727.0, 4662.0, 8005.0, 13841.0, 24036.0, 40053.0, 64442.0, 96362.0, 129017.0, 149970.0, 147479.0, 124033.0, 90094.0, 59827.0, 36882.0, 21777.0, 12620.0, 7377.0, 4172.0, 2597.0, 1521.0, 912.0, 578.0, 364.0, 235.0, 164.0, 102.0, 61.0, 34.0, 25.0, 20.0, 11.0, 8.0, 7.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.01171875, -4.83837890625, -4.6650390625, -4.49169921875, -4.318359375, -4.14501953125, -3.9716796875, -3.79833984375, -3.625, -3.45166015625, -3.2783203125, -3.10498046875, -2.931640625, -2.75830078125, -2.5849609375, -2.41162109375, -2.23828125, -2.06494140625, -1.8916015625, -1.71826171875, -1.544921875, -1.37158203125, -1.1982421875, -1.02490234375, -0.8515625, -0.67822265625, -0.5048828125, -0.33154296875, -0.158203125, 0.01513671875, 0.1884765625, 0.36181640625, 0.53515625, 0.70849609375, 0.8818359375, 1.05517578125, 1.228515625, 1.40185546875, 1.5751953125, 1.74853515625, 1.921875, 2.09521484375, 2.2685546875, 2.44189453125, 2.615234375, 2.78857421875, 2.9619140625, 3.13525390625, 3.30859375, 3.48193359375, 3.6552734375, 3.82861328125, 4.001953125, 4.17529296875, 4.3486328125, 4.52197265625, 4.6953125, 4.86865234375, 5.0419921875, 5.21533203125, 5.388671875, 5.56201171875, 5.7353515625, 5.90869140625, 6.08203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 3.0, 5.0, 11.0, 10.0, 8.0, 9.0, 20.0, 26.0, 21.0, 28.0, 21.0, 28.0, 39.0, 48.0, 31.0, 55.0, 48.0, 46.0, 48.0, 53.0, 55.0, 46.0, 51.0, 37.0, 41.0, 36.0, 33.0, 27.0, 18.0, 14.0, 19.0, 10.0, 12.0, 12.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005631446838378906, -0.0005464404821395874, -0.0005297362804412842, -0.000513032078742981, -0.0004963278770446777, -0.0004796236753463745, -0.0004629194736480713, -0.00044621527194976807, -0.00042951107025146484, -0.0004128068685531616, -0.0003961026668548584, -0.0003793984651565552, -0.00036269426345825195, -0.00034599006175994873, -0.0003292858600616455, -0.0003125816583633423, -0.00029587745666503906, -0.00027917325496673584, -0.0002624690532684326, -0.0002457648515701294, -0.00022906064987182617, -0.00021235644817352295, -0.00019565224647521973, -0.0001789480447769165, -0.00016224384307861328, -0.00014553964138031006, -0.00012883543968200684, -0.00011213123798370361, -9.542703628540039e-05, -7.872283458709717e-05, -6.201863288879395e-05, -4.531443119049072e-05, -2.86102294921875e-05, -1.1906027793884277e-05, 4.798173904418945e-06, 2.1502375602722168e-05, 3.820657730102539e-05, 5.491077899932861e-05, 7.161498069763184e-05, 8.831918239593506e-05, 0.00010502338409423828, 0.0001217275857925415, 0.00013843178749084473, 0.00015513598918914795, 0.00017184019088745117, 0.0001885443925857544, 0.00020524859428405762, 0.00022195279598236084, 0.00023865699768066406, 0.0002553611993789673, 0.0002720654010772705, 0.00028876960277557373, 0.00030547380447387695, 0.0003221780061721802, 0.0003388822078704834, 0.0003555864095687866, 0.00037229061126708984, 0.00038899481296539307, 0.0004056990146636963, 0.0004224032163619995, 0.00043910741806030273, 0.00045581161975860596, 0.0004725158214569092, 0.0004892200231552124, 0.0005059242248535156]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 10.0, 11.0, 12.0, 20.0, 34.0, 74.0, 90.0, 152.0, 267.0, 420.0, 688.0, 1136.0, 1791.0, 2802.0, 4755.0, 7436.0, 12010.0, 19527.0, 30149.0, 44807.0, 64915.0, 86927.0, 107605.0, 121824.0, 124203.0, 112713.0, 92432.0, 70103.0, 49952.0, 33754.0, 21928.0, 13757.0, 8420.0, 5410.0, 3205.0, 1923.0, 1278.0, 758.0, 501.0, 281.0, 184.0, 99.0, 66.0, 50.0, 23.0, 24.0, 16.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.60284423828125, -4.4595947265625, -4.31634521484375, -4.173095703125, -4.02984619140625, -3.8865966796875, -3.74334716796875, -3.60009765625, -3.45684814453125, -3.3135986328125, -3.17034912109375, -3.027099609375, -2.88385009765625, -2.7406005859375, -2.59735107421875, -2.4541015625, -2.31085205078125, -2.1676025390625, -2.02435302734375, -1.881103515625, -1.73785400390625, -1.5946044921875, -1.45135498046875, -1.30810546875, -1.16485595703125, -1.0216064453125, -0.87835693359375, -0.735107421875, -0.59185791015625, -0.4486083984375, -0.30535888671875, -0.162109375, -0.01885986328125, 0.1243896484375, 0.26763916015625, 0.410888671875, 0.55413818359375, 0.6973876953125, 0.84063720703125, 0.98388671875, 1.12713623046875, 1.2703857421875, 1.41363525390625, 1.556884765625, 1.70013427734375, 1.8433837890625, 1.98663330078125, 2.1298828125, 2.27313232421875, 2.4163818359375, 2.55963134765625, 2.702880859375, 2.84613037109375, 2.9893798828125, 3.13262939453125, 3.27587890625, 3.41912841796875, 3.5623779296875, 3.70562744140625, 3.848876953125, 3.99212646484375, 4.1353759765625, 4.27862548828125, 4.421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 10.0, 13.0, 18.0, 14.0, 30.0, 29.0, 25.0, 40.0, 39.0, 50.0, 54.0, 52.0, 73.0, 54.0, 68.0, 67.0, 46.0, 55.0, 39.0, 32.0, 30.0, 34.0, 27.0, 22.0, 20.0, 11.0, 8.0, 9.0, 9.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.9765625, -2.9020843505859375, -2.827606201171875, -2.7531280517578125, -2.67864990234375, -2.6041717529296875, -2.529693603515625, -2.4552154541015625, -2.3807373046875, -2.3062591552734375, -2.231781005859375, -2.1573028564453125, -2.08282470703125, -2.0083465576171875, -1.933868408203125, -1.8593902587890625, -1.784912109375, -1.7104339599609375, -1.635955810546875, -1.5614776611328125, -1.48699951171875, -1.4125213623046875, -1.338043212890625, -1.2635650634765625, -1.1890869140625, -1.1146087646484375, -1.040130615234375, -0.9656524658203125, -0.89117431640625, -0.8166961669921875, -0.742218017578125, -0.6677398681640625, -0.59326171875, -0.5187835693359375, -0.444305419921875, -0.3698272705078125, -0.29534912109375, -0.2208709716796875, -0.146392822265625, -0.0719146728515625, 0.0025634765625, 0.0770416259765625, 0.151519775390625, 0.2259979248046875, 0.30047607421875, 0.3749542236328125, 0.449432373046875, 0.5239105224609375, 0.598388671875, 0.6728668212890625, 0.747344970703125, 0.8218231201171875, 0.89630126953125, 0.9707794189453125, 1.045257568359375, 1.1197357177734375, 1.1942138671875, 1.2686920166015625, 1.343170166015625, 1.4176483154296875, 1.49212646484375, 1.5666046142578125, 1.641082763671875, 1.7155609130859375, 1.7900390625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 3.0, 12.0, 8.0, 17.0, 17.0, 19.0, 13.0, 19.0, 19.0, 19.0, 38.0, 24.0, 38.0, 37.0, 34.0, 48.0, 45.0, 42.0, 50.0, 46.0, 43.0, 40.0, 39.0, 39.0, 43.0, 33.0, 40.0, 27.0, 16.0, 19.0, 22.0, 17.0, 8.0, 8.0, 11.0, 14.0, 6.0, 4.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-21.251632690429688, -20.585906982421875, -19.920183181762695, -19.254457473754883, -18.588733673095703, -17.92300796508789, -17.25728416442871, -16.5915584564209, -15.925833702087402, -15.260108947753906, -14.59438419342041, -13.928659439086914, -13.262933731079102, -12.597209930419922, -11.93148422241211, -11.265759468078613, -10.600034713745117, -9.934309959411621, -9.268585205078125, -8.602860450744629, -7.937135219573975, -7.2714104652404785, -6.605685234069824, -5.939960479736328, -5.274235725402832, -4.608510971069336, -3.9427859783172607, -3.2770609855651855, -2.6113362312316895, -1.9456114768981934, -1.2798864841461182, -0.614161491394043, 0.05156517028808594, 0.7172900438308716, 1.3830149173736572, 2.0487399101257324, 2.7144646644592285, 3.3801894187927246, 4.045914649963379, 4.711639404296875, 5.377364158630371, 6.043088912963867, 6.708813667297363, 7.374538898468018, 8.040264129638672, 8.705987930297852, 9.371713638305664, 10.03743839263916, 10.703163146972656, 11.368887901306152, 12.034612655639648, 12.700337409973145, 13.36606216430664, 14.031787872314453, 14.69751262664795, 15.363237380981445, 16.028961181640625, 16.694686889648438, 17.360410690307617, 18.02613639831543, 18.69186019897461, 19.357585906982422, 20.0233097076416, 20.689035415649414, 21.354761123657227]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 5.0, 9.0, 10.0, 10.0, 14.0, 10.0, 23.0, 24.0, 26.0, 19.0, 28.0, 36.0, 32.0, 40.0, 42.0, 40.0, 40.0, 31.0, 39.0, 36.0, 34.0, 42.0, 37.0, 41.0, 38.0, 41.0, 32.0, 25.0, 30.0, 18.0, 21.0, 14.0, 24.0, 10.0, 12.0, 11.0, 6.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.7653751373291, -24.02655601501465, -23.287736892700195, -22.548917770385742, -21.810096740722656, -21.071277618408203, -20.33245849609375, -19.593639373779297, -18.854820251464844, -18.11600112915039, -17.377182006835938, -16.638362884521484, -15.899542808532715, -15.160723686218262, -14.421903610229492, -13.683084487915039, -12.944265365600586, -12.205446243286133, -11.46662712097168, -10.72780704498291, -9.988987922668457, -9.250168800354004, -8.511348724365234, -7.772529602050781, -7.033710479736328, -6.294891357421875, -5.556071758270264, -4.817252159118652, -4.078433036804199, -3.339613676071167, -2.6007943153381348, -1.8619747161865234, -1.1231536865234375, -0.3843343257904053, 0.35448503494262695, 1.0933043956756592, 1.8321237564086914, 2.5709431171417236, 3.309762477874756, 4.048582077026367, 4.78740119934082, 5.526220321655273, 6.265039920806885, 7.003859519958496, 7.742678642272949, 8.481497764587402, 9.220317840576172, 9.959136962890625, 10.697956085205078, 11.436775207519531, 12.175594329833984, 12.914414405822754, 13.653233528137207, 14.39205265045166, 15.13087272644043, 15.869691848754883, 16.608510971069336, 17.34733009338379, 18.086149215698242, 18.824968338012695, 19.56378936767578, 20.302608489990234, 21.041427612304688, 21.78024673461914, 22.519065856933594]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 12.0, 15.0, 31.0, 52.0, 67.0, 153.0, 255.0, 355.0, 614.0, 1019.0, 1538.0, 2530.0, 4083.0, 6750.0, 10562.0, 17110.0, 27698.0, 43928.0, 71077.0, 110780.0, 170863.0, 253181.0, 349052.0, 444258.0, 509210.0, 515828.0, 466010.0, 376856.0, 278874.0, 191128.0, 126022.0, 81140.0, 50968.0, 31437.0, 19793.0, 11808.0, 7426.0, 4469.0, 2781.0, 1761.0, 1056.0, 661.0, 431.0, 219.0, 175.0, 97.0, 57.0, 40.0, 21.0, 14.0, 13.0, 3.0, 0.0, 4.0, 3.0, 1.0], "bins": [-15.0546875, -14.6004638671875, -14.146240234375, -13.6920166015625, -13.23779296875, -12.7835693359375, -12.329345703125, -11.8751220703125, -11.4208984375, -10.9666748046875, -10.512451171875, -10.0582275390625, -9.60400390625, -9.1497802734375, -8.695556640625, -8.2413330078125, -7.787109375, -7.3328857421875, -6.878662109375, -6.4244384765625, -5.97021484375, -5.5159912109375, -5.061767578125, -4.6075439453125, -4.1533203125, -3.6990966796875, -3.244873046875, -2.7906494140625, -2.33642578125, -1.8822021484375, -1.427978515625, -0.9737548828125, -0.51953125, -0.0653076171875, 0.388916015625, 0.8431396484375, 1.29736328125, 1.7515869140625, 2.205810546875, 2.6600341796875, 3.1142578125, 3.5684814453125, 4.022705078125, 4.4769287109375, 4.93115234375, 5.3853759765625, 5.839599609375, 6.2938232421875, 6.748046875, 7.2022705078125, 7.656494140625, 8.1107177734375, 8.56494140625, 9.0191650390625, 9.473388671875, 9.9276123046875, 10.3818359375, 10.8360595703125, 11.290283203125, 11.7445068359375, 12.19873046875, 12.6529541015625, 13.107177734375, 13.5614013671875, 14.015625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 2.0, 3.0, 11.0, 5.0, 8.0, 7.0, 4.0, 13.0, 21.0, 13.0, 21.0, 21.0, 24.0, 26.0, 23.0, 26.0, 29.0, 40.0, 49.0, 43.0, 34.0, 36.0, 40.0, 33.0, 39.0, 42.0, 37.0, 34.0, 41.0, 40.0, 30.0, 28.0, 21.0, 31.0, 12.0, 20.0, 12.0, 13.0, 13.0, 14.0, 8.0, 5.0, 7.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.0, -17.450927734375, -16.90185546875, -16.352783203125, -15.8037109375, -15.254638671875, -14.70556640625, -14.156494140625, -13.607421875, -13.058349609375, -12.50927734375, -11.960205078125, -11.4111328125, -10.862060546875, -10.31298828125, -9.763916015625, -9.21484375, -8.665771484375, -8.11669921875, -7.567626953125, -7.0185546875, -6.469482421875, -5.92041015625, -5.371337890625, -4.822265625, -4.273193359375, -3.72412109375, -3.175048828125, -2.6259765625, -2.076904296875, -1.52783203125, -0.978759765625, -0.4296875, 0.119384765625, 0.66845703125, 1.217529296875, 1.7666015625, 2.315673828125, 2.86474609375, 3.413818359375, 3.962890625, 4.511962890625, 5.06103515625, 5.610107421875, 6.1591796875, 6.708251953125, 7.25732421875, 7.806396484375, 8.35546875, 8.904541015625, 9.45361328125, 10.002685546875, 10.5517578125, 11.100830078125, 11.64990234375, 12.198974609375, 12.748046875, 13.297119140625, 13.84619140625, 14.395263671875, 14.9443359375, 15.493408203125, 16.04248046875, 16.591552734375, 17.140625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 19.0, 44.0, 59.0, 104.0, 161.0, 251.0, 413.0, 728.0, 1290.0, 2318.0, 3802.0, 6410.0, 10924.0, 18424.0, 29631.0, 49008.0, 77156.0, 119453.0, 178615.0, 255114.0, 344095.0, 426808.0, 486279.0, 494435.0, 452859.0, 373803.0, 284768.0, 203380.0, 137911.0, 89778.0, 56996.0, 35715.0, 21517.0, 13334.0, 7812.0, 4494.0, 2575.0, 1570.0, 868.0, 567.0, 331.0, 200.0, 96.0, 69.0, 39.0, 28.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-16.03125, -15.5479736328125, -15.064697265625, -14.5814208984375, -14.09814453125, -13.6148681640625, -13.131591796875, -12.6483154296875, -12.1650390625, -11.6817626953125, -11.198486328125, -10.7152099609375, -10.23193359375, -9.7486572265625, -9.265380859375, -8.7821044921875, -8.298828125, -7.8155517578125, -7.332275390625, -6.8489990234375, -6.36572265625, -5.8824462890625, -5.399169921875, -4.9158935546875, -4.4326171875, -3.9493408203125, -3.466064453125, -2.9827880859375, -2.49951171875, -2.0162353515625, -1.532958984375, -1.0496826171875, -0.56640625, -0.0831298828125, 0.400146484375, 0.8834228515625, 1.36669921875, 1.8499755859375, 2.333251953125, 2.8165283203125, 3.2998046875, 3.7830810546875, 4.266357421875, 4.7496337890625, 5.23291015625, 5.7161865234375, 6.199462890625, 6.6827392578125, 7.166015625, 7.6492919921875, 8.132568359375, 8.6158447265625, 9.09912109375, 9.5823974609375, 10.065673828125, 10.5489501953125, 11.0322265625, 11.5155029296875, 11.998779296875, 12.4820556640625, 12.96533203125, 13.4486083984375, 13.931884765625, 14.4151611328125, 14.8984375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 8.0, 3.0, 13.0, 13.0, 18.0, 21.0, 30.0, 36.0, 46.0, 50.0, 66.0, 86.0, 85.0, 130.0, 123.0, 155.0, 164.0, 184.0, 197.0, 228.0, 203.0, 252.0, 213.0, 225.0, 215.0, 167.0, 161.0, 168.0, 128.0, 115.0, 114.0, 80.0, 76.0, 70.0, 53.0, 47.0, 35.0, 19.0, 16.0, 16.0, 14.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-8.171875, -7.9261474609375, -7.680419921875, -7.4346923828125, -7.18896484375, -6.9432373046875, -6.697509765625, -6.4517822265625, -6.2060546875, -5.9603271484375, -5.714599609375, -5.4688720703125, -5.22314453125, -4.9774169921875, -4.731689453125, -4.4859619140625, -4.240234375, -3.9945068359375, -3.748779296875, -3.5030517578125, -3.25732421875, -3.0115966796875, -2.765869140625, -2.5201416015625, -2.2744140625, -2.0286865234375, -1.782958984375, -1.5372314453125, -1.29150390625, -1.0457763671875, -0.800048828125, -0.5543212890625, -0.30859375, -0.0628662109375, 0.182861328125, 0.4285888671875, 0.67431640625, 0.9200439453125, 1.165771484375, 1.4114990234375, 1.6572265625, 1.9029541015625, 2.148681640625, 2.3944091796875, 2.64013671875, 2.8858642578125, 3.131591796875, 3.3773193359375, 3.623046875, 3.8687744140625, 4.114501953125, 4.3602294921875, 4.60595703125, 4.8516845703125, 5.097412109375, 5.3431396484375, 5.5888671875, 5.8345947265625, 6.080322265625, 6.3260498046875, 6.57177734375, 6.8175048828125, 7.063232421875, 7.3089599609375, 7.5546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 13.0, 10.0, 10.0, 11.0, 14.0, 19.0, 16.0, 23.0, 20.0, 25.0, 29.0, 23.0, 36.0, 41.0, 33.0, 28.0, 42.0, 46.0, 32.0, 35.0, 39.0, 47.0, 31.0, 35.0, 30.0, 20.0, 26.0, 33.0, 28.0, 24.0, 21.0, 15.0, 20.0, 22.0, 8.0, 7.0, 5.0, 8.0, 11.0, 9.0, 2.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 7.0, 2.0, 2.0], "bins": [-16.19312858581543, -15.700928688049316, -15.208728790283203, -14.71652889251709, -14.224328994750977, -13.732129096984863, -13.23992919921875, -12.747729301452637, -12.255529403686523, -11.76332950592041, -11.271129608154297, -10.778929710388184, -10.28672981262207, -9.794529914855957, -9.302330017089844, -8.81013011932373, -8.317930221557617, -7.825730323791504, -7.333530426025391, -6.841330528259277, -6.349130630493164, -5.856930732727051, -5.3647308349609375, -4.872530937194824, -4.380331039428711, -3.8881311416625977, -3.3959312438964844, -2.903731346130371, -2.411531448364258, -1.9193315505981445, -1.4271316528320312, -0.934931755065918, -0.4427328109741211, 0.04946708679199219, 0.5416669845581055, 1.0338668823242188, 1.526066780090332, 2.0182666778564453, 2.5104665756225586, 3.002666473388672, 3.494866371154785, 3.9870662689208984, 4.479266166687012, 4.971466064453125, 5.463665962219238, 5.955865859985352, 6.448065757751465, 6.940265655517578, 7.432465553283691, 7.924665451049805, 8.416865348815918, 8.909065246582031, 9.401265144348145, 9.893465042114258, 10.385664939880371, 10.877864837646484, 11.370064735412598, 11.862264633178711, 12.354464530944824, 12.846664428710938, 13.33886432647705, 13.831064224243164, 14.323264122009277, 14.81546401977539, 15.307663917541504]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 0.0, 2.0, 10.0, 5.0, 6.0, 7.0, 5.0, 8.0, 10.0, 18.0, 14.0, 23.0, 16.0, 20.0, 23.0, 31.0, 22.0, 28.0, 32.0, 34.0, 43.0, 21.0, 37.0, 50.0, 32.0, 35.0, 40.0, 42.0, 33.0, 40.0, 33.0, 33.0, 26.0, 29.0, 25.0, 33.0, 21.0, 20.0, 16.0, 11.0, 12.0, 13.0, 11.0, 9.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-19.54261589050293, -18.945056915283203, -18.347496032714844, -17.749937057495117, -17.15237808227539, -16.55481719970703, -15.957258224487305, -15.359699249267578, -14.762139320373535, -14.164579391479492, -13.567020416259766, -12.969460487365723, -12.37190055847168, -11.774341583251953, -11.17678165435791, -10.579221725463867, -9.98166275024414, -9.384102821350098, -8.786543846130371, -8.188983917236328, -7.591424465179443, -6.993865013122559, -6.396305084228516, -5.798745632171631, -5.201186180114746, -4.603626728057861, -4.006067276000977, -3.4085073471069336, -2.810947895050049, -2.213388442993164, -1.6158287525177002, -1.0182690620422363, -0.4207115173339844, 0.17684805393218994, 0.7744076251983643, 1.3719671964645386, 1.969526767730713, 2.5670862197875977, 3.1646459102630615, 3.7622056007385254, 4.35976505279541, 4.957324504852295, 5.55488395690918, 6.152443885803223, 6.750003337860107, 7.347562789916992, 7.945122718811035, 8.542682647705078, 9.140241622924805, 9.737801551818848, 10.335360527038574, 10.932920455932617, 11.530479431152344, 12.128039360046387, 12.72559928894043, 13.323158264160156, 13.9207181930542, 14.518278121948242, 15.115837097167969, 15.713397026062012, 16.310956954956055, 16.90851593017578, 17.506074905395508, 18.103635787963867, 18.701194763183594]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 9.0, 26.0, 19.0, 30.0, 54.0, 67.0, 93.0, 126.0, 198.0, 282.0, 440.0, 636.0, 977.0, 1537.0, 2483.0, 4162.0, 7036.0, 12238.0, 22190.0, 40413.0, 73920.0, 128360.0, 191655.0, 206083.0, 151071.0, 90521.0, 50024.0, 27316.0, 15030.0, 8399.0, 4974.0, 2906.0, 1824.0, 1094.0, 791.0, 491.0, 319.0, 223.0, 167.0, 110.0, 74.0, 54.0, 45.0, 20.0, 21.0, 16.0, 6.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.883544921875, -9.53271484375, -9.181884765625, -8.8310546875, -8.480224609375, -8.12939453125, -7.778564453125, -7.427734375, -7.076904296875, -6.72607421875, -6.375244140625, -6.0244140625, -5.673583984375, -5.32275390625, -4.971923828125, -4.62109375, -4.270263671875, -3.91943359375, -3.568603515625, -3.2177734375, -2.866943359375, -2.51611328125, -2.165283203125, -1.814453125, -1.463623046875, -1.11279296875, -0.761962890625, -0.4111328125, -0.060302734375, 0.29052734375, 0.641357421875, 0.9921875, 1.343017578125, 1.69384765625, 2.044677734375, 2.3955078125, 2.746337890625, 3.09716796875, 3.447998046875, 3.798828125, 4.149658203125, 4.50048828125, 4.851318359375, 5.2021484375, 5.552978515625, 5.90380859375, 6.254638671875, 6.60546875, 6.956298828125, 7.30712890625, 7.657958984375, 8.0087890625, 8.359619140625, 8.71044921875, 9.061279296875, 9.412109375, 9.762939453125, 10.11376953125, 10.464599609375, 10.8154296875, 11.166259765625, 11.51708984375, 11.867919921875, 12.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 9.0, 7.0, 9.0, 7.0, 12.0, 11.0, 15.0, 24.0, 19.0, 23.0, 24.0, 26.0, 24.0, 34.0, 33.0, 37.0, 30.0, 33.0, 44.0, 35.0, 40.0, 58.0, 41.0, 34.0, 46.0, 35.0, 36.0, 28.0, 32.0, 25.0, 29.0, 21.0, 16.0, 18.0, 20.0, 10.0, 11.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.885009765625, -19.25439453125, -18.623779296875, -17.9931640625, -17.362548828125, -16.73193359375, -16.101318359375, -15.470703125, -14.840087890625, -14.20947265625, -13.578857421875, -12.9482421875, -12.317626953125, -11.68701171875, -11.056396484375, -10.42578125, -9.795166015625, -9.16455078125, -8.533935546875, -7.9033203125, -7.272705078125, -6.64208984375, -6.011474609375, -5.380859375, -4.750244140625, -4.11962890625, -3.489013671875, -2.8583984375, -2.227783203125, -1.59716796875, -0.966552734375, -0.3359375, 0.294677734375, 0.92529296875, 1.555908203125, 2.1865234375, 2.817138671875, 3.44775390625, 4.078369140625, 4.708984375, 5.339599609375, 5.97021484375, 6.600830078125, 7.2314453125, 7.862060546875, 8.49267578125, 9.123291015625, 9.75390625, 10.384521484375, 11.01513671875, 11.645751953125, 12.2763671875, 12.906982421875, 13.53759765625, 14.168212890625, 14.798828125, 15.429443359375, 16.06005859375, 16.690673828125, 17.3212890625, 17.951904296875, 18.58251953125, 19.213134765625, 19.84375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 4.0, 9.0, 8.0, 13.0, 14.0, 37.0, 30.0, 53.0, 81.0, 113.0, 180.0, 225.0, 375.0, 556.0, 904.0, 1525.0, 2741.0, 5482.0, 12152.0, 33178.0, 100862.0, 276421.0, 356530.0, 167130.0, 54593.0, 18797.0, 7632.0, 3653.0, 1950.0, 1162.0, 689.0, 479.0, 294.0, 212.0, 144.0, 100.0, 69.0, 47.0, 31.0, 23.0, 21.0, 11.0, 10.0, 5.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.671875, -12.29052734375, -11.9091796875, -11.52783203125, -11.146484375, -10.76513671875, -10.3837890625, -10.00244140625, -9.62109375, -9.23974609375, -8.8583984375, -8.47705078125, -8.095703125, -7.71435546875, -7.3330078125, -6.95166015625, -6.5703125, -6.18896484375, -5.8076171875, -5.42626953125, -5.044921875, -4.66357421875, -4.2822265625, -3.90087890625, -3.51953125, -3.13818359375, -2.7568359375, -2.37548828125, -1.994140625, -1.61279296875, -1.2314453125, -0.85009765625, -0.46875, -0.08740234375, 0.2939453125, 0.67529296875, 1.056640625, 1.43798828125, 1.8193359375, 2.20068359375, 2.58203125, 2.96337890625, 3.3447265625, 3.72607421875, 4.107421875, 4.48876953125, 4.8701171875, 5.25146484375, 5.6328125, 6.01416015625, 6.3955078125, 6.77685546875, 7.158203125, 7.53955078125, 7.9208984375, 8.30224609375, 8.68359375, 9.06494140625, 9.4462890625, 9.82763671875, 10.208984375, 10.59033203125, 10.9716796875, 11.35302734375, 11.734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 6.0, 3.0, 6.0, 4.0, 8.0, 13.0, 12.0, 11.0, 16.0, 23.0, 26.0, 33.0, 24.0, 28.0, 36.0, 32.0, 42.0, 41.0, 35.0, 51.0, 50.0, 49.0, 37.0, 41.0, 35.0, 37.0, 27.0, 31.0, 36.0, 36.0, 29.0, 24.0, 20.0, 18.0, 8.0, 15.0, 18.0, 9.0, 7.0, 10.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.5703125, -14.0848388671875, -13.599365234375, -13.1138916015625, -12.62841796875, -12.1429443359375, -11.657470703125, -11.1719970703125, -10.6865234375, -10.2010498046875, -9.715576171875, -9.2301025390625, -8.74462890625, -8.2591552734375, -7.773681640625, -7.2882080078125, -6.802734375, -6.3172607421875, -5.831787109375, -5.3463134765625, -4.86083984375, -4.3753662109375, -3.889892578125, -3.4044189453125, -2.9189453125, -2.4334716796875, -1.947998046875, -1.4625244140625, -0.97705078125, -0.4915771484375, -0.006103515625, 0.4793701171875, 0.96484375, 1.4503173828125, 1.935791015625, 2.4212646484375, 2.90673828125, 3.3922119140625, 3.877685546875, 4.3631591796875, 4.8486328125, 5.3341064453125, 5.819580078125, 6.3050537109375, 6.79052734375, 7.2760009765625, 7.761474609375, 8.2469482421875, 8.732421875, 9.2178955078125, 9.703369140625, 10.1888427734375, 10.67431640625, 11.1597900390625, 11.645263671875, 12.1307373046875, 12.6162109375, 13.1016845703125, 13.587158203125, 14.0726318359375, 14.55810546875, 15.0435791015625, 15.529052734375, 16.0145263671875, 16.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 14.0, 14.0, 27.0, 31.0, 45.0, 66.0, 77.0, 120.0, 162.0, 244.0, 407.0, 660.0, 1070.0, 1776.0, 3260.0, 6447.0, 14348.0, 37689.0, 124540.0, 457610.0, 282364.0, 71732.0, 24660.0, 10176.0, 4865.0, 2427.0, 1372.0, 750.0, 502.0, 314.0, 199.0, 139.0, 101.0, 69.0, 61.0, 56.0, 42.0, 31.0, 24.0, 14.0, 12.0, 9.0, 9.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.33074951171875, -5.1575927734375, -4.98443603515625, -4.811279296875, -4.63812255859375, -4.4649658203125, -4.29180908203125, -4.11865234375, -3.94549560546875, -3.7723388671875, -3.59918212890625, -3.426025390625, -3.25286865234375, -3.0797119140625, -2.90655517578125, -2.7333984375, -2.56024169921875, -2.3870849609375, -2.21392822265625, -2.040771484375, -1.86761474609375, -1.6944580078125, -1.52130126953125, -1.34814453125, -1.17498779296875, -1.0018310546875, -0.82867431640625, -0.655517578125, -0.48236083984375, -0.3092041015625, -0.13604736328125, 0.037109375, 0.21026611328125, 0.3834228515625, 0.55657958984375, 0.729736328125, 0.90289306640625, 1.0760498046875, 1.24920654296875, 1.42236328125, 1.59552001953125, 1.7686767578125, 1.94183349609375, 2.114990234375, 2.28814697265625, 2.4613037109375, 2.63446044921875, 2.8076171875, 2.98077392578125, 3.1539306640625, 3.32708740234375, 3.500244140625, 3.67340087890625, 3.8465576171875, 4.01971435546875, 4.19287109375, 4.36602783203125, 4.5391845703125, 4.71234130859375, 4.885498046875, 5.05865478515625, 5.2318115234375, 5.40496826171875, 5.578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 8.0, 8.0, 9.0, 19.0, 17.0, 24.0, 29.0, 27.0, 29.0, 53.0, 67.0, 93.0, 95.0, 77.0, 77.0, 59.0, 61.0, 46.0, 33.0, 30.0, 21.0, 20.0, 17.0, 10.0, 7.0, 13.0, 9.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007414817810058594, -0.0007174909114837646, -0.0006935000419616699, -0.0006695091724395752, -0.0006455183029174805, -0.0006215274333953857, -0.000597536563873291, -0.0005735456943511963, -0.0005495548248291016, -0.0005255639553070068, -0.0005015730857849121, -0.0004775822162628174, -0.00045359134674072266, -0.00042960047721862793, -0.0004056096076965332, -0.0003816187381744385, -0.00035762786865234375, -0.000333636999130249, -0.0003096461296081543, -0.00028565526008605957, -0.00026166439056396484, -0.00023767352104187012, -0.0002136826515197754, -0.00018969178199768066, -0.00016570091247558594, -0.0001417100429534912, -0.00011771917343139648, -9.372830390930176e-05, -6.973743438720703e-05, -4.5746564865112305e-05, -2.1755695343017578e-05, 2.2351741790771484e-06, 2.6226043701171875e-05, 5.02169132232666e-05, 7.420778274536133e-05, 9.819865226745605e-05, 0.00012218952178955078, 0.0001461803913116455, 0.00017017126083374023, 0.00019416213035583496, 0.0002181529998779297, 0.00024214386940002441, 0.00026613473892211914, 0.00029012560844421387, 0.0003141164779663086, 0.0003381073474884033, 0.00036209821701049805, 0.0003860890865325928, 0.0004100799560546875, 0.0004340708255767822, 0.00045806169509887695, 0.0004820525646209717, 0.0005060434341430664, 0.0005300343036651611, 0.0005540251731872559, 0.0005780160427093506, 0.0006020069122314453, 0.00062599778175354, 0.0006499886512756348, 0.0006739795207977295, 0.0006979703903198242, 0.0007219612598419189, 0.0007459521293640137, 0.0007699429988861084, 0.0007939338684082031]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 10.0, 7.0, 14.0, 21.0, 13.0, 37.0, 46.0, 75.0, 119.0, 152.0, 220.0, 352.0, 561.0, 910.0, 1584.0, 2749.0, 4867.0, 10047.0, 20338.0, 43204.0, 96357.0, 219802.0, 324894.0, 176550.0, 76519.0, 34800.0, 16373.0, 8038.0, 4128.0, 2259.0, 1267.0, 798.0, 502.0, 305.0, 201.0, 140.0, 76.0, 60.0, 46.0, 33.0, 25.0, 14.0, 5.0, 13.0, 9.0, 8.0, 2.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.578125, -5.358154296875, -5.13818359375, -4.918212890625, -4.6982421875, -4.478271484375, -4.25830078125, -4.038330078125, -3.818359375, -3.598388671875, -3.37841796875, -3.158447265625, -2.9384765625, -2.718505859375, -2.49853515625, -2.278564453125, -2.05859375, -1.838623046875, -1.61865234375, -1.398681640625, -1.1787109375, -0.958740234375, -0.73876953125, -0.518798828125, -0.298828125, -0.078857421875, 0.14111328125, 0.361083984375, 0.5810546875, 0.801025390625, 1.02099609375, 1.240966796875, 1.4609375, 1.680908203125, 1.90087890625, 2.120849609375, 2.3408203125, 2.560791015625, 2.78076171875, 3.000732421875, 3.220703125, 3.440673828125, 3.66064453125, 3.880615234375, 4.1005859375, 4.320556640625, 4.54052734375, 4.760498046875, 4.98046875, 5.200439453125, 5.42041015625, 5.640380859375, 5.8603515625, 6.080322265625, 6.30029296875, 6.520263671875, 6.740234375, 6.960205078125, 7.18017578125, 7.400146484375, 7.6201171875, 7.840087890625, 8.06005859375, 8.280029296875, 8.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 10.0, 7.0, 14.0, 17.0, 25.0, 16.0, 27.0, 27.0, 28.0, 51.0, 51.0, 54.0, 62.0, 73.0, 60.0, 63.0, 51.0, 68.0, 67.0, 41.0, 43.0, 22.0, 23.0, 23.0, 18.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.451171875, -1.391754150390625, -1.33233642578125, -1.272918701171875, -1.2135009765625, -1.154083251953125, -1.09466552734375, -1.035247802734375, -0.975830078125, -0.916412353515625, -0.85699462890625, -0.797576904296875, -0.7381591796875, -0.678741455078125, -0.61932373046875, -0.559906005859375, -0.50048828125, -0.441070556640625, -0.38165283203125, -0.322235107421875, -0.2628173828125, -0.203399658203125, -0.14398193359375, -0.084564208984375, -0.025146484375, 0.034271240234375, 0.09368896484375, 0.153106689453125, 0.2125244140625, 0.271942138671875, 0.33135986328125, 0.390777587890625, 0.4501953125, 0.509613037109375, 0.56903076171875, 0.628448486328125, 0.6878662109375, 0.747283935546875, 0.80670166015625, 0.866119384765625, 0.925537109375, 0.984954833984375, 1.04437255859375, 1.103790283203125, 1.1632080078125, 1.222625732421875, 1.28204345703125, 1.341461181640625, 1.40087890625, 1.460296630859375, 1.51971435546875, 1.579132080078125, 1.6385498046875, 1.697967529296875, 1.75738525390625, 1.816802978515625, 1.876220703125, 1.935638427734375, 1.99505615234375, 2.054473876953125, 2.1138916015625, 2.173309326171875, 2.23272705078125, 2.292144775390625, 2.3515625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 12.0, 14.0, 10.0, 16.0, 17.0, 22.0, 16.0, 28.0, 24.0, 21.0, 32.0, 34.0, 35.0, 42.0, 40.0, 43.0, 48.0, 43.0, 42.0, 34.0, 23.0, 49.0, 34.0, 30.0, 29.0, 39.0, 28.0, 19.0, 21.0, 20.0, 15.0, 10.0, 17.0, 9.0, 7.0, 7.0, 10.0, 4.0, 5.0, 6.0, 4.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.254413604736328, -15.745338439941406, -15.236262321472168, -14.727187156677246, -14.218111991882324, -13.709035873413086, -13.199960708618164, -12.690885543823242, -12.18181037902832, -11.672735214233398, -11.16365909576416, -10.654583930969238, -10.145508766174316, -9.636432647705078, -9.127357482910156, -8.618282318115234, -8.109206199645996, -7.600130558013916, -7.091055393218994, -6.581979751586914, -6.072904586791992, -5.563828945159912, -5.054753303527832, -4.54567813873291, -4.03660249710083, -3.527527093887329, -3.018451690673828, -2.509376049041748, -2.000300645828247, -1.491225242614746, -0.982149600982666, -0.47307419776916504, 0.03600120544433594, 0.5450766682624817, 1.0541521310806274, 1.563227653503418, 2.072303056716919, 2.58137845993042, 3.0904541015625, 3.599529504776001, 4.108604907989502, 4.617680549621582, 5.126755714416504, 5.635831356048584, 6.144906997680664, 6.653982162475586, 7.163057804107666, 7.672133445739746, 8.181208610534668, 8.69028377532959, 9.199359893798828, 9.70843505859375, 10.217510223388672, 10.726585388183594, 11.235661506652832, 11.744736671447754, 12.253812789916992, 12.762887954711914, 13.271964073181152, 13.781039237976074, 14.290114402770996, 14.799190521240234, 15.308265686035156, 15.817340850830078, 16.326416015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 4.0, 2.0, 1.0, 7.0, 9.0, 3.0, 8.0, 6.0, 8.0, 9.0, 11.0, 13.0, 24.0, 16.0, 23.0, 20.0, 23.0, 21.0, 37.0, 23.0, 25.0, 47.0, 26.0, 39.0, 41.0, 40.0, 32.0, 37.0, 38.0, 31.0, 37.0, 29.0, 37.0, 37.0, 17.0, 30.0, 33.0, 26.0, 20.0, 13.0, 21.0, 11.0, 17.0, 7.0, 13.0, 7.0, 6.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-18.023099899291992, -17.46468734741211, -16.90627670288086, -16.347864151000977, -15.789453506469727, -15.231040954589844, -14.672629356384277, -14.114217758178711, -13.555806159973145, -12.997394561767578, -12.438982963562012, -11.880571365356445, -11.322158813476562, -10.763748168945312, -10.20533561706543, -9.646924018859863, -9.088512420654297, -8.53010082244873, -7.971689224243164, -7.4132771492004395, -6.854865550994873, -6.296453952789307, -5.738041877746582, -5.179630279541016, -4.621218681335449, -4.062807083129883, -3.5043952465057373, -2.945983409881592, -2.3875718116760254, -1.829160213470459, -1.2707483768463135, -0.712336540222168, -0.15392303466796875, 0.4044886827468872, 0.9629004001617432, 1.5213121175765991, 2.079723834991455, 2.6381354331970215, 3.196547269821167, 3.7549591064453125, 4.313370704650879, 4.871782302856445, 5.430193901062012, 5.988605976104736, 6.547017574310303, 7.105429172515869, 7.663841247558594, 8.22225284576416, 8.780664443969727, 9.339076042175293, 9.89748764038086, 10.455899238586426, 11.014310836791992, 11.572723388671875, 12.131134986877441, 12.689546585083008, 13.247958183288574, 13.80636978149414, 14.364781379699707, 14.923192977905273, 15.481605529785156, 16.040016174316406, 16.59842872619629, 17.156841278076172, 17.715251922607422]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 13.0, 12.0, 25.0, 28.0, 38.0, 68.0, 93.0, 161.0, 203.0, 336.0, 482.0, 785.0, 1142.0, 1689.0, 2632.0, 3669.0, 5444.0, 8058.0, 11409.0, 16397.0, 22710.0, 30831.0, 41287.0, 52788.0, 64949.0, 76636.0, 86695.0, 91736.0, 91483.0, 86891.0, 77615.0, 66313.0, 53829.0, 42144.0, 31857.0, 23496.0, 16870.0, 11938.0, 8260.0, 5632.0, 3901.0, 2647.0, 1835.0, 1198.0, 791.0, 530.0, 351.0, 205.0, 169.0, 118.0, 63.0, 29.0, 32.0, 24.0, 10.0, 13.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.9921875, -10.6263427734375, -10.260498046875, -9.8946533203125, -9.52880859375, -9.1629638671875, -8.797119140625, -8.4312744140625, -8.0654296875, -7.6995849609375, -7.333740234375, -6.9678955078125, -6.60205078125, -6.2362060546875, -5.870361328125, -5.5045166015625, -5.138671875, -4.7728271484375, -4.406982421875, -4.0411376953125, -3.67529296875, -3.3094482421875, -2.943603515625, -2.5777587890625, -2.2119140625, -1.8460693359375, -1.480224609375, -1.1143798828125, -0.74853515625, -0.3826904296875, -0.016845703125, 0.3489990234375, 0.71484375, 1.0806884765625, 1.446533203125, 1.8123779296875, 2.17822265625, 2.5440673828125, 2.909912109375, 3.2757568359375, 3.6416015625, 4.0074462890625, 4.373291015625, 4.7391357421875, 5.10498046875, 5.4708251953125, 5.836669921875, 6.2025146484375, 6.568359375, 6.9342041015625, 7.300048828125, 7.6658935546875, 8.03173828125, 8.3975830078125, 8.763427734375, 9.1292724609375, 9.4951171875, 9.8609619140625, 10.226806640625, 10.5926513671875, 10.95849609375, 11.3243408203125, 11.690185546875, 12.0560302734375, 12.421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 5.0, 4.0, 11.0, 8.0, 12.0, 7.0, 9.0, 13.0, 13.0, 14.0, 18.0, 22.0, 24.0, 24.0, 29.0, 41.0, 28.0, 27.0, 36.0, 34.0, 35.0, 42.0, 42.0, 47.0, 32.0, 31.0, 30.0, 31.0, 34.0, 40.0, 31.0, 38.0, 16.0, 19.0, 23.0, 17.0, 14.0, 16.0, 12.0, 11.0, 15.0, 10.0, 4.0, 7.0, 6.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.5625, -17.0107421875, -16.458984375, -15.9072265625, -15.35546875, -14.8037109375, -14.251953125, -13.7001953125, -13.1484375, -12.5966796875, -12.044921875, -11.4931640625, -10.94140625, -10.3896484375, -9.837890625, -9.2861328125, -8.734375, -8.1826171875, -7.630859375, -7.0791015625, -6.52734375, -5.9755859375, -5.423828125, -4.8720703125, -4.3203125, -3.7685546875, -3.216796875, -2.6650390625, -2.11328125, -1.5615234375, -1.009765625, -0.4580078125, 0.09375, 0.6455078125, 1.197265625, 1.7490234375, 2.30078125, 2.8525390625, 3.404296875, 3.9560546875, 4.5078125, 5.0595703125, 5.611328125, 6.1630859375, 6.71484375, 7.2666015625, 7.818359375, 8.3701171875, 8.921875, 9.4736328125, 10.025390625, 10.5771484375, 11.12890625, 11.6806640625, 12.232421875, 12.7841796875, 13.3359375, 13.8876953125, 14.439453125, 14.9912109375, 15.54296875, 16.0947265625, 16.646484375, 17.1982421875, 17.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 9.0, 30.0, 27.0, 59.0, 90.0, 132.0, 203.0, 349.0, 546.0, 830.0, 1332.0, 2156.0, 3304.0, 5241.0, 8106.0, 12514.0, 18827.0, 28025.0, 40125.0, 55617.0, 73233.0, 90695.0, 104478.0, 111087.0, 108531.0, 96725.0, 80446.0, 62988.0, 45932.0, 32790.0, 22266.0, 14991.0, 9693.0, 6216.0, 4094.0, 2480.0, 1573.0, 1016.0, 643.0, 429.0, 276.0, 142.0, 102.0, 66.0, 56.0, 31.0, 12.0, 14.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-16.59375, -16.1014404296875, -15.609130859375, -15.1168212890625, -14.62451171875, -14.1322021484375, -13.639892578125, -13.1475830078125, -12.6552734375, -12.1629638671875, -11.670654296875, -11.1783447265625, -10.68603515625, -10.1937255859375, -9.701416015625, -9.2091064453125, -8.716796875, -8.2244873046875, -7.732177734375, -7.2398681640625, -6.74755859375, -6.2552490234375, -5.762939453125, -5.2706298828125, -4.7783203125, -4.2860107421875, -3.793701171875, -3.3013916015625, -2.80908203125, -2.3167724609375, -1.824462890625, -1.3321533203125, -0.83984375, -0.3475341796875, 0.144775390625, 0.6370849609375, 1.12939453125, 1.6217041015625, 2.114013671875, 2.6063232421875, 3.0986328125, 3.5909423828125, 4.083251953125, 4.5755615234375, 5.06787109375, 5.5601806640625, 6.052490234375, 6.5447998046875, 7.037109375, 7.5294189453125, 8.021728515625, 8.5140380859375, 9.00634765625, 9.4986572265625, 9.990966796875, 10.4832763671875, 10.9755859375, 11.4678955078125, 11.960205078125, 12.4525146484375, 12.94482421875, 13.4371337890625, 13.929443359375, 14.4217529296875, 14.9140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 12.0, 12.0, 9.0, 9.0, 16.0, 29.0, 20.0, 24.0, 29.0, 31.0, 36.0, 25.0, 35.0, 42.0, 35.0, 48.0, 44.0, 38.0, 56.0, 33.0, 37.0, 39.0, 33.0, 41.0, 30.0, 26.0, 38.0, 31.0, 20.0, 21.0, 16.0, 19.0, 16.0, 2.0, 6.0, 13.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.322998046875, -10.89599609375, -10.468994140625, -10.0419921875, -9.614990234375, -9.18798828125, -8.760986328125, -8.333984375, -7.906982421875, -7.47998046875, -7.052978515625, -6.6259765625, -6.198974609375, -5.77197265625, -5.344970703125, -4.91796875, -4.490966796875, -4.06396484375, -3.636962890625, -3.2099609375, -2.782958984375, -2.35595703125, -1.928955078125, -1.501953125, -1.074951171875, -0.64794921875, -0.220947265625, 0.2060546875, 0.633056640625, 1.06005859375, 1.487060546875, 1.9140625, 2.341064453125, 2.76806640625, 3.195068359375, 3.6220703125, 4.049072265625, 4.47607421875, 4.903076171875, 5.330078125, 5.757080078125, 6.18408203125, 6.611083984375, 7.0380859375, 7.465087890625, 7.89208984375, 8.319091796875, 8.74609375, 9.173095703125, 9.60009765625, 10.027099609375, 10.4541015625, 10.881103515625, 11.30810546875, 11.735107421875, 12.162109375, 12.589111328125, 13.01611328125, 13.443115234375, 13.8701171875, 14.297119140625, 14.72412109375, 15.151123046875, 15.578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 10.0, 3.0, 4.0, 6.0, 20.0, 23.0, 32.0, 49.0, 89.0, 119.0, 183.0, 299.0, 421.0, 657.0, 1008.0, 1638.0, 2721.0, 4690.0, 7942.0, 13619.0, 23264.0, 39727.0, 65676.0, 99924.0, 134706.0, 155722.0, 151254.0, 122685.0, 86842.0, 55147.0, 33095.0, 19196.0, 11162.0, 6535.0, 3862.0, 2239.0, 1450.0, 875.0, 566.0, 364.0, 247.0, 179.0, 101.0, 73.0, 47.0, 35.0, 25.0, 12.0, 11.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.45147705078125, -5.2623291015625, -5.07318115234375, -4.884033203125, -4.69488525390625, -4.5057373046875, -4.31658935546875, -4.12744140625, -3.93829345703125, -3.7491455078125, -3.55999755859375, -3.370849609375, -3.18170166015625, -2.9925537109375, -2.80340576171875, -2.6142578125, -2.42510986328125, -2.2359619140625, -2.04681396484375, -1.857666015625, -1.66851806640625, -1.4793701171875, -1.29022216796875, -1.10107421875, -0.91192626953125, -0.7227783203125, -0.53363037109375, -0.344482421875, -0.15533447265625, 0.0338134765625, 0.22296142578125, 0.412109375, 0.60125732421875, 0.7904052734375, 0.97955322265625, 1.168701171875, 1.35784912109375, 1.5469970703125, 1.73614501953125, 1.92529296875, 2.11444091796875, 2.3035888671875, 2.49273681640625, 2.681884765625, 2.87103271484375, 3.0601806640625, 3.24932861328125, 3.4384765625, 3.62762451171875, 3.8167724609375, 4.00592041015625, 4.195068359375, 4.38421630859375, 4.5733642578125, 4.76251220703125, 4.95166015625, 5.14080810546875, 5.3299560546875, 5.51910400390625, 5.708251953125, 5.89739990234375, 6.0865478515625, 6.27569580078125, 6.46484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 18.0, 13.0, 14.0, 13.0, 17.0, 25.0, 25.0, 30.0, 27.0, 54.0, 44.0, 30.0, 53.0, 43.0, 47.0, 46.0, 37.0, 53.0, 43.0, 51.0, 39.0, 35.0, 29.0, 33.0, 24.0, 19.0, 25.0, 16.0, 20.0, 9.0, 12.0, 8.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005345344543457031, -0.0005172118544578552, -0.0004998892545700073, -0.0004825666546821594, -0.0004652440547943115, -0.0004479214549064636, -0.0004305988550186157, -0.0004132762551307678, -0.0003959536552429199, -0.000378631055355072, -0.0003613084554672241, -0.0003439858555793762, -0.0003266632556915283, -0.0003093406558036804, -0.0002920180559158325, -0.0002746954560279846, -0.0002573728561401367, -0.00024005025625228882, -0.00022272765636444092, -0.00020540505647659302, -0.00018808245658874512, -0.00017075985670089722, -0.00015343725681304932, -0.00013611465692520142, -0.00011879205703735352, -0.00010146945714950562, -8.414685726165771e-05, -6.682425737380981e-05, -4.9501657485961914e-05, -3.2179057598114014e-05, -1.4856457710266113e-05, 2.466142177581787e-06, 1.9788742065429688e-05, 3.711134195327759e-05, 5.443394184112549e-05, 7.175654172897339e-05, 8.907914161682129e-05, 0.00010640174150466919, 0.0001237243413925171, 0.000141046941280365, 0.0001583695411682129, 0.0001756921410560608, 0.0001930147409439087, 0.0002103373408317566, 0.0002276599407196045, 0.0002449825406074524, 0.0002623051404953003, 0.0002796277403831482, 0.0002969503402709961, 0.000314272940158844, 0.0003315955400466919, 0.0003489181399345398, 0.0003662407398223877, 0.0003835633397102356, 0.0004008859395980835, 0.0004182085394859314, 0.0004355311393737793, 0.0004528537392616272, 0.0004701763391494751, 0.000487498939037323, 0.0005048215389251709, 0.0005221441388130188, 0.0005394667387008667, 0.0005567893385887146, 0.0005741119384765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 24.0, 29.0, 58.0, 114.0, 196.0, 388.0, 683.0, 1407.0, 2685.0, 5292.0, 10330.0, 19820.0, 37460.0, 65606.0, 105353.0, 146545.0, 169817.0, 161828.0, 127273.0, 85165.0, 50311.0, 28059.0, 14584.0, 7540.0, 3886.0, 1922.0, 1015.0, 509.0, 295.0, 175.0, 80.0, 52.0, 21.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.919189453125, -5.71337890625, -5.507568359375, -5.3017578125, -5.095947265625, -4.89013671875, -4.684326171875, -4.478515625, -4.272705078125, -4.06689453125, -3.861083984375, -3.6552734375, -3.449462890625, -3.24365234375, -3.037841796875, -2.83203125, -2.626220703125, -2.42041015625, -2.214599609375, -2.0087890625, -1.802978515625, -1.59716796875, -1.391357421875, -1.185546875, -0.979736328125, -0.77392578125, -0.568115234375, -0.3623046875, -0.156494140625, 0.04931640625, 0.255126953125, 0.4609375, 0.666748046875, 0.87255859375, 1.078369140625, 1.2841796875, 1.489990234375, 1.69580078125, 1.901611328125, 2.107421875, 2.313232421875, 2.51904296875, 2.724853515625, 2.9306640625, 3.136474609375, 3.34228515625, 3.548095703125, 3.75390625, 3.959716796875, 4.16552734375, 4.371337890625, 4.5771484375, 4.782958984375, 4.98876953125, 5.194580078125, 5.400390625, 5.606201171875, 5.81201171875, 6.017822265625, 6.2236328125, 6.429443359375, 6.63525390625, 6.841064453125, 7.046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 7.0, 7.0, 14.0, 14.0, 20.0, 21.0, 21.0, 21.0, 23.0, 29.0, 27.0, 33.0, 34.0, 33.0, 52.0, 46.0, 37.0, 50.0, 29.0, 50.0, 45.0, 34.0, 39.0, 41.0, 33.0, 36.0, 27.0, 20.0, 23.0, 23.0, 19.0, 13.0, 15.0, 7.0, 7.0, 10.0, 6.0, 4.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8115234375, -1.75238037109375, -1.6932373046875, -1.63409423828125, -1.574951171875, -1.51580810546875, -1.4566650390625, -1.39752197265625, -1.33837890625, -1.27923583984375, -1.2200927734375, -1.16094970703125, -1.101806640625, -1.04266357421875, -0.9835205078125, -0.92437744140625, -0.865234375, -0.80609130859375, -0.7469482421875, -0.68780517578125, -0.628662109375, -0.56951904296875, -0.5103759765625, -0.45123291015625, -0.39208984375, -0.33294677734375, -0.2738037109375, -0.21466064453125, -0.155517578125, -0.09637451171875, -0.0372314453125, 0.02191162109375, 0.0810546875, 0.14019775390625, 0.1993408203125, 0.25848388671875, 0.317626953125, 0.37677001953125, 0.4359130859375, 0.49505615234375, 0.55419921875, 0.61334228515625, 0.6724853515625, 0.73162841796875, 0.790771484375, 0.84991455078125, 0.9090576171875, 0.96820068359375, 1.02734375, 1.08648681640625, 1.1456298828125, 1.20477294921875, 1.263916015625, 1.32305908203125, 1.3822021484375, 1.44134521484375, 1.50048828125, 1.55963134765625, 1.6187744140625, 1.67791748046875, 1.737060546875, 1.79620361328125, 1.8553466796875, 1.91448974609375, 1.9736328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 6.0, 5.0, 2.0, 8.0, 7.0, 13.0, 12.0, 13.0, 15.0, 12.0, 20.0, 21.0, 31.0, 24.0, 40.0, 31.0, 29.0, 37.0, 32.0, 37.0, 34.0, 36.0, 49.0, 39.0, 41.0, 34.0, 33.0, 30.0, 30.0, 44.0, 29.0, 35.0, 24.0, 27.0, 20.0, 16.0, 14.0, 12.0, 6.0, 7.0, 9.0, 11.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.05389976501465, -15.5481595993042, -15.042420387268066, -14.536680221557617, -14.030940055847168, -13.525199890136719, -13.019460678100586, -12.513720512390137, -12.007980346679688, -11.502240180969238, -10.996500968933105, -10.490760803222656, -9.985020637512207, -9.479280471801758, -8.973541259765625, -8.467801094055176, -7.962061882019043, -7.456322193145752, -6.950582027435303, -6.444842338562012, -5.9391021728515625, -5.4333624839782715, -4.9276227951049805, -4.421882629394531, -3.9161429405212402, -3.41040301322937, -2.9046630859375, -2.398923397064209, -1.8931834697723389, -1.3874435424804688, -0.8817038536071777, -0.3759639263153076, 0.1297760009765625, 0.6355158686637878, 1.1412557363510132, 1.6469955444335938, 2.152735471725464, 2.658475399017334, 3.164215087890625, 3.669955015182495, 4.175694942474365, 4.681434631347656, 5.1871747970581055, 5.6929144859313965, 6.1986541748046875, 6.704394340515137, 7.210134029388428, 7.715873718261719, 8.221613883972168, 8.727354049682617, 9.23309326171875, 9.7388334274292, 10.244573593139648, 10.750312805175781, 11.25605297088623, 11.76179313659668, 12.267532348632812, 12.773272514343262, 13.279011726379395, 13.784751892089844, 14.290492057800293, 14.796232223510742, 15.301971435546875, 15.807711601257324, 16.313451766967773]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 5.0, 5.0, 7.0, 12.0, 10.0, 13.0, 17.0, 21.0, 23.0, 29.0, 34.0, 23.0, 38.0, 44.0, 38.0, 29.0, 35.0, 44.0, 51.0, 30.0, 49.0, 50.0, 43.0, 41.0, 37.0, 38.0, 34.0, 35.0, 29.0, 25.0, 16.0, 21.0, 12.0, 10.0, 10.0, 4.0, 5.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.502573013305664, -22.80191421508789, -22.101255416870117, -21.400596618652344, -20.69993782043457, -19.999279022216797, -19.298622131347656, -18.597963333129883, -17.89730453491211, -17.196645736694336, -16.495986938476562, -15.795328140258789, -15.094670295715332, -14.394011497497559, -13.693352699279785, -12.992694854736328, -12.292035102844238, -11.591376304626465, -10.890717506408691, -10.190059661865234, -9.489400863647461, -8.788742065429688, -8.088083267211914, -7.387424945831299, -6.686766147613525, -5.986107349395752, -5.285449028015137, -4.584790229797363, -3.884131669998169, -3.1834731101989746, -2.482814311981201, -1.782155990600586, -1.0814971923828125, -0.3808385729789734, 0.3198200464248657, 1.0204787254333496, 1.721137285232544, 2.4217958450317383, 3.1224546432495117, 3.823112964630127, 4.5237717628479, 5.224430561065674, 5.925088882446289, 6.6257476806640625, 7.326406478881836, 8.02706527709961, 8.727724075317383, 9.42838191986084, 10.129040718078613, 10.829699516296387, 11.53035831451416, 12.231016159057617, 12.93167495727539, 13.632333755493164, 14.332992553710938, 15.033651351928711, 15.734310150146484, 16.434968948364258, 17.13562774658203, 17.836286544799805, 18.536945343017578, 19.23760223388672, 19.938262939453125, 20.638919830322266, 21.33957862854004]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 7.0, 5.0, 10.0, 15.0, 25.0, 44.0, 93.0, 136.0, 224.0, 419.0, 667.0, 1155.0, 1975.0, 3418.0, 6007.0, 10591.0, 18634.0, 33088.0, 57899.0, 98267.0, 164404.0, 258805.0, 377733.0, 502103.0, 580568.0, 576183.0, 494413.0, 373236.0, 251456.0, 158074.0, 95210.0, 55161.0, 31918.0, 18138.0, 10345.0, 5913.0, 3354.0, 1984.0, 1101.0, 599.0, 373.0, 233.0, 120.0, 87.0, 52.0, 26.0, 12.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.7708740234375, -11.299560546875, -10.8282470703125, -10.35693359375, -9.8856201171875, -9.414306640625, -8.9429931640625, -8.4716796875, -8.0003662109375, -7.529052734375, -7.0577392578125, -6.58642578125, -6.1151123046875, -5.643798828125, -5.1724853515625, -4.701171875, -4.2298583984375, -3.758544921875, -3.2872314453125, -2.81591796875, -2.3446044921875, -1.873291015625, -1.4019775390625, -0.9306640625, -0.4593505859375, 0.011962890625, 0.4832763671875, 0.95458984375, 1.4259033203125, 1.897216796875, 2.3685302734375, 2.83984375, 3.3111572265625, 3.782470703125, 4.2537841796875, 4.72509765625, 5.1964111328125, 5.667724609375, 6.1390380859375, 6.6103515625, 7.0816650390625, 7.552978515625, 8.0242919921875, 8.49560546875, 8.9669189453125, 9.438232421875, 9.9095458984375, 10.380859375, 10.8521728515625, 11.323486328125, 11.7947998046875, 12.26611328125, 12.7374267578125, 13.208740234375, 13.6800537109375, 14.1513671875, 14.6226806640625, 15.093994140625, 15.5653076171875, 16.03662109375, 16.5079345703125, 16.979248046875, 17.4505615234375, 17.921875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 7.0, 3.0, 7.0, 13.0, 12.0, 10.0, 15.0, 16.0, 23.0, 32.0, 39.0, 32.0, 26.0, 36.0, 39.0, 41.0, 34.0, 36.0, 44.0, 44.0, 45.0, 40.0, 43.0, 45.0, 47.0, 29.0, 35.0, 36.0, 29.0, 20.0, 20.0, 20.0, 15.0, 11.0, 4.0, 8.0, 9.0, 11.0, 1.0, 3.0, 8.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.46875, -15.94384765625, -15.4189453125, -14.89404296875, -14.369140625, -13.84423828125, -13.3193359375, -12.79443359375, -12.26953125, -11.74462890625, -11.2197265625, -10.69482421875, -10.169921875, -9.64501953125, -9.1201171875, -8.59521484375, -8.0703125, -7.54541015625, -7.0205078125, -6.49560546875, -5.970703125, -5.44580078125, -4.9208984375, -4.39599609375, -3.87109375, -3.34619140625, -2.8212890625, -2.29638671875, -1.771484375, -1.24658203125, -0.7216796875, -0.19677734375, 0.328125, 0.85302734375, 1.3779296875, 1.90283203125, 2.427734375, 2.95263671875, 3.4775390625, 4.00244140625, 4.52734375, 5.05224609375, 5.5771484375, 6.10205078125, 6.626953125, 7.15185546875, 7.6767578125, 8.20166015625, 8.7265625, 9.25146484375, 9.7763671875, 10.30126953125, 10.826171875, 11.35107421875, 11.8759765625, 12.40087890625, 12.92578125, 13.45068359375, 13.9755859375, 14.50048828125, 15.025390625, 15.55029296875, 16.0751953125, 16.60009765625, 17.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 6.0, 9.0, 18.0, 28.0, 52.0, 84.0, 133.0, 215.0, 338.0, 531.0, 908.0, 1436.0, 2322.0, 3866.0, 6293.0, 9839.0, 15447.0, 24708.0, 37810.0, 57524.0, 85382.0, 122883.0, 169961.0, 228593.0, 289490.0, 349700.0, 393859.0, 415865.0, 406973.0, 370429.0, 316246.0, 253666.0, 193719.0, 142663.0, 99520.0, 68293.0, 44891.0, 29700.0, 19234.0, 11973.0, 7445.0, 4755.0, 2889.0, 1723.0, 1106.0, 691.0, 378.0, 269.0, 180.0, 108.0, 47.0, 32.0, 22.0, 15.0, 10.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.171875, -10.80810546875, -10.4443359375, -10.08056640625, -9.716796875, -9.35302734375, -8.9892578125, -8.62548828125, -8.26171875, -7.89794921875, -7.5341796875, -7.17041015625, -6.806640625, -6.44287109375, -6.0791015625, -5.71533203125, -5.3515625, -4.98779296875, -4.6240234375, -4.26025390625, -3.896484375, -3.53271484375, -3.1689453125, -2.80517578125, -2.44140625, -2.07763671875, -1.7138671875, -1.35009765625, -0.986328125, -0.62255859375, -0.2587890625, 0.10498046875, 0.46875, 0.83251953125, 1.1962890625, 1.56005859375, 1.923828125, 2.28759765625, 2.6513671875, 3.01513671875, 3.37890625, 3.74267578125, 4.1064453125, 4.47021484375, 4.833984375, 5.19775390625, 5.5615234375, 5.92529296875, 6.2890625, 6.65283203125, 7.0166015625, 7.38037109375, 7.744140625, 8.10791015625, 8.4716796875, 8.83544921875, 9.19921875, 9.56298828125, 9.9267578125, 10.29052734375, 10.654296875, 11.01806640625, 11.3818359375, 11.74560546875, 12.109375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 15.0, 22.0, 27.0, 31.0, 35.0, 38.0, 69.0, 73.0, 71.0, 99.0, 116.0, 118.0, 155.0, 170.0, 219.0, 187.0, 210.0, 218.0, 214.0, 182.0, 217.0, 196.0, 168.0, 166.0, 137.0, 164.0, 118.0, 114.0, 95.0, 77.0, 57.0, 56.0, 40.0, 30.0, 33.0, 17.0, 16.0, 30.0, 9.0, 11.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.207763671875, -5.98974609375, -5.771728515625, -5.5537109375, -5.335693359375, -5.11767578125, -4.899658203125, -4.681640625, -4.463623046875, -4.24560546875, -4.027587890625, -3.8095703125, -3.591552734375, -3.37353515625, -3.155517578125, -2.9375, -2.719482421875, -2.50146484375, -2.283447265625, -2.0654296875, -1.847412109375, -1.62939453125, -1.411376953125, -1.193359375, -0.975341796875, -0.75732421875, -0.539306640625, -0.3212890625, -0.103271484375, 0.11474609375, 0.332763671875, 0.55078125, 0.768798828125, 0.98681640625, 1.204833984375, 1.4228515625, 1.640869140625, 1.85888671875, 2.076904296875, 2.294921875, 2.512939453125, 2.73095703125, 2.948974609375, 3.1669921875, 3.385009765625, 3.60302734375, 3.821044921875, 4.0390625, 4.257080078125, 4.47509765625, 4.693115234375, 4.9111328125, 5.129150390625, 5.34716796875, 5.565185546875, 5.783203125, 6.001220703125, 6.21923828125, 6.437255859375, 6.6552734375, 6.873291015625, 7.09130859375, 7.309326171875, 7.52734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 7.0, 6.0, 10.0, 10.0, 13.0, 12.0, 23.0, 24.0, 23.0, 15.0, 22.0, 26.0, 23.0, 40.0, 35.0, 41.0, 38.0, 34.0, 45.0, 36.0, 42.0, 47.0, 35.0, 46.0, 40.0, 23.0, 34.0, 25.0, 40.0, 32.0, 24.0, 17.0, 11.0, 14.0, 14.0, 10.0, 13.0, 9.0, 8.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.987288475036621, -15.524848937988281, -15.062409400939941, -14.599970817565918, -14.137531280517578, -13.675091743469238, -13.212652206420898, -12.750213623046875, -12.287774085998535, -11.825334548950195, -11.362895011901855, -10.900456428527832, -10.438016891479492, -9.975577354431152, -9.513137817382812, -9.050699234008789, -8.588258743286133, -8.125819206237793, -7.663380146026611, -7.2009406089782715, -6.73850154876709, -6.27606201171875, -5.81362247467041, -5.3511834144592285, -4.888744354248047, -4.426304817199707, -3.9638657569885254, -3.5014262199401855, -3.038987159729004, -2.576547622680664, -2.1141083240509033, -1.6516690254211426, -1.189229965209961, -0.7267906665802002, -0.2643513083457947, 0.19808804988861084, 0.6605273485183716, 1.1229667663574219, 1.5854060649871826, 2.0478453636169434, 2.510284662246704, 2.972723960876465, 3.4351632595062256, 3.8976025581359863, 4.360042095184326, 4.822481155395508, 5.284920692443848, 5.7473602294921875, 6.209799289703369, 6.672238826751709, 7.134677886962891, 7.5971174240112305, 8.05955696105957, 8.521995544433594, 8.984435081481934, 9.446874618530273, 9.909314155578613, 10.371753692626953, 10.834193229675293, 11.296631813049316, 11.759071350097656, 12.221510887145996, 12.683950424194336, 13.14638900756836, 13.6088285446167]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 7.0, 4.0, 16.0, 7.0, 13.0, 15.0, 12.0, 14.0, 30.0, 39.0, 25.0, 35.0, 31.0, 38.0, 43.0, 48.0, 49.0, 41.0, 51.0, 52.0, 40.0, 47.0, 43.0, 36.0, 41.0, 32.0, 43.0, 24.0, 20.0, 28.0, 17.0, 7.0, 14.0, 7.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.085586547851562, -19.4284610748291, -18.771333694458008, -18.114208221435547, -17.457080841064453, -16.799955368041992, -16.14282989501953, -15.485703468322754, -14.828577041625977, -14.1714506149292, -13.514324188232422, -12.857198715209961, -12.200072288513184, -11.542945861816406, -10.885820388793945, -10.228693962097168, -9.57156753540039, -8.914441108703613, -8.257314682006836, -7.600189208984375, -6.943062782287598, -6.28593635559082, -5.628810405731201, -4.971684455871582, -4.314558029174805, -3.6574318408966064, -3.000305652618408, -2.34317946434021, -1.6860532760620117, -1.0289270877838135, -0.37180089950561523, 0.2853250503540039, 0.9424514770507812, 1.5995776653289795, 2.2567038536071777, 2.913830041885376, 3.570956230163574, 4.228082656860352, 4.885208606719971, 5.54233455657959, 6.199460983276367, 6.8565874099731445, 7.513713359832764, 8.170839309692383, 8.82796573638916, 9.485092163085938, 10.142217636108398, 10.799344062805176, 11.456470489501953, 12.11359691619873, 12.770723342895508, 13.427848815917969, 14.084975242614746, 14.742101669311523, 15.399227142333984, 16.056354522705078, 16.71347999572754, 17.37060546875, 18.027732849121094, 18.684858322143555, 19.341983795166016, 19.99911117553711, 20.65623664855957, 21.31336212158203, 21.970489501953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 5.0, 17.0, 21.0, 26.0, 34.0, 45.0, 87.0, 145.0, 202.0, 282.0, 436.0, 648.0, 1006.0, 1520.0, 2395.0, 3618.0, 5207.0, 8039.0, 12272.0, 18178.0, 27188.0, 40536.0, 57474.0, 78683.0, 103685.0, 123861.0, 129326.0, 117023.0, 93311.0, 70036.0, 49966.0, 34137.0, 23374.0, 15452.0, 10296.0, 6639.0, 4568.0, 3001.0, 1982.0, 1337.0, 850.0, 560.0, 356.0, 253.0, 157.0, 112.0, 74.0, 52.0, 25.0, 22.0, 13.0, 15.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.296875, -4.15020751953125, -4.0035400390625, -3.85687255859375, -3.710205078125, -3.56353759765625, -3.4168701171875, -3.27020263671875, -3.12353515625, -2.97686767578125, -2.8302001953125, -2.68353271484375, -2.536865234375, -2.39019775390625, -2.2435302734375, -2.09686279296875, -1.9501953125, -1.80352783203125, -1.6568603515625, -1.51019287109375, -1.363525390625, -1.21685791015625, -1.0701904296875, -0.92352294921875, -0.77685546875, -0.63018798828125, -0.4835205078125, -0.33685302734375, -0.190185546875, -0.04351806640625, 0.1031494140625, 0.24981689453125, 0.396484375, 0.54315185546875, 0.6898193359375, 0.83648681640625, 0.983154296875, 1.12982177734375, 1.2764892578125, 1.42315673828125, 1.56982421875, 1.71649169921875, 1.8631591796875, 2.00982666015625, 2.156494140625, 2.30316162109375, 2.4498291015625, 2.59649658203125, 2.7431640625, 2.88983154296875, 3.0364990234375, 3.18316650390625, 3.329833984375, 3.47650146484375, 3.6231689453125, 3.76983642578125, 3.91650390625, 4.06317138671875, 4.2098388671875, 4.35650634765625, 4.503173828125, 4.64984130859375, 4.7965087890625, 4.94317626953125, 5.08984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 10.0, 14.0, 20.0, 11.0, 17.0, 19.0, 23.0, 34.0, 32.0, 27.0, 28.0, 53.0, 46.0, 43.0, 43.0, 45.0, 36.0, 43.0, 43.0, 56.0, 40.0, 38.0, 36.0, 23.0, 33.0, 34.0, 22.0, 23.0, 20.0, 12.0, 12.0, 6.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.890625, -19.249267578125, -18.60791015625, -17.966552734375, -17.3251953125, -16.683837890625, -16.04248046875, -15.401123046875, -14.759765625, -14.118408203125, -13.47705078125, -12.835693359375, -12.1943359375, -11.552978515625, -10.91162109375, -10.270263671875, -9.62890625, -8.987548828125, -8.34619140625, -7.704833984375, -7.0634765625, -6.422119140625, -5.78076171875, -5.139404296875, -4.498046875, -3.856689453125, -3.21533203125, -2.573974609375, -1.9326171875, -1.291259765625, -0.64990234375, -0.008544921875, 0.6328125, 1.274169921875, 1.91552734375, 2.556884765625, 3.1982421875, 3.839599609375, 4.48095703125, 5.122314453125, 5.763671875, 6.405029296875, 7.04638671875, 7.687744140625, 8.3291015625, 8.970458984375, 9.61181640625, 10.253173828125, 10.89453125, 11.535888671875, 12.17724609375, 12.818603515625, 13.4599609375, 14.101318359375, 14.74267578125, 15.384033203125, 16.025390625, 16.666748046875, 17.30810546875, 17.949462890625, 18.5908203125, 19.232177734375, 19.87353515625, 20.514892578125, 21.15625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 4.0, 12.0, 16.0, 28.0, 36.0, 46.0, 85.0, 79.0, 149.0, 195.0, 335.0, 472.0, 711.0, 1097.0, 1613.0, 2543.0, 4244.0, 6885.0, 11722.0, 20632.0, 36185.0, 62497.0, 103488.0, 152846.0, 184081.0, 166551.0, 117134.0, 72828.0, 42529.0, 24279.0, 13857.0, 8139.0, 4813.0, 2928.0, 1919.0, 1188.0, 780.0, 503.0, 330.0, 250.0, 174.0, 103.0, 85.0, 58.0, 34.0, 19.0, 12.0, 12.0, 11.0, 6.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.66796875, -4.52044677734375, -4.3729248046875, -4.22540283203125, -4.077880859375, -3.93035888671875, -3.7828369140625, -3.63531494140625, -3.48779296875, -3.34027099609375, -3.1927490234375, -3.04522705078125, -2.897705078125, -2.75018310546875, -2.6026611328125, -2.45513916015625, -2.3076171875, -2.16009521484375, -2.0125732421875, -1.86505126953125, -1.717529296875, -1.57000732421875, -1.4224853515625, -1.27496337890625, -1.12744140625, -0.97991943359375, -0.8323974609375, -0.68487548828125, -0.537353515625, -0.38983154296875, -0.2423095703125, -0.09478759765625, 0.052734375, 0.20025634765625, 0.3477783203125, 0.49530029296875, 0.642822265625, 0.79034423828125, 0.9378662109375, 1.08538818359375, 1.23291015625, 1.38043212890625, 1.5279541015625, 1.67547607421875, 1.822998046875, 1.97052001953125, 2.1180419921875, 2.26556396484375, 2.4130859375, 2.56060791015625, 2.7081298828125, 2.85565185546875, 3.003173828125, 3.15069580078125, 3.2982177734375, 3.44573974609375, 3.59326171875, 3.74078369140625, 3.8883056640625, 4.03582763671875, 4.183349609375, 4.33087158203125, 4.4783935546875, 4.62591552734375, 4.7734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 13.0, 16.0, 18.0, 10.0, 13.0, 26.0, 28.0, 24.0, 29.0, 26.0, 32.0, 41.0, 35.0, 37.0, 42.0, 36.0, 46.0, 41.0, 38.0, 39.0, 43.0, 29.0, 30.0, 29.0, 34.0, 21.0, 32.0, 30.0, 23.0, 22.0, 12.0, 18.0, 14.0, 8.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.7919921875, -10.396484375, -10.0009765625, -9.60546875, -9.2099609375, -8.814453125, -8.4189453125, -8.0234375, -7.6279296875, -7.232421875, -6.8369140625, -6.44140625, -6.0458984375, -5.650390625, -5.2548828125, -4.859375, -4.4638671875, -4.068359375, -3.6728515625, -3.27734375, -2.8818359375, -2.486328125, -2.0908203125, -1.6953125, -1.2998046875, -0.904296875, -0.5087890625, -0.11328125, 0.2822265625, 0.677734375, 1.0732421875, 1.46875, 1.8642578125, 2.259765625, 2.6552734375, 3.05078125, 3.4462890625, 3.841796875, 4.2373046875, 4.6328125, 5.0283203125, 5.423828125, 5.8193359375, 6.21484375, 6.6103515625, 7.005859375, 7.4013671875, 7.796875, 8.1923828125, 8.587890625, 8.9833984375, 9.37890625, 9.7744140625, 10.169921875, 10.5654296875, 10.9609375, 11.3564453125, 11.751953125, 12.1474609375, 12.54296875, 12.9384765625, 13.333984375, 13.7294921875, 14.125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 17.0, 26.0, 39.0, 73.0, 121.0, 173.0, 311.0, 492.0, 955.0, 1818.0, 3716.0, 7579.0, 17046.0, 41227.0, 110061.0, 295575.0, 342629.0, 137762.0, 50391.0, 20339.0, 8946.0, 4331.0, 2167.0, 1135.0, 653.0, 382.0, 231.0, 137.0, 84.0, 44.0, 28.0, 19.0, 12.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.37237548828125, -2.2935791015625, -2.21478271484375, -2.135986328125, -2.05718994140625, -1.9783935546875, -1.89959716796875, -1.82080078125, -1.74200439453125, -1.6632080078125, -1.58441162109375, -1.505615234375, -1.42681884765625, -1.3480224609375, -1.26922607421875, -1.1904296875, -1.11163330078125, -1.0328369140625, -0.95404052734375, -0.875244140625, -0.79644775390625, -0.7176513671875, -0.63885498046875, -0.56005859375, -0.48126220703125, -0.4024658203125, -0.32366943359375, -0.244873046875, -0.16607666015625, -0.0872802734375, -0.00848388671875, 0.0703125, 0.14910888671875, 0.2279052734375, 0.30670166015625, 0.385498046875, 0.46429443359375, 0.5430908203125, 0.62188720703125, 0.70068359375, 0.77947998046875, 0.8582763671875, 0.93707275390625, 1.015869140625, 1.09466552734375, 1.1734619140625, 1.25225830078125, 1.3310546875, 1.40985107421875, 1.4886474609375, 1.56744384765625, 1.646240234375, 1.72503662109375, 1.8038330078125, 1.88262939453125, 1.96142578125, 2.04022216796875, 2.1190185546875, 2.19781494140625, 2.276611328125, 2.35540771484375, 2.4342041015625, 2.51300048828125, 2.591796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 14.0, 7.0, 10.0, 16.0, 16.0, 17.0, 18.0, 29.0, 28.0, 40.0, 57.0, 61.0, 76.0, 86.0, 105.0, 93.0, 78.0, 54.0, 34.0, 11.0, 29.0, 16.0, 16.0, 15.0, 13.0, 14.0, 7.0, 5.0, 6.0, 3.0, 8.0, 0.0, 2.0, 5.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036072731018066406, -0.0003479085862636566, -0.00033508986234664917, -0.0003222711384296417, -0.0003094524145126343, -0.00029663369059562683, -0.0002838149666786194, -0.00027099624276161194, -0.0002581775188446045, -0.00024535879492759705, -0.0002325400710105896, -0.00021972134709358215, -0.0002069026231765747, -0.00019408389925956726, -0.00018126517534255981, -0.00016844645142555237, -0.00015562772750854492, -0.00014280900359153748, -0.00012999027967453003, -0.00011717155575752258, -0.00010435283184051514, -9.153410792350769e-05, -7.871538400650024e-05, -6.58966600894928e-05, -5.307793617248535e-05, -4.0259212255477905e-05, -2.744048833847046e-05, -1.4621764421463013e-05, -1.8030405044555664e-06, 1.101568341255188e-05, 2.3834407329559326e-05, 3.665313124656677e-05, 4.947185516357422e-05, 6.229057908058167e-05, 7.510930299758911e-05, 8.792802691459656e-05, 0.000100746750831604, 0.00011356547474861145, 0.0001263841986656189, 0.00013920292258262634, 0.0001520216464996338, 0.00016484037041664124, 0.00017765909433364868, 0.00019047781825065613, 0.00020329654216766357, 0.00021611526608467102, 0.00022893399000167847, 0.0002417527139186859, 0.00025457143783569336, 0.0002673901617527008, 0.00028020888566970825, 0.0002930276095867157, 0.00030584633350372314, 0.0003186650574207306, 0.00033148378133773804, 0.0003443025052547455, 0.00035712122917175293, 0.0003699399530887604, 0.0003827586770057678, 0.00039557740092277527, 0.0004083961248397827, 0.00042121484875679016, 0.0004340335726737976, 0.00044685229659080505, 0.0004596710205078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 14.0, 25.0, 31.0, 49.0, 68.0, 79.0, 129.0, 211.0, 249.0, 379.0, 579.0, 932.0, 1420.0, 2305.0, 3695.0, 6052.0, 10493.0, 18339.0, 32811.0, 57764.0, 100474.0, 166368.0, 216636.0, 174962.0, 108374.0, 62446.0, 35079.0, 19943.0, 11472.0, 6513.0, 3855.0, 2402.0, 1536.0, 924.0, 644.0, 421.0, 265.0, 183.0, 115.0, 87.0, 56.0, 49.0, 38.0, 24.0, 13.0, 11.0, 10.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.537109375, -2.4541015625, -2.37109375, -2.2880859375, -2.205078125, -2.1220703125, -2.0390625, -1.9560546875, -1.873046875, -1.7900390625, -1.70703125, -1.6240234375, -1.541015625, -1.4580078125, -1.375, -1.2919921875, -1.208984375, -1.1259765625, -1.04296875, -0.9599609375, -0.876953125, -0.7939453125, -0.7109375, -0.6279296875, -0.544921875, -0.4619140625, -0.37890625, -0.2958984375, -0.212890625, -0.1298828125, -0.046875, 0.0361328125, 0.119140625, 0.2021484375, 0.28515625, 0.3681640625, 0.451171875, 0.5341796875, 0.6171875, 0.7001953125, 0.783203125, 0.8662109375, 0.94921875, 1.0322265625, 1.115234375, 1.1982421875, 1.28125, 1.3642578125, 1.447265625, 1.5302734375, 1.61328125, 1.6962890625, 1.779296875, 1.8623046875, 1.9453125, 2.0283203125, 2.111328125, 2.1943359375, 2.27734375, 2.3603515625, 2.443359375, 2.5263671875, 2.609375, 2.6923828125, 2.775390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 7.0, 14.0, 10.0, 22.0, 28.0, 24.0, 35.0, 42.0, 37.0, 67.0, 62.0, 62.0, 83.0, 63.0, 75.0, 59.0, 58.0, 47.0, 42.0, 29.0, 26.0, 16.0, 12.0, 10.0, 10.0, 5.0, 8.0, 12.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1318359375, -1.095458984375, -1.05908203125, -1.022705078125, -0.986328125, -0.949951171875, -0.91357421875, -0.877197265625, -0.8408203125, -0.804443359375, -0.76806640625, -0.731689453125, -0.6953125, -0.658935546875, -0.62255859375, -0.586181640625, -0.5498046875, -0.513427734375, -0.47705078125, -0.440673828125, -0.404296875, -0.367919921875, -0.33154296875, -0.295166015625, -0.2587890625, -0.222412109375, -0.18603515625, -0.149658203125, -0.11328125, -0.076904296875, -0.04052734375, -0.004150390625, 0.0322265625, 0.068603515625, 0.10498046875, 0.141357421875, 0.177734375, 0.214111328125, 0.25048828125, 0.286865234375, 0.3232421875, 0.359619140625, 0.39599609375, 0.432373046875, 0.46875, 0.505126953125, 0.54150390625, 0.577880859375, 0.6142578125, 0.650634765625, 0.68701171875, 0.723388671875, 0.759765625, 0.796142578125, 0.83251953125, 0.868896484375, 0.9052734375, 0.941650390625, 0.97802734375, 1.014404296875, 1.05078125, 1.087158203125, 1.12353515625, 1.159912109375, 1.1962890625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 5.0, 8.0, 11.0, 8.0, 16.0, 19.0, 24.0, 11.0, 18.0, 20.0, 17.0, 30.0, 40.0, 29.0, 34.0, 32.0, 37.0, 45.0, 40.0, 40.0, 38.0, 30.0, 53.0, 34.0, 38.0, 32.0, 38.0, 36.0, 27.0, 35.0, 17.0, 21.0, 14.0, 7.0, 15.0, 12.0, 12.0, 6.0, 11.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.69510269165039, -15.243623733520508, -14.792144775390625, -14.340665817260742, -13.889187812805176, -13.437708854675293, -12.98622989654541, -12.534750938415527, -12.083272933959961, -11.631793975830078, -11.180315017700195, -10.728836059570312, -10.277358055114746, -9.825879096984863, -9.37440013885498, -8.922921180725098, -8.471442222595215, -8.019963264465332, -7.568484783172607, -7.117005825042725, -6.66552734375, -6.214048385620117, -5.762569427490234, -5.311090469360352, -4.859611988067627, -4.408133029937744, -3.9566545486450195, -3.5051755905151367, -3.053696870803833, -2.6022181510925293, -2.1507391929626465, -1.6992604732513428, -1.2477827072143555, -0.796303927898407, -0.3448251485824585, 0.10665369033813477, 0.5581324100494385, 1.0096111297607422, 1.461090087890625, 1.9125688076019287, 2.3640475273132324, 2.815526247024536, 3.26700496673584, 3.7184839248657227, 4.1699628829956055, 4.62144136428833, 5.072920322418213, 5.5243988037109375, 5.97587776184082, 6.427356719970703, 6.878835201263428, 7.3303141593933105, 7.781792640686035, 8.233271598815918, 8.6847505569458, 9.136229515075684, 9.58770751953125, 10.039186477661133, 10.490665435791016, 10.942144393920898, 11.393622398376465, 11.845101356506348, 12.29658031463623, 12.748059272766113, 13.199538230895996]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 8.0, 5.0, 18.0, 11.0, 13.0, 13.0, 9.0, 23.0, 34.0, 35.0, 26.0, 36.0, 34.0, 44.0, 47.0, 48.0, 46.0, 38.0, 56.0, 45.0, 37.0, 43.0, 49.0, 45.0, 29.0, 39.0, 30.0, 19.0, 23.0, 24.0, 10.0, 13.0, 13.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.151615142822266, -18.512569427490234, -17.873523712158203, -17.23447608947754, -16.595430374145508, -15.956384658813477, -15.317338943481445, -14.678293228149414, -14.039246559143066, -13.400200843811035, -12.761154174804688, -12.122108459472656, -11.483062744140625, -10.844016075134277, -10.204970359802246, -9.565923690795898, -8.926877975463867, -8.287832260131836, -7.648785591125488, -7.009739875793457, -6.370693683624268, -5.731647491455078, -5.092601776123047, -4.453555583953857, -3.814509391784668, -3.1754631996154785, -2.536417245864868, -1.8973711729049683, -1.2583250999450684, -0.6192789077758789, 0.019767045974731445, 0.6588129997253418, 1.2978572845458984, 1.9369033575057983, 2.5759494304656982, 3.2149953842163086, 3.854041576385498, 4.4930877685546875, 5.132133483886719, 5.771179676055908, 6.410225868225098, 7.049272060394287, 7.688318252563477, 8.327363967895508, 8.966409683227539, 9.605456352233887, 10.244502067565918, 10.883548736572266, 11.522594451904297, 12.161640167236328, 12.800686836242676, 13.439732551574707, 14.078779220581055, 14.717824935913086, 15.356870651245117, 15.995916366577148, 16.634963989257812, 17.274009704589844, 17.913055419921875, 18.55210304260254, 19.19114875793457, 19.8301944732666, 20.469240188598633, 21.108285903930664, 21.747331619262695]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 23.0, 40.0, 47.0, 83.0, 139.0, 219.0, 351.0, 547.0, 862.0, 1376.0, 2294.0, 3700.0, 5744.0, 9258.0, 14192.0, 21365.0, 31988.0, 45134.0, 61576.0, 79616.0, 95348.0, 107170.0, 110631.0, 105675.0, 92225.0, 75509.0, 57859.0, 41759.0, 29374.0, 19502.0, 12801.0, 8296.0, 5187.0, 3248.0, 2024.0, 1281.0, 766.0, 516.0, 308.0, 178.0, 119.0, 87.0, 43.0, 37.0, 13.0, 15.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.65625, -12.23974609375, -11.8232421875, -11.40673828125, -10.990234375, -10.57373046875, -10.1572265625, -9.74072265625, -9.32421875, -8.90771484375, -8.4912109375, -8.07470703125, -7.658203125, -7.24169921875, -6.8251953125, -6.40869140625, -5.9921875, -5.57568359375, -5.1591796875, -4.74267578125, -4.326171875, -3.90966796875, -3.4931640625, -3.07666015625, -2.66015625, -2.24365234375, -1.8271484375, -1.41064453125, -0.994140625, -0.57763671875, -0.1611328125, 0.25537109375, 0.671875, 1.08837890625, 1.5048828125, 1.92138671875, 2.337890625, 2.75439453125, 3.1708984375, 3.58740234375, 4.00390625, 4.42041015625, 4.8369140625, 5.25341796875, 5.669921875, 6.08642578125, 6.5029296875, 6.91943359375, 7.3359375, 7.75244140625, 8.1689453125, 8.58544921875, 9.001953125, 9.41845703125, 9.8349609375, 10.25146484375, 10.66796875, 11.08447265625, 11.5009765625, 11.91748046875, 12.333984375, 12.75048828125, 13.1669921875, 13.58349609375, 14.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 7.0, 7.0, 9.0, 12.0, 8.0, 17.0, 9.0, 20.0, 15.0, 20.0, 33.0, 29.0, 33.0, 35.0, 52.0, 44.0, 41.0, 49.0, 56.0, 46.0, 35.0, 39.0, 39.0, 45.0, 40.0, 45.0, 37.0, 20.0, 27.0, 34.0, 17.0, 15.0, 17.0, 9.0, 9.0, 3.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.1396484375, -16.529296875, -15.9189453125, -15.30859375, -14.6982421875, -14.087890625, -13.4775390625, -12.8671875, -12.2568359375, -11.646484375, -11.0361328125, -10.42578125, -9.8154296875, -9.205078125, -8.5947265625, -7.984375, -7.3740234375, -6.763671875, -6.1533203125, -5.54296875, -4.9326171875, -4.322265625, -3.7119140625, -3.1015625, -2.4912109375, -1.880859375, -1.2705078125, -0.66015625, -0.0498046875, 0.560546875, 1.1708984375, 1.78125, 2.3916015625, 3.001953125, 3.6123046875, 4.22265625, 4.8330078125, 5.443359375, 6.0537109375, 6.6640625, 7.2744140625, 7.884765625, 8.4951171875, 9.10546875, 9.7158203125, 10.326171875, 10.9365234375, 11.546875, 12.1572265625, 12.767578125, 13.3779296875, 13.98828125, 14.5986328125, 15.208984375, 15.8193359375, 16.4296875, 17.0400390625, 17.650390625, 18.2607421875, 18.87109375, 19.4814453125, 20.091796875, 20.7021484375, 21.3125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 8.0, 17.0, 40.0, 49.0, 75.0, 122.0, 202.0, 336.0, 504.0, 829.0, 1263.0, 1979.0, 3170.0, 4788.0, 7511.0, 11627.0, 17717.0, 26335.0, 37884.0, 52742.0, 69714.0, 87210.0, 102046.0, 110081.0, 108549.0, 99135.0, 83881.0, 66099.0, 48816.0, 35689.0, 24176.0, 16165.0, 10672.0, 6939.0, 4570.0, 2770.0, 1838.0, 1086.0, 685.0, 460.0, 256.0, 194.0, 116.0, 67.0, 50.0, 37.0, 19.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-14.21875, -13.7864990234375, -13.354248046875, -12.9219970703125, -12.48974609375, -12.0574951171875, -11.625244140625, -11.1929931640625, -10.7607421875, -10.3284912109375, -9.896240234375, -9.4639892578125, -9.03173828125, -8.5994873046875, -8.167236328125, -7.7349853515625, -7.302734375, -6.8704833984375, -6.438232421875, -6.0059814453125, -5.57373046875, -5.1414794921875, -4.709228515625, -4.2769775390625, -3.8447265625, -3.4124755859375, -2.980224609375, -2.5479736328125, -2.11572265625, -1.6834716796875, -1.251220703125, -0.8189697265625, -0.38671875, 0.0455322265625, 0.477783203125, 0.9100341796875, 1.34228515625, 1.7745361328125, 2.206787109375, 2.6390380859375, 3.0712890625, 3.5035400390625, 3.935791015625, 4.3680419921875, 4.80029296875, 5.2325439453125, 5.664794921875, 6.0970458984375, 6.529296875, 6.9615478515625, 7.393798828125, 7.8260498046875, 8.25830078125, 8.6905517578125, 9.122802734375, 9.5550537109375, 9.9873046875, 10.4195556640625, 10.851806640625, 11.2840576171875, 11.71630859375, 12.1485595703125, 12.580810546875, 13.0130615234375, 13.4453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 12.0, 16.0, 7.0, 17.0, 13.0, 20.0, 19.0, 17.0, 21.0, 24.0, 31.0, 25.0, 27.0, 32.0, 39.0, 32.0, 40.0, 32.0, 41.0, 39.0, 43.0, 39.0, 26.0, 40.0, 26.0, 37.0, 26.0, 29.0, 26.0, 18.0, 24.0, 17.0, 16.0, 16.0, 10.0, 12.0, 12.0, 12.0, 7.0, 9.0, 10.0, 3.0, 2.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.8515625, -9.522705078125, -9.19384765625, -8.864990234375, -8.5361328125, -8.207275390625, -7.87841796875, -7.549560546875, -7.220703125, -6.891845703125, -6.56298828125, -6.234130859375, -5.9052734375, -5.576416015625, -5.24755859375, -4.918701171875, -4.58984375, -4.260986328125, -3.93212890625, -3.603271484375, -3.2744140625, -2.945556640625, -2.61669921875, -2.287841796875, -1.958984375, -1.630126953125, -1.30126953125, -0.972412109375, -0.6435546875, -0.314697265625, 0.01416015625, 0.343017578125, 0.671875, 1.000732421875, 1.32958984375, 1.658447265625, 1.9873046875, 2.316162109375, 2.64501953125, 2.973876953125, 3.302734375, 3.631591796875, 3.96044921875, 4.289306640625, 4.6181640625, 4.947021484375, 5.27587890625, 5.604736328125, 5.93359375, 6.262451171875, 6.59130859375, 6.920166015625, 7.2490234375, 7.577880859375, 7.90673828125, 8.235595703125, 8.564453125, 8.893310546875, 9.22216796875, 9.551025390625, 9.8798828125, 10.208740234375, 10.53759765625, 10.866455078125, 11.1953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 9.0, 8.0, 11.0, 30.0, 32.0, 44.0, 79.0, 99.0, 136.0, 182.0, 294.0, 420.0, 580.0, 882.0, 1361.0, 2055.0, 3123.0, 4857.0, 7472.0, 11691.0, 18530.0, 29742.0, 47680.0, 73726.0, 107493.0, 138447.0, 152840.0, 138906.0, 106550.0, 73089.0, 47489.0, 29191.0, 18466.0, 11512.0, 7427.0, 4814.0, 3072.0, 2010.0, 1346.0, 913.0, 601.0, 408.0, 283.0, 193.0, 132.0, 100.0, 73.0, 36.0, 30.0, 34.0, 18.0, 16.0, 12.0, 4.0, 5.0, 4.0, 2.0], "bins": [-6.84765625, -6.6431884765625, -6.438720703125, -6.2342529296875, -6.02978515625, -5.8253173828125, -5.620849609375, -5.4163818359375, -5.2119140625, -5.0074462890625, -4.802978515625, -4.5985107421875, -4.39404296875, -4.1895751953125, -3.985107421875, -3.7806396484375, -3.576171875, -3.3717041015625, -3.167236328125, -2.9627685546875, -2.75830078125, -2.5538330078125, -2.349365234375, -2.1448974609375, -1.9404296875, -1.7359619140625, -1.531494140625, -1.3270263671875, -1.12255859375, -0.9180908203125, -0.713623046875, -0.5091552734375, -0.3046875, -0.1002197265625, 0.104248046875, 0.3087158203125, 0.51318359375, 0.7176513671875, 0.922119140625, 1.1265869140625, 1.3310546875, 1.5355224609375, 1.739990234375, 1.9444580078125, 2.14892578125, 2.3533935546875, 2.557861328125, 2.7623291015625, 2.966796875, 3.1712646484375, 3.375732421875, 3.5802001953125, 3.78466796875, 3.9891357421875, 4.193603515625, 4.3980712890625, 4.6025390625, 4.8070068359375, 5.011474609375, 5.2159423828125, 5.42041015625, 5.6248779296875, 5.829345703125, 6.0338134765625, 6.23828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 21.0, 19.0, 12.0, 19.0, 19.0, 19.0, 30.0, 35.0, 47.0, 45.0, 53.0, 60.0, 62.0, 50.0, 58.0, 57.0, 53.0, 40.0, 52.0, 42.0, 38.0, 20.0, 21.0, 21.0, 15.0, 9.0, 12.0, 15.0, 9.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007724761962890625, -0.000749543309211731, -0.0007266104221343994, -0.0007036775350570679, -0.0006807446479797363, -0.0006578117609024048, -0.0006348788738250732, -0.0006119459867477417, -0.0005890130996704102, -0.0005660802125930786, -0.0005431473255157471, -0.0005202144384384155, -0.000497281551361084, -0.00047434866428375244, -0.0004514157772064209, -0.00042848289012908936, -0.0004055500030517578, -0.00038261711597442627, -0.0003596842288970947, -0.0003367513418197632, -0.00031381845474243164, -0.0002908855676651001, -0.00026795268058776855, -0.000245019793510437, -0.00022208690643310547, -0.00019915401935577393, -0.00017622113227844238, -0.00015328824520111084, -0.0001303553581237793, -0.00010742247104644775, -8.448958396911621e-05, -6.155669689178467e-05, -3.8623809814453125e-05, -1.5690922737121582e-05, 7.241964340209961e-06, 3.0174851417541504e-05, 5.310773849487305e-05, 7.604062557220459e-05, 9.897351264953613e-05, 0.00012190639972686768, 0.00014483928680419922, 0.00016777217388153076, 0.0001907050609588623, 0.00021363794803619385, 0.0002365708351135254, 0.00025950372219085693, 0.0002824366092681885, 0.00030536949634552, 0.00032830238342285156, 0.0003512352705001831, 0.00037416815757751465, 0.0003971010446548462, 0.00042003393173217773, 0.0004429668188095093, 0.0004658997058868408, 0.0004888325929641724, 0.0005117654800415039, 0.0005346983671188354, 0.000557631254196167, 0.0005805641412734985, 0.0006034970283508301, 0.0006264299154281616, 0.0006493628025054932, 0.0006722956895828247, 0.0006952285766601562]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 11.0, 21.0, 28.0, 46.0, 74.0, 113.0, 152.0, 246.0, 421.0, 637.0, 1043.0, 1619.0, 2558.0, 3998.0, 6589.0, 10171.0, 16059.0, 25053.0, 38641.0, 57283.0, 80595.0, 106091.0, 126257.0, 131772.0, 121117.0, 99011.0, 73144.0, 51168.0, 33988.0, 22389.0, 14058.0, 9020.0, 5672.0, 3506.0, 2144.0, 1383.0, 921.0, 523.0, 379.0, 244.0, 162.0, 76.0, 61.0, 48.0, 25.0, 14.0, 12.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.7935791015625, -5.614501953125, -5.4354248046875, -5.25634765625, -5.0772705078125, -4.898193359375, -4.7191162109375, -4.5400390625, -4.3609619140625, -4.181884765625, -4.0028076171875, -3.82373046875, -3.6446533203125, -3.465576171875, -3.2864990234375, -3.107421875, -2.9283447265625, -2.749267578125, -2.5701904296875, -2.39111328125, -2.2120361328125, -2.032958984375, -1.8538818359375, -1.6748046875, -1.4957275390625, -1.316650390625, -1.1375732421875, -0.95849609375, -0.7794189453125, -0.600341796875, -0.4212646484375, -0.2421875, -0.0631103515625, 0.115966796875, 0.2950439453125, 0.47412109375, 0.6531982421875, 0.832275390625, 1.0113525390625, 1.1904296875, 1.3695068359375, 1.548583984375, 1.7276611328125, 1.90673828125, 2.0858154296875, 2.264892578125, 2.4439697265625, 2.623046875, 2.8021240234375, 2.981201171875, 3.1602783203125, 3.33935546875, 3.5184326171875, 3.697509765625, 3.8765869140625, 4.0556640625, 4.2347412109375, 4.413818359375, 4.5928955078125, 4.77197265625, 4.9510498046875, 5.130126953125, 5.3092041015625, 5.48828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 7.0, 8.0, 12.0, 11.0, 10.0, 14.0, 25.0, 24.0, 27.0, 33.0, 36.0, 42.0, 38.0, 52.0, 50.0, 58.0, 58.0, 51.0, 68.0, 51.0, 47.0, 39.0, 38.0, 35.0, 23.0, 18.0, 25.0, 17.0, 23.0, 13.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.887420654296875, -2.79437255859375, -2.701324462890625, -2.6082763671875, -2.515228271484375, -2.42218017578125, -2.329132080078125, -2.236083984375, -2.143035888671875, -2.04998779296875, -1.956939697265625, -1.8638916015625, -1.770843505859375, -1.67779541015625, -1.584747314453125, -1.49169921875, -1.398651123046875, -1.30560302734375, -1.212554931640625, -1.1195068359375, -1.026458740234375, -0.93341064453125, -0.840362548828125, -0.747314453125, -0.654266357421875, -0.56121826171875, -0.468170166015625, -0.3751220703125, -0.282073974609375, -0.18902587890625, -0.095977783203125, -0.0029296875, 0.090118408203125, 0.18316650390625, 0.276214599609375, 0.3692626953125, 0.462310791015625, 0.55535888671875, 0.648406982421875, 0.741455078125, 0.834503173828125, 0.92755126953125, 1.020599365234375, 1.1136474609375, 1.206695556640625, 1.29974365234375, 1.392791748046875, 1.48583984375, 1.578887939453125, 1.67193603515625, 1.764984130859375, 1.8580322265625, 1.951080322265625, 2.04412841796875, 2.137176513671875, 2.230224609375, 2.323272705078125, 2.41632080078125, 2.509368896484375, 2.6024169921875, 2.695465087890625, 2.78851318359375, 2.881561279296875, 2.974609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 11.0, 11.0, 16.0, 18.0, 19.0, 28.0, 20.0, 20.0, 27.0, 30.0, 27.0, 45.0, 48.0, 37.0, 43.0, 57.0, 51.0, 55.0, 56.0, 47.0, 46.0, 32.0, 36.0, 33.0, 32.0, 24.0, 17.0, 17.0, 17.0, 20.0, 11.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.530940055847168, -15.007871627807617, -14.484803199768066, -13.961734771728516, -13.438666343688965, -12.915597915649414, -12.392528533935547, -11.869461059570312, -11.346391677856445, -10.823323249816895, -10.300254821777344, -9.777186393737793, -9.254117965698242, -8.731049537658691, -8.20798110961914, -7.684912204742432, -7.161844253540039, -6.638775825500488, -6.1157073974609375, -5.592638969421387, -5.069570541381836, -4.546502113342285, -4.023433208465576, -3.5003647804260254, -2.9772963523864746, -2.454227924346924, -1.9311593770980835, -1.4080908298492432, -0.8850224018096924, -0.3619539737701416, 0.16111469268798828, 0.6841831207275391, 1.2072525024414062, 1.730320930480957, 2.253389358520508, 2.7764580249786377, 3.2995264530181885, 3.8225948810577393, 4.345663547515869, 4.86873197555542, 5.391800403594971, 5.9148688316345215, 6.437937259674072, 6.961006164550781, 7.484074592590332, 8.007143020629883, 8.530211448669434, 9.053279876708984, 9.576348304748535, 10.099416732788086, 10.622485160827637, 11.145553588867188, 11.668622016906738, 12.191690444946289, 12.714759826660156, 13.23782730102539, 13.760896682739258, 14.283965110778809, 14.80703353881836, 15.33010196685791, 15.853170394897461, 16.376239776611328, 16.899307250976562, 17.42237663269043, 17.945444107055664]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 10.0, 4.0, 10.0, 15.0, 14.0, 21.0, 21.0, 18.0, 21.0, 31.0, 38.0, 31.0, 34.0, 37.0, 40.0, 46.0, 47.0, 43.0, 36.0, 45.0, 47.0, 43.0, 53.0, 44.0, 32.0, 25.0, 22.0, 33.0, 20.0, 17.0, 9.0, 21.0, 17.0, 8.0, 4.0, 8.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.78479766845703, -19.147563934326172, -18.51032829284668, -17.87309455871582, -17.235858917236328, -16.59862518310547, -15.961389541625977, -15.324155807495117, -14.686920166015625, -14.04968547821045, -13.412450790405273, -12.775216102600098, -12.137981414794922, -11.500746726989746, -10.86351203918457, -10.226278305053711, -9.589043617248535, -8.95180892944336, -8.314574241638184, -7.677339553833008, -7.040104866027832, -6.402870178222656, -5.765635967254639, -5.128401279449463, -4.491166591644287, -3.8539319038391113, -3.2166972160339355, -2.579462766647339, -1.942228078842163, -1.3049933910369873, -0.6677589416503906, -0.030524253845214844, 0.6067104339599609, 1.2439451217651367, 1.881179690361023, 2.518414258956909, 3.155648946762085, 3.7928836345672607, 4.430118083953857, 5.067352771759033, 5.704587459564209, 6.341822147369385, 6.9790568351745605, 7.616291046142578, 8.253525733947754, 8.89076042175293, 9.527995109558105, 10.165229797363281, 10.802464485168457, 11.439699172973633, 12.076933860778809, 12.714168548583984, 13.35140323638916, 13.988637924194336, 14.625871658325195, 15.263107299804688, 15.900341033935547, 16.537574768066406, 17.1748104095459, 17.812044143676758, 18.44927978515625, 19.08651351928711, 19.7237491607666, 20.36098289489746, 20.998218536376953]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 10.0, 13.0, 20.0, 61.0, 101.0, 155.0, 234.0, 417.0, 671.0, 1169.0, 1878.0, 3090.0, 5027.0, 8764.0, 14563.0, 24310.0, 39497.0, 63377.0, 101108.0, 154711.0, 228799.0, 317742.0, 410911.0, 482666.0, 508195.0, 480856.0, 407056.0, 312212.0, 222751.0, 149995.0, 96206.0, 61458.0, 38003.0, 23015.0, 13986.0, 8299.0, 5129.0, 3103.0, 1834.0, 1075.0, 664.0, 447.0, 273.0, 152.0, 98.0, 72.0, 35.0, 21.0, 17.0, 9.0, 6.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.2586669921875, -10.876708984375, -10.4947509765625, -10.11279296875, -9.7308349609375, -9.348876953125, -8.9669189453125, -8.5849609375, -8.2030029296875, -7.821044921875, -7.4390869140625, -7.05712890625, -6.6751708984375, -6.293212890625, -5.9112548828125, -5.529296875, -5.1473388671875, -4.765380859375, -4.3834228515625, -4.00146484375, -3.6195068359375, -3.237548828125, -2.8555908203125, -2.4736328125, -2.0916748046875, -1.709716796875, -1.3277587890625, -0.94580078125, -0.5638427734375, -0.181884765625, 0.2000732421875, 0.58203125, 0.9639892578125, 1.345947265625, 1.7279052734375, 2.10986328125, 2.4918212890625, 2.873779296875, 3.2557373046875, 3.6376953125, 4.0196533203125, 4.401611328125, 4.7835693359375, 5.16552734375, 5.5474853515625, 5.929443359375, 6.3114013671875, 6.693359375, 7.0753173828125, 7.457275390625, 7.8392333984375, 8.22119140625, 8.6031494140625, 8.985107421875, 9.3670654296875, 9.7490234375, 10.1309814453125, 10.512939453125, 10.8948974609375, 11.27685546875, 11.6588134765625, 12.040771484375, 12.4227294921875, 12.8046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 4.0, 8.0, 5.0, 10.0, 12.0, 16.0, 27.0, 22.0, 31.0, 19.0, 26.0, 30.0, 36.0, 39.0, 38.0, 39.0, 40.0, 38.0, 38.0, 40.0, 46.0, 45.0, 35.0, 48.0, 42.0, 43.0, 32.0, 24.0, 21.0, 26.0, 11.0, 17.0, 19.0, 10.0, 6.0, 12.0, 8.0, 3.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3671875, -12.9053955078125, -12.443603515625, -11.9818115234375, -11.52001953125, -11.0582275390625, -10.596435546875, -10.1346435546875, -9.6728515625, -9.2110595703125, -8.749267578125, -8.2874755859375, -7.82568359375, -7.3638916015625, -6.902099609375, -6.4403076171875, -5.978515625, -5.5167236328125, -5.054931640625, -4.5931396484375, -4.13134765625, -3.6695556640625, -3.207763671875, -2.7459716796875, -2.2841796875, -1.8223876953125, -1.360595703125, -0.8988037109375, -0.43701171875, 0.0247802734375, 0.486572265625, 0.9483642578125, 1.41015625, 1.8719482421875, 2.333740234375, 2.7955322265625, 3.25732421875, 3.7191162109375, 4.180908203125, 4.6427001953125, 5.1044921875, 5.5662841796875, 6.028076171875, 6.4898681640625, 6.95166015625, 7.4134521484375, 7.875244140625, 8.3370361328125, 8.798828125, 9.2606201171875, 9.722412109375, 10.1842041015625, 10.64599609375, 11.1077880859375, 11.569580078125, 12.0313720703125, 12.4931640625, 12.9549560546875, 13.416748046875, 13.8785400390625, 14.34033203125, 14.8021240234375, 15.263916015625, 15.7257080078125, 16.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 18.0, 17.0, 26.0, 53.0, 91.0, 126.0, 237.0, 368.0, 634.0, 1098.0, 1745.0, 2853.0, 4702.0, 7520.0, 12377.0, 20120.0, 31733.0, 49787.0, 75187.0, 110413.0, 157735.0, 214909.0, 280260.0, 341432.0, 392349.0, 420767.0, 418210.0, 386854.0, 333944.0, 269651.0, 206354.0, 150687.0, 105407.0, 71127.0, 46869.0, 29677.0, 18986.0, 11705.0, 7335.0, 4374.0, 2602.0, 1580.0, 941.0, 562.0, 371.0, 187.0, 117.0, 82.0, 44.0, 28.0, 19.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-10.8359375, -10.49658203125, -10.1572265625, -9.81787109375, -9.478515625, -9.13916015625, -8.7998046875, -8.46044921875, -8.12109375, -7.78173828125, -7.4423828125, -7.10302734375, -6.763671875, -6.42431640625, -6.0849609375, -5.74560546875, -5.40625, -5.06689453125, -4.7275390625, -4.38818359375, -4.048828125, -3.70947265625, -3.3701171875, -3.03076171875, -2.69140625, -2.35205078125, -2.0126953125, -1.67333984375, -1.333984375, -0.99462890625, -0.6552734375, -0.31591796875, 0.0234375, 0.36279296875, 0.7021484375, 1.04150390625, 1.380859375, 1.72021484375, 2.0595703125, 2.39892578125, 2.73828125, 3.07763671875, 3.4169921875, 3.75634765625, 4.095703125, 4.43505859375, 4.7744140625, 5.11376953125, 5.453125, 5.79248046875, 6.1318359375, 6.47119140625, 6.810546875, 7.14990234375, 7.4892578125, 7.82861328125, 8.16796875, 8.50732421875, 8.8466796875, 9.18603515625, 9.525390625, 9.86474609375, 10.2041015625, 10.54345703125, 10.8828125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 8.0, 7.0, 18.0, 16.0, 27.0, 29.0, 45.0, 59.0, 72.0, 69.0, 85.0, 121.0, 124.0, 140.0, 154.0, 170.0, 184.0, 206.0, 219.0, 203.0, 239.0, 220.0, 194.0, 191.0, 190.0, 153.0, 139.0, 143.0, 114.0, 103.0, 81.0, 76.0, 52.0, 53.0, 36.0, 19.0, 22.0, 28.0, 14.0, 7.0, 15.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-6.9140625, -6.70562744140625, -6.4971923828125, -6.28875732421875, -6.080322265625, -5.87188720703125, -5.6634521484375, -5.45501708984375, -5.24658203125, -5.03814697265625, -4.8297119140625, -4.62127685546875, -4.412841796875, -4.20440673828125, -3.9959716796875, -3.78753662109375, -3.5791015625, -3.37066650390625, -3.1622314453125, -2.95379638671875, -2.745361328125, -2.53692626953125, -2.3284912109375, -2.12005615234375, -1.91162109375, -1.70318603515625, -1.4947509765625, -1.28631591796875, -1.077880859375, -0.86944580078125, -0.6610107421875, -0.45257568359375, -0.244140625, -0.03570556640625, 0.1727294921875, 0.38116455078125, 0.589599609375, 0.79803466796875, 1.0064697265625, 1.21490478515625, 1.42333984375, 1.63177490234375, 1.8402099609375, 2.04864501953125, 2.257080078125, 2.46551513671875, 2.6739501953125, 2.88238525390625, 3.0908203125, 3.29925537109375, 3.5076904296875, 3.71612548828125, 3.924560546875, 4.13299560546875, 4.3414306640625, 4.54986572265625, 4.75830078125, 4.96673583984375, 5.1751708984375, 5.38360595703125, 5.592041015625, 5.80047607421875, 6.0089111328125, 6.21734619140625, 6.42578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 16.0, 12.0, 14.0, 13.0, 18.0, 15.0, 25.0, 23.0, 37.0, 33.0, 37.0, 50.0, 54.0, 41.0, 65.0, 50.0, 48.0, 36.0, 43.0, 33.0, 37.0, 51.0, 38.0, 29.0, 36.0, 20.0, 19.0, 21.0, 16.0, 11.0, 10.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.11312484741211, -12.629949569702148, -12.146774291992188, -11.663599014282227, -11.180423736572266, -10.697248458862305, -10.214073181152344, -9.7308988571167, -9.247723579406738, -8.764548301696777, -8.281373023986816, -7.7981977462768555, -7.315022945404053, -6.831847667694092, -6.348672389984131, -5.865497589111328, -5.382321834564209, -4.899146556854248, -4.415971279144287, -3.9327962398529053, -3.4496212005615234, -2.9664459228515625, -2.4832706451416016, -2.0000956058502197, -1.5169203281402588, -1.0337451696395874, -0.5505699515342712, -0.06739473342895508, 0.4157804250717163, 0.8989555835723877, 1.3821308612823486, 1.8653059005737305, 2.3484811782836914, 2.8316564559936523, 3.314831495285034, 3.798006772994995, 4.281181812286377, 4.764357089996338, 5.247532367706299, 5.730707168579102, 6.2138824462890625, 6.697057723999023, 7.180233001708984, 7.663408279418945, 8.146583557128906, 8.629758834838867, 9.112934112548828, 9.596108436584473, 10.07928466796875, 10.562459945678711, 11.045635223388672, 11.528810501098633, 12.011985778808594, 12.495161056518555, 12.978336334228516, 13.46151065826416, 13.944685935974121, 14.427861213684082, 14.911036491394043, 15.394211769104004, 15.877387046813965, 16.36056137084961, 16.84373664855957, 17.32691192626953, 17.810087203979492]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 6.0, 7.0, 13.0, 14.0, 13.0, 17.0, 21.0, 20.0, 32.0, 27.0, 42.0, 23.0, 32.0, 35.0, 35.0, 36.0, 53.0, 41.0, 61.0, 32.0, 38.0, 57.0, 25.0, 38.0, 39.0, 28.0, 31.0, 29.0, 23.0, 28.0, 21.0, 13.0, 8.0, 10.0, 7.0, 8.0, 7.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.314741134643555, -17.746463775634766, -17.17818832397461, -16.60991096496582, -16.04163360595703, -15.473356246948242, -14.90507984161377, -14.336803436279297, -13.768526077270508, -13.200248718261719, -12.631972312927246, -12.063695907592773, -11.495418548583984, -10.927141189575195, -10.358864784240723, -9.79058837890625, -9.222311019897461, -8.654033660888672, -8.0857572555542, -7.517480373382568, -6.9492034912109375, -6.380926609039307, -5.812649726867676, -5.244372844696045, -4.676095962524414, -4.107819080352783, -3.5395421981811523, -2.9712653160095215, -2.4029884338378906, -1.8347115516662598, -1.266434669494629, -0.698157787322998, -0.12987899780273438, 0.4383978843688965, 1.0066747665405273, 1.5749516487121582, 2.143228530883789, 2.71150541305542, 3.279782295227051, 3.8480591773986816, 4.4163360595703125, 4.984612941741943, 5.552889823913574, 6.121166706085205, 6.689443588256836, 7.257720470428467, 7.825997352600098, 8.39427375793457, 8.96255111694336, 9.530828475952148, 10.099104881286621, 10.667381286621094, 11.235658645629883, 11.803936004638672, 12.372212409973145, 12.940488815307617, 13.508766174316406, 14.077043533325195, 14.645319938659668, 15.21359634399414, 15.78187370300293, 16.35015106201172, 16.918426513671875, 17.486703872680664, 18.054981231689453]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 14.0, 10.0, 19.0, 26.0, 34.0, 63.0, 91.0, 166.0, 181.0, 328.0, 507.0, 837.0, 1351.0, 2252.0, 3881.0, 6885.0, 11872.0, 20455.0, 35503.0, 60069.0, 95320.0, 138621.0, 168983.0, 163741.0, 126732.0, 84683.0, 52721.0, 30983.0, 17580.0, 10174.0, 5860.0, 3418.0, 2090.0, 1136.0, 733.0, 421.0, 279.0, 181.0, 112.0, 75.0, 49.0, 33.0, 26.0, 14.0, 7.0, 8.0, 4.0, 9.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.01226806640625, -3.8682861328125, -3.72430419921875, -3.580322265625, -3.43634033203125, -3.2923583984375, -3.14837646484375, -3.00439453125, -2.86041259765625, -2.7164306640625, -2.57244873046875, -2.428466796875, -2.28448486328125, -2.1405029296875, -1.99652099609375, -1.8525390625, -1.70855712890625, -1.5645751953125, -1.42059326171875, -1.276611328125, -1.13262939453125, -0.9886474609375, -0.84466552734375, -0.70068359375, -0.55670166015625, -0.4127197265625, -0.26873779296875, -0.124755859375, 0.01922607421875, 0.1632080078125, 0.30718994140625, 0.451171875, 0.59515380859375, 0.7391357421875, 0.88311767578125, 1.027099609375, 1.17108154296875, 1.3150634765625, 1.45904541015625, 1.60302734375, 1.74700927734375, 1.8909912109375, 2.03497314453125, 2.178955078125, 2.32293701171875, 2.4669189453125, 2.61090087890625, 2.7548828125, 2.89886474609375, 3.0428466796875, 3.18682861328125, 3.330810546875, 3.47479248046875, 3.6187744140625, 3.76275634765625, 3.90673828125, 4.05072021484375, 4.1947021484375, 4.33868408203125, 4.482666015625, 4.62664794921875, 4.7706298828125, 4.91461181640625, 5.05859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 9.0, 6.0, 5.0, 12.0, 13.0, 19.0, 26.0, 25.0, 21.0, 24.0, 32.0, 43.0, 33.0, 34.0, 36.0, 43.0, 50.0, 39.0, 48.0, 38.0, 35.0, 48.0, 34.0, 35.0, 38.0, 31.0, 29.0, 27.0, 29.0, 19.0, 17.0, 18.0, 12.0, 11.0, 6.0, 12.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.328125, -18.7626953125, -18.197265625, -17.6318359375, -17.06640625, -16.5009765625, -15.935546875, -15.3701171875, -14.8046875, -14.2392578125, -13.673828125, -13.1083984375, -12.54296875, -11.9775390625, -11.412109375, -10.8466796875, -10.28125, -9.7158203125, -9.150390625, -8.5849609375, -8.01953125, -7.4541015625, -6.888671875, -6.3232421875, -5.7578125, -5.1923828125, -4.626953125, -4.0615234375, -3.49609375, -2.9306640625, -2.365234375, -1.7998046875, -1.234375, -0.6689453125, -0.103515625, 0.4619140625, 1.02734375, 1.5927734375, 2.158203125, 2.7236328125, 3.2890625, 3.8544921875, 4.419921875, 4.9853515625, 5.55078125, 6.1162109375, 6.681640625, 7.2470703125, 7.8125, 8.3779296875, 8.943359375, 9.5087890625, 10.07421875, 10.6396484375, 11.205078125, 11.7705078125, 12.3359375, 12.9013671875, 13.466796875, 14.0322265625, 14.59765625, 15.1630859375, 15.728515625, 16.2939453125, 16.859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 21.0, 12.0, 18.0, 36.0, 63.0, 78.0, 131.0, 225.0, 326.0, 495.0, 875.0, 1364.0, 2166.0, 3785.0, 6245.0, 10792.0, 18143.0, 30383.0, 49797.0, 77139.0, 111102.0, 142689.0, 156261.0, 140093.0, 106533.0, 72995.0, 46476.0, 28537.0, 17256.0, 9923.0, 5731.0, 3473.0, 2057.0, 1311.0, 766.0, 464.0, 282.0, 184.0, 108.0, 73.0, 52.0, 25.0, 28.0, 10.0, 11.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.035064697265625, -2.93536376953125, -2.835662841796875, -2.7359619140625, -2.636260986328125, -2.53656005859375, -2.436859130859375, -2.337158203125, -2.237457275390625, -2.13775634765625, -2.038055419921875, -1.9383544921875, -1.838653564453125, -1.73895263671875, -1.639251708984375, -1.53955078125, -1.439849853515625, -1.34014892578125, -1.240447998046875, -1.1407470703125, -1.041046142578125, -0.94134521484375, -0.841644287109375, -0.741943359375, -0.642242431640625, -0.54254150390625, -0.442840576171875, -0.3431396484375, -0.243438720703125, -0.14373779296875, -0.044036865234375, 0.0556640625, 0.155364990234375, 0.25506591796875, 0.354766845703125, 0.4544677734375, 0.554168701171875, 0.65386962890625, 0.753570556640625, 0.853271484375, 0.952972412109375, 1.05267333984375, 1.152374267578125, 1.2520751953125, 1.351776123046875, 1.45147705078125, 1.551177978515625, 1.65087890625, 1.750579833984375, 1.85028076171875, 1.949981689453125, 2.0496826171875, 2.149383544921875, 2.24908447265625, 2.348785400390625, 2.448486328125, 2.548187255859375, 2.64788818359375, 2.747589111328125, 2.8472900390625, 2.946990966796875, 3.04669189453125, 3.146392822265625, 3.24609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 7.0, 9.0, 8.0, 9.0, 12.0, 12.0, 13.0, 17.0, 16.0, 19.0, 26.0, 21.0, 35.0, 28.0, 27.0, 47.0, 41.0, 25.0, 36.0, 53.0, 42.0, 34.0, 36.0, 34.0, 34.0, 34.0, 22.0, 43.0, 29.0, 29.0, 24.0, 22.0, 24.0, 27.0, 21.0, 16.0, 18.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6796875, -11.3209228515625, -10.962158203125, -10.6033935546875, -10.24462890625, -9.8858642578125, -9.527099609375, -9.1683349609375, -8.8095703125, -8.4508056640625, -8.092041015625, -7.7332763671875, -7.37451171875, -7.0157470703125, -6.656982421875, -6.2982177734375, -5.939453125, -5.5806884765625, -5.221923828125, -4.8631591796875, -4.50439453125, -4.1456298828125, -3.786865234375, -3.4281005859375, -3.0693359375, -2.7105712890625, -2.351806640625, -1.9930419921875, -1.63427734375, -1.2755126953125, -0.916748046875, -0.5579833984375, -0.19921875, 0.1595458984375, 0.518310546875, 0.8770751953125, 1.23583984375, 1.5946044921875, 1.953369140625, 2.3121337890625, 2.6708984375, 3.0296630859375, 3.388427734375, 3.7471923828125, 4.10595703125, 4.4647216796875, 4.823486328125, 5.1822509765625, 5.541015625, 5.8997802734375, 6.258544921875, 6.6173095703125, 6.97607421875, 7.3348388671875, 7.693603515625, 8.0523681640625, 8.4111328125, 8.7698974609375, 9.128662109375, 9.4874267578125, 9.84619140625, 10.2049560546875, 10.563720703125, 10.9224853515625, 11.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 5.0, 14.0, 9.0, 20.0, 27.0, 31.0, 48.0, 71.0, 127.0, 182.0, 263.0, 423.0, 604.0, 1017.0, 1510.0, 2443.0, 4025.0, 6733.0, 11698.0, 21043.0, 40164.0, 78118.0, 145912.0, 228209.0, 218778.0, 134157.0, 70498.0, 36620.0, 18931.0, 10819.0, 6189.0, 3563.0, 2220.0, 1486.0, 866.0, 607.0, 378.0, 268.0, 160.0, 114.0, 64.0, 49.0, 37.0, 16.0, 18.0, 8.0, 7.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6727828979492188, -0.6468353271484375, -0.6208877563476562, -0.594940185546875, -0.5689926147460938, -0.5430450439453125, -0.5170974731445312, -0.49114990234375, -0.46520233154296875, -0.4392547607421875, -0.41330718994140625, -0.387359619140625, -0.36141204833984375, -0.3354644775390625, -0.30951690673828125, -0.2835693359375, -0.25762176513671875, -0.2316741943359375, -0.20572662353515625, -0.179779052734375, -0.15383148193359375, -0.1278839111328125, -0.10193634033203125, -0.07598876953125, -0.05004119873046875, -0.0240936279296875, 0.00185394287109375, 0.027801513671875, 0.05374908447265625, 0.0796966552734375, 0.10564422607421875, 0.131591796875, 0.15753936767578125, 0.1834869384765625, 0.20943450927734375, 0.235382080078125, 0.26132965087890625, 0.2872772216796875, 0.31322479248046875, 0.33917236328125, 0.36511993408203125, 0.3910675048828125, 0.41701507568359375, 0.442962646484375, 0.46891021728515625, 0.4948577880859375, 0.5208053588867188, 0.5467529296875, 0.5727005004882812, 0.5986480712890625, 0.6245956420898438, 0.650543212890625, 0.6764907836914062, 0.7024383544921875, 0.7283859252929688, 0.75433349609375, 0.7802810668945312, 0.8062286376953125, 0.8321762084960938, 0.858123779296875, 0.8840713500976562, 0.9100189208984375, 0.9359664916992188, 0.9619140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 5.0, 13.0, 21.0, 16.0, 17.0, 23.0, 35.0, 37.0, 51.0, 67.0, 85.0, 87.0, 95.0, 85.0, 73.0, 64.0, 54.0, 44.0, 36.0, 19.0, 14.0, 15.0, 11.0, 4.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024247169494628906, -0.00023613683879375458, -0.0002298019826412201, -0.0002234671264886856, -0.00021713227033615112, -0.00021079741418361664, -0.00020446255803108215, -0.00019812770187854767, -0.00019179284572601318, -0.0001854579895734787, -0.00017912313342094421, -0.00017278827726840973, -0.00016645342111587524, -0.00016011856496334076, -0.00015378370881080627, -0.0001474488526582718, -0.0001411139965057373, -0.00013477914035320282, -0.00012844428420066833, -0.00012210942804813385, -0.00011577457189559937, -0.00010943971574306488, -0.0001031048595905304, -9.677000343799591e-05, -9.043514728546143e-05, -8.410029113292694e-05, -7.776543498039246e-05, -7.143057882785797e-05, -6.509572267532349e-05, -5.8760866522789e-05, -5.2426010370254517e-05, -4.609115421772003e-05, -3.975629806518555e-05, -3.342144191265106e-05, -2.7086585760116577e-05, -2.0751729607582092e-05, -1.4416873455047607e-05, -8.082017302513123e-06, -1.7471611499786377e-06, 4.587695002555847e-06, 1.0922551155090332e-05, 1.7257407307624817e-05, 2.3592263460159302e-05, 2.9927119612693787e-05, 3.626197576522827e-05, 4.2596831917762756e-05, 4.893168807029724e-05, 5.5266544222831726e-05, 6.160140037536621e-05, 6.79362565279007e-05, 7.427111268043518e-05, 8.060596883296967e-05, 8.694082498550415e-05, 9.327568113803864e-05, 9.961053729057312e-05, 0.0001059453934431076, 0.00011228024959564209, 0.00011861510574817657, 0.00012494996190071106, 0.00013128481805324554, 0.00013761967420578003, 0.00014395453035831451, 0.000150289386510849, 0.00015662424266338348, 0.00016295909881591797]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 15.0, 21.0, 36.0, 52.0, 61.0, 124.0, 187.0, 353.0, 622.0, 812.0, 1386.0, 2137.0, 3474.0, 5448.0, 8643.0, 13793.0, 21741.0, 34838.0, 54314.0, 84622.0, 125523.0, 163853.0, 165207.0, 126360.0, 85461.0, 55283.0, 34866.0, 22068.0, 13750.0, 8504.0, 5615.0, 3478.0, 2220.0, 1377.0, 898.0, 521.0, 335.0, 205.0, 129.0, 83.0, 56.0, 33.0, 23.0, 12.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1602020263671875, -1.120208740234375, -1.0802154541015625, -1.04022216796875, -1.0002288818359375, -0.960235595703125, -0.9202423095703125, -0.8802490234375, -0.8402557373046875, -0.800262451171875, -0.7602691650390625, -0.72027587890625, -0.6802825927734375, -0.640289306640625, -0.6002960205078125, -0.560302734375, -0.5203094482421875, -0.480316162109375, -0.4403228759765625, -0.40032958984375, -0.3603363037109375, -0.320343017578125, -0.2803497314453125, -0.2403564453125, -0.2003631591796875, -0.160369873046875, -0.1203765869140625, -0.08038330078125, -0.0403900146484375, -0.000396728515625, 0.0395965576171875, 0.07958984375, 0.1195831298828125, 0.159576416015625, 0.1995697021484375, 0.23956298828125, 0.2795562744140625, 0.319549560546875, 0.3595428466796875, 0.3995361328125, 0.4395294189453125, 0.479522705078125, 0.5195159912109375, 0.55950927734375, 0.5995025634765625, 0.639495849609375, 0.6794891357421875, 0.719482421875, 0.7594757080078125, 0.799468994140625, 0.8394622802734375, 0.87945556640625, 0.9194488525390625, 0.959442138671875, 0.9994354248046875, 1.0394287109375, 1.0794219970703125, 1.119415283203125, 1.1594085693359375, 1.19940185546875, 1.2393951416015625, 1.279388427734375, 1.3193817138671875, 1.359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 9.0, 7.0, 2.0, 6.0, 14.0, 21.0, 14.0, 22.0, 20.0, 37.0, 32.0, 36.0, 37.0, 41.0, 41.0, 47.0, 56.0, 60.0, 55.0, 50.0, 52.0, 46.0, 37.0, 43.0, 27.0, 29.0, 21.0, 25.0, 16.0, 14.0, 6.0, 15.0, 3.0, 10.0, 10.0, 2.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5283203125, -0.5117645263671875, -0.495208740234375, -0.4786529541015625, -0.46209716796875, -0.4455413818359375, -0.428985595703125, -0.4124298095703125, -0.3958740234375, -0.3793182373046875, -0.362762451171875, -0.3462066650390625, -0.32965087890625, -0.3130950927734375, -0.296539306640625, -0.2799835205078125, -0.263427734375, -0.2468719482421875, -0.230316162109375, -0.2137603759765625, -0.19720458984375, -0.1806488037109375, -0.164093017578125, -0.1475372314453125, -0.1309814453125, -0.1144256591796875, -0.097869873046875, -0.0813140869140625, -0.06475830078125, -0.0482025146484375, -0.031646728515625, -0.0150909423828125, 0.00146484375, 0.0180206298828125, 0.034576416015625, 0.0511322021484375, 0.06768798828125, 0.0842437744140625, 0.100799560546875, 0.1173553466796875, 0.1339111328125, 0.1504669189453125, 0.167022705078125, 0.1835784912109375, 0.20013427734375, 0.2166900634765625, 0.233245849609375, 0.2498016357421875, 0.266357421875, 0.2829132080078125, 0.299468994140625, 0.3160247802734375, 0.33258056640625, 0.3491363525390625, 0.365692138671875, 0.3822479248046875, 0.3988037109375, 0.4153594970703125, 0.431915283203125, 0.4484710693359375, 0.46502685546875, 0.4815826416015625, 0.498138427734375, 0.5146942138671875, 0.53125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 7.0, 11.0, 11.0, 12.0, 17.0, 19.0, 17.0, 15.0, 28.0, 34.0, 24.0, 51.0, 39.0, 49.0, 51.0, 38.0, 61.0, 58.0, 51.0, 36.0, 38.0, 31.0, 40.0, 40.0, 32.0, 29.0, 33.0, 25.0, 15.0, 15.0, 14.0, 13.0, 8.0, 4.0, 8.0, 8.0, 2.0, 0.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.565869331359863, -13.09119701385498, -12.616525650024414, -12.141853332519531, -11.667181968688965, -11.192509651184082, -10.717838287353516, -10.243165969848633, -9.76849365234375, -9.293821334838867, -8.8191499710083, -8.344477653503418, -7.869806289672852, -7.395133972167969, -6.920462131500244, -6.4457902908325195, -5.971118927001953, -5.4964470863342285, -5.021775245666504, -4.547102928161621, -4.072431564331055, -3.597759485244751, -3.1230874061584473, -2.6484155654907227, -2.173743724822998, -1.6990718841552734, -1.2243999242782593, -0.7497279644012451, -0.2750561237335205, 0.1996157169342041, 0.6742877960205078, 1.1489596366882324, 1.6236305236816406, 2.0983023643493652, 2.57297420501709, 3.0476462841033936, 3.522318124771118, 3.9969899654388428, 4.4716620445251465, 4.946333885192871, 5.421005725860596, 5.89567756652832, 6.370349407196045, 6.8450212478637695, 7.319693565368652, 7.794364929199219, 8.269037246704102, 8.743709564208984, 9.21838092803955, 9.693053245544434, 10.167724609375, 10.642396926879883, 11.11706829071045, 11.591740608215332, 12.066411972045898, 12.541084289550781, 13.015756607055664, 13.490428924560547, 13.965100288391113, 14.439772605895996, 14.914443969726562, 15.389116287231445, 15.863788604736328, 16.338459014892578, 16.81313133239746]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 3.0, 9.0, 9.0, 15.0, 12.0, 14.0, 19.0, 22.0, 25.0, 26.0, 41.0, 26.0, 32.0, 34.0, 37.0, 35.0, 41.0, 42.0, 47.0, 52.0, 38.0, 56.0, 31.0, 34.0, 30.0, 39.0, 33.0, 30.0, 22.0, 30.0, 22.0, 17.0, 12.0, 10.0, 9.0, 6.0, 7.0, 4.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25825309753418, -17.699724197387695, -17.141193389892578, -16.582664489746094, -16.02413558959961, -15.465606689453125, -14.907076835632324, -14.348546981811523, -13.790018081665039, -13.231489181518555, -12.672959327697754, -12.114429473876953, -11.555900573730469, -10.997371673583984, -10.438841819763184, -9.880311965942383, -9.321783065795898, -8.763254165649414, -8.204724311828613, -7.646194934844971, -7.087665557861328, -6.5291361808776855, -5.970606803894043, -5.4120774269104, -4.853548049926758, -4.295018672943115, -3.7364892959594727, -3.17795991897583, -2.6194305419921875, -2.060901165008545, -1.5023717880249023, -0.9438424110412598, -0.3853111267089844, 0.1732182502746582, 0.7317476272583008, 1.2902770042419434, 1.848806381225586, 2.4073357582092285, 2.965865135192871, 3.5243945121765137, 4.082923889160156, 4.641453266143799, 5.199982643127441, 5.758512020111084, 6.317041397094727, 6.875570774078369, 7.434100151062012, 7.992629528045654, 8.551158905029297, 9.109687805175781, 9.668217658996582, 10.226747512817383, 10.785276412963867, 11.343805313110352, 11.902335166931152, 12.460865020751953, 13.019393920898438, 13.577922821044922, 14.136452674865723, 14.694982528686523, 15.253511428833008, 15.812040328979492, 16.37057113647461, 16.929100036621094, 17.487628936767578]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 8.0, 21.0, 32.0, 54.0, 70.0, 95.0, 177.0, 293.0, 429.0, 688.0, 1051.0, 1625.0, 2480.0, 3780.0, 5446.0, 8160.0, 12098.0, 17008.0, 23679.0, 32461.0, 42735.0, 54988.0, 67524.0, 79137.0, 87392.0, 91795.0, 90766.0, 86059.0, 76744.0, 65102.0, 52884.0, 41025.0, 30543.0, 22416.0, 16027.0, 11205.0, 7636.0, 5110.0, 3463.0, 2196.0, 1453.0, 953.0, 640.0, 363.0, 254.0, 170.0, 98.0, 76.0, 55.0, 38.0, 14.0, 14.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0], "bins": [-9.3515625, -9.0584716796875, -8.765380859375, -8.4722900390625, -8.17919921875, -7.8861083984375, -7.593017578125, -7.2999267578125, -7.0068359375, -6.7137451171875, -6.420654296875, -6.1275634765625, -5.83447265625, -5.5413818359375, -5.248291015625, -4.9552001953125, -4.662109375, -4.3690185546875, -4.075927734375, -3.7828369140625, -3.48974609375, -3.1966552734375, -2.903564453125, -2.6104736328125, -2.3173828125, -2.0242919921875, -1.731201171875, -1.4381103515625, -1.14501953125, -0.8519287109375, -0.558837890625, -0.2657470703125, 0.02734375, 0.3204345703125, 0.613525390625, 0.9066162109375, 1.19970703125, 1.4927978515625, 1.785888671875, 2.0789794921875, 2.3720703125, 2.6651611328125, 2.958251953125, 3.2513427734375, 3.54443359375, 3.8375244140625, 4.130615234375, 4.4237060546875, 4.716796875, 5.0098876953125, 5.302978515625, 5.5960693359375, 5.88916015625, 6.1822509765625, 6.475341796875, 6.7684326171875, 7.0615234375, 7.3546142578125, 7.647705078125, 7.9407958984375, 8.23388671875, 8.5269775390625, 8.820068359375, 9.1131591796875, 9.40625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 9.0, 6.0, 12.0, 16.0, 11.0, 18.0, 16.0, 20.0, 35.0, 29.0, 35.0, 35.0, 35.0, 42.0, 44.0, 35.0, 42.0, 47.0, 39.0, 44.0, 59.0, 42.0, 30.0, 34.0, 34.0, 29.0, 31.0, 28.0, 28.0, 19.0, 19.0, 12.0, 5.0, 13.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.78125, -17.221923828125, -16.66259765625, -16.103271484375, -15.5439453125, -14.984619140625, -14.42529296875, -13.865966796875, -13.306640625, -12.747314453125, -12.18798828125, -11.628662109375, -11.0693359375, -10.510009765625, -9.95068359375, -9.391357421875, -8.83203125, -8.272705078125, -7.71337890625, -7.154052734375, -6.5947265625, -6.035400390625, -5.47607421875, -4.916748046875, -4.357421875, -3.798095703125, -3.23876953125, -2.679443359375, -2.1201171875, -1.560791015625, -1.00146484375, -0.442138671875, 0.1171875, 0.676513671875, 1.23583984375, 1.795166015625, 2.3544921875, 2.913818359375, 3.47314453125, 4.032470703125, 4.591796875, 5.151123046875, 5.71044921875, 6.269775390625, 6.8291015625, 7.388427734375, 7.94775390625, 8.507080078125, 9.06640625, 9.625732421875, 10.18505859375, 10.744384765625, 11.3037109375, 11.863037109375, 12.42236328125, 12.981689453125, 13.541015625, 14.100341796875, 14.65966796875, 15.218994140625, 15.7783203125, 16.337646484375, 16.89697265625, 17.456298828125, 18.015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 17.0, 18.0, 28.0, 46.0, 84.0, 119.0, 183.0, 305.0, 483.0, 757.0, 1301.0, 2020.0, 3259.0, 5061.0, 8079.0, 12318.0, 18776.0, 27914.0, 39742.0, 55232.0, 71225.0, 88326.0, 101776.0, 108186.0, 106336.0, 96791.0, 81818.0, 65911.0, 48388.0, 34845.0, 23994.0, 16271.0, 10543.0, 6730.0, 4432.0, 2793.0, 1672.0, 1050.0, 706.0, 400.0, 247.0, 134.0, 74.0, 64.0, 38.0, 19.0, 17.0, 8.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.6656494140625, -10.307861328125, -9.9500732421875, -9.59228515625, -9.2344970703125, -8.876708984375, -8.5189208984375, -8.1611328125, -7.8033447265625, -7.445556640625, -7.0877685546875, -6.72998046875, -6.3721923828125, -6.014404296875, -5.6566162109375, -5.298828125, -4.9410400390625, -4.583251953125, -4.2254638671875, -3.86767578125, -3.5098876953125, -3.152099609375, -2.7943115234375, -2.4365234375, -2.0787353515625, -1.720947265625, -1.3631591796875, -1.00537109375, -0.6475830078125, -0.289794921875, 0.0679931640625, 0.42578125, 0.7835693359375, 1.141357421875, 1.4991455078125, 1.85693359375, 2.2147216796875, 2.572509765625, 2.9302978515625, 3.2880859375, 3.6458740234375, 4.003662109375, 4.3614501953125, 4.71923828125, 5.0770263671875, 5.434814453125, 5.7926025390625, 6.150390625, 6.5081787109375, 6.865966796875, 7.2237548828125, 7.58154296875, 7.9393310546875, 8.297119140625, 8.6549072265625, 9.0126953125, 9.3704833984375, 9.728271484375, 10.0860595703125, 10.44384765625, 10.8016357421875, 11.159423828125, 11.5172119140625, 11.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 9.0, 13.0, 5.0, 11.0, 14.0, 15.0, 14.0, 15.0, 17.0, 28.0, 36.0, 20.0, 34.0, 46.0, 48.0, 32.0, 52.0, 40.0, 46.0, 32.0, 50.0, 36.0, 46.0, 34.0, 37.0, 36.0, 37.0, 27.0, 21.0, 20.0, 22.0, 15.0, 12.0, 14.0, 17.0, 12.0, 4.0, 9.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.1280517578125, -10.763916015625, -10.3997802734375, -10.03564453125, -9.6715087890625, -9.307373046875, -8.9432373046875, -8.5791015625, -8.2149658203125, -7.850830078125, -7.4866943359375, -7.12255859375, -6.7584228515625, -6.394287109375, -6.0301513671875, -5.666015625, -5.3018798828125, -4.937744140625, -4.5736083984375, -4.20947265625, -3.8453369140625, -3.481201171875, -3.1170654296875, -2.7529296875, -2.3887939453125, -2.024658203125, -1.6605224609375, -1.29638671875, -0.9322509765625, -0.568115234375, -0.2039794921875, 0.16015625, 0.5242919921875, 0.888427734375, 1.2525634765625, 1.61669921875, 1.9808349609375, 2.344970703125, 2.7091064453125, 3.0732421875, 3.4373779296875, 3.801513671875, 4.1656494140625, 4.52978515625, 4.8939208984375, 5.258056640625, 5.6221923828125, 5.986328125, 6.3504638671875, 6.714599609375, 7.0787353515625, 7.44287109375, 7.8070068359375, 8.171142578125, 8.5352783203125, 8.8994140625, 9.2635498046875, 9.627685546875, 9.9918212890625, 10.35595703125, 10.7200927734375, 11.084228515625, 11.4483642578125, 11.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 12.0, 8.0, 15.0, 15.0, 21.0, 39.0, 71.0, 100.0, 181.0, 245.0, 456.0, 651.0, 1122.0, 1905.0, 3098.0, 5236.0, 8348.0, 14203.0, 23137.0, 37859.0, 58725.0, 85977.0, 114871.0, 135375.0, 139338.0, 125610.0, 99753.0, 71130.0, 46994.0, 29229.0, 17724.0, 10679.0, 6405.0, 3939.0, 2355.0, 1406.0, 873.0, 567.0, 337.0, 220.0, 137.0, 69.0, 53.0, 31.0, 15.0, 13.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1328125, -4.97357177734375, -4.8143310546875, -4.65509033203125, -4.495849609375, -4.33660888671875, -4.1773681640625, -4.01812744140625, -3.85888671875, -3.69964599609375, -3.5404052734375, -3.38116455078125, -3.221923828125, -3.06268310546875, -2.9034423828125, -2.74420166015625, -2.5849609375, -2.42572021484375, -2.2664794921875, -2.10723876953125, -1.947998046875, -1.78875732421875, -1.6295166015625, -1.47027587890625, -1.31103515625, -1.15179443359375, -0.9925537109375, -0.83331298828125, -0.674072265625, -0.51483154296875, -0.3555908203125, -0.19635009765625, -0.037109375, 0.12213134765625, 0.2813720703125, 0.44061279296875, 0.599853515625, 0.75909423828125, 0.9183349609375, 1.07757568359375, 1.23681640625, 1.39605712890625, 1.5552978515625, 1.71453857421875, 1.873779296875, 2.03302001953125, 2.1922607421875, 2.35150146484375, 2.5107421875, 2.66998291015625, 2.8292236328125, 2.98846435546875, 3.147705078125, 3.30694580078125, 3.4661865234375, 3.62542724609375, 3.78466796875, 3.94390869140625, 4.1031494140625, 4.26239013671875, 4.421630859375, 4.58087158203125, 4.7401123046875, 4.89935302734375, 5.05859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 6.0, 15.0, 17.0, 14.0, 14.0, 32.0, 33.0, 29.0, 33.0, 32.0, 37.0, 48.0, 50.0, 71.0, 40.0, 46.0, 55.0, 53.0, 56.0, 45.0, 42.0, 36.0, 27.0, 32.0, 25.0, 17.0, 16.0, 15.0, 14.0, 11.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.000614166259765625, -0.0005970895290374756, -0.0005800127983093262, -0.0005629360675811768, -0.0005458593368530273, -0.0005287826061248779, -0.0005117058753967285, -0.0004946291446685791, -0.0004775524139404297, -0.0004604756832122803, -0.00044339895248413086, -0.00042632222175598145, -0.00040924549102783203, -0.0003921687602996826, -0.0003750920295715332, -0.0003580152988433838, -0.0003409385681152344, -0.00032386183738708496, -0.00030678510665893555, -0.00028970837593078613, -0.0002726316452026367, -0.0002555549144744873, -0.0002384781837463379, -0.00022140145301818848, -0.00020432472229003906, -0.00018724799156188965, -0.00017017126083374023, -0.00015309453010559082, -0.0001360177993774414, -0.00011894106864929199, -0.00010186433792114258, -8.478760719299316e-05, -6.771087646484375e-05, -5.0634145736694336e-05, -3.355741500854492e-05, -1.6480684280395508e-05, 5.960464477539062e-07, 1.767277717590332e-05, 3.4749507904052734e-05, 5.182623863220215e-05, 6.890296936035156e-05, 8.597970008850098e-05, 0.00010305643081665039, 0.0001201331615447998, 0.00013720989227294922, 0.00015428662300109863, 0.00017136335372924805, 0.00018844008445739746, 0.00020551681518554688, 0.0002225935459136963, 0.0002396702766418457, 0.0002567470073699951, 0.00027382373809814453, 0.00029090046882629395, 0.00030797719955444336, 0.0003250539302825928, 0.0003421306610107422, 0.0003592073917388916, 0.000376284122467041, 0.00039336085319519043, 0.00041043758392333984, 0.00042751431465148926, 0.00044459104537963867, 0.0004616677761077881, 0.0004787445068359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 11.0, 20.0, 24.0, 37.0, 52.0, 92.0, 119.0, 168.0, 259.0, 379.0, 569.0, 868.0, 1260.0, 1901.0, 2976.0, 4717.0, 7334.0, 11498.0, 17746.0, 27259.0, 40781.0, 59544.0, 81876.0, 105063.0, 121662.0, 125908.0, 116185.0, 96307.0, 72984.0, 51461.0, 34769.0, 22899.0, 14741.0, 9496.0, 6150.0, 3877.0, 2466.0, 1728.0, 1065.0, 745.0, 553.0, 317.0, 240.0, 138.0, 95.0, 80.0, 45.0, 34.0, 12.0, 22.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.84375, -4.69378662109375, -4.5438232421875, -4.39385986328125, -4.243896484375, -4.09393310546875, -3.9439697265625, -3.79400634765625, -3.64404296875, -3.49407958984375, -3.3441162109375, -3.19415283203125, -3.044189453125, -2.89422607421875, -2.7442626953125, -2.59429931640625, -2.4443359375, -2.29437255859375, -2.1444091796875, -1.99444580078125, -1.844482421875, -1.69451904296875, -1.5445556640625, -1.39459228515625, -1.24462890625, -1.09466552734375, -0.9447021484375, -0.79473876953125, -0.644775390625, -0.49481201171875, -0.3448486328125, -0.19488525390625, -0.044921875, 0.10504150390625, 0.2550048828125, 0.40496826171875, 0.554931640625, 0.70489501953125, 0.8548583984375, 1.00482177734375, 1.15478515625, 1.30474853515625, 1.4547119140625, 1.60467529296875, 1.754638671875, 1.90460205078125, 2.0545654296875, 2.20452880859375, 2.3544921875, 2.50445556640625, 2.6544189453125, 2.80438232421875, 2.954345703125, 3.10430908203125, 3.2542724609375, 3.40423583984375, 3.55419921875, 3.70416259765625, 3.8541259765625, 4.00408935546875, 4.154052734375, 4.30401611328125, 4.4539794921875, 4.60394287109375, 4.75390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 9.0, 7.0, 7.0, 11.0, 15.0, 17.0, 12.0, 21.0, 20.0, 34.0, 31.0, 28.0, 43.0, 49.0, 53.0, 52.0, 41.0, 69.0, 46.0, 59.0, 43.0, 53.0, 41.0, 32.0, 29.0, 20.0, 21.0, 21.0, 20.0, 12.0, 14.0, 14.0, 5.0, 12.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.310546875, -2.2391357421875, -2.167724609375, -2.0963134765625, -2.02490234375, -1.9534912109375, -1.882080078125, -1.8106689453125, -1.7392578125, -1.6678466796875, -1.596435546875, -1.5250244140625, -1.45361328125, -1.3822021484375, -1.310791015625, -1.2393798828125, -1.16796875, -1.0965576171875, -1.025146484375, -0.9537353515625, -0.88232421875, -0.8109130859375, -0.739501953125, -0.6680908203125, -0.5966796875, -0.5252685546875, -0.453857421875, -0.3824462890625, -0.31103515625, -0.2396240234375, -0.168212890625, -0.0968017578125, -0.025390625, 0.0460205078125, 0.117431640625, 0.1888427734375, 0.26025390625, 0.3316650390625, 0.403076171875, 0.4744873046875, 0.5458984375, 0.6173095703125, 0.688720703125, 0.7601318359375, 0.83154296875, 0.9029541015625, 0.974365234375, 1.0457763671875, 1.1171875, 1.1885986328125, 1.260009765625, 1.3314208984375, 1.40283203125, 1.4742431640625, 1.545654296875, 1.6170654296875, 1.6884765625, 1.7598876953125, 1.831298828125, 1.9027099609375, 1.97412109375, 2.0455322265625, 2.116943359375, 2.1883544921875, 2.259765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 17.0, 16.0, 22.0, 22.0, 32.0, 32.0, 34.0, 43.0, 41.0, 37.0, 48.0, 49.0, 44.0, 48.0, 38.0, 42.0, 45.0, 40.0, 38.0, 44.0, 31.0, 29.0, 20.0, 26.0, 25.0, 21.0, 13.0, 8.0, 17.0, 5.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.452465057373047, -13.994357109069824, -13.536249160766602, -13.078141212463379, -12.620033264160156, -12.16192626953125, -11.703817367553711, -11.245710372924805, -10.787602424621582, -10.32949447631836, -9.871386528015137, -9.413278579711914, -8.955170631408691, -8.497062683105469, -8.038955688476562, -7.58084774017334, -7.122739315032959, -6.664631366729736, -6.206523418426514, -5.748415946960449, -5.290307998657227, -4.832200050354004, -4.374092102050781, -3.9159843921661377, -3.457876443862915, -2.9997684955596924, -2.541660785675049, -2.083552837371826, -1.625445008277893, -1.16733717918396, -0.7092292308807373, -0.25112152099609375, 0.2069864273071289, 0.665094256401062, 1.1232020854949951, 1.5813100337982178, 2.0394177436828613, 2.497525691986084, 2.9556336402893066, 3.41374135017395, 3.871849298477173, 4.329957008361816, 4.788064956665039, 5.246172904968262, 5.704280853271484, 6.162388801574707, 6.62049674987793, 7.078604221343994, 7.536712169647217, 7.9948201179504395, 8.452927589416504, 8.911035537719727, 9.36914348602295, 9.827251434326172, 10.285359382629395, 10.743467330932617, 11.20157527923584, 11.659683227539062, 12.117791175842285, 12.575899124145508, 13.03400707244873, 13.492115020751953, 13.95022201538086, 14.408329963684082, 14.866437911987305]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 1.0, 3.0, 2.0, 6.0, 18.0, 14.0, 11.0, 10.0, 17.0, 9.0, 18.0, 20.0, 22.0, 29.0, 25.0, 31.0, 31.0, 39.0, 26.0, 37.0, 33.0, 30.0, 34.0, 42.0, 40.0, 25.0, 41.0, 26.0, 26.0, 36.0, 28.0, 34.0, 32.0, 24.0, 24.0, 22.0, 24.0, 14.0, 16.0, 14.0, 11.0, 8.0, 13.0, 10.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-16.794418334960938, -16.277511596679688, -15.76060676574707, -15.24370002746582, -14.726794242858887, -14.209888458251953, -13.69298267364502, -13.176076889038086, -12.659170150756836, -12.142264366149902, -11.625358581542969, -11.108451843261719, -10.591546058654785, -10.074640274047852, -9.557734489440918, -9.040828704833984, -8.52392292022705, -8.007017135620117, -7.490110874176025, -6.973205089569092, -6.456298828125, -5.939393043518066, -5.422487258911133, -4.905581474304199, -4.388675212860107, -3.8717691898345947, -3.354863166809082, -2.8379573822021484, -2.3210513591766357, -1.804145336151123, -1.2872395515441895, -0.7703335285186768, -0.25342750549316406, 0.26347845792770386, 0.7803844213485718, 1.297290325164795, 1.8141963481903076, 2.3311023712158203, 2.848008155822754, 3.3649141788482666, 3.8818202018737793, 4.398725986480713, 4.915632247924805, 5.432538032531738, 5.949443817138672, 6.466350078582764, 6.983255863189697, 7.500162124633789, 8.017067909240723, 8.533973693847656, 9.05087947845459, 9.567785263061523, 10.084692001342773, 10.601597785949707, 11.11850357055664, 11.635409355163574, 12.152315139770508, 12.669220924377441, 13.186126708984375, 13.703033447265625, 14.219939231872559, 14.736845016479492, 15.253750801086426, 15.77065658569336, 16.28756332397461]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 14.0, 24.0, 42.0, 80.0, 124.0, 176.0, 290.0, 468.0, 749.0, 1097.0, 1750.0, 2652.0, 4207.0, 6729.0, 10363.0, 16080.0, 25173.0, 38260.0, 58031.0, 87264.0, 126985.0, 180052.0, 243232.0, 316650.0, 382017.0, 429160.0, 441813.0, 419845.0, 365774.0, 298043.0, 227373.0, 165489.0, 115934.0, 79223.0, 52307.0, 34352.0, 22447.0, 14536.0, 9164.0, 6043.0, 3730.0, 2403.0, 1540.0, 953.0, 614.0, 381.0, 229.0, 151.0, 110.0, 49.0, 39.0, 20.0, 23.0, 11.0, 6.0, 6.0, 2.0], "bins": [-10.3984375, -10.0867919921875, -9.775146484375, -9.4635009765625, -9.15185546875, -8.8402099609375, -8.528564453125, -8.2169189453125, -7.9052734375, -7.5936279296875, -7.281982421875, -6.9703369140625, -6.65869140625, -6.3470458984375, -6.035400390625, -5.7237548828125, -5.412109375, -5.1004638671875, -4.788818359375, -4.4771728515625, -4.16552734375, -3.8538818359375, -3.542236328125, -3.2305908203125, -2.9189453125, -2.6072998046875, -2.295654296875, -1.9840087890625, -1.67236328125, -1.3607177734375, -1.049072265625, -0.7374267578125, -0.42578125, -0.1141357421875, 0.197509765625, 0.5091552734375, 0.82080078125, 1.1324462890625, 1.444091796875, 1.7557373046875, 2.0673828125, 2.3790283203125, 2.690673828125, 3.0023193359375, 3.31396484375, 3.6256103515625, 3.937255859375, 4.2489013671875, 4.560546875, 4.8721923828125, 5.183837890625, 5.4954833984375, 5.80712890625, 6.1187744140625, 6.430419921875, 6.7420654296875, 7.0537109375, 7.3653564453125, 7.677001953125, 7.9886474609375, 8.30029296875, 8.6119384765625, 8.923583984375, 9.2352294921875, 9.546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 13.0, 5.0, 12.0, 14.0, 14.0, 13.0, 23.0, 20.0, 26.0, 32.0, 37.0, 40.0, 24.0, 40.0, 44.0, 38.0, 38.0, 40.0, 42.0, 40.0, 39.0, 27.0, 29.0, 50.0, 36.0, 30.0, 29.0, 21.0, 29.0, 26.0, 21.0, 25.0, 10.0, 15.0, 11.0, 4.0, 8.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.55029296875, -13.1005859375, -12.65087890625, -12.201171875, -11.75146484375, -11.3017578125, -10.85205078125, -10.40234375, -9.95263671875, -9.5029296875, -9.05322265625, -8.603515625, -8.15380859375, -7.7041015625, -7.25439453125, -6.8046875, -6.35498046875, -5.9052734375, -5.45556640625, -5.005859375, -4.55615234375, -4.1064453125, -3.65673828125, -3.20703125, -2.75732421875, -2.3076171875, -1.85791015625, -1.408203125, -0.95849609375, -0.5087890625, -0.05908203125, 0.390625, 0.84033203125, 1.2900390625, 1.73974609375, 2.189453125, 2.63916015625, 3.0888671875, 3.53857421875, 3.98828125, 4.43798828125, 4.8876953125, 5.33740234375, 5.787109375, 6.23681640625, 6.6865234375, 7.13623046875, 7.5859375, 8.03564453125, 8.4853515625, 8.93505859375, 9.384765625, 9.83447265625, 10.2841796875, 10.73388671875, 11.18359375, 11.63330078125, 12.0830078125, 12.53271484375, 12.982421875, 13.43212890625, 13.8818359375, 14.33154296875, 14.78125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 13.0, 12.0, 31.0, 28.0, 64.0, 94.0, 158.0, 310.0, 478.0, 732.0, 1221.0, 1976.0, 3153.0, 4968.0, 7983.0, 12599.0, 19555.0, 30006.0, 45333.0, 67045.0, 96038.0, 134593.0, 180966.0, 233373.0, 289246.0, 339823.0, 374938.0, 390599.0, 381863.0, 352201.0, 305466.0, 250994.0, 196589.0, 146640.0, 105599.0, 74493.0, 50804.0, 33817.0, 21954.0, 14238.0, 9067.0, 5820.0, 3571.0, 2158.0, 1415.0, 875.0, 587.0, 329.0, 197.0, 108.0, 77.0, 28.0, 41.0, 12.0, 10.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.7969970703125, -8.500244140625, -8.2034912109375, -7.90673828125, -7.6099853515625, -7.313232421875, -7.0164794921875, -6.7197265625, -6.4229736328125, -6.126220703125, -5.8294677734375, -5.53271484375, -5.2359619140625, -4.939208984375, -4.6424560546875, -4.345703125, -4.0489501953125, -3.752197265625, -3.4554443359375, -3.15869140625, -2.8619384765625, -2.565185546875, -2.2684326171875, -1.9716796875, -1.6749267578125, -1.378173828125, -1.0814208984375, -0.78466796875, -0.4879150390625, -0.191162109375, 0.1055908203125, 0.40234375, 0.6990966796875, 0.995849609375, 1.2926025390625, 1.58935546875, 1.8861083984375, 2.182861328125, 2.4796142578125, 2.7763671875, 3.0731201171875, 3.369873046875, 3.6666259765625, 3.96337890625, 4.2601318359375, 4.556884765625, 4.8536376953125, 5.150390625, 5.4471435546875, 5.743896484375, 6.0406494140625, 6.33740234375, 6.6341552734375, 6.930908203125, 7.2276611328125, 7.5244140625, 7.8211669921875, 8.117919921875, 8.4146728515625, 8.71142578125, 9.0081787109375, 9.304931640625, 9.6016845703125, 9.8984375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 6.0, 7.0, 3.0, 4.0, 12.0, 8.0, 9.0, 19.0, 16.0, 27.0, 33.0, 43.0, 60.0, 60.0, 61.0, 85.0, 114.0, 118.0, 139.0, 163.0, 175.0, 169.0, 162.0, 185.0, 203.0, 195.0, 214.0, 203.0, 187.0, 194.0, 165.0, 173.0, 139.0, 127.0, 98.0, 97.0, 65.0, 61.0, 61.0, 37.0, 36.0, 29.0, 28.0, 25.0, 16.0, 17.0, 3.0, 11.0, 3.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.8359375, -5.644775390625, -5.45361328125, -5.262451171875, -5.0712890625, -4.880126953125, -4.68896484375, -4.497802734375, -4.306640625, -4.115478515625, -3.92431640625, -3.733154296875, -3.5419921875, -3.350830078125, -3.15966796875, -2.968505859375, -2.77734375, -2.586181640625, -2.39501953125, -2.203857421875, -2.0126953125, -1.821533203125, -1.63037109375, -1.439208984375, -1.248046875, -1.056884765625, -0.86572265625, -0.674560546875, -0.4833984375, -0.292236328125, -0.10107421875, 0.090087890625, 0.28125, 0.472412109375, 0.66357421875, 0.854736328125, 1.0458984375, 1.237060546875, 1.42822265625, 1.619384765625, 1.810546875, 2.001708984375, 2.19287109375, 2.384033203125, 2.5751953125, 2.766357421875, 2.95751953125, 3.148681640625, 3.33984375, 3.531005859375, 3.72216796875, 3.913330078125, 4.1044921875, 4.295654296875, 4.48681640625, 4.677978515625, 4.869140625, 5.060302734375, 5.25146484375, 5.442626953125, 5.6337890625, 5.824951171875, 6.01611328125, 6.207275390625, 6.3984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 9.0, 4.0, 3.0, 5.0, 15.0, 9.0, 11.0, 9.0, 16.0, 13.0, 19.0, 22.0, 30.0, 20.0, 34.0, 30.0, 34.0, 38.0, 35.0, 35.0, 47.0, 52.0, 50.0, 41.0, 44.0, 34.0, 31.0, 25.0, 34.0, 33.0, 26.0, 28.0, 22.0, 21.0, 16.0, 24.0, 20.0, 6.0, 9.0, 5.0, 7.0, 11.0, 9.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-12.84615707397461, -12.451104164123535, -12.056050300598145, -11.66099739074707, -11.265944480895996, -10.870891571044922, -10.475837707519531, -10.080784797668457, -9.685731887817383, -9.290678977966309, -8.895625114440918, -8.500572204589844, -8.10551929473877, -7.710465908050537, -7.315412521362305, -6.9203596115112305, -6.525306224822998, -6.130252838134766, -5.735199928283691, -5.340146541595459, -4.945093631744385, -4.550040245056152, -4.154987335205078, -3.7599339485168457, -3.3648808002471924, -2.969827651977539, -2.5747745037078857, -2.1797213554382324, -1.7846680879592896, -1.3896149396896362, -0.9945616722106934, -0.59950852394104, -0.20445537567138672, 0.190597802400589, 0.5856509804725647, 0.9807041883468628, 1.3757573366165161, 1.7708104848861694, 2.1658637523651123, 2.5609169006347656, 2.955970048904419, 3.3510231971740723, 3.7460763454437256, 4.141129493713379, 4.536182880401611, 4.9312357902526855, 5.326289176940918, 5.721342086791992, 6.116395473480225, 6.511448860168457, 6.906501770019531, 7.301555156707764, 7.696608066558838, 8.09166145324707, 8.486714363098145, 8.881767272949219, 9.27682113647461, 9.671874046325684, 10.066927909851074, 10.461980819702148, 10.857033729553223, 11.252086639404297, 11.647140502929688, 12.042193412780762, 12.437246322631836]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 13.0, 16.0, 12.0, 13.0, 16.0, 16.0, 31.0, 23.0, 23.0, 30.0, 28.0, 33.0, 26.0, 35.0, 30.0, 43.0, 29.0, 43.0, 29.0, 42.0, 53.0, 37.0, 32.0, 37.0, 27.0, 42.0, 31.0, 31.0, 23.0, 27.0, 20.0, 17.0, 13.0, 7.0, 11.0, 10.0, 5.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-17.186349868774414, -16.683250427246094, -16.18014907836914, -15.677048683166504, -15.173948287963867, -14.670848846435547, -14.16774845123291, -13.664648056030273, -13.161547660827637, -12.658447265625, -12.155346870422363, -11.652246475219727, -11.149147033691406, -10.646045684814453, -10.142946243286133, -9.639845848083496, -9.13674545288086, -8.633645057678223, -8.130544662475586, -7.627444744110107, -7.124344348907471, -6.621243953704834, -6.1181440353393555, -5.615043640136719, -5.111943244934082, -4.608842849731445, -4.105742454528809, -3.60264253616333, -3.0995421409606934, -2.5964417457580566, -2.093341588973999, -1.5902414321899414, -1.087141990661621, -0.5840417146682739, -0.08094143867492676, 0.4221588373184204, 0.9252591133117676, 1.4283595085144043, 1.931459665298462, 2.4345598220825195, 2.9376602172851562, 3.440760612487793, 3.9438607692718506, 4.446960926055908, 4.950061321258545, 5.453161716461182, 5.95626163482666, 6.459362030029297, 6.962462425231934, 7.46556282043457, 7.968663215637207, 8.471763610839844, 8.974863052368164, 9.477964401245117, 9.981063842773438, 10.484164237976074, 10.987264633178711, 11.490365028381348, 11.993465423583984, 12.496565818786621, 12.999666213989258, 13.502765655517578, 14.005866050720215, 14.508966445922852, 15.012066841125488]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 12.0, 5.0, 15.0, 26.0, 37.0, 63.0, 89.0, 143.0, 208.0, 304.0, 441.0, 692.0, 1064.0, 1641.0, 2650.0, 4343.0, 7337.0, 11749.0, 19842.0, 31971.0, 51652.0, 79987.0, 116094.0, 147821.0, 157367.0, 136255.0, 100885.0, 66782.0, 42158.0, 25957.0, 15764.0, 9534.0, 5848.0, 3609.0, 2161.0, 1438.0, 920.0, 595.0, 357.0, 217.0, 177.0, 108.0, 84.0, 50.0, 36.0, 11.0, 21.0, 16.0, 3.0, 9.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.521484375, -3.40521240234375, -3.2889404296875, -3.17266845703125, -3.056396484375, -2.94012451171875, -2.8238525390625, -2.70758056640625, -2.59130859375, -2.47503662109375, -2.3587646484375, -2.24249267578125, -2.126220703125, -2.00994873046875, -1.8936767578125, -1.77740478515625, -1.6611328125, -1.54486083984375, -1.4285888671875, -1.31231689453125, -1.196044921875, -1.07977294921875, -0.9635009765625, -0.84722900390625, -0.73095703125, -0.61468505859375, -0.4984130859375, -0.38214111328125, -0.265869140625, -0.14959716796875, -0.0333251953125, 0.08294677734375, 0.19921875, 0.31549072265625, 0.4317626953125, 0.54803466796875, 0.664306640625, 0.78057861328125, 0.8968505859375, 1.01312255859375, 1.12939453125, 1.24566650390625, 1.3619384765625, 1.47821044921875, 1.594482421875, 1.71075439453125, 1.8270263671875, 1.94329833984375, 2.0595703125, 2.17584228515625, 2.2921142578125, 2.40838623046875, 2.524658203125, 2.64093017578125, 2.7572021484375, 2.87347412109375, 2.98974609375, 3.10601806640625, 3.2222900390625, 3.33856201171875, 3.454833984375, 3.57110595703125, 3.6873779296875, 3.80364990234375, 3.919921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 10.0, 10.0, 12.0, 15.0, 15.0, 13.0, 17.0, 33.0, 20.0, 33.0, 23.0, 32.0, 19.0, 28.0, 43.0, 37.0, 40.0, 43.0, 40.0, 30.0, 48.0, 30.0, 46.0, 38.0, 39.0, 41.0, 32.0, 23.0, 26.0, 24.0, 23.0, 21.0, 13.0, 13.0, 8.0, 11.0, 11.0, 4.0, 3.0, 4.0, 6.0, 6.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-18.125, -17.6064453125, -17.087890625, -16.5693359375, -16.05078125, -15.5322265625, -15.013671875, -14.4951171875, -13.9765625, -13.4580078125, -12.939453125, -12.4208984375, -11.90234375, -11.3837890625, -10.865234375, -10.3466796875, -9.828125, -9.3095703125, -8.791015625, -8.2724609375, -7.75390625, -7.2353515625, -6.716796875, -6.1982421875, -5.6796875, -5.1611328125, -4.642578125, -4.1240234375, -3.60546875, -3.0869140625, -2.568359375, -2.0498046875, -1.53125, -1.0126953125, -0.494140625, 0.0244140625, 0.54296875, 1.0615234375, 1.580078125, 2.0986328125, 2.6171875, 3.1357421875, 3.654296875, 4.1728515625, 4.69140625, 5.2099609375, 5.728515625, 6.2470703125, 6.765625, 7.2841796875, 7.802734375, 8.3212890625, 8.83984375, 9.3583984375, 9.876953125, 10.3955078125, 10.9140625, 11.4326171875, 11.951171875, 12.4697265625, 12.98828125, 13.5068359375, 14.025390625, 14.5439453125, 15.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 8.0, 10.0, 19.0, 18.0, 24.0, 40.0, 47.0, 80.0, 127.0, 191.0, 325.0, 495.0, 700.0, 1195.0, 2094.0, 3530.0, 6003.0, 10478.0, 18120.0, 30524.0, 50064.0, 80062.0, 115990.0, 148920.0, 160095.0, 140215.0, 104448.0, 69567.0, 43177.0, 25230.0, 15115.0, 8728.0, 5226.0, 2900.0, 1819.0, 1096.0, 656.0, 421.0, 269.0, 164.0, 129.0, 71.0, 56.0, 33.0, 23.0, 12.0, 11.0, 7.0, 7.0, 8.0, 2.0, 2.0, 5.0, 2.0], "bins": [-3.150390625, -3.05865478515625, -2.9669189453125, -2.87518310546875, -2.783447265625, -2.69171142578125, -2.5999755859375, -2.50823974609375, -2.41650390625, -2.32476806640625, -2.2330322265625, -2.14129638671875, -2.049560546875, -1.95782470703125, -1.8660888671875, -1.77435302734375, -1.6826171875, -1.59088134765625, -1.4991455078125, -1.40740966796875, -1.315673828125, -1.22393798828125, -1.1322021484375, -1.04046630859375, -0.94873046875, -0.85699462890625, -0.7652587890625, -0.67352294921875, -0.581787109375, -0.49005126953125, -0.3983154296875, -0.30657958984375, -0.21484375, -0.12310791015625, -0.0313720703125, 0.06036376953125, 0.152099609375, 0.24383544921875, 0.3355712890625, 0.42730712890625, 0.51904296875, 0.61077880859375, 0.7025146484375, 0.79425048828125, 0.885986328125, 0.97772216796875, 1.0694580078125, 1.16119384765625, 1.2529296875, 1.34466552734375, 1.4364013671875, 1.52813720703125, 1.619873046875, 1.71160888671875, 1.8033447265625, 1.89508056640625, 1.98681640625, 2.07855224609375, 2.1702880859375, 2.26202392578125, 2.353759765625, 2.44549560546875, 2.5372314453125, 2.62896728515625, 2.720703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 12.0, 7.0, 6.0, 13.0, 8.0, 10.0, 14.0, 15.0, 19.0, 14.0, 14.0, 16.0, 27.0, 24.0, 28.0, 27.0, 35.0, 32.0, 42.0, 38.0, 41.0, 37.0, 37.0, 34.0, 33.0, 45.0, 35.0, 20.0, 31.0, 29.0, 38.0, 20.0, 27.0, 21.0, 25.0, 14.0, 16.0, 13.0, 14.0, 15.0, 7.0, 12.0, 7.0, 9.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.796875, -10.459228515625, -10.12158203125, -9.783935546875, -9.4462890625, -9.108642578125, -8.77099609375, -8.433349609375, -8.095703125, -7.758056640625, -7.42041015625, -7.082763671875, -6.7451171875, -6.407470703125, -6.06982421875, -5.732177734375, -5.39453125, -5.056884765625, -4.71923828125, -4.381591796875, -4.0439453125, -3.706298828125, -3.36865234375, -3.031005859375, -2.693359375, -2.355712890625, -2.01806640625, -1.680419921875, -1.3427734375, -1.005126953125, -0.66748046875, -0.329833984375, 0.0078125, 0.345458984375, 0.68310546875, 1.020751953125, 1.3583984375, 1.696044921875, 2.03369140625, 2.371337890625, 2.708984375, 3.046630859375, 3.38427734375, 3.721923828125, 4.0595703125, 4.397216796875, 4.73486328125, 5.072509765625, 5.41015625, 5.747802734375, 6.08544921875, 6.423095703125, 6.7607421875, 7.098388671875, 7.43603515625, 7.773681640625, 8.111328125, 8.448974609375, 8.78662109375, 9.124267578125, 9.4619140625, 9.799560546875, 10.13720703125, 10.474853515625, 10.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 1.0, 5.0, 6.0, 4.0, 17.0, 16.0, 28.0, 38.0, 51.0, 79.0, 117.0, 163.0, 197.0, 287.0, 430.0, 624.0, 917.0, 1387.0, 2215.0, 3540.0, 6392.0, 11509.0, 22195.0, 45177.0, 97124.0, 190961.0, 267997.0, 197197.0, 100302.0, 47363.0, 23130.0, 11793.0, 6341.0, 3856.0, 2379.0, 1566.0, 987.0, 664.0, 467.0, 323.0, 217.0, 148.0, 98.0, 72.0, 56.0, 36.0, 25.0, 21.0, 15.0, 11.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7548828125, -0.7293167114257812, -0.7037506103515625, -0.6781845092773438, -0.652618408203125, -0.6270523071289062, -0.6014862060546875, -0.5759201049804688, -0.55035400390625, -0.5247879028320312, -0.4992218017578125, -0.47365570068359375, -0.448089599609375, -0.42252349853515625, -0.3969573974609375, -0.37139129638671875, -0.3458251953125, -0.32025909423828125, -0.2946929931640625, -0.26912689208984375, -0.243560791015625, -0.21799468994140625, -0.1924285888671875, -0.16686248779296875, -0.14129638671875, -0.11573028564453125, -0.0901641845703125, -0.06459808349609375, -0.039031982421875, -0.01346588134765625, 0.0121002197265625, 0.03766632080078125, 0.063232421875, 0.08879852294921875, 0.1143646240234375, 0.13993072509765625, 0.165496826171875, 0.19106292724609375, 0.2166290283203125, 0.24219512939453125, 0.26776123046875, 0.29332733154296875, 0.3188934326171875, 0.34445953369140625, 0.370025634765625, 0.39559173583984375, 0.4211578369140625, 0.44672393798828125, 0.4722900390625, 0.49785614013671875, 0.5234222412109375, 0.5489883422851562, 0.574554443359375, 0.6001205444335938, 0.6256866455078125, 0.6512527465820312, 0.67681884765625, 0.7023849487304688, 0.7279510498046875, 0.7535171508789062, 0.779083251953125, 0.8046493530273438, 0.8302154541015625, 0.8557815551757812, 0.88134765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 10.0, 8.0, 14.0, 14.0, 32.0, 35.0, 46.0, 54.0, 79.0, 84.0, 119.0, 123.0, 96.0, 72.0, 49.0, 52.0, 35.0, 24.0, 13.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021159648895263672, -0.0002056807279586792, -0.00019976496696472168, -0.00019384920597076416, -0.00018793344497680664, -0.00018201768398284912, -0.0001761019229888916, -0.00017018616199493408, -0.00016427040100097656, -0.00015835464000701904, -0.00015243887901306152, -0.000146523118019104, -0.00014060735702514648, -0.00013469159603118896, -0.00012877583503723145, -0.00012286007404327393, -0.0001169443130493164, -0.00011102855205535889, -0.00010511279106140137, -9.919703006744385e-05, -9.328126907348633e-05, -8.736550807952881e-05, -8.144974708557129e-05, -7.553398609161377e-05, -6.961822509765625e-05, -6.370246410369873e-05, -5.778670310974121e-05, -5.187094211578369e-05, -4.595518112182617e-05, -4.003942012786865e-05, -3.412365913391113e-05, -2.8207898139953613e-05, -2.2292137145996094e-05, -1.6376376152038574e-05, -1.0460615158081055e-05, -4.544854164123535e-06, 1.3709068298339844e-06, 7.286667823791504e-06, 1.3202428817749023e-05, 1.9118189811706543e-05, 2.5033950805664062e-05, 3.094971179962158e-05, 3.68654727935791e-05, 4.278123378753662e-05, 4.869699478149414e-05, 5.461275577545166e-05, 6.052851676940918e-05, 6.64442777633667e-05, 7.236003875732422e-05, 7.827579975128174e-05, 8.419156074523926e-05, 9.010732173919678e-05, 9.60230827331543e-05, 0.00010193884372711182, 0.00010785460472106934, 0.00011377036571502686, 0.00011968612670898438, 0.0001256018877029419, 0.00013151764869689941, 0.00013743340969085693, 0.00014334917068481445, 0.00014926493167877197, 0.0001551806926727295, 0.000161096453666687, 0.00016701221466064453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 11.0, 11.0, 17.0, 30.0, 51.0, 74.0, 121.0, 164.0, 235.0, 360.0, 531.0, 822.0, 1140.0, 1739.0, 2546.0, 3900.0, 6114.0, 9526.0, 15302.0, 25335.0, 41503.0, 69929.0, 113845.0, 165484.0, 186036.0, 150146.0, 98397.0, 60386.0, 35757.0, 21758.0, 13242.0, 8470.0, 5303.0, 3409.0, 2244.0, 1519.0, 944.0, 692.0, 459.0, 317.0, 193.0, 149.0, 122.0, 67.0, 63.0, 25.0, 18.0, 14.0, 10.0, 10.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.110595703125, -1.07275390625, -1.034912109375, -0.9970703125, -0.959228515625, -0.92138671875, -0.883544921875, -0.845703125, -0.807861328125, -0.77001953125, -0.732177734375, -0.6943359375, -0.656494140625, -0.61865234375, -0.580810546875, -0.54296875, -0.505126953125, -0.46728515625, -0.429443359375, -0.3916015625, -0.353759765625, -0.31591796875, -0.278076171875, -0.240234375, -0.202392578125, -0.16455078125, -0.126708984375, -0.0888671875, -0.051025390625, -0.01318359375, 0.024658203125, 0.0625, 0.100341796875, 0.13818359375, 0.176025390625, 0.2138671875, 0.251708984375, 0.28955078125, 0.327392578125, 0.365234375, 0.403076171875, 0.44091796875, 0.478759765625, 0.5166015625, 0.554443359375, 0.59228515625, 0.630126953125, 0.66796875, 0.705810546875, 0.74365234375, 0.781494140625, 0.8193359375, 0.857177734375, 0.89501953125, 0.932861328125, 0.970703125, 1.008544921875, 1.04638671875, 1.084228515625, 1.1220703125, 1.159912109375, 1.19775390625, 1.235595703125, 1.2734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 10.0, 9.0, 19.0, 19.0, 19.0, 15.0, 37.0, 34.0, 43.0, 61.0, 77.0, 80.0, 87.0, 79.0, 72.0, 74.0, 54.0, 39.0, 27.0, 31.0, 26.0, 16.0, 9.0, 11.0, 6.0, 9.0, 3.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.67138671875, -0.6514053344726562, -0.6314239501953125, -0.6114425659179688, -0.591461181640625, -0.5714797973632812, -0.5514984130859375, -0.5315170288085938, -0.51153564453125, -0.49155426025390625, -0.4715728759765625, -0.45159149169921875, -0.431610107421875, -0.41162872314453125, -0.3916473388671875, -0.37166595458984375, -0.3516845703125, -0.33170318603515625, -0.3117218017578125, -0.29174041748046875, -0.271759033203125, -0.25177764892578125, -0.2317962646484375, -0.21181488037109375, -0.19183349609375, -0.17185211181640625, -0.1518707275390625, -0.13188934326171875, -0.111907958984375, -0.09192657470703125, -0.0719451904296875, -0.05196380615234375, -0.031982421875, -0.01200103759765625, 0.0079803466796875, 0.02796173095703125, 0.047943115234375, 0.06792449951171875, 0.0879058837890625, 0.10788726806640625, 0.12786865234375, 0.14785003662109375, 0.1678314208984375, 0.18781280517578125, 0.207794189453125, 0.22777557373046875, 0.2477569580078125, 0.26773834228515625, 0.2877197265625, 0.30770111083984375, 0.3276824951171875, 0.34766387939453125, 0.367645263671875, 0.38762664794921875, 0.4076080322265625, 0.42758941650390625, 0.44757080078125, 0.46755218505859375, 0.4875335693359375, 0.5075149536132812, 0.527496337890625, 0.5474777221679688, 0.5674591064453125, 0.5874404907226562, 0.607421875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 1.0, 6.0, 7.0, 11.0, 8.0, 7.0, 17.0, 10.0, 15.0, 13.0, 21.0, 23.0, 23.0, 38.0, 33.0, 25.0, 33.0, 38.0, 36.0, 31.0, 44.0, 53.0, 49.0, 33.0, 40.0, 37.0, 27.0, 31.0, 24.0, 34.0, 21.0, 28.0, 25.0, 23.0, 17.0, 18.0, 13.0, 16.0, 8.0, 9.0, 8.0, 7.0, 9.0, 2.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-12.044129371643066, -11.671682357788086, -11.299235343933105, -10.926788330078125, -10.554340362548828, -10.181893348693848, -9.809446334838867, -9.436999320983887, -9.064552307128906, -8.692105293273926, -8.319658279418945, -7.947210788726807, -7.574763774871826, -7.202316761016846, -6.829869270324707, -6.457422256469727, -6.084975242614746, -5.712528228759766, -5.340081214904785, -4.9676337242126465, -4.595186710357666, -4.2227396965026855, -3.850292444229126, -3.4778451919555664, -3.105398178100586, -2.7329511642456055, -2.360503911972046, -1.9880567789077759, -1.6156096458435059, -1.2431625127792358, -0.8707153797149658, -0.49826812744140625, -0.12582015991210938, 0.24662697315216064, 0.6190741062164307, 0.9915212392807007, 1.3639683723449707, 1.7364155054092407, 2.1088626384735107, 2.4813098907470703, 2.853756904602051, 3.2262039184570312, 3.598651170730591, 3.9710984230041504, 4.343545436859131, 4.715992450714111, 5.08843994140625, 5.4608869552612305, 5.833333969116211, 6.205780982971191, 6.578227996826172, 6.9506754875183105, 7.323122501373291, 7.6955695152282715, 8.06801700592041, 8.44046401977539, 8.812911033630371, 9.185358047485352, 9.557805061340332, 9.930252075195312, 10.30270004272461, 10.67514705657959, 11.04759407043457, 11.42004108428955, 11.792488098144531]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 13.0, 13.0, 12.0, 18.0, 21.0, 29.0, 17.0, 27.0, 30.0, 30.0, 23.0, 38.0, 28.0, 37.0, 41.0, 32.0, 37.0, 30.0, 47.0, 45.0, 45.0, 40.0, 23.0, 31.0, 37.0, 36.0, 27.0, 26.0, 21.0, 18.0, 17.0, 17.0, 7.0, 8.0, 9.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-17.543622970581055, -17.04429054260254, -16.54495620727539, -16.045623779296875, -15.546290397644043, -15.046957015991211, -14.547623634338379, -14.048290252685547, -13.548956871032715, -13.049623489379883, -12.55029010772705, -12.050956726074219, -11.551624298095703, -11.052290916442871, -10.552957534790039, -10.053624153137207, -9.554290771484375, -9.054957389831543, -8.555624008178711, -8.056291580200195, -7.556957721710205, -7.057624816894531, -6.558291435241699, -6.058958053588867, -5.559625625610352, -5.0602922439575195, -4.560959339141846, -4.061625957489014, -3.5622925758361816, -3.0629594326019287, -2.563626289367676, -2.0642929077148438, -1.5649595260620117, -1.0656262636184692, -0.5662930607795715, -0.06695985794067383, 0.43237340450286865, 0.9317066669464111, 1.431039810180664, 1.930373191833496, 2.429706335067749, 2.929039478302002, 3.428372859954834, 3.927706003189087, 4.42703914642334, 4.926372528076172, 5.425705909729004, 5.925039291381836, 6.42437219619751, 6.923705577850342, 7.423038482666016, 7.922371864318848, 8.42170524597168, 8.921038627624512, 9.420372009277344, 9.91970443725586, 10.419037818908691, 10.918371200561523, 11.417704582214355, 11.917037963867188, 12.416370391845703, 12.915703773498535, 13.415037155151367, 13.9143705368042, 14.413703918457031]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 6.0, 4.0, 10.0, 25.0, 32.0, 40.0, 61.0, 132.0, 194.0, 291.0, 449.0, 721.0, 1078.0, 1830.0, 2759.0, 4234.0, 6572.0, 9517.0, 14558.0, 20712.0, 29396.0, 40324.0, 52433.0, 66152.0, 79647.0, 89528.0, 96201.0, 96259.0, 91389.0, 81311.0, 68577.0, 54538.0, 41806.0, 30714.0, 22050.0, 15056.0, 10260.0, 7025.0, 4433.0, 2978.0, 1948.0, 1228.0, 755.0, 521.0, 282.0, 172.0, 123.0, 80.0, 54.0, 37.0, 20.0, 12.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.3125, -9.0128173828125, -8.713134765625, -8.4134521484375, -8.11376953125, -7.8140869140625, -7.514404296875, -7.2147216796875, -6.9150390625, -6.6153564453125, -6.315673828125, -6.0159912109375, -5.71630859375, -5.4166259765625, -5.116943359375, -4.8172607421875, -4.517578125, -4.2178955078125, -3.918212890625, -3.6185302734375, -3.31884765625, -3.0191650390625, -2.719482421875, -2.4197998046875, -2.1201171875, -1.8204345703125, -1.520751953125, -1.2210693359375, -0.92138671875, -0.6217041015625, -0.322021484375, -0.0223388671875, 0.27734375, 0.5770263671875, 0.876708984375, 1.1763916015625, 1.47607421875, 1.7757568359375, 2.075439453125, 2.3751220703125, 2.6748046875, 2.9744873046875, 3.274169921875, 3.5738525390625, 3.87353515625, 4.1732177734375, 4.472900390625, 4.7725830078125, 5.072265625, 5.3719482421875, 5.671630859375, 5.9713134765625, 6.27099609375, 6.5706787109375, 6.870361328125, 7.1700439453125, 7.4697265625, 7.7694091796875, 8.069091796875, 8.3687744140625, 8.66845703125, 8.9681396484375, 9.267822265625, 9.5675048828125, 9.8671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 12.0, 3.0, 17.0, 13.0, 25.0, 26.0, 21.0, 19.0, 24.0, 20.0, 43.0, 30.0, 29.0, 44.0, 37.0, 33.0, 32.0, 34.0, 42.0, 35.0, 52.0, 37.0, 35.0, 33.0, 37.0, 32.0, 27.0, 25.0, 26.0, 23.0, 24.0, 19.0, 14.0, 13.0, 8.0, 4.0, 8.0, 6.0, 5.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0], "bins": [-18.015625, -17.51513671875, -17.0146484375, -16.51416015625, -16.013671875, -15.51318359375, -15.0126953125, -14.51220703125, -14.01171875, -13.51123046875, -13.0107421875, -12.51025390625, -12.009765625, -11.50927734375, -11.0087890625, -10.50830078125, -10.0078125, -9.50732421875, -9.0068359375, -8.50634765625, -8.005859375, -7.50537109375, -7.0048828125, -6.50439453125, -6.00390625, -5.50341796875, -5.0029296875, -4.50244140625, -4.001953125, -3.50146484375, -3.0009765625, -2.50048828125, -2.0, -1.49951171875, -0.9990234375, -0.49853515625, 0.001953125, 0.50244140625, 1.0029296875, 1.50341796875, 2.00390625, 2.50439453125, 3.0048828125, 3.50537109375, 4.005859375, 4.50634765625, 5.0068359375, 5.50732421875, 6.0078125, 6.50830078125, 7.0087890625, 7.50927734375, 8.009765625, 8.51025390625, 9.0107421875, 9.51123046875, 10.01171875, 10.51220703125, 11.0126953125, 11.51318359375, 12.013671875, 12.51416015625, 13.0146484375, 13.51513671875, 14.015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 11.0, 13.0, 8.0, 21.0, 25.0, 37.0, 66.0, 120.0, 194.0, 351.0, 512.0, 1019.0, 1790.0, 3095.0, 5398.0, 9358.0, 16215.0, 26759.0, 43182.0, 65142.0, 90551.0, 115622.0, 132294.0, 133596.0, 120025.0, 95559.0, 69213.0, 46736.0, 29337.0, 17782.0, 10423.0, 6006.0, 3486.0, 1981.0, 1145.0, 603.0, 361.0, 210.0, 109.0, 88.0, 38.0, 25.0, 19.0, 22.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.230712890625, -12.80517578125, -12.379638671875, -11.9541015625, -11.528564453125, -11.10302734375, -10.677490234375, -10.251953125, -9.826416015625, -9.40087890625, -8.975341796875, -8.5498046875, -8.124267578125, -7.69873046875, -7.273193359375, -6.84765625, -6.422119140625, -5.99658203125, -5.571044921875, -5.1455078125, -4.719970703125, -4.29443359375, -3.868896484375, -3.443359375, -3.017822265625, -2.59228515625, -2.166748046875, -1.7412109375, -1.315673828125, -0.89013671875, -0.464599609375, -0.0390625, 0.386474609375, 0.81201171875, 1.237548828125, 1.6630859375, 2.088623046875, 2.51416015625, 2.939697265625, 3.365234375, 3.790771484375, 4.21630859375, 4.641845703125, 5.0673828125, 5.492919921875, 5.91845703125, 6.343994140625, 6.76953125, 7.195068359375, 7.62060546875, 8.046142578125, 8.4716796875, 8.897216796875, 9.32275390625, 9.748291015625, 10.173828125, 10.599365234375, 11.02490234375, 11.450439453125, 11.8759765625, 12.301513671875, 12.72705078125, 13.152587890625, 13.578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 6.0, 7.0, 14.0, 11.0, 15.0, 19.0, 18.0, 21.0, 30.0, 24.0, 24.0, 26.0, 25.0, 39.0, 31.0, 40.0, 38.0, 45.0, 36.0, 42.0, 36.0, 50.0, 34.0, 37.0, 41.0, 28.0, 29.0, 27.0, 21.0, 23.0, 29.0, 22.0, 17.0, 12.0, 16.0, 9.0, 4.0, 5.0, 5.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4296875, -10.094482421875, -9.75927734375, -9.424072265625, -9.0888671875, -8.753662109375, -8.41845703125, -8.083251953125, -7.748046875, -7.412841796875, -7.07763671875, -6.742431640625, -6.4072265625, -6.072021484375, -5.73681640625, -5.401611328125, -5.06640625, -4.731201171875, -4.39599609375, -4.060791015625, -3.7255859375, -3.390380859375, -3.05517578125, -2.719970703125, -2.384765625, -2.049560546875, -1.71435546875, -1.379150390625, -1.0439453125, -0.708740234375, -0.37353515625, -0.038330078125, 0.296875, 0.632080078125, 0.96728515625, 1.302490234375, 1.6376953125, 1.972900390625, 2.30810546875, 2.643310546875, 2.978515625, 3.313720703125, 3.64892578125, 3.984130859375, 4.3193359375, 4.654541015625, 4.98974609375, 5.324951171875, 5.66015625, 5.995361328125, 6.33056640625, 6.665771484375, 7.0009765625, 7.336181640625, 7.67138671875, 8.006591796875, 8.341796875, 8.677001953125, 9.01220703125, 9.347412109375, 9.6826171875, 10.017822265625, 10.35302734375, 10.688232421875, 11.0234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 6.0, 6.0, 12.0, 8.0, 14.0, 23.0, 41.0, 67.0, 104.0, 186.0, 283.0, 486.0, 816.0, 1515.0, 2716.0, 4793.0, 8896.0, 16689.0, 31789.0, 62490.0, 115847.0, 184371.0, 216566.0, 175034.0, 106282.0, 56715.0, 29416.0, 15234.0, 8134.0, 4396.0, 2362.0, 1354.0, 783.0, 448.0, 269.0, 169.0, 98.0, 56.0, 32.0, 19.0, 19.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.453125, -6.1993408203125, -5.945556640625, -5.6917724609375, -5.43798828125, -5.1842041015625, -4.930419921875, -4.6766357421875, -4.4228515625, -4.1690673828125, -3.915283203125, -3.6614990234375, -3.40771484375, -3.1539306640625, -2.900146484375, -2.6463623046875, -2.392578125, -2.1387939453125, -1.885009765625, -1.6312255859375, -1.37744140625, -1.1236572265625, -0.869873046875, -0.6160888671875, -0.3623046875, -0.1085205078125, 0.145263671875, 0.3990478515625, 0.65283203125, 0.9066162109375, 1.160400390625, 1.4141845703125, 1.66796875, 1.9217529296875, 2.175537109375, 2.4293212890625, 2.68310546875, 2.9368896484375, 3.190673828125, 3.4444580078125, 3.6982421875, 3.9520263671875, 4.205810546875, 4.4595947265625, 4.71337890625, 4.9671630859375, 5.220947265625, 5.4747314453125, 5.728515625, 5.9822998046875, 6.236083984375, 6.4898681640625, 6.74365234375, 6.9974365234375, 7.251220703125, 7.5050048828125, 7.7587890625, 8.0125732421875, 8.266357421875, 8.5201416015625, 8.77392578125, 9.0277099609375, 9.281494140625, 9.5352783203125, 9.7890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 11.0, 5.0, 9.0, 11.0, 29.0, 23.0, 21.0, 33.0, 33.0, 59.0, 65.0, 55.0, 64.0, 87.0, 71.0, 65.0, 65.0, 47.0, 47.0, 32.0, 34.0, 24.0, 25.0, 19.0, 11.0, 10.0, 11.0, 5.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00078582763671875, -0.0007632747292518616, -0.0007407218217849731, -0.0007181689143180847, -0.0006956160068511963, -0.0006730630993843079, -0.0006505101919174194, -0.000627957284450531, -0.0006054043769836426, -0.0005828514695167542, -0.0005602985620498657, -0.0005377456545829773, -0.0005151927471160889, -0.0004926398396492004, -0.000470086932182312, -0.0004475340247154236, -0.00042498111724853516, -0.00040242820978164673, -0.0003798753023147583, -0.0003573223948478699, -0.00033476948738098145, -0.000312216579914093, -0.0002896636724472046, -0.00026711076498031616, -0.00024455785751342773, -0.0002220049500465393, -0.00019945204257965088, -0.00017689913511276245, -0.00015434622764587402, -0.0001317933201789856, -0.00010924041271209717, -8.668750524520874e-05, -6.413459777832031e-05, -4.1581690311431885e-05, -1.9028782844543457e-05, 3.5241246223449707e-06, 2.60770320892334e-05, 4.8629939556121826e-05, 7.118284702301025e-05, 9.373575448989868e-05, 0.00011628866195678711, 0.00013884156942367554, 0.00016139447689056396, 0.0001839473843574524, 0.00020650029182434082, 0.00022905319929122925, 0.0002516061067581177, 0.0002741590142250061, 0.00029671192169189453, 0.00031926482915878296, 0.0003418177366256714, 0.0003643706440925598, 0.00038692355155944824, 0.00040947645902633667, 0.0004320293664932251, 0.0004545822739601135, 0.00047713518142700195, 0.0004996880888938904, 0.0005222409963607788, 0.0005447939038276672, 0.0005673468112945557, 0.0005898997187614441, 0.0006124526262283325, 0.000635005533695221, 0.0006575584411621094]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 14.0, 21.0, 30.0, 40.0, 65.0, 79.0, 125.0, 171.0, 246.0, 371.0, 606.0, 922.0, 1404.0, 2260.0, 3479.0, 5610.0, 8975.0, 14031.0, 22929.0, 36064.0, 55781.0, 84522.0, 116412.0, 142454.0, 146557.0, 127362.0, 96514.0, 66107.0, 42654.0, 26958.0, 16973.0, 10624.0, 6539.0, 4117.0, 2593.0, 1733.0, 1120.0, 697.0, 494.0, 291.0, 202.0, 125.0, 90.0, 60.0, 43.0, 27.0, 23.0, 15.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.6171875, -5.43707275390625, -5.2569580078125, -5.07684326171875, -4.896728515625, -4.71661376953125, -4.5364990234375, -4.35638427734375, -4.17626953125, -3.99615478515625, -3.8160400390625, -3.63592529296875, -3.455810546875, -3.27569580078125, -3.0955810546875, -2.91546630859375, -2.7353515625, -2.55523681640625, -2.3751220703125, -2.19500732421875, -2.014892578125, -1.83477783203125, -1.6546630859375, -1.47454833984375, -1.29443359375, -1.11431884765625, -0.9342041015625, -0.75408935546875, -0.573974609375, -0.39385986328125, -0.2137451171875, -0.03363037109375, 0.146484375, 0.32659912109375, 0.5067138671875, 0.68682861328125, 0.866943359375, 1.04705810546875, 1.2271728515625, 1.40728759765625, 1.58740234375, 1.76751708984375, 1.9476318359375, 2.12774658203125, 2.307861328125, 2.48797607421875, 2.6680908203125, 2.84820556640625, 3.0283203125, 3.20843505859375, 3.3885498046875, 3.56866455078125, 3.748779296875, 3.92889404296875, 4.1090087890625, 4.28912353515625, 4.46923828125, 4.64935302734375, 4.8294677734375, 5.00958251953125, 5.189697265625, 5.36981201171875, 5.5499267578125, 5.73004150390625, 5.91015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 4.0, 12.0, 10.0, 14.0, 10.0, 18.0, 22.0, 35.0, 40.0, 47.0, 55.0, 68.0, 69.0, 81.0, 76.0, 71.0, 72.0, 49.0, 41.0, 43.0, 30.0, 22.0, 25.0, 15.0, 15.0, 11.0, 11.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.048828125, -2.956817626953125, -2.86480712890625, -2.772796630859375, -2.6807861328125, -2.588775634765625, -2.49676513671875, -2.404754638671875, -2.312744140625, -2.220733642578125, -2.12872314453125, -2.036712646484375, -1.9447021484375, -1.852691650390625, -1.76068115234375, -1.668670654296875, -1.57666015625, -1.484649658203125, -1.39263916015625, -1.300628662109375, -1.2086181640625, -1.116607666015625, -1.02459716796875, -0.932586669921875, -0.840576171875, -0.748565673828125, -0.65655517578125, -0.564544677734375, -0.4725341796875, -0.380523681640625, -0.28851318359375, -0.196502685546875, -0.1044921875, -0.012481689453125, 0.07952880859375, 0.171539306640625, 0.2635498046875, 0.355560302734375, 0.44757080078125, 0.539581298828125, 0.631591796875, 0.723602294921875, 0.81561279296875, 0.907623291015625, 0.9996337890625, 1.091644287109375, 1.18365478515625, 1.275665283203125, 1.36767578125, 1.459686279296875, 1.55169677734375, 1.643707275390625, 1.7357177734375, 1.827728271484375, 1.91973876953125, 2.011749267578125, 2.103759765625, 2.195770263671875, 2.28778076171875, 2.379791259765625, 2.4718017578125, 2.563812255859375, 2.65582275390625, 2.747833251953125, 2.83984375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 5.0, 7.0, 6.0, 11.0, 14.0, 12.0, 18.0, 9.0, 20.0, 18.0, 26.0, 34.0, 28.0, 26.0, 26.0, 43.0, 41.0, 42.0, 34.0, 45.0, 32.0, 31.0, 37.0, 46.0, 39.0, 30.0, 31.0, 33.0, 31.0, 26.0, 19.0, 19.0, 14.0, 22.0, 17.0, 20.0, 16.0, 10.0, 13.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0], "bins": [-11.96922492980957, -11.600311279296875, -11.23139762878418, -10.862483978271484, -10.493569374084473, -10.124655723571777, -9.755742073059082, -9.386828422546387, -9.017913818359375, -8.64900016784668, -8.280086517333984, -7.911172389984131, -7.542258262634277, -7.173344612121582, -6.804430961608887, -6.435517311096191, -6.066603660583496, -5.697690010070801, -5.328775882720947, -4.959862232208252, -4.590948104858398, -4.222034454345703, -3.853120803833008, -3.4842069149017334, -3.115293025970459, -2.7463791370391846, -2.37746524810791, -2.008551597595215, -1.6396377086639404, -1.270723819732666, -0.9018101692199707, -0.5328962802886963, -0.16398239135742188, 0.20493143796920776, 0.5738452672958374, 0.9427590370178223, 1.3116729259490967, 1.680586814880371, 2.0495004653930664, 2.418414354324341, 2.7873282432556152, 3.1562421321868896, 3.525156021118164, 3.8940696716308594, 4.262983322143555, 4.631897449493408, 5.0008111000061035, 5.369725227355957, 5.738638877868652, 6.107552528381348, 6.476466655731201, 6.8453803062438965, 7.21429443359375, 7.583208084106445, 7.952121734619141, 8.321035385131836, 8.689949035644531, 9.058862686157227, 9.427776336669922, 9.796689987182617, 10.165604591369629, 10.534518241882324, 10.90343189239502, 11.272345542907715, 11.641260147094727]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 14.0, 9.0, 9.0, 11.0, 13.0, 19.0, 19.0, 24.0, 19.0, 22.0, 27.0, 40.0, 38.0, 30.0, 29.0, 33.0, 60.0, 47.0, 40.0, 49.0, 31.0, 31.0, 43.0, 30.0, 36.0, 31.0, 37.0, 33.0, 24.0, 27.0, 19.0, 23.0, 19.0, 10.0, 12.0, 11.0, 6.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.43821907043457, -18.87759017944336, -18.31696128845215, -17.756332397460938, -17.195703506469727, -16.635074615478516, -16.074445724487305, -15.513816833496094, -14.953187942504883, -14.392559051513672, -13.831930160522461, -13.27130126953125, -12.710672378540039, -12.150043487548828, -11.589414596557617, -11.028785705566406, -10.468155860900879, -9.907526969909668, -9.346898078918457, -8.786269187927246, -8.225640296936035, -7.665011405944824, -7.104382038116455, -6.543753147125244, -5.983124256134033, -5.422495365142822, -4.861866474151611, -4.301237106323242, -3.7406084537506104, -3.1799795627593994, -2.6193504333496094, -2.0587215423583984, -1.4980926513671875, -0.9374637007713318, -0.3768347501754761, 0.18379426002502441, 0.7444231510162354, 1.3050520420074463, 1.8656811714172363, 2.4263100624084473, 2.986938953399658, 3.547567844390869, 4.10819673538208, 4.668826103210449, 5.22945499420166, 5.790083885192871, 6.350712776184082, 6.911341667175293, 7.471970558166504, 8.032599449157715, 8.593228340148926, 9.153857231140137, 9.714486122131348, 10.275115013122559, 10.835744857788086, 11.396373748779297, 11.957002639770508, 12.517631530761719, 13.07826042175293, 13.63888931274414, 14.199518203735352, 14.760147094726562, 15.320775985717773, 15.881404876708984, 16.442033767700195]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 12.0, 29.0, 33.0, 67.0, 132.0, 237.0, 364.0, 707.0, 1144.0, 1949.0, 3452.0, 5560.0, 9389.0, 15997.0, 26928.0, 43628.0, 70498.0, 111071.0, 169074.0, 245631.0, 333306.0, 420271.0, 482318.0, 496899.0, 463060.0, 387486.0, 298900.0, 215112.0, 145037.0, 94593.0, 59837.0, 36873.0, 22325.0, 13431.0, 7859.0, 4603.0, 2709.0, 1619.0, 860.0, 558.0, 314.0, 184.0, 92.0, 44.0, 36.0, 23.0, 11.0, 11.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.032470703125, -9.68994140625, -9.347412109375, -9.0048828125, -8.662353515625, -8.31982421875, -7.977294921875, -7.634765625, -7.292236328125, -6.94970703125, -6.607177734375, -6.2646484375, -5.922119140625, -5.57958984375, -5.237060546875, -4.89453125, -4.552001953125, -4.20947265625, -3.866943359375, -3.5244140625, -3.181884765625, -2.83935546875, -2.496826171875, -2.154296875, -1.811767578125, -1.46923828125, -1.126708984375, -0.7841796875, -0.441650390625, -0.09912109375, 0.243408203125, 0.5859375, 0.928466796875, 1.27099609375, 1.613525390625, 1.9560546875, 2.298583984375, 2.64111328125, 2.983642578125, 3.326171875, 3.668701171875, 4.01123046875, 4.353759765625, 4.6962890625, 5.038818359375, 5.38134765625, 5.723876953125, 6.06640625, 6.408935546875, 6.75146484375, 7.093994140625, 7.4365234375, 7.779052734375, 8.12158203125, 8.464111328125, 8.806640625, 9.149169921875, 9.49169921875, 9.834228515625, 10.1767578125, 10.519287109375, 10.86181640625, 11.204345703125, 11.546875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 5.0, 9.0, 10.0, 14.0, 9.0, 10.0, 13.0, 13.0, 20.0, 18.0, 20.0, 29.0, 35.0, 34.0, 33.0, 35.0, 33.0, 44.0, 48.0, 44.0, 42.0, 36.0, 38.0, 34.0, 33.0, 35.0, 46.0, 27.0, 27.0, 24.0, 32.0, 27.0, 19.0, 14.0, 17.0, 13.0, 11.0, 7.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.84375, -13.4271240234375, -13.010498046875, -12.5938720703125, -12.17724609375, -11.7606201171875, -11.343994140625, -10.9273681640625, -10.5107421875, -10.0941162109375, -9.677490234375, -9.2608642578125, -8.84423828125, -8.4276123046875, -8.010986328125, -7.5943603515625, -7.177734375, -6.7611083984375, -6.344482421875, -5.9278564453125, -5.51123046875, -5.0946044921875, -4.677978515625, -4.2613525390625, -3.8447265625, -3.4281005859375, -3.011474609375, -2.5948486328125, -2.17822265625, -1.7615966796875, -1.344970703125, -0.9283447265625, -0.51171875, -0.0950927734375, 0.321533203125, 0.7381591796875, 1.15478515625, 1.5714111328125, 1.988037109375, 2.4046630859375, 2.8212890625, 3.2379150390625, 3.654541015625, 4.0711669921875, 4.48779296875, 4.9044189453125, 5.321044921875, 5.7376708984375, 6.154296875, 6.5709228515625, 6.987548828125, 7.4041748046875, 7.82080078125, 8.2374267578125, 8.654052734375, 9.0706787109375, 9.4873046875, 9.9039306640625, 10.320556640625, 10.7371826171875, 11.15380859375, 11.5704345703125, 11.987060546875, 12.4036865234375, 12.8203125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 14.0, 38.0, 62.0, 120.0, 162.0, 327.0, 514.0, 926.0, 1654.0, 2921.0, 4805.0, 8144.0, 13543.0, 22286.0, 35443.0, 55348.0, 84447.0, 124053.0, 174697.0, 235221.0, 300208.0, 358654.0, 403349.0, 422268.0, 411426.0, 373833.0, 316970.0, 253351.0, 189836.0, 137698.0, 95071.0, 62663.0, 40578.0, 25446.0, 15363.0, 9500.0, 5561.0, 3352.0, 1843.0, 1115.0, 621.0, 342.0, 246.0, 112.0, 63.0, 33.0, 14.0, 17.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-10.4921875, -10.1802978515625, -9.868408203125, -9.5565185546875, -9.24462890625, -8.9327392578125, -8.620849609375, -8.3089599609375, -7.9970703125, -7.6851806640625, -7.373291015625, -7.0614013671875, -6.74951171875, -6.4376220703125, -6.125732421875, -5.8138427734375, -5.501953125, -5.1900634765625, -4.878173828125, -4.5662841796875, -4.25439453125, -3.9425048828125, -3.630615234375, -3.3187255859375, -3.0068359375, -2.6949462890625, -2.383056640625, -2.0711669921875, -1.75927734375, -1.4473876953125, -1.135498046875, -0.8236083984375, -0.51171875, -0.1998291015625, 0.112060546875, 0.4239501953125, 0.73583984375, 1.0477294921875, 1.359619140625, 1.6715087890625, 1.9833984375, 2.2952880859375, 2.607177734375, 2.9190673828125, 3.23095703125, 3.5428466796875, 3.854736328125, 4.1666259765625, 4.478515625, 4.7904052734375, 5.102294921875, 5.4141845703125, 5.72607421875, 6.0379638671875, 6.349853515625, 6.6617431640625, 6.9736328125, 7.2855224609375, 7.597412109375, 7.9093017578125, 8.22119140625, 8.5330810546875, 8.844970703125, 9.1568603515625, 9.46875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 5.0, 5.0, 24.0, 27.0, 39.0, 25.0, 37.0, 56.0, 74.0, 85.0, 89.0, 106.0, 118.0, 156.0, 149.0, 186.0, 203.0, 214.0, 189.0, 213.0, 192.0, 218.0, 196.0, 183.0, 177.0, 162.0, 154.0, 123.0, 130.0, 103.0, 86.0, 61.0, 58.0, 55.0, 34.0, 31.0, 31.0, 12.0, 12.0, 17.0, 10.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.97265625, -6.7838134765625, -6.594970703125, -6.4061279296875, -6.21728515625, -6.0284423828125, -5.839599609375, -5.6507568359375, -5.4619140625, -5.2730712890625, -5.084228515625, -4.8953857421875, -4.70654296875, -4.5177001953125, -4.328857421875, -4.1400146484375, -3.951171875, -3.7623291015625, -3.573486328125, -3.3846435546875, -3.19580078125, -3.0069580078125, -2.818115234375, -2.6292724609375, -2.4404296875, -2.2515869140625, -2.062744140625, -1.8739013671875, -1.68505859375, -1.4962158203125, -1.307373046875, -1.1185302734375, -0.9296875, -0.7408447265625, -0.552001953125, -0.3631591796875, -0.17431640625, 0.0145263671875, 0.203369140625, 0.3922119140625, 0.5810546875, 0.7698974609375, 0.958740234375, 1.1475830078125, 1.33642578125, 1.5252685546875, 1.714111328125, 1.9029541015625, 2.091796875, 2.2806396484375, 2.469482421875, 2.6583251953125, 2.84716796875, 3.0360107421875, 3.224853515625, 3.4136962890625, 3.6025390625, 3.7913818359375, 3.980224609375, 4.1690673828125, 4.35791015625, 4.5467529296875, 4.735595703125, 4.9244384765625, 5.11328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 8.0, 8.0, 13.0, 18.0, 18.0, 15.0, 20.0, 36.0, 34.0, 26.0, 30.0, 33.0, 29.0, 32.0, 51.0, 49.0, 39.0, 42.0, 40.0, 38.0, 42.0, 49.0, 42.0, 34.0, 24.0, 31.0, 29.0, 21.0, 28.0, 18.0, 15.0, 16.0, 6.0, 10.0, 6.0, 7.0, 4.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3630952835083, -10.952713012695312, -10.542329788208008, -10.13194751739502, -9.721565246582031, -9.311182022094727, -8.900799751281738, -8.49041748046875, -8.080034255981445, -7.669651508331299, -7.2592692375183105, -6.848886489868164, -6.438504219055176, -6.028121471405029, -5.617738723754883, -5.2073564529418945, -4.796974182128906, -4.38659143447876, -3.9762091636657715, -3.565826416015625, -3.1554439067840576, -2.7450613975524902, -2.3346786499023438, -1.9242961406707764, -1.513913631439209, -1.1035311222076416, -0.6931484937667847, -0.28276586532592773, 0.12761664390563965, 0.537999153137207, 0.9483819007873535, 1.358764410018921, 1.7691478729248047, 2.179530382156372, 2.5899128913879395, 3.000295639038086, 3.4106781482696533, 3.8210606575012207, 4.231443405151367, 4.6418256759643555, 5.052208423614502, 5.462591171264648, 5.872973442077637, 6.283356189727783, 6.69373893737793, 7.104121208190918, 7.5145039558410645, 7.924886703491211, 8.3352689743042, 8.745651245117188, 9.156034469604492, 9.56641674041748, 9.976799011230469, 10.387182235717773, 10.797564506530762, 11.20794677734375, 11.618330001831055, 12.028712272644043, 12.439095497131348, 12.849477767944336, 13.259860038757324, 13.670242309570312, 14.080625534057617, 14.491007804870605, 14.901390075683594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 8.0, 11.0, 4.0, 7.0, 10.0, 14.0, 11.0, 13.0, 22.0, 19.0, 26.0, 28.0, 23.0, 34.0, 22.0, 34.0, 28.0, 36.0, 40.0, 31.0, 38.0, 51.0, 49.0, 42.0, 37.0, 30.0, 29.0, 34.0, 31.0, 37.0, 32.0, 26.0, 26.0, 18.0, 13.0, 12.0, 12.0, 11.0, 18.0, 9.0, 4.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0], "bins": [-16.742549896240234, -16.260732650756836, -15.778915405273438, -15.297098159790039, -14.81528091430664, -14.333463668823242, -13.851646423339844, -13.369829177856445, -12.888011932373047, -12.406194686889648, -11.92437744140625, -11.442560195922852, -10.960742950439453, -10.478925704956055, -9.997108459472656, -9.515291213989258, -9.03347396850586, -8.551656723022461, -8.069839477539062, -7.588022232055664, -7.106204986572266, -6.624387741088867, -6.142570495605469, -5.66075325012207, -5.178936004638672, -4.697118759155273, -4.215301513671875, -3.7334842681884766, -3.251667022705078, -2.7698497772216797, -2.2880325317382812, -1.8062152862548828, -1.3243989944458008, -0.8425817489624023, -0.3607645034790039, 0.12105274200439453, 0.602869987487793, 1.0846872329711914, 1.5665044784545898, 2.0483217239379883, 2.5301389694213867, 3.011956214904785, 3.4937734603881836, 3.975590705871582, 4.4574079513549805, 4.939225196838379, 5.421042442321777, 5.902859687805176, 6.384676933288574, 6.866494178771973, 7.348311424255371, 7.8301286697387695, 8.311945915222168, 8.793763160705566, 9.275580406188965, 9.757397651672363, 10.239214897155762, 10.72103214263916, 11.202849388122559, 11.684666633605957, 12.166483879089355, 12.648301124572754, 13.130118370056152, 13.61193561553955, 14.09375286102295]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 15.0, 16.0, 30.0, 41.0, 47.0, 102.0, 145.0, 226.0, 370.0, 613.0, 977.0, 1605.0, 2661.0, 4641.0, 8149.0, 15383.0, 28335.0, 53429.0, 97302.0, 159134.0, 207525.0, 187331.0, 124614.0, 71716.0, 37924.0, 20416.0, 11139.0, 5986.0, 3470.0, 1984.0, 1176.0, 743.0, 459.0, 290.0, 197.0, 120.0, 76.0, 65.0, 38.0, 18.0, 6.0, 10.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.421875, -4.28253173828125, -4.1431884765625, -4.00384521484375, -3.864501953125, -3.72515869140625, -3.5858154296875, -3.44647216796875, -3.30712890625, -3.16778564453125, -3.0284423828125, -2.88909912109375, -2.749755859375, -2.61041259765625, -2.4710693359375, -2.33172607421875, -2.1923828125, -2.05303955078125, -1.9136962890625, -1.77435302734375, -1.635009765625, -1.49566650390625, -1.3563232421875, -1.21697998046875, -1.07763671875, -0.93829345703125, -0.7989501953125, -0.65960693359375, -0.520263671875, -0.38092041015625, -0.2415771484375, -0.10223388671875, 0.037109375, 0.17645263671875, 0.3157958984375, 0.45513916015625, 0.594482421875, 0.73382568359375, 0.8731689453125, 1.01251220703125, 1.15185546875, 1.29119873046875, 1.4305419921875, 1.56988525390625, 1.709228515625, 1.84857177734375, 1.9879150390625, 2.12725830078125, 2.2666015625, 2.40594482421875, 2.5452880859375, 2.68463134765625, 2.823974609375, 2.96331787109375, 3.1026611328125, 3.24200439453125, 3.38134765625, 3.52069091796875, 3.6600341796875, 3.79937744140625, 3.938720703125, 4.07806396484375, 4.2174072265625, 4.35675048828125, 4.49609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 9.0, 9.0, 4.0, 11.0, 7.0, 10.0, 14.0, 19.0, 15.0, 25.0, 32.0, 33.0, 28.0, 30.0, 25.0, 46.0, 24.0, 41.0, 54.0, 39.0, 36.0, 50.0, 43.0, 44.0, 26.0, 39.0, 35.0, 39.0, 29.0, 31.0, 30.0, 25.0, 18.0, 17.0, 15.0, 18.0, 9.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.524658203125, -16.98681640625, -16.448974609375, -15.9111328125, -15.373291015625, -14.83544921875, -14.297607421875, -13.759765625, -13.221923828125, -12.68408203125, -12.146240234375, -11.6083984375, -11.070556640625, -10.53271484375, -9.994873046875, -9.45703125, -8.919189453125, -8.38134765625, -7.843505859375, -7.3056640625, -6.767822265625, -6.22998046875, -5.692138671875, -5.154296875, -4.616455078125, -4.07861328125, -3.540771484375, -3.0029296875, -2.465087890625, -1.92724609375, -1.389404296875, -0.8515625, -0.313720703125, 0.22412109375, 0.761962890625, 1.2998046875, 1.837646484375, 2.37548828125, 2.913330078125, 3.451171875, 3.989013671875, 4.52685546875, 5.064697265625, 5.6025390625, 6.140380859375, 6.67822265625, 7.216064453125, 7.75390625, 8.291748046875, 8.82958984375, 9.367431640625, 9.9052734375, 10.443115234375, 10.98095703125, 11.518798828125, 12.056640625, 12.594482421875, 13.13232421875, 13.670166015625, 14.2080078125, 14.745849609375, 15.28369140625, 15.821533203125, 16.359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 12.0, 19.0, 15.0, 33.0, 33.0, 56.0, 68.0, 79.0, 103.0, 159.0, 228.0, 304.0, 457.0, 702.0, 1126.0, 1798.0, 3198.0, 5917.0, 11174.0, 22082.0, 43973.0, 84203.0, 147145.0, 206636.0, 204327.0, 143559.0, 82032.0, 42751.0, 21435.0, 10878.0, 5572.0, 3152.0, 1800.0, 1154.0, 689.0, 446.0, 331.0, 255.0, 165.0, 100.0, 91.0, 71.0, 56.0, 28.0, 36.0, 28.0, 17.0, 19.0, 8.0, 8.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0], "bins": [-3.630859375, -3.517303466796875, -3.40374755859375, -3.290191650390625, -3.1766357421875, -3.063079833984375, -2.94952392578125, -2.835968017578125, -2.722412109375, -2.608856201171875, -2.49530029296875, -2.381744384765625, -2.2681884765625, -2.154632568359375, -2.04107666015625, -1.927520751953125, -1.81396484375, -1.700408935546875, -1.58685302734375, -1.473297119140625, -1.3597412109375, -1.246185302734375, -1.13262939453125, -1.019073486328125, -0.905517578125, -0.791961669921875, -0.67840576171875, -0.564849853515625, -0.4512939453125, -0.337738037109375, -0.22418212890625, -0.110626220703125, 0.0029296875, 0.116485595703125, 0.23004150390625, 0.343597412109375, 0.4571533203125, 0.570709228515625, 0.68426513671875, 0.797821044921875, 0.911376953125, 1.024932861328125, 1.13848876953125, 1.252044677734375, 1.3656005859375, 1.479156494140625, 1.59271240234375, 1.706268310546875, 1.81982421875, 1.933380126953125, 2.04693603515625, 2.160491943359375, 2.2740478515625, 2.387603759765625, 2.50115966796875, 2.614715576171875, 2.728271484375, 2.841827392578125, 2.95538330078125, 3.068939208984375, 3.1824951171875, 3.296051025390625, 3.40960693359375, 3.523162841796875, 3.63671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 10.0, 10.0, 8.0, 10.0, 13.0, 23.0, 24.0, 21.0, 33.0, 25.0, 31.0, 21.0, 33.0, 36.0, 40.0, 29.0, 38.0, 43.0, 45.0, 48.0, 51.0, 36.0, 47.0, 31.0, 41.0, 35.0, 29.0, 27.0, 24.0, 17.0, 19.0, 22.0, 13.0, 10.0, 9.0, 9.0, 8.0, 3.0, 9.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.140625, -11.7838134765625, -11.427001953125, -11.0701904296875, -10.71337890625, -10.3565673828125, -9.999755859375, -9.6429443359375, -9.2861328125, -8.9293212890625, -8.572509765625, -8.2156982421875, -7.85888671875, -7.5020751953125, -7.145263671875, -6.7884521484375, -6.431640625, -6.0748291015625, -5.718017578125, -5.3612060546875, -5.00439453125, -4.6475830078125, -4.290771484375, -3.9339599609375, -3.5771484375, -3.2203369140625, -2.863525390625, -2.5067138671875, -2.14990234375, -1.7930908203125, -1.436279296875, -1.0794677734375, -0.72265625, -0.3658447265625, -0.009033203125, 0.3477783203125, 0.70458984375, 1.0614013671875, 1.418212890625, 1.7750244140625, 2.1318359375, 2.4886474609375, 2.845458984375, 3.2022705078125, 3.55908203125, 3.9158935546875, 4.272705078125, 4.6295166015625, 4.986328125, 5.3431396484375, 5.699951171875, 6.0567626953125, 6.41357421875, 6.7703857421875, 7.127197265625, 7.4840087890625, 7.8408203125, 8.1976318359375, 8.554443359375, 8.9112548828125, 9.26806640625, 9.6248779296875, 9.981689453125, 10.3385009765625, 10.6953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 10.0, 21.0, 25.0, 34.0, 51.0, 72.0, 101.0, 118.0, 197.0, 223.0, 360.0, 496.0, 660.0, 988.0, 1356.0, 2000.0, 2977.0, 4850.0, 8019.0, 14988.0, 29934.0, 66520.0, 158780.0, 300181.0, 246080.0, 109997.0, 47102.0, 22225.0, 11561.0, 6524.0, 3911.0, 2524.0, 1706.0, 1151.0, 771.0, 580.0, 403.0, 310.0, 206.0, 141.0, 109.0, 83.0, 55.0, 45.0, 19.0, 19.0, 15.0, 8.0, 7.0, 8.0, 6.0, 2.0, 2.0, 5.0], "bins": [-0.84423828125, -0.8192520141601562, -0.7942657470703125, -0.7692794799804688, -0.744293212890625, -0.7193069458007812, -0.6943206787109375, -0.6693344116210938, -0.64434814453125, -0.6193618774414062, -0.5943756103515625, -0.5693893432617188, -0.544403076171875, -0.5194168090820312, -0.4944305419921875, -0.46944427490234375, -0.4444580078125, -0.41947174072265625, -0.3944854736328125, -0.36949920654296875, -0.344512939453125, -0.31952667236328125, -0.2945404052734375, -0.26955413818359375, -0.24456787109375, -0.21958160400390625, -0.1945953369140625, -0.16960906982421875, -0.144622802734375, -0.11963653564453125, -0.0946502685546875, -0.06966400146484375, -0.044677734375, -0.01969146728515625, 0.0052947998046875, 0.03028106689453125, 0.055267333984375, 0.08025360107421875, 0.1052398681640625, 0.13022613525390625, 0.15521240234375, 0.18019866943359375, 0.2051849365234375, 0.23017120361328125, 0.255157470703125, 0.28014373779296875, 0.3051300048828125, 0.33011627197265625, 0.3551025390625, 0.38008880615234375, 0.4050750732421875, 0.43006134033203125, 0.455047607421875, 0.48003387451171875, 0.5050201416015625, 0.5300064086914062, 0.55499267578125, 0.5799789428710938, 0.6049652099609375, 0.6299514770507812, 0.654937744140625, 0.6799240112304688, 0.7049102783203125, 0.7298965454101562, 0.7548828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 2.0, 6.0, 7.0, 13.0, 16.0, 16.0, 27.0, 28.0, 37.0, 48.0, 82.0, 111.0, 111.0, 123.0, 81.0, 68.0, 52.0, 34.0, 28.0, 24.0, 14.0, 7.0, 10.0, 8.0, 10.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00021278858184814453, -0.0002070162445306778, -0.00020124390721321106, -0.00019547156989574432, -0.0001896992325782776, -0.00018392689526081085, -0.00017815455794334412, -0.00017238222062587738, -0.00016660988330841064, -0.0001608375459909439, -0.00015506520867347717, -0.00014929287135601044, -0.0001435205340385437, -0.00013774819672107697, -0.00013197585940361023, -0.0001262035220861435, -0.00012043118476867676, -0.00011465884745121002, -0.00010888651013374329, -0.00010311417281627655, -9.734183549880981e-05, -9.156949818134308e-05, -8.579716086387634e-05, -8.002482354640961e-05, -7.425248622894287e-05, -6.848014891147614e-05, -6.27078115940094e-05, -5.6935474276542664e-05, -5.116313695907593e-05, -4.539079964160919e-05, -3.9618462324142456e-05, -3.384612500667572e-05, -2.8073787689208984e-05, -2.230145037174225e-05, -1.6529113054275513e-05, -1.0756775736808777e-05, -4.984438419342041e-06, 7.878988981246948e-07, 6.560236215591431e-06, 1.2332573533058167e-05, 1.8104910850524902e-05, 2.3877248167991638e-05, 2.9649585485458374e-05, 3.542192280292511e-05, 4.1194260120391846e-05, 4.696659743785858e-05, 5.273893475532532e-05, 5.851127207279205e-05, 6.428360939025879e-05, 7.005594670772552e-05, 7.582828402519226e-05, 8.1600621342659e-05, 8.737295866012573e-05, 9.314529597759247e-05, 9.89176332950592e-05, 0.00010468997061252594, 0.00011046230792999268, 0.00011623464524745941, 0.00012200698256492615, 0.00012777931988239288, 0.00013355165719985962, 0.00013932399451732635, 0.0001450963318347931, 0.00015086866915225983, 0.00015664100646972656]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 14.0, 9.0, 23.0, 32.0, 37.0, 58.0, 90.0, 109.0, 173.0, 294.0, 388.0, 564.0, 813.0, 1282.0, 1891.0, 2836.0, 4406.0, 7146.0, 11670.0, 19917.0, 37755.0, 75170.0, 158713.0, 268999.0, 222343.0, 111257.0, 53863.0, 27829.0, 15479.0, 9075.0, 5646.0, 3583.0, 2395.0, 1567.0, 954.0, 685.0, 465.0, 298.0, 210.0, 167.0, 102.0, 81.0, 45.0, 35.0, 27.0, 13.0, 14.0, 10.0, 6.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.4052734375, -1.3623809814453125, -1.319488525390625, -1.2765960693359375, -1.23370361328125, -1.1908111572265625, -1.147918701171875, -1.1050262451171875, -1.0621337890625, -1.0192413330078125, -0.976348876953125, -0.9334564208984375, -0.89056396484375, -0.8476715087890625, -0.804779052734375, -0.7618865966796875, -0.718994140625, -0.6761016845703125, -0.633209228515625, -0.5903167724609375, -0.54742431640625, -0.5045318603515625, -0.461639404296875, -0.4187469482421875, -0.3758544921875, -0.3329620361328125, -0.290069580078125, -0.2471771240234375, -0.20428466796875, -0.1613922119140625, -0.118499755859375, -0.0756072998046875, -0.03271484375, 0.0101776123046875, 0.053070068359375, 0.0959625244140625, 0.13885498046875, 0.1817474365234375, 0.224639892578125, 0.2675323486328125, 0.3104248046875, 0.3533172607421875, 0.396209716796875, 0.4391021728515625, 0.48199462890625, 0.5248870849609375, 0.567779541015625, 0.6106719970703125, 0.653564453125, 0.6964569091796875, 0.739349365234375, 0.7822418212890625, 0.82513427734375, 0.8680267333984375, 0.910919189453125, 0.9538116455078125, 0.9967041015625, 1.0395965576171875, 1.082489013671875, 1.1253814697265625, 1.16827392578125, 1.2111663818359375, 1.254058837890625, 1.2969512939453125, 1.33984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 15.0, 16.0, 18.0, 38.0, 69.0, 86.0, 151.0, 161.0, 135.0, 100.0, 71.0, 44.0, 21.0, 14.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8728790283203125, -0.844390869140625, -0.8159027099609375, -0.78741455078125, -0.7589263916015625, -0.730438232421875, -0.7019500732421875, -0.6734619140625, -0.6449737548828125, -0.616485595703125, -0.5879974365234375, -0.55950927734375, -0.5310211181640625, -0.502532958984375, -0.4740447998046875, -0.445556640625, -0.4170684814453125, -0.388580322265625, -0.3600921630859375, -0.33160400390625, -0.3031158447265625, -0.274627685546875, -0.2461395263671875, -0.2176513671875, -0.1891632080078125, -0.160675048828125, -0.1321868896484375, -0.10369873046875, -0.0752105712890625, -0.046722412109375, -0.0182342529296875, 0.01025390625, 0.0387420654296875, 0.067230224609375, 0.0957183837890625, 0.12420654296875, 0.1526947021484375, 0.181182861328125, 0.2096710205078125, 0.2381591796875, 0.2666473388671875, 0.295135498046875, 0.3236236572265625, 0.35211181640625, 0.3805999755859375, 0.409088134765625, 0.4375762939453125, 0.466064453125, 0.4945526123046875, 0.523040771484375, 0.5515289306640625, 0.58001708984375, 0.6085052490234375, 0.636993408203125, 0.6654815673828125, 0.6939697265625, 0.7224578857421875, 0.750946044921875, 0.7794342041015625, 0.80792236328125, 0.8364105224609375, 0.864898681640625, 0.8933868408203125, 0.921875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 5.0, 12.0, 10.0, 11.0, 16.0, 16.0, 28.0, 22.0, 36.0, 31.0, 29.0, 30.0, 28.0, 37.0, 39.0, 49.0, 44.0, 41.0, 42.0, 44.0, 39.0, 45.0, 43.0, 38.0, 29.0, 33.0, 32.0, 24.0, 24.0, 21.0, 15.0, 15.0, 13.0, 12.0, 5.0, 5.0, 5.0, 7.0, 6.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.873531341552734, -10.458719253540039, -10.043907165527344, -9.629095077514648, -9.214282989501953, -8.799470901489258, -8.384658813476562, -7.969845771789551, -7.5550336837768555, -7.14022159576416, -6.725409507751465, -6.3105974197387695, -5.895784854888916, -5.480972766876221, -5.066160678863525, -4.651348114013672, -4.236536502838135, -3.8217244148254395, -3.406912088394165, -2.9921000003814697, -2.5772876739501953, -2.1624755859375, -1.7476634979248047, -1.3328511714935303, -0.918039083480835, -0.5032268762588501, -0.08841472864151001, 0.3263974189758301, 0.7412096261978149, 1.1560218334197998, 1.5708339214324951, 1.9856462478637695, 2.400458335876465, 2.81527042388916, 3.2300827503204346, 3.64489483833313, 4.059707164764404, 4.4745192527771, 4.889331340789795, 5.304143905639648, 5.718955993652344, 6.133768081665039, 6.548580169677734, 6.96339225769043, 7.378204822540283, 7.7930169105529785, 8.207828521728516, 8.622641563415527, 9.037452697753906, 9.452264785766602, 9.867076873779297, 10.281888961791992, 10.696701049804688, 11.111513137817383, 11.526325225830078, 11.94113826751709, 12.355950355529785, 12.77076244354248, 13.185574531555176, 13.600386619567871, 14.015198707580566, 14.430011749267578, 14.844823837280273, 15.259635925292969, 15.674448013305664]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 8.0, 10.0, 6.0, 5.0, 10.0, 14.0, 14.0, 12.0, 22.0, 18.0, 26.0, 23.0, 26.0, 33.0, 22.0, 33.0, 26.0, 39.0, 41.0, 34.0, 36.0, 42.0, 55.0, 41.0, 39.0, 33.0, 30.0, 28.0, 33.0, 41.0, 32.0, 28.0, 19.0, 21.0, 14.0, 11.0, 12.0, 11.0, 20.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0], "bins": [-16.54392433166504, -16.06588363647461, -15.587841033935547, -15.1097993850708, -14.631757736206055, -14.153717041015625, -13.675675392150879, -13.197633743286133, -12.719592094421387, -12.24155044555664, -11.763508796691895, -11.285467147827148, -10.807426452636719, -10.329383850097656, -9.851343154907227, -9.37330150604248, -8.895259857177734, -8.417218208312988, -7.939176559448242, -7.461135387420654, -6.983093738555908, -6.505052089691162, -6.027010917663574, -5.548969268798828, -5.070927619934082, -4.592885971069336, -4.11484432220459, -3.636803150177002, -3.158761501312256, -2.6807198524475098, -2.2026784420013428, -1.7246370315551758, -1.246596336364746, -0.7685548067092896, -0.290513277053833, 0.18752825260162354, 0.6655697822570801, 1.1436114311218262, 1.6216528415679932, 2.09969425201416, 2.5777359008789062, 3.0557775497436523, 3.5338189601898193, 4.011860370635986, 4.489902019500732, 4.9679436683654785, 5.445984840393066, 5.9240264892578125, 6.402068138122559, 6.880109786987305, 7.358151435852051, 7.836192607879639, 8.314233779907227, 8.792276382446289, 9.270317077636719, 9.748358726501465, 10.226400375366211, 10.704442024230957, 11.182483673095703, 11.66052532196045, 12.138566970825195, 12.616607666015625, 13.094649314880371, 13.572690963745117, 14.050732612609863]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 13.0, 13.0, 29.0, 47.0, 62.0, 109.0, 175.0, 291.0, 462.0, 758.0, 1177.0, 1729.0, 2838.0, 4459.0, 6724.0, 10249.0, 15071.0, 21936.0, 30502.0, 41517.0, 54067.0, 67766.0, 80416.0, 90743.0, 96725.0, 96681.0, 90590.0, 79953.0, 66827.0, 53063.0, 40514.0, 29572.0, 20885.0, 14428.0, 9981.0, 6476.0, 4254.0, 2689.0, 1756.0, 1124.0, 709.0, 415.0, 291.0, 165.0, 105.0, 83.0, 42.0, 25.0, 21.0, 9.0, 11.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.765625, -8.4913330078125, -8.217041015625, -7.9427490234375, -7.66845703125, -7.3941650390625, -7.119873046875, -6.8455810546875, -6.5712890625, -6.2969970703125, -6.022705078125, -5.7484130859375, -5.47412109375, -5.1998291015625, -4.925537109375, -4.6512451171875, -4.376953125, -4.1026611328125, -3.828369140625, -3.5540771484375, -3.27978515625, -3.0054931640625, -2.731201171875, -2.4569091796875, -2.1826171875, -1.9083251953125, -1.634033203125, -1.3597412109375, -1.08544921875, -0.8111572265625, -0.536865234375, -0.2625732421875, 0.01171875, 0.2860107421875, 0.560302734375, 0.8345947265625, 1.10888671875, 1.3831787109375, 1.657470703125, 1.9317626953125, 2.2060546875, 2.4803466796875, 2.754638671875, 3.0289306640625, 3.30322265625, 3.5775146484375, 3.851806640625, 4.1260986328125, 4.400390625, 4.6746826171875, 4.948974609375, 5.2232666015625, 5.49755859375, 5.7718505859375, 6.046142578125, 6.3204345703125, 6.5947265625, 6.8690185546875, 7.143310546875, 7.4176025390625, 7.69189453125, 7.9661865234375, 8.240478515625, 8.5147705078125, 8.7890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 10.0, 7.0, 5.0, 19.0, 12.0, 17.0, 20.0, 24.0, 24.0, 24.0, 28.0, 36.0, 28.0, 28.0, 47.0, 40.0, 45.0, 55.0, 51.0, 34.0, 50.0, 35.0, 38.0, 35.0, 36.0, 31.0, 32.0, 24.0, 17.0, 26.0, 20.0, 26.0, 11.0, 9.0, 10.0, 16.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.828125, -17.3125, -16.796875, -16.28125, -15.765625, -15.25, -14.734375, -14.21875, -13.703125, -13.1875, -12.671875, -12.15625, -11.640625, -11.125, -10.609375, -10.09375, -9.578125, -9.0625, -8.546875, -8.03125, -7.515625, -7.0, -6.484375, -5.96875, -5.453125, -4.9375, -4.421875, -3.90625, -3.390625, -2.875, -2.359375, -1.84375, -1.328125, -0.8125, -0.296875, 0.21875, 0.734375, 1.25, 1.765625, 2.28125, 2.796875, 3.3125, 3.828125, 4.34375, 4.859375, 5.375, 5.890625, 6.40625, 6.921875, 7.4375, 7.953125, 8.46875, 8.984375, 9.5, 10.015625, 10.53125, 11.046875, 11.5625, 12.078125, 12.59375, 13.109375, 13.625, 14.140625, 14.65625, 15.171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 11.0, 12.0, 34.0, 65.0, 81.0, 124.0, 220.0, 324.0, 528.0, 857.0, 1364.0, 2139.0, 3336.0, 5283.0, 8171.0, 12386.0, 18347.0, 26977.0, 37223.0, 50392.0, 64909.0, 78970.0, 92032.0, 99385.0, 100434.0, 95072.0, 84891.0, 70984.0, 56167.0, 42934.0, 31029.0, 21731.0, 14700.0, 9896.0, 6367.0, 4114.0, 2691.0, 1643.0, 1074.0, 628.0, 416.0, 256.0, 139.0, 87.0, 55.0, 28.0, 25.0, 14.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -7.97265625, -7.6796875, -7.38671875, -7.09375, -6.80078125, -6.5078125, -6.21484375, -5.921875, -5.62890625, -5.3359375, -5.04296875, -4.75, -4.45703125, -4.1640625, -3.87109375, -3.578125, -3.28515625, -2.9921875, -2.69921875, -2.40625, -2.11328125, -1.8203125, -1.52734375, -1.234375, -0.94140625, -0.6484375, -0.35546875, -0.0625, 0.23046875, 0.5234375, 0.81640625, 1.109375, 1.40234375, 1.6953125, 1.98828125, 2.28125, 2.57421875, 2.8671875, 3.16015625, 3.453125, 3.74609375, 4.0390625, 4.33203125, 4.625, 4.91796875, 5.2109375, 5.50390625, 5.796875, 6.08984375, 6.3828125, 6.67578125, 6.96875, 7.26171875, 7.5546875, 7.84765625, 8.140625, 8.43359375, 8.7265625, 9.01953125, 9.3125, 9.60546875, 9.8984375, 10.19140625, 10.484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 6.0, 9.0, 9.0, 11.0, 12.0, 15.0, 15.0, 31.0, 19.0, 21.0, 37.0, 32.0, 37.0, 28.0, 39.0, 46.0, 35.0, 32.0, 50.0, 47.0, 47.0, 51.0, 48.0, 39.0, 25.0, 26.0, 37.0, 29.0, 25.0, 20.0, 22.0, 13.0, 10.0, 15.0, 12.0, 9.0, 5.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1171875, -10.7918701171875, -10.466552734375, -10.1412353515625, -9.81591796875, -9.4906005859375, -9.165283203125, -8.8399658203125, -8.5146484375, -8.1893310546875, -7.864013671875, -7.5386962890625, -7.21337890625, -6.8880615234375, -6.562744140625, -6.2374267578125, -5.912109375, -5.5867919921875, -5.261474609375, -4.9361572265625, -4.61083984375, -4.2855224609375, -3.960205078125, -3.6348876953125, -3.3095703125, -2.9842529296875, -2.658935546875, -2.3336181640625, -2.00830078125, -1.6829833984375, -1.357666015625, -1.0323486328125, -0.70703125, -0.3817138671875, -0.056396484375, 0.2689208984375, 0.59423828125, 0.9195556640625, 1.244873046875, 1.5701904296875, 1.8955078125, 2.2208251953125, 2.546142578125, 2.8714599609375, 3.19677734375, 3.5220947265625, 3.847412109375, 4.1727294921875, 4.498046875, 4.8233642578125, 5.148681640625, 5.4739990234375, 5.79931640625, 6.1246337890625, 6.449951171875, 6.7752685546875, 7.1005859375, 7.4259033203125, 7.751220703125, 8.0765380859375, 8.40185546875, 8.7271728515625, 9.052490234375, 9.3778076171875, 9.703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 16.0, 31.0, 39.0, 60.0, 76.0, 127.0, 179.0, 304.0, 426.0, 650.0, 966.0, 1505.0, 2268.0, 3327.0, 5170.0, 7833.0, 11791.0, 17705.0, 26549.0, 38917.0, 54889.0, 72532.0, 91587.0, 106714.0, 113852.0, 110873.0, 98899.0, 80369.0, 62232.0, 44791.0, 31017.0, 21233.0, 14082.0, 9431.0, 6064.0, 4039.0, 2758.0, 1769.0, 1135.0, 802.0, 547.0, 347.0, 225.0, 154.0, 93.0, 55.0, 31.0, 19.0, 19.0, 8.0, 7.0, 7.0, 7.0, 6.0, 1.0, 6.0], "bins": [-3.962890625, -3.84173583984375, -3.7205810546875, -3.59942626953125, -3.478271484375, -3.35711669921875, -3.2359619140625, -3.11480712890625, -2.99365234375, -2.87249755859375, -2.7513427734375, -2.63018798828125, -2.509033203125, -2.38787841796875, -2.2667236328125, -2.14556884765625, -2.0244140625, -1.90325927734375, -1.7821044921875, -1.66094970703125, -1.539794921875, -1.41864013671875, -1.2974853515625, -1.17633056640625, -1.05517578125, -0.93402099609375, -0.8128662109375, -0.69171142578125, -0.570556640625, -0.44940185546875, -0.3282470703125, -0.20709228515625, -0.0859375, 0.03521728515625, 0.1563720703125, 0.27752685546875, 0.398681640625, 0.51983642578125, 0.6409912109375, 0.76214599609375, 0.88330078125, 1.00445556640625, 1.1256103515625, 1.24676513671875, 1.367919921875, 1.48907470703125, 1.6102294921875, 1.73138427734375, 1.8525390625, 1.97369384765625, 2.0948486328125, 2.21600341796875, 2.337158203125, 2.45831298828125, 2.5794677734375, 2.70062255859375, 2.82177734375, 2.94293212890625, 3.0640869140625, 3.18524169921875, 3.306396484375, 3.42755126953125, 3.5487060546875, 3.66986083984375, 3.791015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 11.0, 15.0, 19.0, 22.0, 23.0, 21.0, 40.0, 30.0, 33.0, 42.0, 43.0, 52.0, 46.0, 42.0, 55.0, 42.0, 38.0, 46.0, 44.0, 36.0, 21.0, 45.0, 26.0, 26.0, 22.0, 31.0, 13.0, 16.0, 9.0, 16.0, 8.0, 6.0, 11.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000446319580078125, -0.0004323050379753113, -0.00041829049587249756, -0.00040427595376968384, -0.0003902614116668701, -0.0003762468695640564, -0.0003622323274612427, -0.00034821778535842896, -0.00033420324325561523, -0.0003201887011528015, -0.0003061741590499878, -0.00029215961694717407, -0.00027814507484436035, -0.00026413053274154663, -0.0002501159906387329, -0.0002361014485359192, -0.00022208690643310547, -0.00020807236433029175, -0.00019405782222747803, -0.0001800432801246643, -0.00016602873802185059, -0.00015201419591903687, -0.00013799965381622314, -0.00012398511171340942, -0.0001099705696105957, -9.595602750778198e-05, -8.194148540496826e-05, -6.792694330215454e-05, -5.391240119934082e-05, -3.98978590965271e-05, -2.588331699371338e-05, -1.1868774890899658e-05, 2.1457672119140625e-06, 1.6160309314727783e-05, 3.0174851417541504e-05, 4.4189393520355225e-05, 5.8203935623168945e-05, 7.221847772598267e-05, 8.623301982879639e-05, 0.00010024756193161011, 0.00011426210403442383, 0.00012827664613723755, 0.00014229118824005127, 0.000156305730342865, 0.0001703202724456787, 0.00018433481454849243, 0.00019834935665130615, 0.00021236389875411987, 0.0002263784408569336, 0.00024039298295974731, 0.00025440752506256104, 0.00026842206716537476, 0.0002824366092681885, 0.0002964511513710022, 0.0003104656934738159, 0.00032448023557662964, 0.00033849477767944336, 0.0003525093197822571, 0.0003665238618850708, 0.0003805384039878845, 0.00039455294609069824, 0.00040856748819351196, 0.0004225820302963257, 0.0004365965723991394, 0.0004506111145019531]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 15.0, 15.0, 29.0, 38.0, 73.0, 105.0, 161.0, 284.0, 459.0, 724.0, 1261.0, 2166.0, 3844.0, 6658.0, 11544.0, 20095.0, 34413.0, 56722.0, 87264.0, 120281.0, 146056.0, 152036.0, 132641.0, 101027.0, 68227.0, 42583.0, 25129.0, 14622.0, 8410.0, 4798.0, 2772.0, 1618.0, 940.0, 613.0, 342.0, 240.0, 127.0, 81.0, 50.0, 32.0, 12.0, 13.0, 11.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.14227294921875, -4.9720458984375, -4.80181884765625, -4.631591796875, -4.46136474609375, -4.2911376953125, -4.12091064453125, -3.95068359375, -3.78045654296875, -3.6102294921875, -3.44000244140625, -3.269775390625, -3.09954833984375, -2.9293212890625, -2.75909423828125, -2.5888671875, -2.41864013671875, -2.2484130859375, -2.07818603515625, -1.907958984375, -1.73773193359375, -1.5675048828125, -1.39727783203125, -1.22705078125, -1.05682373046875, -0.8865966796875, -0.71636962890625, -0.546142578125, -0.37591552734375, -0.2056884765625, -0.03546142578125, 0.134765625, 0.30499267578125, 0.4752197265625, 0.64544677734375, 0.815673828125, 0.98590087890625, 1.1561279296875, 1.32635498046875, 1.49658203125, 1.66680908203125, 1.8370361328125, 2.00726318359375, 2.177490234375, 2.34771728515625, 2.5179443359375, 2.68817138671875, 2.8583984375, 3.02862548828125, 3.1988525390625, 3.36907958984375, 3.539306640625, 3.70953369140625, 3.8797607421875, 4.04998779296875, 4.22021484375, 4.39044189453125, 4.5606689453125, 4.73089599609375, 4.901123046875, 5.07135009765625, 5.2415771484375, 5.41180419921875, 5.58203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 4.0, 3.0, 9.0, 8.0, 12.0, 11.0, 19.0, 12.0, 16.0, 29.0, 31.0, 30.0, 40.0, 28.0, 34.0, 30.0, 46.0, 48.0, 49.0, 39.0, 43.0, 48.0, 43.0, 47.0, 48.0, 46.0, 38.0, 38.0, 26.0, 23.0, 13.0, 20.0, 12.0, 15.0, 12.0, 4.0, 3.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.095703125, -2.03509521484375, -1.9744873046875, -1.91387939453125, -1.853271484375, -1.79266357421875, -1.7320556640625, -1.67144775390625, -1.61083984375, -1.55023193359375, -1.4896240234375, -1.42901611328125, -1.368408203125, -1.30780029296875, -1.2471923828125, -1.18658447265625, -1.1259765625, -1.06536865234375, -1.0047607421875, -0.94415283203125, -0.883544921875, -0.82293701171875, -0.7623291015625, -0.70172119140625, -0.64111328125, -0.58050537109375, -0.5198974609375, -0.45928955078125, -0.398681640625, -0.33807373046875, -0.2774658203125, -0.21685791015625, -0.15625, -0.09564208984375, -0.0350341796875, 0.02557373046875, 0.086181640625, 0.14678955078125, 0.2073974609375, 0.26800537109375, 0.32861328125, 0.38922119140625, 0.4498291015625, 0.51043701171875, 0.571044921875, 0.63165283203125, 0.6922607421875, 0.75286865234375, 0.8134765625, 0.87408447265625, 0.9346923828125, 0.99530029296875, 1.055908203125, 1.11651611328125, 1.1771240234375, 1.23773193359375, 1.29833984375, 1.35894775390625, 1.4195556640625, 1.48016357421875, 1.540771484375, 1.60137939453125, 1.6619873046875, 1.72259521484375, 1.783203125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 12.0, 12.0, 21.0, 17.0, 18.0, 28.0, 25.0, 27.0, 32.0, 36.0, 38.0, 28.0, 48.0, 36.0, 42.0, 46.0, 45.0, 45.0, 38.0, 47.0, 51.0, 36.0, 41.0, 32.0, 24.0, 23.0, 19.0, 23.0, 17.0, 20.0, 8.0, 7.0, 12.0, 2.0, 7.0, 5.0, 2.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.385777473449707, -10.968724250793457, -10.551671028137207, -10.134617805480957, -9.717564582824707, -9.30051040649414, -8.88345718383789, -8.46640396118164, -8.04935073852539, -7.632297515869141, -7.215244293212891, -6.798191070556641, -6.381137371063232, -5.964084148406982, -5.547030925750732, -5.129977226257324, -4.712924480438232, -4.295871257781982, -3.8788177967071533, -3.4617645740509033, -3.044711112976074, -2.627657890319824, -2.210604667663574, -1.7935512065887451, -1.3764979839324951, -0.9594446420669556, -0.5423913598060608, -0.12533807754516602, 0.29171526432037354, 0.7087686061859131, 1.125821828842163, 1.5428752899169922, 1.9599285125732422, 2.376981735229492, 2.7940351963043213, 3.2110884189605713, 3.6281418800354004, 4.04519510269165, 4.4622483253479, 4.879302024841309, 5.296355247497559, 5.713408470153809, 6.130461692810059, 6.547514915466309, 6.964568614959717, 7.381621837615967, 7.798675060272217, 8.215728759765625, 8.632781982421875, 9.049835205078125, 9.466888427734375, 9.883941650390625, 10.300994873046875, 10.718048095703125, 11.135101318359375, 11.552155494689941, 11.969207763671875, 12.386260986328125, 12.803314208984375, 13.220367431640625, 13.637420654296875, 14.054473876953125, 14.471527099609375, 14.888581275939941, 15.305634498596191]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 9.0, 6.0, 13.0, 10.0, 8.0, 8.0, 13.0, 29.0, 21.0, 29.0, 21.0, 25.0, 35.0, 39.0, 33.0, 28.0, 34.0, 42.0, 42.0, 31.0, 42.0, 50.0, 27.0, 40.0, 45.0, 35.0, 31.0, 31.0, 26.0, 26.0, 24.0, 19.0, 10.0, 16.0, 21.0, 16.0, 14.0, 9.0, 8.0, 14.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-17.004196166992188, -16.49961280822754, -15.99502944946289, -15.490447044372559, -14.98586368560791, -14.481280326843262, -13.97669792175293, -13.472114562988281, -12.967531204223633, -12.462947845458984, -11.958364486694336, -11.453782081604004, -10.949198722839355, -10.444615364074707, -9.940032958984375, -9.435449600219727, -8.930866241455078, -8.42628288269043, -7.9217000007629395, -7.417117118835449, -6.912533760070801, -6.407950401306152, -5.903367519378662, -5.398784637451172, -4.894201278686523, -4.389617919921875, -3.8850350379943848, -3.3804519176483154, -2.875868797302246, -2.3712856769561768, -1.8667025566101074, -1.362119436264038, -0.8575363159179688, -0.3529531955718994, 0.15162992477416992, 0.6562130451202393, 1.1607961654663086, 1.665379285812378, 2.1699624061584473, 2.6745455265045166, 3.179128646850586, 3.6837117671966553, 4.188294887542725, 4.692877769470215, 5.197461128234863, 5.702044486999512, 6.206627368927002, 6.711210250854492, 7.215793609619141, 7.720376968383789, 8.224960327148438, 8.72954273223877, 9.234126091003418, 9.738709449768066, 10.243291854858398, 10.747875213623047, 11.252458572387695, 11.757041931152344, 12.261625289916992, 12.766207695007324, 13.270791053771973, 13.775374412536621, 14.279956817626953, 14.784540176391602, 15.28912353515625]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 9.0, 14.0, 29.0, 44.0, 75.0, 89.0, 149.0, 225.0, 406.0, 635.0, 1007.0, 1594.0, 2444.0, 4025.0, 6194.0, 9408.0, 14522.0, 22175.0, 33493.0, 49898.0, 73426.0, 105623.0, 146341.0, 198075.0, 256026.0, 315297.0, 366757.0, 398311.0, 405767.0, 382758.0, 339192.0, 282122.0, 223455.0, 168482.0, 123040.0, 86403.0, 60198.0, 40469.0, 26871.0, 17547.0, 11396.0, 7320.0, 4698.0, 3062.0, 1965.0, 1180.0, 756.0, 507.0, 306.0, 189.0, 114.0, 67.0, 59.0, 33.0, 22.0, 9.0, 8.0, 5.0, 2.0, 1.0, 1.0], "bins": [-8.71875, -8.439453125, -8.16015625, -7.880859375, -7.6015625, -7.322265625, -7.04296875, -6.763671875, -6.484375, -6.205078125, -5.92578125, -5.646484375, -5.3671875, -5.087890625, -4.80859375, -4.529296875, -4.25, -3.970703125, -3.69140625, -3.412109375, -3.1328125, -2.853515625, -2.57421875, -2.294921875, -2.015625, -1.736328125, -1.45703125, -1.177734375, -0.8984375, -0.619140625, -0.33984375, -0.060546875, 0.21875, 0.498046875, 0.77734375, 1.056640625, 1.3359375, 1.615234375, 1.89453125, 2.173828125, 2.453125, 2.732421875, 3.01171875, 3.291015625, 3.5703125, 3.849609375, 4.12890625, 4.408203125, 4.6875, 4.966796875, 5.24609375, 5.525390625, 5.8046875, 6.083984375, 6.36328125, 6.642578125, 6.921875, 7.201171875, 7.48046875, 7.759765625, 8.0390625, 8.318359375, 8.59765625, 8.876953125, 9.15625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 9.0, 9.0, 10.0, 17.0, 14.0, 18.0, 16.0, 16.0, 25.0, 25.0, 41.0, 34.0, 38.0, 27.0, 30.0, 33.0, 37.0, 42.0, 45.0, 41.0, 39.0, 42.0, 45.0, 33.0, 43.0, 33.0, 32.0, 24.0, 33.0, 28.0, 16.0, 14.0, 10.0, 15.0, 15.0, 11.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1875, -12.7838134765625, -12.380126953125, -11.9764404296875, -11.57275390625, -11.1690673828125, -10.765380859375, -10.3616943359375, -9.9580078125, -9.5543212890625, -9.150634765625, -8.7469482421875, -8.34326171875, -7.9395751953125, -7.535888671875, -7.1322021484375, -6.728515625, -6.3248291015625, -5.921142578125, -5.5174560546875, -5.11376953125, -4.7100830078125, -4.306396484375, -3.9027099609375, -3.4990234375, -3.0953369140625, -2.691650390625, -2.2879638671875, -1.88427734375, -1.4805908203125, -1.076904296875, -0.6732177734375, -0.26953125, 0.1341552734375, 0.537841796875, 0.9415283203125, 1.34521484375, 1.7489013671875, 2.152587890625, 2.5562744140625, 2.9599609375, 3.3636474609375, 3.767333984375, 4.1710205078125, 4.57470703125, 4.9783935546875, 5.382080078125, 5.7857666015625, 6.189453125, 6.5931396484375, 6.996826171875, 7.4005126953125, 7.80419921875, 8.2078857421875, 8.611572265625, 9.0152587890625, 9.4189453125, 9.8226318359375, 10.226318359375, 10.6300048828125, 11.03369140625, 11.4373779296875, 11.841064453125, 12.2447509765625, 12.6484375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 14.0, 21.0, 46.0, 89.0, 151.0, 253.0, 413.0, 703.0, 1191.0, 1964.0, 3387.0, 5427.0, 8982.0, 14448.0, 22147.0, 34376.0, 51579.0, 76790.0, 108425.0, 149880.0, 199003.0, 251721.0, 303389.0, 347589.0, 375683.0, 384098.0, 370292.0, 336536.0, 289488.0, 237189.0, 184194.0, 138374.0, 99243.0, 69058.0, 45974.0, 30688.0, 19661.0, 12526.0, 7599.0, 4760.0, 2752.0, 1724.0, 1037.0, 611.0, 338.0, 191.0, 133.0, 64.0, 36.0, 19.0, 13.0, 6.0, 6.0, 4.0, 1.0], "bins": [-9.78125, -9.49658203125, -9.2119140625, -8.92724609375, -8.642578125, -8.35791015625, -8.0732421875, -7.78857421875, -7.50390625, -7.21923828125, -6.9345703125, -6.64990234375, -6.365234375, -6.08056640625, -5.7958984375, -5.51123046875, -5.2265625, -4.94189453125, -4.6572265625, -4.37255859375, -4.087890625, -3.80322265625, -3.5185546875, -3.23388671875, -2.94921875, -2.66455078125, -2.3798828125, -2.09521484375, -1.810546875, -1.52587890625, -1.2412109375, -0.95654296875, -0.671875, -0.38720703125, -0.1025390625, 0.18212890625, 0.466796875, 0.75146484375, 1.0361328125, 1.32080078125, 1.60546875, 1.89013671875, 2.1748046875, 2.45947265625, 2.744140625, 3.02880859375, 3.3134765625, 3.59814453125, 3.8828125, 4.16748046875, 4.4521484375, 4.73681640625, 5.021484375, 5.30615234375, 5.5908203125, 5.87548828125, 6.16015625, 6.44482421875, 6.7294921875, 7.01416015625, 7.298828125, 7.58349609375, 7.8681640625, 8.15283203125, 8.4375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 2.0, 4.0, 17.0, 10.0, 16.0, 19.0, 24.0, 28.0, 28.0, 38.0, 45.0, 70.0, 73.0, 85.0, 131.0, 135.0, 141.0, 134.0, 173.0, 188.0, 216.0, 203.0, 236.0, 196.0, 196.0, 185.0, 184.0, 194.0, 160.0, 134.0, 134.0, 126.0, 114.0, 93.0, 67.0, 60.0, 47.0, 33.0, 26.0, 28.0, 18.0, 17.0, 10.0, 16.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.1875, -6.00054931640625, -5.8135986328125, -5.62664794921875, -5.439697265625, -5.25274658203125, -5.0657958984375, -4.87884521484375, -4.69189453125, -4.50494384765625, -4.3179931640625, -4.13104248046875, -3.944091796875, -3.75714111328125, -3.5701904296875, -3.38323974609375, -3.1962890625, -3.00933837890625, -2.8223876953125, -2.63543701171875, -2.448486328125, -2.26153564453125, -2.0745849609375, -1.88763427734375, -1.70068359375, -1.51373291015625, -1.3267822265625, -1.13983154296875, -0.952880859375, -0.76593017578125, -0.5789794921875, -0.39202880859375, -0.205078125, -0.01812744140625, 0.1688232421875, 0.35577392578125, 0.542724609375, 0.72967529296875, 0.9166259765625, 1.10357666015625, 1.29052734375, 1.47747802734375, 1.6644287109375, 1.85137939453125, 2.038330078125, 2.22528076171875, 2.4122314453125, 2.59918212890625, 2.7861328125, 2.97308349609375, 3.1600341796875, 3.34698486328125, 3.533935546875, 3.72088623046875, 3.9078369140625, 4.09478759765625, 4.28173828125, 4.46868896484375, 4.6556396484375, 4.84259033203125, 5.029541015625, 5.21649169921875, 5.4034423828125, 5.59039306640625, 5.77734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 10.0, 11.0, 23.0, 27.0, 28.0, 29.0, 29.0, 30.0, 43.0, 42.0, 50.0, 53.0, 54.0, 47.0, 38.0, 47.0, 38.0, 48.0, 52.0, 43.0, 35.0, 25.0, 28.0, 19.0, 19.0, 14.0, 30.0, 10.0, 14.0, 10.0, 7.0, 6.0, 3.0, 3.0, 5.0, 6.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-15.986053466796875, -15.557334899902344, -15.128615379333496, -14.699896812438965, -14.271178245544434, -13.842458724975586, -13.413740158081055, -12.985021591186523, -12.556303024291992, -12.127584457397461, -11.698864936828613, -11.270146369934082, -10.84142780303955, -10.412708282470703, -9.983989715576172, -9.55527114868164, -9.126551628112793, -8.697833061218262, -8.269113540649414, -7.840394973754883, -7.411676406860352, -6.982957363128662, -6.554238319396973, -6.125519752502441, -5.696800708770752, -5.2680816650390625, -4.839363098144531, -4.410644054412842, -3.9819252490997314, -3.553206443786621, -3.1244874000549316, -2.6957685947418213, -2.2670507431030273, -1.838331937789917, -1.409613013267517, -0.9808940887451172, -0.5521752834320068, -0.12345647811889648, 0.30526256561279297, 0.7339813709259033, 1.1627001762390137, 1.591418981552124, 2.0201377868652344, 2.448856830596924, 2.877575635910034, 3.3062944412231445, 3.735013484954834, 4.163732528686523, 4.592451095581055, 5.021170139312744, 5.449888706207275, 5.878607749938965, 6.307326316833496, 6.7360453605651855, 7.164764404296875, 7.593482971191406, 8.022201538085938, 8.450920104980469, 8.879639625549316, 9.308358192443848, 9.737076759338379, 10.165796279907227, 10.594514846801758, 11.023233413696289, 11.451952934265137]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 11.0, 5.0, 11.0, 6.0, 17.0, 11.0, 13.0, 19.0, 18.0, 29.0, 27.0, 22.0, 53.0, 34.0, 28.0, 34.0, 41.0, 35.0, 40.0, 48.0, 37.0, 42.0, 45.0, 37.0, 33.0, 44.0, 34.0, 35.0, 28.0, 24.0, 14.0, 21.0, 25.0, 11.0, 16.0, 5.0, 16.0, 5.0, 9.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.235815048217773, -16.738744735717773, -16.241676330566406, -15.744606018066406, -15.247536659240723, -14.750467300415039, -14.253396987915039, -13.756327629089355, -13.259258270263672, -12.762188911437988, -12.265119552612305, -11.768049240112305, -11.270979881286621, -10.773910522460938, -10.276840209960938, -9.779770851135254, -9.28270149230957, -8.785632133483887, -8.288562774658203, -7.791492462158203, -7.2944231033325195, -6.797353744506836, -6.300283908843994, -5.803214073181152, -5.306144714355469, -4.809075355529785, -4.312005519866943, -3.8149359226226807, -3.317866325378418, -2.8207967281341553, -2.3237271308898926, -1.8266575336456299, -1.3295888900756836, -0.8325192928314209, -0.3354496955871582, 0.1616199016571045, 0.6586894989013672, 1.1557590961456299, 1.6528286933898926, 2.1498982906341553, 2.646967887878418, 3.1440374851226807, 3.6411070823669434, 4.138176918029785, 4.635246276855469, 5.132315635681152, 5.629385471343994, 6.126455307006836, 6.6235246658325195, 7.120594024658203, 7.617663860321045, 8.114733695983887, 8.61180305480957, 9.108872413635254, 9.605941772460938, 10.103012084960938, 10.600081443786621, 11.097150802612305, 11.594221115112305, 12.091290473937988, 12.588359832763672, 13.085429191589355, 13.582498550415039, 14.079568862915039, 14.576638221740723]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 12.0, 19.0, 22.0, 26.0, 38.0, 87.0, 118.0, 179.0, 269.0, 406.0, 597.0, 990.0, 1465.0, 2496.0, 3952.0, 6422.0, 10940.0, 18707.0, 32022.0, 55524.0, 90581.0, 136237.0, 174128.0, 171602.0, 130894.0, 85065.0, 51534.0, 30177.0, 17463.0, 10377.0, 6185.0, 3744.0, 2251.0, 1365.0, 910.0, 625.0, 372.0, 276.0, 145.0, 128.0, 75.0, 43.0, 33.0, 23.0, 9.0, 12.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.153228759765625, -3.05450439453125, -2.955780029296875, -2.8570556640625, -2.758331298828125, -2.65960693359375, -2.560882568359375, -2.462158203125, -2.363433837890625, -2.26470947265625, -2.165985107421875, -2.0672607421875, -1.968536376953125, -1.86981201171875, -1.771087646484375, -1.67236328125, -1.573638916015625, -1.47491455078125, -1.376190185546875, -1.2774658203125, -1.178741455078125, -1.08001708984375, -0.981292724609375, -0.882568359375, -0.783843994140625, -0.68511962890625, -0.586395263671875, -0.4876708984375, -0.388946533203125, -0.29022216796875, -0.191497802734375, -0.0927734375, 0.005950927734375, 0.10467529296875, 0.203399658203125, 0.3021240234375, 0.400848388671875, 0.49957275390625, 0.598297119140625, 0.697021484375, 0.795745849609375, 0.89447021484375, 0.993194580078125, 1.0919189453125, 1.190643310546875, 1.28936767578125, 1.388092041015625, 1.48681640625, 1.585540771484375, 1.68426513671875, 1.782989501953125, 1.8817138671875, 1.980438232421875, 2.07916259765625, 2.177886962890625, 2.276611328125, 2.375335693359375, 2.47406005859375, 2.572784423828125, 2.6715087890625, 2.770233154296875, 2.86895751953125, 2.967681884765625, 3.06640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 10.0, 6.0, 5.0, 12.0, 13.0, 12.0, 8.0, 14.0, 26.0, 25.0, 28.0, 26.0, 35.0, 41.0, 31.0, 37.0, 34.0, 41.0, 38.0, 45.0, 48.0, 42.0, 55.0, 37.0, 40.0, 30.0, 27.0, 33.0, 42.0, 27.0, 17.0, 23.0, 20.0, 12.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.078125, -17.542724609375, -17.00732421875, -16.471923828125, -15.9365234375, -15.401123046875, -14.86572265625, -14.330322265625, -13.794921875, -13.259521484375, -12.72412109375, -12.188720703125, -11.6533203125, -11.117919921875, -10.58251953125, -10.047119140625, -9.51171875, -8.976318359375, -8.44091796875, -7.905517578125, -7.3701171875, -6.834716796875, -6.29931640625, -5.763916015625, -5.228515625, -4.693115234375, -4.15771484375, -3.622314453125, -3.0869140625, -2.551513671875, -2.01611328125, -1.480712890625, -0.9453125, -0.409912109375, 0.12548828125, 0.660888671875, 1.1962890625, 1.731689453125, 2.26708984375, 2.802490234375, 3.337890625, 3.873291015625, 4.40869140625, 4.944091796875, 5.4794921875, 6.014892578125, 6.55029296875, 7.085693359375, 7.62109375, 8.156494140625, 8.69189453125, 9.227294921875, 9.7626953125, 10.298095703125, 10.83349609375, 11.368896484375, 11.904296875, 12.439697265625, 12.97509765625, 13.510498046875, 14.0458984375, 14.581298828125, 15.11669921875, 15.652099609375, 16.1875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 8.0, 11.0, 16.0, 30.0, 32.0, 47.0, 57.0, 66.0, 124.0, 179.0, 254.0, 414.0, 557.0, 901.0, 1314.0, 2121.0, 3433.0, 5533.0, 8931.0, 14630.0, 23895.0, 38372.0, 60313.0, 90337.0, 124105.0, 150580.0, 150132.0, 123555.0, 89203.0, 59501.0, 38313.0, 23534.0, 14611.0, 8876.0, 5369.0, 3405.0, 2043.0, 1311.0, 779.0, 527.0, 379.0, 210.0, 168.0, 105.0, 89.0, 51.0, 44.0, 23.0, 22.0, 15.0, 10.0, 8.0, 8.0, 2.0, 1.0, 2.0, 4.0, 2.0], "bins": [-2.41015625, -2.334808349609375, -2.25946044921875, -2.184112548828125, -2.1087646484375, -2.033416748046875, -1.95806884765625, -1.882720947265625, -1.807373046875, -1.732025146484375, -1.65667724609375, -1.581329345703125, -1.5059814453125, -1.430633544921875, -1.35528564453125, -1.279937744140625, -1.20458984375, -1.129241943359375, -1.05389404296875, -0.978546142578125, -0.9031982421875, -0.827850341796875, -0.75250244140625, -0.677154541015625, -0.601806640625, -0.526458740234375, -0.45111083984375, -0.375762939453125, -0.3004150390625, -0.225067138671875, -0.14971923828125, -0.074371337890625, 0.0009765625, 0.076324462890625, 0.15167236328125, 0.227020263671875, 0.3023681640625, 0.377716064453125, 0.45306396484375, 0.528411865234375, 0.603759765625, 0.679107666015625, 0.75445556640625, 0.829803466796875, 0.9051513671875, 0.980499267578125, 1.05584716796875, 1.131195068359375, 1.20654296875, 1.281890869140625, 1.35723876953125, 1.432586669921875, 1.5079345703125, 1.583282470703125, 1.65863037109375, 1.733978271484375, 1.809326171875, 1.884674072265625, 1.96002197265625, 2.035369873046875, 2.1107177734375, 2.186065673828125, 2.26141357421875, 2.336761474609375, 2.412109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 7.0, 8.0, 12.0, 18.0, 14.0, 16.0, 13.0, 18.0, 28.0, 17.0, 36.0, 29.0, 38.0, 33.0, 41.0, 45.0, 36.0, 52.0, 41.0, 45.0, 59.0, 37.0, 36.0, 31.0, 37.0, 31.0, 24.0, 27.0, 23.0, 29.0, 14.0, 15.0, 10.0, 16.0, 12.0, 5.0, 3.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.84375, -10.4979248046875, -10.152099609375, -9.8062744140625, -9.46044921875, -9.1146240234375, -8.768798828125, -8.4229736328125, -8.0771484375, -7.7313232421875, -7.385498046875, -7.0396728515625, -6.69384765625, -6.3480224609375, -6.002197265625, -5.6563720703125, -5.310546875, -4.9647216796875, -4.618896484375, -4.2730712890625, -3.92724609375, -3.5814208984375, -3.235595703125, -2.8897705078125, -2.5439453125, -2.1981201171875, -1.852294921875, -1.5064697265625, -1.16064453125, -0.8148193359375, -0.468994140625, -0.1231689453125, 0.22265625, 0.5684814453125, 0.914306640625, 1.2601318359375, 1.60595703125, 1.9517822265625, 2.297607421875, 2.6434326171875, 2.9892578125, 3.3350830078125, 3.680908203125, 4.0267333984375, 4.37255859375, 4.7183837890625, 5.064208984375, 5.4100341796875, 5.755859375, 6.1016845703125, 6.447509765625, 6.7933349609375, 7.13916015625, 7.4849853515625, 7.830810546875, 8.1766357421875, 8.5224609375, 8.8682861328125, 9.214111328125, 9.5599365234375, 9.90576171875, 10.2515869140625, 10.597412109375, 10.9432373046875, 11.2890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 9.0, 19.0, 26.0, 30.0, 43.0, 43.0, 63.0, 101.0, 145.0, 171.0, 230.0, 336.0, 423.0, 680.0, 965.0, 1389.0, 2223.0, 3721.0, 6620.0, 12513.0, 25323.0, 55300.0, 127207.0, 258063.0, 279652.0, 146828.0, 64525.0, 28779.0, 14069.0, 7337.0, 4282.0, 2510.0, 1607.0, 1014.0, 633.0, 478.0, 330.0, 218.0, 157.0, 136.0, 85.0, 76.0, 49.0, 38.0, 23.0, 22.0, 16.0, 6.0, 8.0, 4.0, 9.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.521484375, -0.5052337646484375, -0.488983154296875, -0.4727325439453125, -0.45648193359375, -0.4402313232421875, -0.423980712890625, -0.4077301025390625, -0.3914794921875, -0.3752288818359375, -0.358978271484375, -0.3427276611328125, -0.32647705078125, -0.3102264404296875, -0.293975830078125, -0.2777252197265625, -0.261474609375, -0.2452239990234375, -0.228973388671875, -0.2127227783203125, -0.19647216796875, -0.1802215576171875, -0.163970947265625, -0.1477203369140625, -0.1314697265625, -0.1152191162109375, -0.098968505859375, -0.0827178955078125, -0.06646728515625, -0.0502166748046875, -0.033966064453125, -0.0177154541015625, -0.00146484375, 0.0147857666015625, 0.031036376953125, 0.0472869873046875, 0.06353759765625, 0.0797882080078125, 0.096038818359375, 0.1122894287109375, 0.1285400390625, 0.1447906494140625, 0.161041259765625, 0.1772918701171875, 0.19354248046875, 0.2097930908203125, 0.226043701171875, 0.2422943115234375, 0.258544921875, 0.2747955322265625, 0.291046142578125, 0.3072967529296875, 0.32354736328125, 0.3397979736328125, 0.356048583984375, 0.3722991943359375, 0.3885498046875, 0.4048004150390625, 0.421051025390625, 0.4373016357421875, 0.45355224609375, 0.4698028564453125, 0.486053466796875, 0.5023040771484375, 0.5185546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 15.0, 22.0, 24.0, 47.0, 75.0, 99.0, 114.0, 123.0, 123.0, 90.0, 75.0, 64.0, 37.0, 25.0, 16.0, 13.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.00014781951904296875, -0.00014418642967939377, -0.0001405533403158188, -0.0001369202509522438, -0.00013328716158866882, -0.00012965407222509384, -0.00012602098286151886, -0.00012238789349794388, -0.0001187548041343689, -0.00011512171477079391, -0.00011148862540721893, -0.00010785553604364395, -0.00010422244668006897, -0.00010058935731649399, -9.6956267952919e-05, -9.332317858934402e-05, -8.969008922576904e-05, -8.605699986219406e-05, -8.242391049861908e-05, -7.87908211350441e-05, -7.515773177146912e-05, -7.152464240789413e-05, -6.789155304431915e-05, -6.425846368074417e-05, -6.062537431716919e-05, -5.699228495359421e-05, -5.3359195590019226e-05, -4.9726106226444244e-05, -4.609301686286926e-05, -4.245992749929428e-05, -3.88268381357193e-05, -3.519374877214432e-05, -3.1560659408569336e-05, -2.7927570044994354e-05, -2.4294480681419373e-05, -2.066139131784439e-05, -1.702830195426941e-05, -1.3395212590694427e-05, -9.762123227119446e-06, -6.129033863544464e-06, -2.4959444999694824e-06, 1.1371448636054993e-06, 4.770234227180481e-06, 8.403323590755463e-06, 1.2036412954330444e-05, 1.5669502317905426e-05, 1.9302591681480408e-05, 2.293568104505539e-05, 2.656877040863037e-05, 3.0201859772205353e-05, 3.3834949135780334e-05, 3.7468038499355316e-05, 4.11011278629303e-05, 4.473421722650528e-05, 4.836730659008026e-05, 5.200039595365524e-05, 5.5633485317230225e-05, 5.9266574680805206e-05, 6.289966404438019e-05, 6.653275340795517e-05, 7.016584277153015e-05, 7.379893213510513e-05, 7.743202149868011e-05, 8.10651108622551e-05, 8.469820022583008e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 11.0, 12.0, 22.0, 19.0, 30.0, 40.0, 56.0, 93.0, 111.0, 186.0, 268.0, 394.0, 583.0, 873.0, 1403.0, 2401.0, 4715.0, 9913.0, 22794.0, 56673.0, 147755.0, 318115.0, 280215.0, 119330.0, 46056.0, 18517.0, 8148.0, 4061.0, 2103.0, 1228.0, 736.0, 557.0, 346.0, 217.0, 171.0, 114.0, 96.0, 66.0, 44.0, 29.0, 21.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1843109130859375, -1.145965576171875, -1.1076202392578125, -1.06927490234375, -1.0309295654296875, -0.992584228515625, -0.9542388916015625, -0.9158935546875, -0.8775482177734375, -0.839202880859375, -0.8008575439453125, -0.76251220703125, -0.7241668701171875, -0.685821533203125, -0.6474761962890625, -0.609130859375, -0.5707855224609375, -0.532440185546875, -0.4940948486328125, -0.45574951171875, -0.4174041748046875, -0.379058837890625, -0.3407135009765625, -0.3023681640625, -0.2640228271484375, -0.225677490234375, -0.1873321533203125, -0.14898681640625, -0.1106414794921875, -0.072296142578125, -0.0339508056640625, 0.00439453125, 0.0427398681640625, 0.081085205078125, 0.1194305419921875, 0.15777587890625, 0.1961212158203125, 0.234466552734375, 0.2728118896484375, 0.3111572265625, 0.3495025634765625, 0.387847900390625, 0.4261932373046875, 0.46453857421875, 0.5028839111328125, 0.541229248046875, 0.5795745849609375, 0.617919921875, 0.6562652587890625, 0.694610595703125, 0.7329559326171875, 0.77130126953125, 0.8096466064453125, 0.847991943359375, 0.8863372802734375, 0.9246826171875, 0.9630279541015625, 1.001373291015625, 1.0397186279296875, 1.07806396484375, 1.1164093017578125, 1.154754638671875, 1.1930999755859375, 1.2314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 8.0, 10.0, 15.0, 14.0, 18.0, 36.0, 43.0, 55.0, 73.0, 85.0, 101.0, 109.0, 97.0, 68.0, 56.0, 47.0, 34.0, 22.0, 23.0, 16.0, 10.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.31102752685546875, -0.3002777099609375, -0.28952789306640625, -0.278778076171875, -0.26802825927734375, -0.2572784423828125, -0.24652862548828125, -0.23577880859375, -0.22502899169921875, -0.2142791748046875, -0.20352935791015625, -0.192779541015625, -0.18202972412109375, -0.1712799072265625, -0.16053009033203125, -0.1497802734375, -0.13903045654296875, -0.1282806396484375, -0.11753082275390625, -0.106781005859375, -0.09603118896484375, -0.0852813720703125, -0.07453155517578125, -0.06378173828125, -0.05303192138671875, -0.0422821044921875, -0.03153228759765625, -0.020782470703125, -0.01003265380859375, 0.0007171630859375, 0.01146697998046875, 0.022216796875, 0.03296661376953125, 0.0437164306640625, 0.05446624755859375, 0.065216064453125, 0.07596588134765625, 0.0867156982421875, 0.09746551513671875, 0.10821533203125, 0.11896514892578125, 0.1297149658203125, 0.14046478271484375, 0.151214599609375, 0.16196441650390625, 0.1727142333984375, 0.18346405029296875, 0.1942138671875, 0.20496368408203125, 0.2157135009765625, 0.22646331787109375, 0.237213134765625, 0.24796295166015625, 0.2587127685546875, 0.26946258544921875, 0.28021240234375, 0.29096221923828125, 0.3017120361328125, 0.31246185302734375, 0.323211669921875, 0.33396148681640625, 0.3447113037109375, 0.35546112060546875, 0.3662109375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 4.0, 7.0, 9.0, 13.0, 13.0, 23.0, 28.0, 31.0, 27.0, 43.0, 35.0, 36.0, 44.0, 52.0, 58.0, 46.0, 40.0, 54.0, 43.0, 43.0, 47.0, 51.0, 36.0, 21.0, 33.0, 20.0, 23.0, 21.0, 27.0, 10.0, 18.0, 8.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.046205520629883, -15.609572410583496, -15.17293930053711, -14.736307144165039, -14.299674034118652, -13.863040924072266, -13.426407814025879, -12.989774703979492, -12.553141593933105, -12.116508483886719, -11.679875373840332, -11.243242263793945, -10.806610107421875, -10.369976997375488, -9.933343887329102, -9.496710777282715, -9.060077667236328, -8.623444557189941, -8.186811447143555, -7.750178813934326, -7.3135457038879395, -6.876913070678711, -6.440279960632324, -6.0036468505859375, -5.567014694213867, -5.1303815841674805, -4.693748950958252, -4.257115840911865, -3.8204827308654785, -3.383849859237671, -2.9472169876098633, -2.5105838775634766, -2.07395076751709, -1.6373177766799927, -1.2006847858428955, -0.7640519142150879, -0.3274189233779907, 0.10921406745910645, 0.5458469390869141, 0.9824800491333008, 1.4191129207611084, 1.8557459115982056, 2.2923789024353027, 2.7290117740631104, 3.165644645690918, 3.6022777557373047, 4.038910865783691, 4.475543975830078, 4.912176609039307, 5.348809719085693, 5.785442352294922, 6.222075462341309, 6.658708572387695, 7.095341682434082, 7.5319743156433105, 7.968607425689697, 8.405240058898926, 8.841873168945312, 9.2785062789917, 9.715139389038086, 10.151771545410156, 10.588404655456543, 11.02503776550293, 11.461670875549316, 11.898303985595703]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 8.0, 10.0, 6.0, 17.0, 10.0, 14.0, 22.0, 14.0, 29.0, 25.0, 24.0, 50.0, 34.0, 28.0, 33.0, 45.0, 32.0, 42.0, 44.0, 42.0, 38.0, 45.0, 32.0, 37.0, 45.0, 33.0, 40.0, 26.0, 25.0, 16.0, 15.0, 28.0, 13.0, 14.0, 7.0, 12.0, 9.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.06932258605957, -16.576322555541992, -16.08332061767578, -15.590320587158203, -15.097320556640625, -14.60431957244873, -14.111318588256836, -13.618318557739258, -13.12531852722168, -12.632317543029785, -12.139317512512207, -11.646316528320312, -11.153316497802734, -10.66031551361084, -10.167314529418945, -9.674314498901367, -9.181313514709473, -8.688312530517578, -8.1953125, -7.7023115158081055, -7.209311485290527, -6.716310501098633, -6.2233099937438965, -5.73030948638916, -5.237308979034424, -4.7443084716796875, -4.251307964324951, -3.7583072185516357, -3.2653067111968994, -2.772306203842163, -2.2793054580688477, -1.7863049507141113, -1.293304443359375, -0.8003038763999939, -0.3073033094406128, 0.18569731712341309, 0.6786978244781494, 1.1716983318328857, 1.6646990776062012, 2.1576995849609375, 2.650700092315674, 3.14370059967041, 3.6367011070251465, 4.129701614379883, 4.622702598571777, 5.1157026290893555, 5.60870361328125, 6.101704120635986, 6.594704627990723, 7.087705135345459, 7.580705642700195, 8.07370662689209, 8.566706657409668, 9.059707641601562, 9.55270767211914, 10.045708656311035, 10.53870964050293, 11.031710624694824, 11.524710655212402, 12.017711639404297, 12.510711669921875, 13.00371265411377, 13.496713638305664, 13.989713668823242, 14.48271369934082]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 9.0, 29.0, 25.0, 38.0, 76.0, 120.0, 193.0, 369.0, 543.0, 968.0, 1515.0, 2446.0, 4088.0, 6318.0, 9849.0, 15018.0, 21761.0, 31579.0, 43762.0, 57790.0, 72770.0, 87434.0, 97207.0, 102918.0, 100266.0, 91741.0, 78130.0, 63228.0, 49130.0, 35730.0, 25133.0, 17024.0, 11355.0, 7354.0, 4787.0, 3096.0, 1901.0, 1163.0, 655.0, 418.0, 261.0, 152.0, 90.0, 52.0, 22.0, 18.0, 12.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3828125, -8.109619140625, -7.83642578125, -7.563232421875, -7.2900390625, -7.016845703125, -6.74365234375, -6.470458984375, -6.197265625, -5.924072265625, -5.65087890625, -5.377685546875, -5.1044921875, -4.831298828125, -4.55810546875, -4.284912109375, -4.01171875, -3.738525390625, -3.46533203125, -3.192138671875, -2.9189453125, -2.645751953125, -2.37255859375, -2.099365234375, -1.826171875, -1.552978515625, -1.27978515625, -1.006591796875, -0.7333984375, -0.460205078125, -0.18701171875, 0.086181640625, 0.359375, 0.632568359375, 0.90576171875, 1.178955078125, 1.4521484375, 1.725341796875, 1.99853515625, 2.271728515625, 2.544921875, 2.818115234375, 3.09130859375, 3.364501953125, 3.6376953125, 3.910888671875, 4.18408203125, 4.457275390625, 4.73046875, 5.003662109375, 5.27685546875, 5.550048828125, 5.8232421875, 6.096435546875, 6.36962890625, 6.642822265625, 6.916015625, 7.189208984375, 7.46240234375, 7.735595703125, 8.0087890625, 8.281982421875, 8.55517578125, 8.828369140625, 9.1015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 9.0, 7.0, 12.0, 16.0, 18.0, 18.0, 23.0, 14.0, 23.0, 21.0, 26.0, 37.0, 33.0, 35.0, 25.0, 32.0, 40.0, 36.0, 43.0, 44.0, 36.0, 48.0, 37.0, 34.0, 32.0, 29.0, 31.0, 32.0, 23.0, 26.0, 19.0, 23.0, 20.0, 14.0, 14.0, 13.0, 10.0, 7.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.25, -15.78369140625, -15.3173828125, -14.85107421875, -14.384765625, -13.91845703125, -13.4521484375, -12.98583984375, -12.51953125, -12.05322265625, -11.5869140625, -11.12060546875, -10.654296875, -10.18798828125, -9.7216796875, -9.25537109375, -8.7890625, -8.32275390625, -7.8564453125, -7.39013671875, -6.923828125, -6.45751953125, -5.9912109375, -5.52490234375, -5.05859375, -4.59228515625, -4.1259765625, -3.65966796875, -3.193359375, -2.72705078125, -2.2607421875, -1.79443359375, -1.328125, -0.86181640625, -0.3955078125, 0.07080078125, 0.537109375, 1.00341796875, 1.4697265625, 1.93603515625, 2.40234375, 2.86865234375, 3.3349609375, 3.80126953125, 4.267578125, 4.73388671875, 5.2001953125, 5.66650390625, 6.1328125, 6.59912109375, 7.0654296875, 7.53173828125, 7.998046875, 8.46435546875, 8.9306640625, 9.39697265625, 9.86328125, 10.32958984375, 10.7958984375, 11.26220703125, 11.728515625, 12.19482421875, 12.6611328125, 13.12744140625, 13.59375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 9.0, 17.0, 19.0, 37.0, 49.0, 93.0, 146.0, 191.0, 342.0, 533.0, 865.0, 1312.0, 2120.0, 3281.0, 4903.0, 7664.0, 11376.0, 16651.0, 23854.0, 33380.0, 44608.0, 58309.0, 72653.0, 85343.0, 94591.0, 98220.0, 96130.0, 88195.0, 76560.0, 62063.0, 48195.0, 36100.0, 26079.0, 18168.0, 12606.0, 8435.0, 5495.0, 3622.0, 2276.0, 1501.0, 918.0, 602.0, 384.0, 247.0, 139.0, 100.0, 69.0, 35.0, 28.0, 16.0, 18.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.61328125, -7.34735107421875, -7.0814208984375, -6.81549072265625, -6.549560546875, -6.28363037109375, -6.0177001953125, -5.75177001953125, -5.48583984375, -5.21990966796875, -4.9539794921875, -4.68804931640625, -4.422119140625, -4.15618896484375, -3.8902587890625, -3.62432861328125, -3.3583984375, -3.09246826171875, -2.8265380859375, -2.56060791015625, -2.294677734375, -2.02874755859375, -1.7628173828125, -1.49688720703125, -1.23095703125, -0.96502685546875, -0.6990966796875, -0.43316650390625, -0.167236328125, 0.09869384765625, 0.3646240234375, 0.63055419921875, 0.896484375, 1.16241455078125, 1.4283447265625, 1.69427490234375, 1.960205078125, 2.22613525390625, 2.4920654296875, 2.75799560546875, 3.02392578125, 3.28985595703125, 3.5557861328125, 3.82171630859375, 4.087646484375, 4.35357666015625, 4.6195068359375, 4.88543701171875, 5.1513671875, 5.41729736328125, 5.6832275390625, 5.94915771484375, 6.215087890625, 6.48101806640625, 6.7469482421875, 7.01287841796875, 7.27880859375, 7.54473876953125, 7.8106689453125, 8.07659912109375, 8.342529296875, 8.60845947265625, 8.8743896484375, 9.14031982421875, 9.40625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 6.0, 8.0, 7.0, 7.0, 10.0, 15.0, 18.0, 22.0, 22.0, 26.0, 33.0, 33.0, 35.0, 42.0, 38.0, 36.0, 44.0, 43.0, 38.0, 51.0, 40.0, 40.0, 39.0, 34.0, 33.0, 25.0, 32.0, 26.0, 26.0, 29.0, 19.0, 25.0, 14.0, 10.0, 14.0, 11.0, 7.0, 9.0, 8.0, 7.0, 2.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1484375, -9.8438720703125, -9.539306640625, -9.2347412109375, -8.93017578125, -8.6256103515625, -8.321044921875, -8.0164794921875, -7.7119140625, -7.4073486328125, -7.102783203125, -6.7982177734375, -6.49365234375, -6.1890869140625, -5.884521484375, -5.5799560546875, -5.275390625, -4.9708251953125, -4.666259765625, -4.3616943359375, -4.05712890625, -3.7525634765625, -3.447998046875, -3.1434326171875, -2.8388671875, -2.5343017578125, -2.229736328125, -1.9251708984375, -1.62060546875, -1.3160400390625, -1.011474609375, -0.7069091796875, -0.40234375, -0.0977783203125, 0.206787109375, 0.5113525390625, 0.81591796875, 1.1204833984375, 1.425048828125, 1.7296142578125, 2.0341796875, 2.3387451171875, 2.643310546875, 2.9478759765625, 3.25244140625, 3.5570068359375, 3.861572265625, 4.1661376953125, 4.470703125, 4.7752685546875, 5.079833984375, 5.3843994140625, 5.68896484375, 5.9935302734375, 6.298095703125, 6.6026611328125, 6.9072265625, 7.2117919921875, 7.516357421875, 7.8209228515625, 8.12548828125, 8.4300537109375, 8.734619140625, 9.0391845703125, 9.34375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 10.0, 12.0, 17.0, 21.0, 39.0, 53.0, 81.0, 94.0, 136.0, 240.0, 330.0, 554.0, 814.0, 1171.0, 1721.0, 2707.0, 4142.0, 6397.0, 9902.0, 15016.0, 22667.0, 33365.0, 47435.0, 64978.0, 84821.0, 101114.0, 113110.0, 113838.0, 104824.0, 88963.0, 69706.0, 51440.0, 36072.0, 24876.0, 16535.0, 10753.0, 7040.0, 4685.0, 2908.0, 1969.0, 1314.0, 884.0, 577.0, 407.0, 278.0, 167.0, 129.0, 94.0, 60.0, 31.0, 27.0, 11.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.544921875, -3.430999755859375, -3.31707763671875, -3.203155517578125, -3.0892333984375, -2.975311279296875, -2.86138916015625, -2.747467041015625, -2.633544921875, -2.519622802734375, -2.40570068359375, -2.291778564453125, -2.1778564453125, -2.063934326171875, -1.95001220703125, -1.836090087890625, -1.72216796875, -1.608245849609375, -1.49432373046875, -1.380401611328125, -1.2664794921875, -1.152557373046875, -1.03863525390625, -0.924713134765625, -0.810791015625, -0.696868896484375, -0.58294677734375, -0.469024658203125, -0.3551025390625, -0.241180419921875, -0.12725830078125, -0.013336181640625, 0.1005859375, 0.214508056640625, 0.32843017578125, 0.442352294921875, 0.5562744140625, 0.670196533203125, 0.78411865234375, 0.898040771484375, 1.011962890625, 1.125885009765625, 1.23980712890625, 1.353729248046875, 1.4676513671875, 1.581573486328125, 1.69549560546875, 1.809417724609375, 1.92333984375, 2.037261962890625, 2.15118408203125, 2.265106201171875, 2.3790283203125, 2.492950439453125, 2.60687255859375, 2.720794677734375, 2.834716796875, 2.948638916015625, 3.06256103515625, 3.176483154296875, 3.2904052734375, 3.404327392578125, 3.51824951171875, 3.632171630859375, 3.74609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 3.0, 12.0, 8.0, 13.0, 14.0, 19.0, 16.0, 33.0, 33.0, 29.0, 29.0, 40.0, 37.0, 47.0, 42.0, 41.0, 41.0, 60.0, 47.0, 47.0, 59.0, 47.0, 41.0, 38.0, 35.0, 27.0, 27.0, 14.0, 18.0, 14.0, 12.0, 5.0, 10.0, 7.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004107952117919922, -0.0003975033760070801, -0.00038421154022216797, -0.00037091970443725586, -0.00035762786865234375, -0.00034433603286743164, -0.00033104419708251953, -0.0003177523612976074, -0.0003044605255126953, -0.0002911686897277832, -0.0002778768539428711, -0.000264585018157959, -0.0002512931823730469, -0.00023800134658813477, -0.00022470951080322266, -0.00021141767501831055, -0.00019812583923339844, -0.00018483400344848633, -0.00017154216766357422, -0.0001582503318786621, -0.00014495849609375, -0.0001316666603088379, -0.00011837482452392578, -0.00010508298873901367, -9.179115295410156e-05, -7.849931716918945e-05, -6.520748138427734e-05, -5.1915645599365234e-05, -3.8623809814453125e-05, -2.5331974029541016e-05, -1.2040138244628906e-05, 1.2516975402832031e-06, 1.4543533325195312e-05, 2.7835369110107422e-05, 4.112720489501953e-05, 5.441904067993164e-05, 6.771087646484375e-05, 8.100271224975586e-05, 9.429454803466797e-05, 0.00010758638381958008, 0.00012087821960449219, 0.0001341700553894043, 0.0001474618911743164, 0.00016075372695922852, 0.00017404556274414062, 0.00018733739852905273, 0.00020062923431396484, 0.00021392107009887695, 0.00022721290588378906, 0.00024050474166870117, 0.0002537965774536133, 0.0002670884132385254, 0.0002803802490234375, 0.0002936720848083496, 0.0003069639205932617, 0.00032025575637817383, 0.00033354759216308594, 0.00034683942794799805, 0.00036013126373291016, 0.00037342309951782227, 0.0003867149353027344, 0.0004000067710876465, 0.0004132986068725586, 0.0004265904426574707, 0.0004398822784423828]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 14.0, 16.0, 20.0, 36.0, 40.0, 65.0, 123.0, 181.0, 270.0, 450.0, 691.0, 1192.0, 1962.0, 3275.0, 5631.0, 9747.0, 16952.0, 28700.0, 47109.0, 73240.0, 104569.0, 134081.0, 148176.0, 139843.0, 114055.0, 82659.0, 54179.0, 33605.0, 19805.0, 11565.0, 6562.0, 3825.0, 2283.0, 1356.0, 820.0, 534.0, 339.0, 192.0, 154.0, 70.0, 55.0, 42.0, 22.0, 17.0, 16.0, 12.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.8359375, -4.67816162109375, -4.5203857421875, -4.36260986328125, -4.204833984375, -4.04705810546875, -3.8892822265625, -3.73150634765625, -3.57373046875, -3.41595458984375, -3.2581787109375, -3.10040283203125, -2.942626953125, -2.78485107421875, -2.6270751953125, -2.46929931640625, -2.3115234375, -2.15374755859375, -1.9959716796875, -1.83819580078125, -1.680419921875, -1.52264404296875, -1.3648681640625, -1.20709228515625, -1.04931640625, -0.89154052734375, -0.7337646484375, -0.57598876953125, -0.418212890625, -0.26043701171875, -0.1026611328125, 0.05511474609375, 0.212890625, 0.37066650390625, 0.5284423828125, 0.68621826171875, 0.843994140625, 1.00177001953125, 1.1595458984375, 1.31732177734375, 1.47509765625, 1.63287353515625, 1.7906494140625, 1.94842529296875, 2.106201171875, 2.26397705078125, 2.4217529296875, 2.57952880859375, 2.7373046875, 2.89508056640625, 3.0528564453125, 3.21063232421875, 3.368408203125, 3.52618408203125, 3.6839599609375, 3.84173583984375, 3.99951171875, 4.15728759765625, 4.3150634765625, 4.47283935546875, 4.630615234375, 4.78839111328125, 4.9461669921875, 5.10394287109375, 5.26171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 15.0, 11.0, 24.0, 22.0, 26.0, 23.0, 28.0, 42.0, 59.0, 46.0, 68.0, 55.0, 69.0, 52.0, 44.0, 61.0, 69.0, 44.0, 38.0, 28.0, 27.0, 24.0, 27.0, 28.0, 18.0, 8.0, 5.0, 7.0, 4.0, 6.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8988189697265625, -1.835723876953125, -1.7726287841796875, -1.70953369140625, -1.6464385986328125, -1.583343505859375, -1.5202484130859375, -1.4571533203125, -1.3940582275390625, -1.330963134765625, -1.2678680419921875, -1.20477294921875, -1.1416778564453125, -1.078582763671875, -1.0154876708984375, -0.952392578125, -0.8892974853515625, -0.826202392578125, -0.7631072998046875, -0.70001220703125, -0.6369171142578125, -0.573822021484375, -0.5107269287109375, -0.4476318359375, -0.3845367431640625, -0.321441650390625, -0.2583465576171875, -0.19525146484375, -0.1321563720703125, -0.069061279296875, -0.0059661865234375, 0.05712890625, 0.1202239990234375, 0.183319091796875, 0.2464141845703125, 0.30950927734375, 0.3726043701171875, 0.435699462890625, 0.4987945556640625, 0.5618896484375, 0.6249847412109375, 0.688079833984375, 0.7511749267578125, 0.81427001953125, 0.8773651123046875, 0.940460205078125, 1.0035552978515625, 1.066650390625, 1.1297454833984375, 1.192840576171875, 1.2559356689453125, 1.31903076171875, 1.3821258544921875, 1.445220947265625, 1.5083160400390625, 1.5714111328125, 1.6345062255859375, 1.697601318359375, 1.7606964111328125, 1.82379150390625, 1.8868865966796875, 1.949981689453125, 2.0130767822265625, 2.076171875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 15.0, 13.0, 17.0, 16.0, 31.0, 22.0, 28.0, 22.0, 37.0, 32.0, 33.0, 39.0, 57.0, 45.0, 42.0, 47.0, 34.0, 41.0, 43.0, 43.0, 43.0, 21.0, 37.0, 22.0, 34.0, 22.0, 27.0, 24.0, 18.0, 9.0, 11.0, 10.0, 11.0, 11.0, 4.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.94345760345459, -12.551535606384277, -12.159614562988281, -11.767692565917969, -11.375770568847656, -10.98384952545166, -10.591927528381348, -10.200006484985352, -9.808084487915039, -9.416162490844727, -9.02424144744873, -8.632319450378418, -8.240398406982422, -7.848476409912109, -7.456554412841797, -7.064632892608643, -6.672711372375488, -6.280789852142334, -5.88886833190918, -5.496946334838867, -5.105024814605713, -4.713103294372559, -4.321181297302246, -3.929259777069092, -3.5373382568359375, -3.145416736602783, -2.75349497795105, -2.3615732192993164, -1.969651699066162, -1.5777300596237183, -1.1858084201812744, -0.793886661529541, -0.4019641876220703, -0.010042548179626465, 0.3818790912628174, 0.7738007307052612, 1.165722370147705, 1.557644009590149, 1.9495656490325928, 2.341487407684326, 2.7334089279174805, 3.1253304481506348, 3.517252206802368, 3.9091739654541016, 4.301095485687256, 4.69301700592041, 5.084939002990723, 5.476860523223877, 5.868782043457031, 6.2607035636901855, 6.65262508392334, 7.044547080993652, 7.436468601226807, 7.828390121459961, 8.220312118530273, 8.612234115600586, 9.004155158996582, 9.396077156066895, 9.78799819946289, 10.179920196533203, 10.571842193603516, 10.963763236999512, 11.355685234069824, 11.74760627746582, 12.139528274536133]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 10.0, 9.0, 9.0, 7.0, 4.0, 12.0, 9.0, 13.0, 17.0, 21.0, 21.0, 21.0, 33.0, 34.0, 36.0, 49.0, 39.0, 39.0, 45.0, 35.0, 49.0, 55.0, 45.0, 28.0, 51.0, 43.0, 32.0, 32.0, 30.0, 25.0, 25.0, 17.0, 17.0, 23.0, 16.0, 14.0, 15.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.820951461791992, -18.276235580444336, -17.731521606445312, -17.186805725097656, -16.64208984375, -16.097373962402344, -15.552659034729004, -15.007944107055664, -14.463228225708008, -13.918512344360352, -13.373797416687012, -12.829082489013672, -12.284366607666016, -11.73965072631836, -11.19493579864502, -10.65022087097168, -10.105504989624023, -9.560789108276367, -9.016074180603027, -8.471359252929688, -7.926643371582031, -7.381927967071533, -6.837212562561035, -6.292497158050537, -5.747781753540039, -5.203066349029541, -4.658350944519043, -4.113635540008545, -3.568920135498047, -3.024204730987549, -2.479489326477051, -1.9347739219665527, -1.3900585174560547, -0.8453431129455566, -0.3006277084350586, 0.24408769607543945, 0.7888031005859375, 1.3335185050964355, 1.8782339096069336, 2.4229493141174316, 2.9676647186279297, 3.5123801231384277, 4.057095527648926, 4.601810932159424, 5.146526336669922, 5.69124174118042, 6.235957145690918, 6.780672550201416, 7.325387954711914, 7.870103359222412, 8.41481876373291, 8.95953369140625, 9.504249572753906, 10.048965454101562, 10.593680381774902, 11.138395309448242, 11.683111190795898, 12.227827072143555, 12.772541999816895, 13.317256927490234, 13.86197280883789, 14.406688690185547, 14.951403617858887, 15.496118545532227, 16.040834426879883]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 11.0, 19.0, 32.0, 45.0, 61.0, 130.0, 171.0, 324.0, 520.0, 894.0, 1417.0, 2397.0, 3926.0, 6386.0, 10318.0, 16344.0, 25979.0, 41028.0, 62543.0, 93834.0, 137140.0, 192507.0, 255326.0, 324834.0, 384098.0, 424541.0, 432459.0, 408027.0, 356862.0, 292858.0, 224363.0, 164197.0, 114644.0, 77580.0, 51566.0, 32807.0, 20683.0, 13035.0, 8070.0, 4955.0, 2980.0, 1753.0, 1056.0, 626.0, 376.0, 227.0, 134.0, 75.0, 52.0, 31.0, 17.0, 12.0, 4.0, 4.0, 6.0, 1.0, 2.0], "bins": [-10.125, -9.8204345703125, -9.515869140625, -9.2113037109375, -8.90673828125, -8.6021728515625, -8.297607421875, -7.9930419921875, -7.6884765625, -7.3839111328125, -7.079345703125, -6.7747802734375, -6.47021484375, -6.1656494140625, -5.861083984375, -5.5565185546875, -5.251953125, -4.9473876953125, -4.642822265625, -4.3382568359375, -4.03369140625, -3.7291259765625, -3.424560546875, -3.1199951171875, -2.8154296875, -2.5108642578125, -2.206298828125, -1.9017333984375, -1.59716796875, -1.2926025390625, -0.988037109375, -0.6834716796875, -0.37890625, -0.0743408203125, 0.230224609375, 0.5347900390625, 0.83935546875, 1.1439208984375, 1.448486328125, 1.7530517578125, 2.0576171875, 2.3621826171875, 2.666748046875, 2.9713134765625, 3.27587890625, 3.5804443359375, 3.885009765625, 4.1895751953125, 4.494140625, 4.7987060546875, 5.103271484375, 5.4078369140625, 5.71240234375, 6.0169677734375, 6.321533203125, 6.6260986328125, 6.9306640625, 7.2352294921875, 7.539794921875, 7.8443603515625, 8.14892578125, 8.4534912109375, 8.758056640625, 9.0626220703125, 9.3671875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 7.0, 8.0, 9.0, 8.0, 10.0, 12.0, 17.0, 19.0, 26.0, 23.0, 27.0, 26.0, 32.0, 49.0, 45.0, 54.0, 40.0, 45.0, 51.0, 43.0, 50.0, 50.0, 40.0, 40.0, 34.0, 34.0, 28.0, 31.0, 30.0, 21.0, 21.0, 16.0, 17.0, 10.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.578125, -15.11083984375, -14.6435546875, -14.17626953125, -13.708984375, -13.24169921875, -12.7744140625, -12.30712890625, -11.83984375, -11.37255859375, -10.9052734375, -10.43798828125, -9.970703125, -9.50341796875, -9.0361328125, -8.56884765625, -8.1015625, -7.63427734375, -7.1669921875, -6.69970703125, -6.232421875, -5.76513671875, -5.2978515625, -4.83056640625, -4.36328125, -3.89599609375, -3.4287109375, -2.96142578125, -2.494140625, -2.02685546875, -1.5595703125, -1.09228515625, -0.625, -0.15771484375, 0.3095703125, 0.77685546875, 1.244140625, 1.71142578125, 2.1787109375, 2.64599609375, 3.11328125, 3.58056640625, 4.0478515625, 4.51513671875, 4.982421875, 5.44970703125, 5.9169921875, 6.38427734375, 6.8515625, 7.31884765625, 7.7861328125, 8.25341796875, 8.720703125, 9.18798828125, 9.6552734375, 10.12255859375, 10.58984375, 11.05712890625, 11.5244140625, 11.99169921875, 12.458984375, 12.92626953125, 13.3935546875, 13.86083984375, 14.328125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 4.0, 18.0, 24.0, 48.0, 79.0, 166.0, 289.0, 465.0, 777.0, 1270.0, 2122.0, 3587.0, 5674.0, 9287.0, 14767.0, 22793.0, 35934.0, 52589.0, 76838.0, 108340.0, 147255.0, 191952.0, 242958.0, 290867.0, 331684.0, 362130.0, 371615.0, 362033.0, 334956.0, 292669.0, 245186.0, 195623.0, 148963.0, 109437.0, 78327.0, 54313.0, 35631.0, 23683.0, 15303.0, 9545.0, 5996.0, 3715.0, 2204.0, 1305.0, 766.0, 451.0, 298.0, 163.0, 73.0, 53.0, 29.0, 16.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0], "bins": [-9.1875, -8.905029296875, -8.62255859375, -8.340087890625, -8.0576171875, -7.775146484375, -7.49267578125, -7.210205078125, -6.927734375, -6.645263671875, -6.36279296875, -6.080322265625, -5.7978515625, -5.515380859375, -5.23291015625, -4.950439453125, -4.66796875, -4.385498046875, -4.10302734375, -3.820556640625, -3.5380859375, -3.255615234375, -2.97314453125, -2.690673828125, -2.408203125, -2.125732421875, -1.84326171875, -1.560791015625, -1.2783203125, -0.995849609375, -0.71337890625, -0.430908203125, -0.1484375, 0.134033203125, 0.41650390625, 0.698974609375, 0.9814453125, 1.263916015625, 1.54638671875, 1.828857421875, 2.111328125, 2.393798828125, 2.67626953125, 2.958740234375, 3.2412109375, 3.523681640625, 3.80615234375, 4.088623046875, 4.37109375, 4.653564453125, 4.93603515625, 5.218505859375, 5.5009765625, 5.783447265625, 6.06591796875, 6.348388671875, 6.630859375, 6.913330078125, 7.19580078125, 7.478271484375, 7.7607421875, 8.043212890625, 8.32568359375, 8.608154296875, 8.890625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 5.0, 20.0, 42.0, 33.0, 40.0, 45.0, 60.0, 75.0, 91.0, 103.0, 118.0, 131.0, 144.0, 159.0, 167.0, 196.0, 199.0, 203.0, 198.0, 196.0, 185.0, 213.0, 181.0, 189.0, 170.0, 161.0, 121.0, 121.0, 89.0, 75.0, 68.0, 56.0, 55.0, 30.0, 29.0, 19.0, 12.0, 21.0, 13.0, 8.0, 3.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33203125, -6.13909912109375, -5.9461669921875, -5.75323486328125, -5.560302734375, -5.36737060546875, -5.1744384765625, -4.98150634765625, -4.78857421875, -4.59564208984375, -4.4027099609375, -4.20977783203125, -4.016845703125, -3.82391357421875, -3.6309814453125, -3.43804931640625, -3.2451171875, -3.05218505859375, -2.8592529296875, -2.66632080078125, -2.473388671875, -2.28045654296875, -2.0875244140625, -1.89459228515625, -1.70166015625, -1.50872802734375, -1.3157958984375, -1.12286376953125, -0.929931640625, -0.73699951171875, -0.5440673828125, -0.35113525390625, -0.158203125, 0.03472900390625, 0.2276611328125, 0.42059326171875, 0.613525390625, 0.80645751953125, 0.9993896484375, 1.19232177734375, 1.38525390625, 1.57818603515625, 1.7711181640625, 1.96405029296875, 2.156982421875, 2.34991455078125, 2.5428466796875, 2.73577880859375, 2.9287109375, 3.12164306640625, 3.3145751953125, 3.50750732421875, 3.700439453125, 3.89337158203125, 4.0863037109375, 4.27923583984375, 4.47216796875, 4.66510009765625, 4.8580322265625, 5.05096435546875, 5.243896484375, 5.43682861328125, 5.6297607421875, 5.82269287109375, 6.015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 5.0, 6.0, 11.0, 20.0, 17.0, 27.0, 22.0, 32.0, 36.0, 31.0, 40.0, 47.0, 49.0, 58.0, 61.0, 53.0, 59.0, 69.0, 44.0, 50.0, 49.0, 34.0, 31.0, 23.0, 30.0, 23.0, 17.0, 17.0, 9.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.849138259887695, -17.3325138092041, -16.815887451171875, -16.29926300048828, -15.782638549804688, -15.266013145446777, -14.749387741088867, -14.232763290405273, -13.71613883972168, -13.19951343536377, -12.682888984680176, -12.166263580322266, -11.649639129638672, -11.133013725280762, -10.616388320922852, -10.099763870239258, -9.583138465881348, -9.066513061523438, -8.549888610839844, -8.033263206481934, -7.51663875579834, -7.00001335144043, -6.483388423919678, -5.966763496398926, -5.450138568878174, -4.933513641357422, -4.41688871383667, -3.900263547897339, -3.383638620376587, -2.867013692855835, -2.350388526916504, -1.833763599395752, -1.3171396255493164, -0.8005146384239197, -0.28388965129852295, 0.23273539543151855, 0.7493603229522705, 1.2659852504730225, 1.7826104164123535, 2.2992353439331055, 2.8158602714538574, 3.3324851989746094, 3.8491101264953613, 4.365735054016113, 4.882360458374023, 5.398984909057617, 5.915610313415527, 6.432235240936279, 6.948860168457031, 7.465485095977783, 7.982110023498535, 8.498735427856445, 9.015359878540039, 9.53198528289795, 10.04861068725586, 10.565235137939453, 11.081859588623047, 11.598484992980957, 12.11510944366455, 12.631734848022461, 13.148359298706055, 13.664984703063965, 14.181610107421875, 14.698234558105469, 15.214859962463379]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 4.0, 13.0, 13.0, 9.0, 8.0, 14.0, 13.0, 16.0, 22.0, 26.0, 23.0, 23.0, 38.0, 37.0, 38.0, 28.0, 41.0, 51.0, 36.0, 49.0, 52.0, 42.0, 35.0, 34.0, 43.0, 41.0, 41.0, 32.0, 26.0, 22.0, 25.0, 21.0, 17.0, 11.0, 14.0, 7.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.520597457885742, -17.01219940185547, -16.503801345825195, -15.995404243469238, -15.487007141113281, -14.978609085083008, -14.470211029052734, -13.961813926696777, -13.45341682434082, -12.945018768310547, -12.43662166595459, -11.928223609924316, -11.41982650756836, -10.911428451538086, -10.403030395507812, -9.894633293151855, -9.386235237121582, -8.877837181091309, -8.369440078735352, -7.861042022705078, -7.352644920349121, -6.844246864318848, -6.335849285125732, -5.827451705932617, -5.319054126739502, -4.810656547546387, -4.3022589683532715, -3.793861150741577, -3.285463571548462, -2.7770659923553467, -2.2686681747436523, -1.760270595550537, -1.2518720626831055, -0.7434744238853455, -0.23507678508758545, 0.27332091331481934, 0.7817184925079346, 1.2901160717010498, 1.7985138893127441, 2.3069114685058594, 2.8153090476989746, 3.32370662689209, 3.832104206085205, 4.34050178527832, 4.848899841308594, 5.357296943664551, 5.865694999694824, 6.3740925788879395, 6.882490158081055, 7.39088773727417, 7.899285316467285, 8.407683372497559, 8.916080474853516, 9.424478530883789, 9.932876586914062, 10.44127368927002, 10.949670791625977, 11.45806884765625, 11.966465950012207, 12.47486400604248, 12.983261108398438, 13.491659164428711, 14.000057220458984, 14.508454322814941, 15.016852378845215]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 11.0, 12.0, 16.0, 21.0, 34.0, 62.0, 78.0, 101.0, 181.0, 266.0, 473.0, 623.0, 987.0, 1500.0, 2429.0, 3863.0, 6007.0, 9354.0, 14721.0, 23120.0, 35171.0, 52889.0, 77819.0, 105966.0, 131225.0, 140111.0, 127246.0, 99663.0, 72788.0, 49868.0, 32812.0, 21427.0, 13697.0, 8657.0, 5470.0, 3551.0, 2293.0, 1410.0, 886.0, 610.0, 392.0, 258.0, 152.0, 103.0, 84.0, 47.0, 35.0, 26.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 1.0], "bins": [-2.466796875, -2.395111083984375, -2.32342529296875, -2.251739501953125, -2.1800537109375, -2.108367919921875, -2.03668212890625, -1.964996337890625, -1.893310546875, -1.821624755859375, -1.74993896484375, -1.678253173828125, -1.6065673828125, -1.534881591796875, -1.46319580078125, -1.391510009765625, -1.31982421875, -1.248138427734375, -1.17645263671875, -1.104766845703125, -1.0330810546875, -0.961395263671875, -0.88970947265625, -0.818023681640625, -0.746337890625, -0.674652099609375, -0.60296630859375, -0.531280517578125, -0.4595947265625, -0.387908935546875, -0.31622314453125, -0.244537353515625, -0.1728515625, -0.101165771484375, -0.02947998046875, 0.042205810546875, 0.1138916015625, 0.185577392578125, 0.25726318359375, 0.328948974609375, 0.400634765625, 0.472320556640625, 0.54400634765625, 0.615692138671875, 0.6873779296875, 0.759063720703125, 0.83074951171875, 0.902435302734375, 0.97412109375, 1.045806884765625, 1.11749267578125, 1.189178466796875, 1.2608642578125, 1.332550048828125, 1.40423583984375, 1.475921630859375, 1.547607421875, 1.619293212890625, 1.69097900390625, 1.762664794921875, 1.8343505859375, 1.906036376953125, 1.97772216796875, 2.049407958984375, 2.12109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 7.0, 4.0, 11.0, 14.0, 24.0, 13.0, 11.0, 11.0, 23.0, 19.0, 12.0, 21.0, 32.0, 38.0, 28.0, 29.0, 46.0, 39.0, 45.0, 41.0, 50.0, 38.0, 42.0, 53.0, 33.0, 47.0, 41.0, 36.0, 23.0, 30.0, 17.0, 17.0, 19.0, 15.0, 9.0, 13.0, 3.0, 8.0, 15.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.921875, -17.4102783203125, -16.898681640625, -16.3870849609375, -15.87548828125, -15.3638916015625, -14.852294921875, -14.3406982421875, -13.8291015625, -13.3175048828125, -12.805908203125, -12.2943115234375, -11.78271484375, -11.2711181640625, -10.759521484375, -10.2479248046875, -9.736328125, -9.2247314453125, -8.713134765625, -8.2015380859375, -7.68994140625, -7.1783447265625, -6.666748046875, -6.1551513671875, -5.6435546875, -5.1319580078125, -4.620361328125, -4.1087646484375, -3.59716796875, -3.0855712890625, -2.573974609375, -2.0623779296875, -1.55078125, -1.0391845703125, -0.527587890625, -0.0159912109375, 0.49560546875, 1.0072021484375, 1.518798828125, 2.0303955078125, 2.5419921875, 3.0535888671875, 3.565185546875, 4.0767822265625, 4.58837890625, 5.0999755859375, 5.611572265625, 6.1231689453125, 6.634765625, 7.1463623046875, 7.657958984375, 8.1695556640625, 8.68115234375, 9.1927490234375, 9.704345703125, 10.2159423828125, 10.7275390625, 11.2391357421875, 11.750732421875, 12.2623291015625, 12.77392578125, 13.2855224609375, 13.797119140625, 14.3087158203125, 14.8203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 12.0, 22.0, 36.0, 38.0, 65.0, 99.0, 128.0, 208.0, 309.0, 548.0, 736.0, 1163.0, 1884.0, 3067.0, 5113.0, 8172.0, 13570.0, 22052.0, 36114.0, 55542.0, 83828.0, 115551.0, 143144.0, 148353.0, 129375.0, 97445.0, 67563.0, 43583.0, 27439.0, 16783.0, 10426.0, 6132.0, 3801.0, 2287.0, 1452.0, 880.0, 565.0, 365.0, 249.0, 149.0, 102.0, 80.0, 41.0, 31.0, 19.0, 14.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.26953125, -2.19683837890625, -2.1241455078125, -2.05145263671875, -1.978759765625, -1.90606689453125, -1.8333740234375, -1.76068115234375, -1.68798828125, -1.61529541015625, -1.5426025390625, -1.46990966796875, -1.397216796875, -1.32452392578125, -1.2518310546875, -1.17913818359375, -1.1064453125, -1.03375244140625, -0.9610595703125, -0.88836669921875, -0.815673828125, -0.74298095703125, -0.6702880859375, -0.59759521484375, -0.52490234375, -0.45220947265625, -0.3795166015625, -0.30682373046875, -0.234130859375, -0.16143798828125, -0.0887451171875, -0.01605224609375, 0.056640625, 0.12933349609375, 0.2020263671875, 0.27471923828125, 0.347412109375, 0.42010498046875, 0.4927978515625, 0.56549072265625, 0.63818359375, 0.71087646484375, 0.7835693359375, 0.85626220703125, 0.928955078125, 1.00164794921875, 1.0743408203125, 1.14703369140625, 1.2197265625, 1.29241943359375, 1.3651123046875, 1.43780517578125, 1.510498046875, 1.58319091796875, 1.6558837890625, 1.72857666015625, 1.80126953125, 1.87396240234375, 1.9466552734375, 2.01934814453125, 2.092041015625, 2.16473388671875, 2.2374267578125, 2.31011962890625, 2.3828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 8.0, 12.0, 13.0, 5.0, 11.0, 10.0, 17.0, 17.0, 16.0, 21.0, 29.0, 33.0, 28.0, 33.0, 32.0, 32.0, 47.0, 31.0, 51.0, 36.0, 34.0, 32.0, 42.0, 30.0, 36.0, 40.0, 24.0, 33.0, 33.0, 21.0, 24.0, 20.0, 25.0, 20.0, 15.0, 16.0, 9.0, 10.0, 11.0, 10.0, 0.0, 6.0, 5.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0], "bins": [-10.265625, -9.9615478515625, -9.657470703125, -9.3533935546875, -9.04931640625, -8.7452392578125, -8.441162109375, -8.1370849609375, -7.8330078125, -7.5289306640625, -7.224853515625, -6.9207763671875, -6.61669921875, -6.3126220703125, -6.008544921875, -5.7044677734375, -5.400390625, -5.0963134765625, -4.792236328125, -4.4881591796875, -4.18408203125, -3.8800048828125, -3.575927734375, -3.2718505859375, -2.9677734375, -2.6636962890625, -2.359619140625, -2.0555419921875, -1.75146484375, -1.4473876953125, -1.143310546875, -0.8392333984375, -0.53515625, -0.2310791015625, 0.072998046875, 0.3770751953125, 0.68115234375, 0.9852294921875, 1.289306640625, 1.5933837890625, 1.8974609375, 2.2015380859375, 2.505615234375, 2.8096923828125, 3.11376953125, 3.4178466796875, 3.721923828125, 4.0260009765625, 4.330078125, 4.6341552734375, 4.938232421875, 5.2423095703125, 5.54638671875, 5.8504638671875, 6.154541015625, 6.4586181640625, 6.7626953125, 7.0667724609375, 7.370849609375, 7.6749267578125, 7.97900390625, 8.2830810546875, 8.587158203125, 8.8912353515625, 9.1953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 2.0, 7.0, 6.0, 9.0, 12.0, 24.0, 29.0, 44.0, 49.0, 79.0, 107.0, 172.0, 268.0, 381.0, 629.0, 1113.0, 1985.0, 3996.0, 8287.0, 18623.0, 47583.0, 127254.0, 283968.0, 308059.0, 148888.0, 56203.0, 21766.0, 9325.0, 4336.0, 2221.0, 1197.0, 689.0, 431.0, 276.0, 189.0, 111.0, 58.0, 55.0, 39.0, 21.0, 19.0, 11.0, 9.0, 11.0, 8.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.49100494384765625, -0.4746856689453125, -0.45836639404296875, -0.442047119140625, -0.42572784423828125, -0.4094085693359375, -0.39308929443359375, -0.37677001953125, -0.36045074462890625, -0.3441314697265625, -0.32781219482421875, -0.311492919921875, -0.29517364501953125, -0.2788543701171875, -0.26253509521484375, -0.2462158203125, -0.22989654541015625, -0.2135772705078125, -0.19725799560546875, -0.180938720703125, -0.16461944580078125, -0.1483001708984375, -0.13198089599609375, -0.11566162109375, -0.09934234619140625, -0.0830230712890625, -0.06670379638671875, -0.050384521484375, -0.03406524658203125, -0.0177459716796875, -0.00142669677734375, 0.014892578125, 0.03121185302734375, 0.0475311279296875, 0.06385040283203125, 0.080169677734375, 0.09648895263671875, 0.1128082275390625, 0.12912750244140625, 0.14544677734375, 0.16176605224609375, 0.1780853271484375, 0.19440460205078125, 0.210723876953125, 0.22704315185546875, 0.2433624267578125, 0.25968170166015625, 0.2760009765625, 0.29232025146484375, 0.3086395263671875, 0.32495880126953125, 0.341278076171875, 0.35759735107421875, 0.3739166259765625, 0.39023590087890625, 0.40655517578125, 0.42287445068359375, 0.4391937255859375, 0.45551300048828125, 0.471832275390625, 0.48815155029296875, 0.5044708251953125, 0.5207901000976562, 0.537109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 9.0, 11.0, 17.0, 28.0, 27.0, 41.0, 44.0, 77.0, 95.0, 111.0, 98.0, 99.0, 87.0, 71.0, 41.0, 26.0, 28.0, 14.0, 11.0, 6.0, 11.0, 5.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.053945541381836e-05, -8.772220462560654e-05, -8.490495383739471e-05, -8.208770304918289e-05, -7.927045226097107e-05, -7.645320147275925e-05, -7.363595068454742e-05, -7.08186998963356e-05, -6.800144910812378e-05, -6.518419831991196e-05, -6.236694753170013e-05, -5.954969674348831e-05, -5.673244595527649e-05, -5.391519516706467e-05, -5.1097944378852844e-05, -4.828069359064102e-05, -4.54634428024292e-05, -4.264619201421738e-05, -3.9828941226005554e-05, -3.701169043779373e-05, -3.419443964958191e-05, -3.137718886137009e-05, -2.8559938073158264e-05, -2.574268728494644e-05, -2.292543649673462e-05, -2.0108185708522797e-05, -1.7290934920310974e-05, -1.4473684132099152e-05, -1.1656433343887329e-05, -8.839182555675507e-06, -6.021931767463684e-06, -3.2046809792518616e-06, -3.8743019104003906e-07, 2.4298205971717834e-06, 5.247071385383606e-06, 8.064322173595428e-06, 1.0881572961807251e-05, 1.3698823750019073e-05, 1.6516074538230896e-05, 1.933332532644272e-05, 2.215057611465454e-05, 2.4967826902866364e-05, 2.7785077691078186e-05, 3.060232847929001e-05, 3.341957926750183e-05, 3.6236830055713654e-05, 3.9054080843925476e-05, 4.18713316321373e-05, 4.468858242034912e-05, 4.7505833208560944e-05, 5.0323083996772766e-05, 5.314033478498459e-05, 5.595758557319641e-05, 5.8774836361408234e-05, 6.159208714962006e-05, 6.440933793783188e-05, 6.72265887260437e-05, 7.004383951425552e-05, 7.286109030246735e-05, 7.567834109067917e-05, 7.849559187889099e-05, 8.131284266710281e-05, 8.413009345531464e-05, 8.694734424352646e-05, 8.976459503173828e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 8.0, 9.0, 28.0, 31.0, 64.0, 64.0, 92.0, 121.0, 203.0, 269.0, 434.0, 550.0, 887.0, 1377.0, 2076.0, 3377.0, 5449.0, 9640.0, 17418.0, 33076.0, 67358.0, 136367.0, 241682.0, 244162.0, 138766.0, 68479.0, 34110.0, 17662.0, 9553.0, 5538.0, 3476.0, 2051.0, 1328.0, 899.0, 633.0, 390.0, 279.0, 185.0, 126.0, 86.0, 80.0, 42.0, 34.0, 26.0, 23.0, 17.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.875, -0.849273681640625, -0.82354736328125, -0.797821044921875, -0.7720947265625, -0.746368408203125, -0.72064208984375, -0.694915771484375, -0.669189453125, -0.643463134765625, -0.61773681640625, -0.592010498046875, -0.5662841796875, -0.540557861328125, -0.51483154296875, -0.489105224609375, -0.46337890625, -0.437652587890625, -0.41192626953125, -0.386199951171875, -0.3604736328125, -0.334747314453125, -0.30902099609375, -0.283294677734375, -0.257568359375, -0.231842041015625, -0.20611572265625, -0.180389404296875, -0.1546630859375, -0.128936767578125, -0.10321044921875, -0.077484130859375, -0.0517578125, -0.026031494140625, -0.00030517578125, 0.025421142578125, 0.0511474609375, 0.076873779296875, 0.10260009765625, 0.128326416015625, 0.154052734375, 0.179779052734375, 0.20550537109375, 0.231231689453125, 0.2569580078125, 0.282684326171875, 0.30841064453125, 0.334136962890625, 0.35986328125, 0.385589599609375, 0.41131591796875, 0.437042236328125, 0.4627685546875, 0.488494873046875, 0.51422119140625, 0.539947509765625, 0.565673828125, 0.591400146484375, 0.61712646484375, 0.642852783203125, 0.6685791015625, 0.694305419921875, 0.72003173828125, 0.745758056640625, 0.771484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 9.0, 12.0, 14.0, 12.0, 16.0, 17.0, 29.0, 30.0, 29.0, 36.0, 42.0, 50.0, 50.0, 49.0, 66.0, 64.0, 49.0, 54.0, 45.0, 44.0, 37.0, 32.0, 36.0, 19.0, 14.0, 22.0, 23.0, 16.0, 11.0, 6.0, 8.0, 11.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0], "bins": [-0.22265625, -0.21608352661132812, -0.20951080322265625, -0.20293807983398438, -0.1963653564453125, -0.18979263305664062, -0.18321990966796875, -0.17664718627929688, -0.170074462890625, -0.16350173950195312, -0.15692901611328125, -0.15035629272460938, -0.1437835693359375, -0.13721084594726562, -0.13063812255859375, -0.12406539916992188, -0.11749267578125, -0.11091995239257812, -0.10434722900390625, -0.09777450561523438, -0.0912017822265625, -0.08462905883789062, -0.07805633544921875, -0.07148361206054688, -0.064910888671875, -0.058338165283203125, -0.05176544189453125, -0.045192718505859375, -0.0386199951171875, -0.032047271728515625, -0.02547454833984375, -0.018901824951171875, -0.0123291015625, -0.005756378173828125, 0.00081634521484375, 0.007389068603515625, 0.0139617919921875, 0.020534515380859375, 0.02710723876953125, 0.033679962158203125, 0.040252685546875, 0.046825408935546875, 0.05339813232421875, 0.059970855712890625, 0.0665435791015625, 0.07311630249023438, 0.07968902587890625, 0.08626174926757812, 0.09283447265625, 0.09940719604492188, 0.10597991943359375, 0.11255264282226562, 0.1191253662109375, 0.12569808959960938, 0.13227081298828125, 0.13884353637695312, 0.145416259765625, 0.15198898315429688, 0.15856170654296875, 0.16513442993164062, 0.1717071533203125, 0.17827987670898438, 0.18485260009765625, 0.19142532348632812, 0.197998046875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 3.0, 9.0, 17.0, 13.0, 21.0, 28.0, 24.0, 32.0, 38.0, 33.0, 42.0, 42.0, 56.0, 62.0, 57.0, 59.0, 53.0, 65.0, 44.0, 51.0, 44.0, 34.0, 24.0, 29.0, 29.0, 22.0, 15.0, 16.0, 9.0, 7.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.706798553466797, -17.189796447753906, -16.672792434692383, -16.155790328979492, -15.638788223266602, -15.121785163879395, -14.604782104492188, -14.087779998779297, -13.57077693939209, -13.053773880004883, -12.536771774291992, -12.019768714904785, -11.502765655517578, -10.985763549804688, -10.46876049041748, -9.951757431030273, -9.434755325317383, -8.917752265930176, -8.400750160217285, -7.883747100830078, -7.366744518280029, -6.8497419357299805, -6.332738876342773, -5.815736293792725, -5.298733711242676, -4.781731128692627, -4.264728546142578, -3.747725486755371, -3.2307229042053223, -2.7137203216552734, -2.1967175006866455, -1.6797146797180176, -1.162710189819336, -0.6457074880599976, -0.12870478630065918, 0.3882979154586792, 0.9053006172180176, 1.4223031997680664, 1.9393060207366943, 2.4563088417053223, 2.973311424255371, 3.49031400680542, 4.007316589355469, 4.524319648742676, 5.041322231292725, 5.558324813842773, 6.0753278732299805, 6.592330455780029, 7.109333038330078, 7.626335620880127, 8.143338203430176, 8.660341262817383, 9.177343368530273, 9.69434642791748, 10.211349487304688, 10.728351593017578, 11.245354652404785, 11.762357711791992, 12.279359817504883, 12.79636287689209, 13.313365936279297, 13.830368041992188, 14.347371101379395, 14.864374160766602, 15.381376266479492]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 0.0, 0.0, 4.0, 10.0, 11.0, 11.0, 7.0, 11.0, 12.0, 15.0, 15.0, 24.0, 24.0, 23.0, 27.0, 38.0, 39.0, 37.0, 26.0, 39.0, 49.0, 38.0, 53.0, 53.0, 36.0, 39.0, 31.0, 46.0, 41.0, 39.0, 32.0, 23.0, 23.0, 22.0, 22.0, 15.0, 13.0, 14.0, 7.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.27195930480957, -16.76767921447754, -16.263399124145508, -15.75911808013916, -15.254837036132812, -14.750556945800781, -14.24627685546875, -13.741995811462402, -13.237714767456055, -12.733434677124023, -12.229153633117676, -11.724873542785645, -11.220592498779297, -10.716312408447266, -10.212032318115234, -9.707751274108887, -9.203471183776855, -8.699191093444824, -8.194910049438477, -7.690629959106445, -7.186348915100098, -6.682068824768066, -6.177788257598877, -5.6735076904296875, -5.169227123260498, -4.664946556091309, -4.160665988922119, -3.656385660171509, -3.1521050930023193, -2.64782452583313, -2.1435441970825195, -1.63926362991333, -1.1349821090698242, -0.6307016015052795, -0.12642109394073486, 0.37785935401916504, 0.8821399211883545, 1.386420488357544, 1.8907008171081543, 2.3949813842773438, 2.899261951446533, 3.4035425186157227, 3.907823085784912, 4.412103652954102, 4.916383743286133, 5.4206647872924805, 5.924944877624512, 6.429225444793701, 6.933506011962891, 7.43778657913208, 7.9420671463012695, 8.4463472366333, 8.950628280639648, 9.45490837097168, 9.959188461303711, 10.463469505310059, 10.967750549316406, 11.472030639648438, 11.976311683654785, 12.480591773986816, 12.984872817993164, 13.489152908325195, 13.993432998657227, 14.497714042663574, 15.001994132995605]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 13.0, 22.0, 28.0, 41.0, 82.0, 89.0, 171.0, 230.0, 386.0, 668.0, 1029.0, 1648.0, 2484.0, 3718.0, 6034.0, 8833.0, 13091.0, 19132.0, 26699.0, 36459.0, 48101.0, 60826.0, 73757.0, 84821.0, 92462.0, 94994.0, 92184.0, 84109.0, 72572.0, 59700.0, 47336.0, 35509.0, 25579.0, 18333.0, 12623.0, 8512.0, 5901.0, 3677.0, 2415.0, 1538.0, 1022.0, 651.0, 404.0, 245.0, 147.0, 111.0, 66.0, 36.0, 25.0, 15.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0], "bins": [-8.390625, -8.13983154296875, -7.8890380859375, -7.63824462890625, -7.387451171875, -7.13665771484375, -6.8858642578125, -6.63507080078125, -6.38427734375, -6.13348388671875, -5.8826904296875, -5.63189697265625, -5.381103515625, -5.13031005859375, -4.8795166015625, -4.62872314453125, -4.3779296875, -4.12713623046875, -3.8763427734375, -3.62554931640625, -3.374755859375, -3.12396240234375, -2.8731689453125, -2.62237548828125, -2.37158203125, -2.12078857421875, -1.8699951171875, -1.61920166015625, -1.368408203125, -1.11761474609375, -0.8668212890625, -0.61602783203125, -0.365234375, -0.11444091796875, 0.1363525390625, 0.38714599609375, 0.637939453125, 0.88873291015625, 1.1395263671875, 1.39031982421875, 1.64111328125, 1.89190673828125, 2.1427001953125, 2.39349365234375, 2.644287109375, 2.89508056640625, 3.1458740234375, 3.39666748046875, 3.6474609375, 3.89825439453125, 4.1490478515625, 4.39984130859375, 4.650634765625, 4.90142822265625, 5.1522216796875, 5.40301513671875, 5.65380859375, 5.90460205078125, 6.1553955078125, 6.40618896484375, 6.656982421875, 6.90777587890625, 7.1585693359375, 7.40936279296875, 7.66015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 0.0, 3.0, 6.0, 12.0, 7.0, 8.0, 13.0, 19.0, 17.0, 16.0, 15.0, 27.0, 22.0, 28.0, 28.0, 40.0, 31.0, 44.0, 43.0, 52.0, 43.0, 40.0, 53.0, 34.0, 43.0, 41.0, 34.0, 41.0, 24.0, 38.0, 31.0, 27.0, 21.0, 22.0, 11.0, 14.0, 12.0, 10.0, 7.0, 5.0, 2.0, 7.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.200927734375, -15.68310546875, -15.165283203125, -14.6474609375, -14.129638671875, -13.61181640625, -13.093994140625, -12.576171875, -12.058349609375, -11.54052734375, -11.022705078125, -10.5048828125, -9.987060546875, -9.46923828125, -8.951416015625, -8.43359375, -7.915771484375, -7.39794921875, -6.880126953125, -6.3623046875, -5.844482421875, -5.32666015625, -4.808837890625, -4.291015625, -3.773193359375, -3.25537109375, -2.737548828125, -2.2197265625, -1.701904296875, -1.18408203125, -0.666259765625, -0.1484375, 0.369384765625, 0.88720703125, 1.405029296875, 1.9228515625, 2.440673828125, 2.95849609375, 3.476318359375, 3.994140625, 4.511962890625, 5.02978515625, 5.547607421875, 6.0654296875, 6.583251953125, 7.10107421875, 7.618896484375, 8.13671875, 8.654541015625, 9.17236328125, 9.690185546875, 10.2080078125, 10.725830078125, 11.24365234375, 11.761474609375, 12.279296875, 12.797119140625, 13.31494140625, 13.832763671875, 14.3505859375, 14.868408203125, 15.38623046875, 15.904052734375, 16.421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 9.0, 16.0, 26.0, 44.0, 62.0, 123.0, 187.0, 352.0, 583.0, 934.0, 1553.0, 2629.0, 4262.0, 6725.0, 10608.0, 16497.0, 24861.0, 36316.0, 50237.0, 66804.0, 84756.0, 98129.0, 106625.0, 108138.0, 100517.0, 87807.0, 70753.0, 53868.0, 39042.0, 26969.0, 17868.0, 11712.0, 7427.0, 4790.0, 2958.0, 1765.0, 1041.0, 617.0, 396.0, 235.0, 135.0, 73.0, 52.0, 24.0, 12.0, 13.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.0830078125, -8.791015625, -8.4990234375, -8.20703125, -7.9150390625, -7.623046875, -7.3310546875, -7.0390625, -6.7470703125, -6.455078125, -6.1630859375, -5.87109375, -5.5791015625, -5.287109375, -4.9951171875, -4.703125, -4.4111328125, -4.119140625, -3.8271484375, -3.53515625, -3.2431640625, -2.951171875, -2.6591796875, -2.3671875, -2.0751953125, -1.783203125, -1.4912109375, -1.19921875, -0.9072265625, -0.615234375, -0.3232421875, -0.03125, 0.2607421875, 0.552734375, 0.8447265625, 1.13671875, 1.4287109375, 1.720703125, 2.0126953125, 2.3046875, 2.5966796875, 2.888671875, 3.1806640625, 3.47265625, 3.7646484375, 4.056640625, 4.3486328125, 4.640625, 4.9326171875, 5.224609375, 5.5166015625, 5.80859375, 6.1005859375, 6.392578125, 6.6845703125, 6.9765625, 7.2685546875, 7.560546875, 7.8525390625, 8.14453125, 8.4365234375, 8.728515625, 9.0205078125, 9.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 11.0, 15.0, 23.0, 21.0, 24.0, 27.0, 39.0, 43.0, 36.0, 32.0, 44.0, 49.0, 43.0, 45.0, 32.0, 41.0, 32.0, 41.0, 43.0, 39.0, 34.0, 29.0, 36.0, 32.0, 23.0, 26.0, 19.0, 18.0, 11.0, 21.0, 18.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3984375, -11.048828125, -10.69921875, -10.349609375, -10.0, -9.650390625, -9.30078125, -8.951171875, -8.6015625, -8.251953125, -7.90234375, -7.552734375, -7.203125, -6.853515625, -6.50390625, -6.154296875, -5.8046875, -5.455078125, -5.10546875, -4.755859375, -4.40625, -4.056640625, -3.70703125, -3.357421875, -3.0078125, -2.658203125, -2.30859375, -1.958984375, -1.609375, -1.259765625, -0.91015625, -0.560546875, -0.2109375, 0.138671875, 0.48828125, 0.837890625, 1.1875, 1.537109375, 1.88671875, 2.236328125, 2.5859375, 2.935546875, 3.28515625, 3.634765625, 3.984375, 4.333984375, 4.68359375, 5.033203125, 5.3828125, 5.732421875, 6.08203125, 6.431640625, 6.78125, 7.130859375, 7.48046875, 7.830078125, 8.1796875, 8.529296875, 8.87890625, 9.228515625, 9.578125, 9.927734375, 10.27734375, 10.626953125, 10.9765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 14.0, 9.0, 26.0, 37.0, 69.0, 92.0, 184.0, 288.0, 600.0, 1011.0, 1629.0, 2833.0, 4962.0, 8573.0, 14464.0, 23983.0, 37318.0, 56368.0, 79681.0, 103234.0, 120714.0, 127692.0, 121830.0, 103809.0, 81547.0, 57865.0, 38808.0, 24686.0, 15114.0, 8796.0, 5265.0, 2973.0, 1733.0, 968.0, 557.0, 359.0, 189.0, 112.0, 72.0, 36.0, 23.0, 13.0, 8.0, 6.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.25, -4.130401611328125, -4.01080322265625, -3.891204833984375, -3.7716064453125, -3.652008056640625, -3.53240966796875, -3.412811279296875, -3.293212890625, -3.173614501953125, -3.05401611328125, -2.934417724609375, -2.8148193359375, -2.695220947265625, -2.57562255859375, -2.456024169921875, -2.33642578125, -2.216827392578125, -2.09722900390625, -1.977630615234375, -1.8580322265625, -1.738433837890625, -1.61883544921875, -1.499237060546875, -1.379638671875, -1.260040283203125, -1.14044189453125, -1.020843505859375, -0.9012451171875, -0.781646728515625, -0.66204833984375, -0.542449951171875, -0.4228515625, -0.303253173828125, -0.18365478515625, -0.064056396484375, 0.0555419921875, 0.175140380859375, 0.29473876953125, 0.414337158203125, 0.533935546875, 0.653533935546875, 0.77313232421875, 0.892730712890625, 1.0123291015625, 1.131927490234375, 1.25152587890625, 1.371124267578125, 1.49072265625, 1.610321044921875, 1.72991943359375, 1.849517822265625, 1.9691162109375, 2.088714599609375, 2.20831298828125, 2.327911376953125, 2.447509765625, 2.567108154296875, 2.68670654296875, 2.806304931640625, 2.9259033203125, 3.045501708984375, 3.16510009765625, 3.284698486328125, 3.404296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 4.0, 9.0, 10.0, 11.0, 11.0, 19.0, 26.0, 19.0, 23.0, 33.0, 24.0, 33.0, 37.0, 39.0, 44.0, 42.0, 48.0, 42.0, 53.0, 42.0, 41.0, 31.0, 35.0, 43.0, 22.0, 29.0, 28.0, 22.0, 28.0, 22.0, 23.0, 16.0, 13.0, 9.0, 12.0, 9.0, 4.0, 2.0, 5.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003452301025390625, -0.00033386796712875366, -0.0003225058317184448, -0.000311143696308136, -0.00029978156089782715, -0.0002884194254875183, -0.00027705729007720947, -0.00026569515466690063, -0.0002543330192565918, -0.00024297088384628296, -0.00023160874843597412, -0.00022024661302566528, -0.00020888447761535645, -0.0001975223422050476, -0.00018616020679473877, -0.00017479807138442993, -0.0001634359359741211, -0.00015207380056381226, -0.00014071166515350342, -0.00012934952974319458, -0.00011798739433288574, -0.0001066252589225769, -9.526312351226807e-05, -8.390098810195923e-05, -7.253885269165039e-05, -6.117671728134155e-05, -4.9814581871032715e-05, -3.845244646072388e-05, -2.709031105041504e-05, -1.57281756401062e-05, -4.366040229797363e-06, 6.996095180511475e-06, 1.8358230590820312e-05, 2.972036600112915e-05, 4.108250141143799e-05, 5.2444636821746826e-05, 6.380677223205566e-05, 7.51689076423645e-05, 8.653104305267334e-05, 9.789317846298218e-05, 0.00010925531387329102, 0.00012061744928359985, 0.0001319795846939087, 0.00014334172010421753, 0.00015470385551452637, 0.0001660659909248352, 0.00017742812633514404, 0.00018879026174545288, 0.00020015239715576172, 0.00021151453256607056, 0.0002228766679763794, 0.00023423880338668823, 0.00024560093879699707, 0.0002569630742073059, 0.00026832520961761475, 0.0002796873450279236, 0.0002910494804382324, 0.00030241161584854126, 0.0003137737512588501, 0.00032513588666915894, 0.0003364980220794678, 0.0003478601574897766, 0.00035922229290008545, 0.0003705844283103943, 0.0003819465637207031]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 28.0, 23.0, 51.0, 82.0, 126.0, 226.0, 394.0, 640.0, 1109.0, 2092.0, 3587.0, 6393.0, 10830.0, 17864.0, 29482.0, 46154.0, 68897.0, 94677.0, 118792.0, 132755.0, 131173.0, 115499.0, 90913.0, 65362.0, 43974.0, 27667.0, 16451.0, 9973.0, 5556.0, 3315.0, 1879.0, 1089.0, 627.0, 342.0, 201.0, 113.0, 85.0, 52.0, 24.0, 13.0, 11.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.24609375, -4.11309814453125, -3.9801025390625, -3.84710693359375, -3.714111328125, -3.58111572265625, -3.4481201171875, -3.31512451171875, -3.18212890625, -3.04913330078125, -2.9161376953125, -2.78314208984375, -2.650146484375, -2.51715087890625, -2.3841552734375, -2.25115966796875, -2.1181640625, -1.98516845703125, -1.8521728515625, -1.71917724609375, -1.586181640625, -1.45318603515625, -1.3201904296875, -1.18719482421875, -1.05419921875, -0.92120361328125, -0.7882080078125, -0.65521240234375, -0.522216796875, -0.38922119140625, -0.2562255859375, -0.12322998046875, 0.009765625, 0.14276123046875, 0.2757568359375, 0.40875244140625, 0.541748046875, 0.67474365234375, 0.8077392578125, 0.94073486328125, 1.07373046875, 1.20672607421875, 1.3397216796875, 1.47271728515625, 1.605712890625, 1.73870849609375, 1.8717041015625, 2.00469970703125, 2.1376953125, 2.27069091796875, 2.4036865234375, 2.53668212890625, 2.669677734375, 2.80267333984375, 2.9356689453125, 3.06866455078125, 3.20166015625, 3.33465576171875, 3.4676513671875, 3.60064697265625, 3.733642578125, 3.86663818359375, 3.9996337890625, 4.13262939453125, 4.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 13.0, 15.0, 22.0, 27.0, 30.0, 30.0, 20.0, 43.0, 37.0, 51.0, 37.0, 50.0, 45.0, 52.0, 56.0, 42.0, 51.0, 46.0, 38.0, 24.0, 28.0, 29.0, 26.0, 21.0, 18.0, 19.0, 16.0, 13.0, 12.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5214385986328125, -1.471588134765625, -1.4217376708984375, -1.37188720703125, -1.3220367431640625, -1.272186279296875, -1.2223358154296875, -1.1724853515625, -1.1226348876953125, -1.072784423828125, -1.0229339599609375, -0.97308349609375, -0.9232330322265625, -0.873382568359375, -0.8235321044921875, -0.773681640625, -0.7238311767578125, -0.673980712890625, -0.6241302490234375, -0.57427978515625, -0.5244293212890625, -0.474578857421875, -0.4247283935546875, -0.3748779296875, -0.3250274658203125, -0.275177001953125, -0.2253265380859375, -0.17547607421875, -0.1256256103515625, -0.075775146484375, -0.0259246826171875, 0.02392578125, 0.0737762451171875, 0.123626708984375, 0.1734771728515625, 0.22332763671875, 0.2731781005859375, 0.323028564453125, 0.3728790283203125, 0.4227294921875, 0.4725799560546875, 0.522430419921875, 0.5722808837890625, 0.62213134765625, 0.6719818115234375, 0.721832275390625, 0.7716827392578125, 0.821533203125, 0.8713836669921875, 0.921234130859375, 0.9710845947265625, 1.02093505859375, 1.0707855224609375, 1.120635986328125, 1.1704864501953125, 1.2203369140625, 1.2701873779296875, 1.320037841796875, 1.3698883056640625, 1.41973876953125, 1.4695892333984375, 1.519439697265625, 1.5692901611328125, 1.619140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 13.0, 10.0, 21.0, 27.0, 36.0, 17.0, 43.0, 46.0, 47.0, 41.0, 53.0, 60.0, 69.0, 63.0, 68.0, 63.0, 44.0, 46.0, 35.0, 37.0, 31.0, 28.0, 29.0, 20.0, 8.0, 9.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5992431640625, -18.036405563354492, -17.473567962646484, -16.910730361938477, -16.34789276123047, -15.785055160522461, -15.222217559814453, -14.659379959106445, -14.096542358398438, -13.53370475769043, -12.970867156982422, -12.408029556274414, -11.845191955566406, -11.282354354858398, -10.71951675415039, -10.156679153442383, -9.593842506408691, -9.031004905700684, -8.468167304992676, -7.905329704284668, -7.34249210357666, -6.779654502868652, -6.216817378997803, -5.653979778289795, -5.091142177581787, -4.528304576873779, -3.9654669761657715, -3.4026296138763428, -2.839792013168335, -2.276954412460327, -1.7141170501708984, -1.1512794494628906, -0.5884418487548828, -0.025604307651519775, 0.5372332334518433, 1.1000707149505615, 1.6629083156585693, 2.225745916366577, 2.788583278656006, 3.3514208793640137, 3.9142584800720215, 4.477096080780029, 5.039933681488037, 5.602770805358887, 6.1656084060668945, 6.728446006774902, 7.29128360748291, 7.854121208190918, 8.416958808898926, 8.979796409606934, 9.542634010314941, 10.10547161102295, 10.668309211730957, 11.231146812438965, 11.793983459472656, 12.356821060180664, 12.919658660888672, 13.48249626159668, 14.045333862304688, 14.608171463012695, 15.171009063720703, 15.733846664428711, 16.29668426513672, 16.859521865844727, 17.422359466552734]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 7.0, 13.0, 4.0, 5.0, 14.0, 18.0, 18.0, 16.0, 13.0, 23.0, 29.0, 27.0, 35.0, 34.0, 50.0, 51.0, 48.0, 47.0, 46.0, 54.0, 48.0, 39.0, 51.0, 32.0, 40.0, 45.0, 31.0, 24.0, 36.0, 21.0, 14.0, 7.0, 20.0, 13.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.871850967407227, -17.271791458129883, -16.67173194885254, -16.071670532226562, -15.471611022949219, -14.871551513671875, -14.271492004394531, -13.671432495117188, -13.071372032165527, -12.471312522888184, -11.871252059936523, -11.27119255065918, -10.671133041381836, -10.071072578430176, -9.471013069152832, -8.870952606201172, -8.270893096923828, -7.670833110809326, -7.070773124694824, -6.4707136154174805, -5.8706536293029785, -5.270593643188477, -4.670534133911133, -4.070474147796631, -3.470414161682129, -2.870354175567627, -2.270294427871704, -1.6702345609664917, -1.0701746940612793, -0.47011470794677734, 0.1299450397491455, 0.7300047874450684, 1.3300666809082031, 1.9301265478134155, 2.530186414718628, 3.130246162414551, 3.7303061485290527, 4.330366134643555, 4.930425643920898, 5.5304856300354, 6.130545616149902, 6.730605602264404, 7.330665588378906, 7.93072509765625, 8.530784606933594, 9.130845069885254, 9.730904579162598, 10.330965042114258, 10.931024551391602, 11.531084060668945, 12.131144523620605, 12.73120403289795, 13.33126449584961, 13.931324005126953, 14.531383514404297, 15.13144302368164, 15.7315034866333, 16.33156394958496, 16.931623458862305, 17.53168296813965, 18.131742477416992, 18.73180389404297, 19.331863403320312, 19.931922912597656, 20.531982421875]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 17.0, 26.0, 37.0, 90.0, 130.0, 187.0, 328.0, 594.0, 925.0, 1619.0, 2498.0, 4162.0, 6696.0, 10928.0, 17160.0, 27099.0, 41124.0, 62619.0, 91985.0, 132055.0, 179879.0, 237172.0, 297296.0, 352547.0, 390698.0, 406870.0, 395603.0, 360604.0, 307524.0, 248377.0, 190261.0, 138978.0, 97723.0, 67057.0, 45006.0, 29376.0, 18832.0, 11915.0, 7392.0, 4375.0, 2604.0, 1613.0, 949.0, 583.0, 343.0, 178.0, 113.0, 70.0, 33.0, 27.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.859375, -9.556884765625, -9.25439453125, -8.951904296875, -8.6494140625, -8.346923828125, -8.04443359375, -7.741943359375, -7.439453125, -7.136962890625, -6.83447265625, -6.531982421875, -6.2294921875, -5.927001953125, -5.62451171875, -5.322021484375, -5.01953125, -4.717041015625, -4.41455078125, -4.112060546875, -3.8095703125, -3.507080078125, -3.20458984375, -2.902099609375, -2.599609375, -2.297119140625, -1.99462890625, -1.692138671875, -1.3896484375, -1.087158203125, -0.78466796875, -0.482177734375, -0.1796875, 0.122802734375, 0.42529296875, 0.727783203125, 1.0302734375, 1.332763671875, 1.63525390625, 1.937744140625, 2.240234375, 2.542724609375, 2.84521484375, 3.147705078125, 3.4501953125, 3.752685546875, 4.05517578125, 4.357666015625, 4.66015625, 4.962646484375, 5.26513671875, 5.567626953125, 5.8701171875, 6.172607421875, 6.47509765625, 6.777587890625, 7.080078125, 7.382568359375, 7.68505859375, 7.987548828125, 8.2900390625, 8.592529296875, 8.89501953125, 9.197509765625, 9.5]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 4.0, 6.0, 4.0, 7.0, 6.0, 9.0, 8.0, 13.0, 15.0, 20.0, 25.0, 29.0, 20.0, 48.0, 31.0, 35.0, 47.0, 47.0, 64.0, 45.0, 50.0, 50.0, 39.0, 44.0, 45.0, 42.0, 42.0, 32.0, 20.0, 33.0, 21.0, 23.0, 22.0, 7.0, 13.0, 8.0, 12.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.339111328125, -13.85009765625, -13.361083984375, -12.8720703125, -12.383056640625, -11.89404296875, -11.405029296875, -10.916015625, -10.427001953125, -9.93798828125, -9.448974609375, -8.9599609375, -8.470947265625, -7.98193359375, -7.492919921875, -7.00390625, -6.514892578125, -6.02587890625, -5.536865234375, -5.0478515625, -4.558837890625, -4.06982421875, -3.580810546875, -3.091796875, -2.602783203125, -2.11376953125, -1.624755859375, -1.1357421875, -0.646728515625, -0.15771484375, 0.331298828125, 0.8203125, 1.309326171875, 1.79833984375, 2.287353515625, 2.7763671875, 3.265380859375, 3.75439453125, 4.243408203125, 4.732421875, 5.221435546875, 5.71044921875, 6.199462890625, 6.6884765625, 7.177490234375, 7.66650390625, 8.155517578125, 8.64453125, 9.133544921875, 9.62255859375, 10.111572265625, 10.6005859375, 11.089599609375, 11.57861328125, 12.067626953125, 12.556640625, 13.045654296875, 13.53466796875, 14.023681640625, 14.5126953125, 15.001708984375, 15.49072265625, 15.979736328125, 16.46875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 10.0, 13.0, 26.0, 32.0, 79.0, 117.0, 238.0, 371.0, 589.0, 998.0, 1865.0, 2979.0, 5077.0, 8205.0, 13124.0, 21008.0, 32613.0, 48783.0, 72960.0, 102716.0, 142112.0, 186394.0, 237821.0, 286686.0, 330217.0, 360527.0, 373490.0, 366472.0, 340812.0, 299855.0, 252942.0, 201233.0, 155105.0, 113235.0, 80920.0, 55397.0, 36789.0, 23795.0, 15153.0, 9340.0, 5759.0, 3373.0, 2181.0, 1205.0, 726.0, 403.0, 239.0, 135.0, 69.0, 56.0, 28.0, 12.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.8671875, -9.56494140625, -9.2626953125, -8.96044921875, -8.658203125, -8.35595703125, -8.0537109375, -7.75146484375, -7.44921875, -7.14697265625, -6.8447265625, -6.54248046875, -6.240234375, -5.93798828125, -5.6357421875, -5.33349609375, -5.03125, -4.72900390625, -4.4267578125, -4.12451171875, -3.822265625, -3.52001953125, -3.2177734375, -2.91552734375, -2.61328125, -2.31103515625, -2.0087890625, -1.70654296875, -1.404296875, -1.10205078125, -0.7998046875, -0.49755859375, -0.1953125, 0.10693359375, 0.4091796875, 0.71142578125, 1.013671875, 1.31591796875, 1.6181640625, 1.92041015625, 2.22265625, 2.52490234375, 2.8271484375, 3.12939453125, 3.431640625, 3.73388671875, 4.0361328125, 4.33837890625, 4.640625, 4.94287109375, 5.2451171875, 5.54736328125, 5.849609375, 6.15185546875, 6.4541015625, 6.75634765625, 7.05859375, 7.36083984375, 7.6630859375, 7.96533203125, 8.267578125, 8.56982421875, 8.8720703125, 9.17431640625, 9.4765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 11.0, 12.0, 14.0, 23.0, 23.0, 30.0, 59.0, 60.0, 59.0, 72.0, 97.0, 79.0, 111.0, 141.0, 143.0, 160.0, 175.0, 179.0, 197.0, 181.0, 191.0, 201.0, 185.0, 177.0, 191.0, 155.0, 169.0, 150.0, 108.0, 102.0, 100.0, 97.0, 64.0, 67.0, 55.0, 46.0, 41.0, 30.0, 24.0, 21.0, 14.0, 8.0, 7.0, 10.0, 4.0, 5.0, 4.0, 0.0, 4.0, 2.0, 3.0], "bins": [-6.37890625, -6.1907958984375, -6.002685546875, -5.8145751953125, -5.62646484375, -5.4383544921875, -5.250244140625, -5.0621337890625, -4.8740234375, -4.6859130859375, -4.497802734375, -4.3096923828125, -4.12158203125, -3.9334716796875, -3.745361328125, -3.5572509765625, -3.369140625, -3.1810302734375, -2.992919921875, -2.8048095703125, -2.61669921875, -2.4285888671875, -2.240478515625, -2.0523681640625, -1.8642578125, -1.6761474609375, -1.488037109375, -1.2999267578125, -1.11181640625, -0.9237060546875, -0.735595703125, -0.5474853515625, -0.359375, -0.1712646484375, 0.016845703125, 0.2049560546875, 0.39306640625, 0.5811767578125, 0.769287109375, 0.9573974609375, 1.1455078125, 1.3336181640625, 1.521728515625, 1.7098388671875, 1.89794921875, 2.0860595703125, 2.274169921875, 2.4622802734375, 2.650390625, 2.8385009765625, 3.026611328125, 3.2147216796875, 3.40283203125, 3.5909423828125, 3.779052734375, 3.9671630859375, 4.1552734375, 4.3433837890625, 4.531494140625, 4.7196044921875, 4.90771484375, 5.0958251953125, 5.283935546875, 5.4720458984375, 5.66015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 5.0, 14.0, 8.0, 21.0, 16.0, 17.0, 25.0, 36.0, 28.0, 35.0, 40.0, 43.0, 39.0, 51.0, 52.0, 57.0, 47.0, 52.0, 56.0, 34.0, 53.0, 50.0, 31.0, 25.0, 32.0, 25.0, 18.0, 11.0, 19.0, 9.0, 16.0, 7.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.374584197998047, -14.856935501098633, -14.339285850524902, -13.821637153625488, -13.303987503051758, -12.786338806152344, -12.26869010925293, -11.7510404586792, -11.233390808105469, -10.715742111206055, -10.198092460632324, -9.68044376373291, -9.16279411315918, -8.645145416259766, -8.127496719360352, -7.609847068786621, -7.092198371887207, -6.574549198150635, -6.0569000244140625, -5.539251327514648, -5.021601676940918, -4.503952980041504, -3.9863038063049316, -3.4686546325683594, -2.951005458831787, -2.433356285095215, -1.9157072305679321, -1.3980581760406494, -0.8804090023040771, -0.3627598285675049, 0.15488910675048828, 0.6725382804870605, 1.1901874542236328, 1.707836627960205, 2.2254858016967773, 2.7431347370147705, 3.2607839107513428, 3.778433084487915, 4.296082019805908, 4.8137311935424805, 5.331380367279053, 5.849029541015625, 6.366678714752197, 6.8843278884887695, 7.401976585388184, 7.919626235961914, 8.437274932861328, 8.954923629760742, 9.472573280334473, 9.990221977233887, 10.507871627807617, 11.025520324707031, 11.543169975280762, 12.060818672180176, 12.578468322753906, 13.09611701965332, 13.613765716552734, 14.131414413452148, 14.649064064025879, 15.166712760925293, 15.684362411499023, 16.202011108398438, 16.71965980529785, 17.237308502197266, 17.754959106445312]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 3.0, 4.0, 12.0, 12.0, 18.0, 10.0, 13.0, 12.0, 23.0, 27.0, 29.0, 41.0, 39.0, 32.0, 39.0, 53.0, 42.0, 54.0, 44.0, 49.0, 54.0, 48.0, 43.0, 33.0, 38.0, 37.0, 35.0, 26.0, 15.0, 18.0, 20.0, 17.0, 12.0, 12.0, 8.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.725248336791992, -17.14628791809082, -16.56732749938965, -15.988367080688477, -15.409406661987305, -14.830446243286133, -14.251485824584961, -13.672525405883789, -13.093564987182617, -12.514604568481445, -11.935644149780273, -11.356683731079102, -10.77772331237793, -10.198762893676758, -9.619802474975586, -9.040842056274414, -8.461881637573242, -7.88292121887207, -7.303960800170898, -6.725000381469727, -6.146039962768555, -5.567079544067383, -4.988119125366211, -4.409158706665039, -3.830198287963867, -3.2512378692626953, -2.6722774505615234, -2.0933170318603516, -1.5143566131591797, -0.9353961944580078, -0.35643577575683594, 0.22252464294433594, 0.8014850616455078, 1.3804454803466797, 1.9594058990478516, 2.5383663177490234, 3.1173267364501953, 3.696287155151367, 4.275247573852539, 4.854207992553711, 5.433168411254883, 6.012128829956055, 6.591089248657227, 7.170049667358398, 7.74901008605957, 8.327970504760742, 8.906930923461914, 9.485891342163086, 10.064851760864258, 10.64381217956543, 11.222772598266602, 11.801733016967773, 12.380693435668945, 12.959653854370117, 13.538614273071289, 14.117574691772461, 14.696535110473633, 15.275495529174805, 15.854455947875977, 16.43341636657715, 17.01237678527832, 17.591337203979492, 18.170297622680664, 18.749258041381836, 19.328218460083008]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 9.0, 9.0, 23.0, 28.0, 39.0, 72.0, 129.0, 209.0, 316.0, 460.0, 720.0, 1153.0, 1849.0, 2802.0, 4400.0, 7222.0, 11705.0, 18266.0, 29523.0, 46542.0, 72185.0, 105084.0, 140463.0, 156603.0, 141083.0, 106570.0, 73533.0, 47459.0, 29954.0, 18923.0, 11584.0, 7224.0, 4650.0, 2770.0, 1767.0, 1153.0, 744.0, 493.0, 293.0, 198.0, 129.0, 95.0, 49.0, 25.0, 20.0, 11.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.63763427734375, -2.5565185546875, -2.47540283203125, -2.394287109375, -2.31317138671875, -2.2320556640625, -2.15093994140625, -2.06982421875, -1.98870849609375, -1.9075927734375, -1.82647705078125, -1.745361328125, -1.66424560546875, -1.5831298828125, -1.50201416015625, -1.4208984375, -1.33978271484375, -1.2586669921875, -1.17755126953125, -1.096435546875, -1.01531982421875, -0.9342041015625, -0.85308837890625, -0.77197265625, -0.69085693359375, -0.6097412109375, -0.52862548828125, -0.447509765625, -0.36639404296875, -0.2852783203125, -0.20416259765625, -0.123046875, -0.04193115234375, 0.0391845703125, 0.12030029296875, 0.201416015625, 0.28253173828125, 0.3636474609375, 0.44476318359375, 0.52587890625, 0.60699462890625, 0.6881103515625, 0.76922607421875, 0.850341796875, 0.93145751953125, 1.0125732421875, 1.09368896484375, 1.1748046875, 1.25592041015625, 1.3370361328125, 1.41815185546875, 1.499267578125, 1.58038330078125, 1.6614990234375, 1.74261474609375, 1.82373046875, 1.90484619140625, 1.9859619140625, 2.06707763671875, 2.148193359375, 2.22930908203125, 2.3104248046875, 2.39154052734375, 2.47265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 6.0, 9.0, 7.0, 8.0, 14.0, 14.0, 18.0, 19.0, 21.0, 30.0, 32.0, 37.0, 35.0, 48.0, 41.0, 43.0, 50.0, 51.0, 44.0, 43.0, 47.0, 58.0, 36.0, 35.0, 33.0, 30.0, 27.0, 20.0, 33.0, 28.0, 12.0, 16.0, 10.0, 7.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.235595703125, -16.64306640625, -16.050537109375, -15.4580078125, -14.865478515625, -14.27294921875, -13.680419921875, -13.087890625, -12.495361328125, -11.90283203125, -11.310302734375, -10.7177734375, -10.125244140625, -9.53271484375, -8.940185546875, -8.34765625, -7.755126953125, -7.16259765625, -6.570068359375, -5.9775390625, -5.385009765625, -4.79248046875, -4.199951171875, -3.607421875, -3.014892578125, -2.42236328125, -1.829833984375, -1.2373046875, -0.644775390625, -0.05224609375, 0.540283203125, 1.1328125, 1.725341796875, 2.31787109375, 2.910400390625, 3.5029296875, 4.095458984375, 4.68798828125, 5.280517578125, 5.873046875, 6.465576171875, 7.05810546875, 7.650634765625, 8.2431640625, 8.835693359375, 9.42822265625, 10.020751953125, 10.61328125, 11.205810546875, 11.79833984375, 12.390869140625, 12.9833984375, 13.575927734375, 14.16845703125, 14.760986328125, 15.353515625, 15.946044921875, 16.53857421875, 17.131103515625, 17.7236328125, 18.316162109375, 18.90869140625, 19.501220703125, 20.09375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 9.0, 13.0, 30.0, 33.0, 62.0, 78.0, 94.0, 168.0, 277.0, 374.0, 580.0, 943.0, 1417.0, 2203.0, 3224.0, 4977.0, 7682.0, 11988.0, 18282.0, 28983.0, 43959.0, 64437.0, 90665.0, 117510.0, 136148.0, 135174.0, 114243.0, 86526.0, 61511.0, 41110.0, 27008.0, 17240.0, 11104.0, 7167.0, 4586.0, 2941.0, 1964.0, 1262.0, 871.0, 574.0, 377.0, 244.0, 169.0, 92.0, 97.0, 44.0, 42.0, 21.0, 14.0, 13.0, 4.0, 9.0, 4.0, 1.0, 2.0, 2.0], "bins": [-2.431640625, -2.3577880859375, -2.283935546875, -2.2100830078125, -2.13623046875, -2.0623779296875, -1.988525390625, -1.9146728515625, -1.8408203125, -1.7669677734375, -1.693115234375, -1.6192626953125, -1.54541015625, -1.4715576171875, -1.397705078125, -1.3238525390625, -1.25, -1.1761474609375, -1.102294921875, -1.0284423828125, -0.95458984375, -0.8807373046875, -0.806884765625, -0.7330322265625, -0.6591796875, -0.5853271484375, -0.511474609375, -0.4376220703125, -0.36376953125, -0.2899169921875, -0.216064453125, -0.1422119140625, -0.068359375, 0.0054931640625, 0.079345703125, 0.1531982421875, 0.22705078125, 0.3009033203125, 0.374755859375, 0.4486083984375, 0.5224609375, 0.5963134765625, 0.670166015625, 0.7440185546875, 0.81787109375, 0.8917236328125, 0.965576171875, 1.0394287109375, 1.11328125, 1.1871337890625, 1.260986328125, 1.3348388671875, 1.40869140625, 1.4825439453125, 1.556396484375, 1.6302490234375, 1.7041015625, 1.7779541015625, 1.851806640625, 1.9256591796875, 1.99951171875, 2.0733642578125, 2.147216796875, 2.2210693359375, 2.294921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 10.0, 7.0, 10.0, 3.0, 11.0, 13.0, 10.0, 13.0, 21.0, 26.0, 24.0, 25.0, 33.0, 19.0, 24.0, 36.0, 27.0, 42.0, 40.0, 29.0, 42.0, 29.0, 37.0, 37.0, 21.0, 47.0, 43.0, 30.0, 38.0, 36.0, 22.0, 27.0, 19.0, 20.0, 18.0, 16.0, 20.0, 7.0, 11.0, 4.0, 10.0, 9.0, 6.0, 2.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.765625, -9.451904296875, -9.13818359375, -8.824462890625, -8.5107421875, -8.197021484375, -7.88330078125, -7.569580078125, -7.255859375, -6.942138671875, -6.62841796875, -6.314697265625, -6.0009765625, -5.687255859375, -5.37353515625, -5.059814453125, -4.74609375, -4.432373046875, -4.11865234375, -3.804931640625, -3.4912109375, -3.177490234375, -2.86376953125, -2.550048828125, -2.236328125, -1.922607421875, -1.60888671875, -1.295166015625, -0.9814453125, -0.667724609375, -0.35400390625, -0.040283203125, 0.2734375, 0.587158203125, 0.90087890625, 1.214599609375, 1.5283203125, 1.842041015625, 2.15576171875, 2.469482421875, 2.783203125, 3.096923828125, 3.41064453125, 3.724365234375, 4.0380859375, 4.351806640625, 4.66552734375, 4.979248046875, 5.29296875, 5.606689453125, 5.92041015625, 6.234130859375, 6.5478515625, 6.861572265625, 7.17529296875, 7.489013671875, 7.802734375, 8.116455078125, 8.43017578125, 8.743896484375, 9.0576171875, 9.371337890625, 9.68505859375, 9.998779296875, 10.3125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 14.0, 18.0, 12.0, 31.0, 34.0, 36.0, 52.0, 56.0, 86.0, 92.0, 94.0, 155.0, 178.0, 210.0, 296.0, 410.0, 560.0, 836.0, 1239.0, 2233.0, 4446.0, 11282.0, 34994.0, 133127.0, 384414.0, 327399.0, 99560.0, 27387.0, 9319.0, 3884.0, 2006.0, 1125.0, 777.0, 513.0, 378.0, 288.0, 214.0, 162.0, 156.0, 104.0, 92.0, 62.0, 44.0, 41.0, 28.0, 25.0, 16.0, 14.0, 12.0, 14.0, 3.0, 2.0, 8.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.7333984375, -0.7104034423828125, -0.687408447265625, -0.6644134521484375, -0.64141845703125, -0.6184234619140625, -0.595428466796875, -0.5724334716796875, -0.5494384765625, -0.5264434814453125, -0.503448486328125, -0.4804534912109375, -0.45745849609375, -0.4344635009765625, -0.411468505859375, -0.3884735107421875, -0.365478515625, -0.3424835205078125, -0.319488525390625, -0.2964935302734375, -0.27349853515625, -0.2505035400390625, -0.227508544921875, -0.2045135498046875, -0.1815185546875, -0.1585235595703125, -0.135528564453125, -0.1125335693359375, -0.08953857421875, -0.0665435791015625, -0.043548583984375, -0.0205535888671875, 0.00244140625, 0.0254364013671875, 0.048431396484375, 0.0714263916015625, 0.09442138671875, 0.1174163818359375, 0.140411376953125, 0.1634063720703125, 0.1864013671875, 0.2093963623046875, 0.232391357421875, 0.2553863525390625, 0.27838134765625, 0.3013763427734375, 0.324371337890625, 0.3473663330078125, 0.370361328125, 0.3933563232421875, 0.416351318359375, 0.4393463134765625, 0.46234130859375, 0.4853363037109375, 0.508331298828125, 0.5313262939453125, 0.5543212890625, 0.5773162841796875, 0.600311279296875, 0.6233062744140625, 0.64630126953125, 0.6692962646484375, 0.692291259765625, 0.7152862548828125, 0.73828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 18.0, 37.0, 35.0, 53.0, 73.0, 107.0, 107.0, 114.0, 122.0, 87.0, 81.0, 50.0, 28.0, 17.0, 20.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.908884435892105e-05, -7.628090679645538e-05, -7.347296923398972e-05, -7.066503167152405e-05, -6.785709410905838e-05, -6.504915654659271e-05, -6.224121898412704e-05, -5.943328142166138e-05, -5.662534385919571e-05, -5.381740629673004e-05, -5.1009468734264374e-05, -4.8201531171798706e-05, -4.539359360933304e-05, -4.258565604686737e-05, -3.97777184844017e-05, -3.6969780921936035e-05, -3.416184335947037e-05, -3.13539057970047e-05, -2.8545968234539032e-05, -2.5738030672073364e-05, -2.2930093109607697e-05, -2.012215554714203e-05, -1.731421798467636e-05, -1.4506280422210693e-05, -1.1698342859745026e-05, -8.890405297279358e-06, -6.08246773481369e-06, -3.2745301723480225e-06, -4.6659260988235474e-07, 2.341344952583313e-06, 5.149282515048981e-06, 7.957220077514648e-06, 1.0765157639980316e-05, 1.3573095202445984e-05, 1.638103276491165e-05, 1.918897032737732e-05, 2.1996907889842987e-05, 2.4804845452308655e-05, 2.7612783014774323e-05, 3.042072057723999e-05, 3.322865813970566e-05, 3.6036595702171326e-05, 3.8844533264636993e-05, 4.165247082710266e-05, 4.446040838956833e-05, 4.7268345952033997e-05, 5.0076283514499664e-05, 5.288422107696533e-05, 5.5692158639431e-05, 5.850009620189667e-05, 6.130803376436234e-05, 6.4115971326828e-05, 6.692390888929367e-05, 6.973184645175934e-05, 7.2539784014225e-05, 7.534772157669067e-05, 7.815565913915634e-05, 8.096359670162201e-05, 8.377153426408768e-05, 8.657947182655334e-05, 8.938740938901901e-05, 9.219534695148468e-05, 9.500328451395035e-05, 9.781122207641602e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 21.0, 25.0, 30.0, 47.0, 53.0, 86.0, 120.0, 162.0, 233.0, 349.0, 493.0, 752.0, 1140.0, 1896.0, 3049.0, 5352.0, 9559.0, 17340.0, 34266.0, 68869.0, 138628.0, 237377.0, 239910.0, 141206.0, 70877.0, 35108.0, 17952.0, 9640.0, 5298.0, 3162.0, 1856.0, 1237.0, 780.0, 512.0, 362.0, 249.0, 160.0, 110.0, 80.0, 53.0, 34.0, 43.0, 20.0, 10.0, 8.0, 12.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74658203125, -0.721710205078125, -0.69683837890625, -0.671966552734375, -0.6470947265625, -0.622222900390625, -0.59735107421875, -0.572479248046875, -0.547607421875, -0.522735595703125, -0.49786376953125, -0.472991943359375, -0.4481201171875, -0.423248291015625, -0.39837646484375, -0.373504638671875, -0.3486328125, -0.323760986328125, -0.29888916015625, -0.274017333984375, -0.2491455078125, -0.224273681640625, -0.19940185546875, -0.174530029296875, -0.149658203125, -0.124786376953125, -0.09991455078125, -0.075042724609375, -0.0501708984375, -0.025299072265625, -0.00042724609375, 0.024444580078125, 0.04931640625, 0.074188232421875, 0.09906005859375, 0.123931884765625, 0.1488037109375, 0.173675537109375, 0.19854736328125, 0.223419189453125, 0.248291015625, 0.273162841796875, 0.29803466796875, 0.322906494140625, 0.3477783203125, 0.372650146484375, 0.39752197265625, 0.422393798828125, 0.447265625, 0.472137451171875, 0.49700927734375, 0.521881103515625, 0.5467529296875, 0.571624755859375, 0.59649658203125, 0.621368408203125, 0.646240234375, 0.671112060546875, 0.69598388671875, 0.720855712890625, 0.7457275390625, 0.770599365234375, 0.79547119140625, 0.820343017578125, 0.84521484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 0.0, 2.0, 2.0, 10.0, 4.0, 10.0, 6.0, 16.0, 6.0, 20.0, 23.0, 22.0, 40.0, 41.0, 44.0, 65.0, 55.0, 65.0, 81.0, 76.0, 57.0, 69.0, 48.0, 38.0, 42.0, 31.0, 24.0, 21.0, 13.0, 10.0, 14.0, 4.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24787521362304688, -0.23818206787109375, -0.22848892211914062, -0.2187957763671875, -0.20910263061523438, -0.19940948486328125, -0.18971633911132812, -0.180023193359375, -0.17033004760742188, -0.16063690185546875, -0.15094375610351562, -0.1412506103515625, -0.13155746459960938, -0.12186431884765625, -0.11217117309570312, -0.10247802734375, -0.09278488159179688, -0.08309173583984375, -0.07339859008789062, -0.0637054443359375, -0.054012298583984375, -0.04431915283203125, -0.034626007080078125, -0.024932861328125, -0.015239715576171875, -0.00554656982421875, 0.004146575927734375, 0.0138397216796875, 0.023532867431640625, 0.03322601318359375, 0.042919158935546875, 0.0526123046875, 0.062305450439453125, 0.07199859619140625, 0.08169174194335938, 0.0913848876953125, 0.10107803344726562, 0.11077117919921875, 0.12046432495117188, 0.130157470703125, 0.13985061645507812, 0.14954376220703125, 0.15923690795898438, 0.1689300537109375, 0.17862319946289062, 0.18831634521484375, 0.19800949096679688, 0.20770263671875, 0.21739578247070312, 0.22708892822265625, 0.23678207397460938, 0.2464752197265625, 0.2561683654785156, 0.26586151123046875, 0.2755546569824219, 0.285247802734375, 0.2949409484863281, 0.30463409423828125, 0.3143272399902344, 0.3240203857421875, 0.3337135314941406, 0.34340667724609375, 0.3530998229980469, 0.36279296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 14.0, 12.0, 18.0, 20.0, 15.0, 26.0, 36.0, 35.0, 38.0, 35.0, 50.0, 33.0, 53.0, 53.0, 56.0, 45.0, 57.0, 51.0, 38.0, 53.0, 47.0, 23.0, 27.0, 30.0, 25.0, 18.0, 13.0, 14.0, 15.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.235774040222168, -14.71944522857666, -14.203116416931152, -13.686787605285645, -13.170458793640137, -12.654129981994629, -12.137802124023438, -11.62147331237793, -11.105144500732422, -10.588815689086914, -10.072486877441406, -9.556158065795898, -9.03982925415039, -8.523500442504883, -8.007171630859375, -7.490843296051025, -6.974514007568359, -6.458185195922852, -5.941856384277344, -5.425527572631836, -4.909198760986328, -4.39286994934082, -3.8765416145324707, -3.360212802886963, -2.843883991241455, -2.3275551795959473, -1.811226487159729, -1.2948977947235107, -0.7785689830780029, -0.2622401714324951, 0.2540884017944336, 0.7704172134399414, 1.2867469787597656, 1.8030757904052734, 2.3194046020507812, 2.83573317527771, 3.3520619869232178, 3.8683907985687256, 4.384719371795654, 4.901048183441162, 5.41737699508667, 5.933705806732178, 6.4500346183776855, 6.966362953186035, 7.482691764831543, 7.999020576477051, 8.515349388122559, 9.031678199768066, 9.548007011413574, 10.064335823059082, 10.58066463470459, 11.096993446350098, 11.613322257995605, 12.129651069641113, 12.645978927612305, 13.162307739257812, 13.67863655090332, 14.194965362548828, 14.711294174194336, 15.227622985839844, 15.743951797485352, 16.26028060913086, 16.776609420776367, 17.292938232421875, 17.809267044067383]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 13.0, 10.0, 19.0, 10.0, 12.0, 13.0, 26.0, 23.0, 27.0, 45.0, 35.0, 35.0, 40.0, 49.0, 43.0, 54.0, 49.0, 45.0, 55.0, 43.0, 43.0, 33.0, 37.0, 38.0, 32.0, 27.0, 20.0, 18.0, 20.0, 16.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.608219146728516, -17.03321647644043, -16.458213806152344, -15.883211135864258, -15.308208465576172, -14.733205795288086, -14.158204078674316, -13.58320140838623, -13.008198738098145, -12.433196067810059, -11.858193397521973, -11.283190727233887, -10.708189010620117, -10.133186340332031, -9.558183670043945, -8.98318099975586, -8.408178329467773, -7.8331756591796875, -7.258172988891602, -6.683170795440674, -6.108168125152588, -5.533165454864502, -4.958163261413574, -4.383160591125488, -3.8081579208374023, -3.2331552505493164, -2.6581528186798096, -2.0831503868103027, -1.5081477165222168, -0.9331450462341309, -0.358142614364624, 0.2168598175048828, 0.7918643951416016, 1.366866946220398, 1.9418694972991943, 2.516871929168701, 3.091874599456787, 3.666877269744873, 4.241879463195801, 4.816882133483887, 5.391884803771973, 5.966887474060059, 6.5418901443481445, 7.116892337799072, 7.691895008087158, 8.266897201538086, 8.841899871826172, 9.416902542114258, 9.991905212402344, 10.56690788269043, 11.141910552978516, 11.716913223266602, 12.291915893554688, 12.866918563842773, 13.441920280456543, 14.016922950744629, 14.591925621032715, 15.1669282913208, 15.741930961608887, 16.316932678222656, 16.891935348510742, 17.466938018798828, 18.041940689086914, 18.616943359375, 19.191946029663086]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 13.0, 17.0, 31.0, 49.0, 84.0, 138.0, 213.0, 367.0, 560.0, 956.0, 1445.0, 2313.0, 3618.0, 5623.0, 8311.0, 12238.0, 18150.0, 25494.0, 35163.0, 46850.0, 59776.0, 72305.0, 84396.0, 92681.0, 95212.0, 92784.0, 85785.0, 73866.0, 61221.0, 48493.0, 36882.0, 26671.0, 18923.0, 13032.0, 8888.0, 5769.0, 3754.0, 2346.0, 1565.0, 996.0, 645.0, 366.0, 226.0, 126.0, 88.0, 44.0, 27.0, 21.0, 18.0, 7.0, 6.0, 2.0, 2.0, 1.0], "bins": [-8.6875, -8.4361572265625, -8.184814453125, -7.9334716796875, -7.68212890625, -7.4307861328125, -7.179443359375, -6.9281005859375, -6.6767578125, -6.4254150390625, -6.174072265625, -5.9227294921875, -5.67138671875, -5.4200439453125, -5.168701171875, -4.9173583984375, -4.666015625, -4.4146728515625, -4.163330078125, -3.9119873046875, -3.66064453125, -3.4093017578125, -3.157958984375, -2.9066162109375, -2.6552734375, -2.4039306640625, -2.152587890625, -1.9012451171875, -1.64990234375, -1.3985595703125, -1.147216796875, -0.8958740234375, -0.64453125, -0.3931884765625, -0.141845703125, 0.1094970703125, 0.36083984375, 0.6121826171875, 0.863525390625, 1.1148681640625, 1.3662109375, 1.6175537109375, 1.868896484375, 2.1202392578125, 2.37158203125, 2.6229248046875, 2.874267578125, 3.1256103515625, 3.376953125, 3.6282958984375, 3.879638671875, 4.1309814453125, 4.38232421875, 4.6336669921875, 4.885009765625, 5.1363525390625, 5.3876953125, 5.6390380859375, 5.890380859375, 6.1417236328125, 6.39306640625, 6.6444091796875, 6.895751953125, 7.1470947265625, 7.3984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 11.0, 7.0, 4.0, 8.0, 9.0, 13.0, 20.0, 13.0, 13.0, 28.0, 25.0, 26.0, 25.0, 34.0, 37.0, 46.0, 34.0, 38.0, 55.0, 35.0, 54.0, 43.0, 40.0, 42.0, 42.0, 36.0, 38.0, 29.0, 36.0, 24.0, 21.0, 16.0, 27.0, 13.0, 10.0, 12.0, 10.0, 8.0, 8.0, 2.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84375, -16.28564453125, -15.7275390625, -15.16943359375, -14.611328125, -14.05322265625, -13.4951171875, -12.93701171875, -12.37890625, -11.82080078125, -11.2626953125, -10.70458984375, -10.146484375, -9.58837890625, -9.0302734375, -8.47216796875, -7.9140625, -7.35595703125, -6.7978515625, -6.23974609375, -5.681640625, -5.12353515625, -4.5654296875, -4.00732421875, -3.44921875, -2.89111328125, -2.3330078125, -1.77490234375, -1.216796875, -0.65869140625, -0.1005859375, 0.45751953125, 1.015625, 1.57373046875, 2.1318359375, 2.68994140625, 3.248046875, 3.80615234375, 4.3642578125, 4.92236328125, 5.48046875, 6.03857421875, 6.5966796875, 7.15478515625, 7.712890625, 8.27099609375, 8.8291015625, 9.38720703125, 9.9453125, 10.50341796875, 11.0615234375, 11.61962890625, 12.177734375, 12.73583984375, 13.2939453125, 13.85205078125, 14.41015625, 14.96826171875, 15.5263671875, 16.08447265625, 16.642578125, 17.20068359375, 17.7587890625, 18.31689453125, 18.875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 11.0, 13.0, 19.0, 34.0, 74.0, 87.0, 173.0, 311.0, 479.0, 748.0, 1238.0, 2001.0, 3271.0, 5259.0, 8056.0, 12437.0, 18639.0, 27236.0, 38219.0, 52054.0, 67030.0, 81631.0, 94071.0, 101823.0, 102506.0, 96026.0, 84469.0, 69714.0, 54453.0, 40656.0, 28941.0, 19737.0, 13453.0, 8806.0, 5614.0, 3533.0, 2147.0, 1407.0, 841.0, 542.0, 316.0, 191.0, 111.0, 73.0, 41.0, 24.0, 16.0, 14.0, 9.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.71875, -9.4417724609375, -9.164794921875, -8.8878173828125, -8.61083984375, -8.3338623046875, -8.056884765625, -7.7799072265625, -7.5029296875, -7.2259521484375, -6.948974609375, -6.6719970703125, -6.39501953125, -6.1180419921875, -5.841064453125, -5.5640869140625, -5.287109375, -5.0101318359375, -4.733154296875, -4.4561767578125, -4.17919921875, -3.9022216796875, -3.625244140625, -3.3482666015625, -3.0712890625, -2.7943115234375, -2.517333984375, -2.2403564453125, -1.96337890625, -1.6864013671875, -1.409423828125, -1.1324462890625, -0.85546875, -0.5784912109375, -0.301513671875, -0.0245361328125, 0.25244140625, 0.5294189453125, 0.806396484375, 1.0833740234375, 1.3603515625, 1.6373291015625, 1.914306640625, 2.1912841796875, 2.46826171875, 2.7452392578125, 3.022216796875, 3.2991943359375, 3.576171875, 3.8531494140625, 4.130126953125, 4.4071044921875, 4.68408203125, 4.9610595703125, 5.238037109375, 5.5150146484375, 5.7919921875, 6.0689697265625, 6.345947265625, 6.6229248046875, 6.89990234375, 7.1768798828125, 7.453857421875, 7.7308349609375, 8.0078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 7.0, 13.0, 14.0, 16.0, 17.0, 22.0, 26.0, 18.0, 23.0, 38.0, 36.0, 32.0, 51.0, 45.0, 50.0, 42.0, 37.0, 37.0, 50.0, 44.0, 44.0, 49.0, 41.0, 34.0, 18.0, 31.0, 25.0, 20.0, 20.0, 21.0, 20.0, 15.0, 8.0, 7.0, 10.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.896484375, -10.55078125, -10.205078125, -9.859375, -9.513671875, -9.16796875, -8.822265625, -8.4765625, -8.130859375, -7.78515625, -7.439453125, -7.09375, -6.748046875, -6.40234375, -6.056640625, -5.7109375, -5.365234375, -5.01953125, -4.673828125, -4.328125, -3.982421875, -3.63671875, -3.291015625, -2.9453125, -2.599609375, -2.25390625, -1.908203125, -1.5625, -1.216796875, -0.87109375, -0.525390625, -0.1796875, 0.166015625, 0.51171875, 0.857421875, 1.203125, 1.548828125, 1.89453125, 2.240234375, 2.5859375, 2.931640625, 3.27734375, 3.623046875, 3.96875, 4.314453125, 4.66015625, 5.005859375, 5.3515625, 5.697265625, 6.04296875, 6.388671875, 6.734375, 7.080078125, 7.42578125, 7.771484375, 8.1171875, 8.462890625, 8.80859375, 9.154296875, 9.5, 9.845703125, 10.19140625, 10.537109375, 10.8828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 14.0, 25.0, 52.0, 74.0, 113.0, 183.0, 288.0, 474.0, 768.0, 1292.0, 1981.0, 3080.0, 5082.0, 8177.0, 12622.0, 19392.0, 29477.0, 41516.0, 57425.0, 75010.0, 91465.0, 103860.0, 109592.0, 106993.0, 95929.0, 80514.0, 62869.0, 46381.0, 32674.0, 22172.0, 14251.0, 9205.0, 5943.0, 3629.0, 2268.0, 1407.0, 877.0, 547.0, 332.0, 214.0, 141.0, 74.0, 50.0, 41.0, 27.0, 23.0, 12.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.45703125, -3.357269287109375, -3.25750732421875, -3.157745361328125, -3.0579833984375, -2.958221435546875, -2.85845947265625, -2.758697509765625, -2.658935546875, -2.559173583984375, -2.45941162109375, -2.359649658203125, -2.2598876953125, -2.160125732421875, -2.06036376953125, -1.960601806640625, -1.86083984375, -1.761077880859375, -1.66131591796875, -1.561553955078125, -1.4617919921875, -1.362030029296875, -1.26226806640625, -1.162506103515625, -1.062744140625, -0.962982177734375, -0.86322021484375, -0.763458251953125, -0.6636962890625, -0.563934326171875, -0.46417236328125, -0.364410400390625, -0.2646484375, -0.164886474609375, -0.06512451171875, 0.034637451171875, 0.1343994140625, 0.234161376953125, 0.33392333984375, 0.433685302734375, 0.533447265625, 0.633209228515625, 0.73297119140625, 0.832733154296875, 0.9324951171875, 1.032257080078125, 1.13201904296875, 1.231781005859375, 1.33154296875, 1.431304931640625, 1.53106689453125, 1.630828857421875, 1.7305908203125, 1.830352783203125, 1.93011474609375, 2.029876708984375, 2.129638671875, 2.229400634765625, 2.32916259765625, 2.428924560546875, 2.5286865234375, 2.628448486328125, 2.72821044921875, 2.827972412109375, 2.927734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 10.0, 10.0, 16.0, 12.0, 17.0, 20.0, 27.0, 26.0, 40.0, 34.0, 52.0, 52.0, 54.0, 44.0, 46.0, 54.0, 43.0, 66.0, 54.0, 46.0, 33.0, 43.0, 29.0, 36.0, 19.0, 23.0, 17.0, 16.0, 13.0, 11.0, 7.0, 4.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003731250762939453, -0.00035999715328216553, -0.00034686923027038574, -0.00033374130725860596, -0.00032061338424682617, -0.0003074854612350464, -0.0002943575382232666, -0.0002812296152114868, -0.00026810169219970703, -0.00025497376918792725, -0.00024184584617614746, -0.00022871792316436768, -0.0002155900001525879, -0.0002024620771408081, -0.00018933415412902832, -0.00017620623111724854, -0.00016307830810546875, -0.00014995038509368896, -0.00013682246208190918, -0.0001236945390701294, -0.00011056661605834961, -9.743869304656982e-05, -8.431077003479004e-05, -7.118284702301025e-05, -5.805492401123047e-05, -4.4927000999450684e-05, -3.17990779876709e-05, -1.8671154975891113e-05, -5.543231964111328e-06, 7.584691047668457e-06, 2.0712614059448242e-05, 3.384053707122803e-05, 4.696846008300781e-05, 6.00963830947876e-05, 7.322430610656738e-05, 8.635222911834717e-05, 9.948015213012695e-05, 0.00011260807514190674, 0.00012573599815368652, 0.0001388639211654663, 0.0001519918441772461, 0.00016511976718902588, 0.00017824769020080566, 0.00019137561321258545, 0.00020450353622436523, 0.00021763145923614502, 0.0002307593822479248, 0.0002438873052597046, 0.0002570152282714844, 0.00027014315128326416, 0.00028327107429504395, 0.00029639899730682373, 0.0003095269203186035, 0.0003226548433303833, 0.0003357827663421631, 0.00034891068935394287, 0.00036203861236572266, 0.00037516653537750244, 0.0003882944583892822, 0.000401422381401062, 0.0004145503044128418, 0.0004276782274246216, 0.00044080615043640137, 0.00045393407344818115, 0.00046706199645996094]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 9.0, 18.0, 33.0, 69.0, 76.0, 128.0, 191.0, 330.0, 496.0, 866.0, 1416.0, 2398.0, 4015.0, 6724.0, 11014.0, 17838.0, 28873.0, 44328.0, 63711.0, 87031.0, 109280.0, 122514.0, 125235.0, 115357.0, 95393.0, 72011.0, 50617.0, 33786.0, 21419.0, 13298.0, 8033.0, 4678.0, 3012.0, 1646.0, 1082.0, 623.0, 358.0, 208.0, 169.0, 100.0, 52.0, 28.0, 34.0, 22.0, 7.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.86328125, -3.7393798828125, -3.615478515625, -3.4915771484375, -3.36767578125, -3.2437744140625, -3.119873046875, -2.9959716796875, -2.8720703125, -2.7481689453125, -2.624267578125, -2.5003662109375, -2.37646484375, -2.2525634765625, -2.128662109375, -2.0047607421875, -1.880859375, -1.7569580078125, -1.633056640625, -1.5091552734375, -1.38525390625, -1.2613525390625, -1.137451171875, -1.0135498046875, -0.8896484375, -0.7657470703125, -0.641845703125, -0.5179443359375, -0.39404296875, -0.2701416015625, -0.146240234375, -0.0223388671875, 0.1015625, 0.2254638671875, 0.349365234375, 0.4732666015625, 0.59716796875, 0.7210693359375, 0.844970703125, 0.9688720703125, 1.0927734375, 1.2166748046875, 1.340576171875, 1.4644775390625, 1.58837890625, 1.7122802734375, 1.836181640625, 1.9600830078125, 2.083984375, 2.2078857421875, 2.331787109375, 2.4556884765625, 2.57958984375, 2.7034912109375, 2.827392578125, 2.9512939453125, 3.0751953125, 3.1990966796875, 3.322998046875, 3.4468994140625, 3.57080078125, 3.6947021484375, 3.818603515625, 3.9425048828125, 4.06640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 9.0, 8.0, 16.0, 15.0, 20.0, 26.0, 22.0, 31.0, 47.0, 40.0, 49.0, 58.0, 49.0, 51.0, 60.0, 63.0, 66.0, 43.0, 60.0, 53.0, 39.0, 32.0, 33.0, 29.0, 14.0, 17.0, 12.0, 5.0, 14.0, 6.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.439453125, -2.377777099609375, -2.31610107421875, -2.254425048828125, -2.1927490234375, -2.131072998046875, -2.06939697265625, -2.007720947265625, -1.946044921875, -1.884368896484375, -1.82269287109375, -1.761016845703125, -1.6993408203125, -1.637664794921875, -1.57598876953125, -1.514312744140625, -1.45263671875, -1.390960693359375, -1.32928466796875, -1.267608642578125, -1.2059326171875, -1.144256591796875, -1.08258056640625, -1.020904541015625, -0.959228515625, -0.897552490234375, -0.83587646484375, -0.774200439453125, -0.7125244140625, -0.650848388671875, -0.58917236328125, -0.527496337890625, -0.4658203125, -0.404144287109375, -0.34246826171875, -0.280792236328125, -0.2191162109375, -0.157440185546875, -0.09576416015625, -0.034088134765625, 0.027587890625, 0.089263916015625, 0.15093994140625, 0.212615966796875, 0.2742919921875, 0.335968017578125, 0.39764404296875, 0.459320068359375, 0.52099609375, 0.582672119140625, 0.64434814453125, 0.706024169921875, 0.7677001953125, 0.829376220703125, 0.89105224609375, 0.952728271484375, 1.014404296875, 1.076080322265625, 1.13775634765625, 1.199432373046875, 1.2611083984375, 1.322784423828125, 1.38446044921875, 1.446136474609375, 1.5078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 10.0, 11.0, 12.0, 11.0, 19.0, 16.0, 15.0, 27.0, 25.0, 37.0, 37.0, 34.0, 25.0, 40.0, 39.0, 45.0, 50.0, 48.0, 44.0, 52.0, 40.0, 52.0, 44.0, 38.0, 34.0, 26.0, 27.0, 22.0, 26.0, 23.0, 14.0, 11.0, 11.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.720953941345215, -14.254154205322266, -13.787353515625, -13.32055377960205, -12.853754043579102, -12.386953353881836, -11.920153617858887, -11.453353881835938, -10.986553192138672, -10.519753456115723, -10.052952766418457, -9.586153030395508, -9.119353294372559, -8.65255355834961, -8.185752868652344, -7.7189531326293945, -7.252153396606445, -6.785353183746338, -6.318553447723389, -5.851753234863281, -5.384953498840332, -4.918153285980225, -4.451353073120117, -3.984553098678589, -3.5177531242370605, -3.0509531497955322, -2.584153175354004, -2.1173529624938965, -1.6505529880523682, -1.1837530136108398, -0.7169528007507324, -0.2501528263092041, 0.21664714813232422, 0.6834471821784973, 1.1502472162246704, 1.6170473098754883, 2.0838472843170166, 2.550647258758545, 3.0174474716186523, 3.4842474460601807, 3.951047420501709, 4.417847633361816, 4.884647369384766, 5.351447582244873, 5.8182477951049805, 6.28504753112793, 6.751847743988037, 7.2186479568481445, 7.685447692871094, 8.152247428894043, 8.619048118591309, 9.085847854614258, 9.552647590637207, 10.019447326660156, 10.486248016357422, 10.953047752380371, 11.41984748840332, 11.88664722442627, 12.353447914123535, 12.820247650146484, 13.287047386169434, 13.753847122192383, 14.220647811889648, 14.687447547912598, 15.154248237609863]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 7.0, 7.0, 6.0, 7.0, 14.0, 9.0, 17.0, 18.0, 13.0, 21.0, 34.0, 32.0, 28.0, 37.0, 38.0, 47.0, 54.0, 64.0, 30.0, 49.0, 56.0, 43.0, 54.0, 47.0, 37.0, 25.0, 28.0, 26.0, 17.0, 26.0, 31.0, 13.0, 18.0, 16.0, 8.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.77967071533203, -17.148536682128906, -16.517404556274414, -15.886271476745605, -15.255138397216797, -14.624004364013672, -13.992871284484863, -13.361738204956055, -12.730605125427246, -12.099472045898438, -11.468338966369629, -10.83720588684082, -10.206071853637695, -9.574939727783203, -8.943805694580078, -8.31267261505127, -7.681539535522461, -7.050406455993652, -6.419273376464844, -5.788139820098877, -5.157006740570068, -4.52587366104126, -3.894740343093872, -3.2636070251464844, -2.632473945617676, -2.001340866088867, -1.3702075481414795, -0.7390743494033813, -0.1079411506652832, 0.5231919288635254, 1.154325246810913, 1.7854585647583008, 2.4165916442871094, 3.047724723815918, 3.6788580417633057, 4.309991359710693, 4.941124439239502, 5.5722575187683105, 6.203391075134277, 6.834524154663086, 7.4656572341918945, 8.096790313720703, 8.727923393249512, 9.35905647277832, 9.990190505981445, 10.621322631835938, 11.252456665039062, 11.883589744567871, 12.51472282409668, 13.145855903625488, 13.776988983154297, 14.408122062683105, 15.039255142211914, 15.670389175415039, 16.30152130126953, 16.932655334472656, 17.56378936767578, 18.194923400878906, 18.8260555267334, 19.457189559936523, 20.088321685791016, 20.71945571899414, 21.350587844848633, 21.981721878051758, 22.61285400390625]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 17.0, 15.0, 43.0, 93.0, 128.0, 254.0, 400.0, 739.0, 1259.0, 2130.0, 3587.0, 6121.0, 9847.0, 16083.0, 25238.0, 39372.0, 60384.0, 89104.0, 127647.0, 176091.0, 231642.0, 291078.0, 345135.0, 386214.0, 404904.0, 396291.0, 363837.0, 312891.0, 256054.0, 197169.0, 145344.0, 104094.0, 71348.0, 47318.0, 30959.0, 19903.0, 12267.0, 7693.0, 4668.0, 2823.0, 1629.0, 1002.0, 623.0, 360.0, 209.0, 111.0, 70.0, 47.0, 33.0, 8.0, 5.0, 2.0, 0.0, 1.0, 3.0], "bins": [-11.125, -10.794921875, -10.46484375, -10.134765625, -9.8046875, -9.474609375, -9.14453125, -8.814453125, -8.484375, -8.154296875, -7.82421875, -7.494140625, -7.1640625, -6.833984375, -6.50390625, -6.173828125, -5.84375, -5.513671875, -5.18359375, -4.853515625, -4.5234375, -4.193359375, -3.86328125, -3.533203125, -3.203125, -2.873046875, -2.54296875, -2.212890625, -1.8828125, -1.552734375, -1.22265625, -0.892578125, -0.5625, -0.232421875, 0.09765625, 0.427734375, 0.7578125, 1.087890625, 1.41796875, 1.748046875, 2.078125, 2.408203125, 2.73828125, 3.068359375, 3.3984375, 3.728515625, 4.05859375, 4.388671875, 4.71875, 5.048828125, 5.37890625, 5.708984375, 6.0390625, 6.369140625, 6.69921875, 7.029296875, 7.359375, 7.689453125, 8.01953125, 8.349609375, 8.6796875, 9.009765625, 9.33984375, 9.669921875, 10.0]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 4.0, 10.0, 8.0, 14.0, 17.0, 15.0, 11.0, 15.0, 36.0, 19.0, 39.0, 35.0, 32.0, 43.0, 49.0, 55.0, 41.0, 48.0, 55.0, 53.0, 49.0, 37.0, 36.0, 39.0, 38.0, 29.0, 31.0, 11.0, 28.0, 21.0, 21.0, 10.0, 12.0, 10.0, 7.0, 4.0, 3.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.609375, -15.087890625, -14.56640625, -14.044921875, -13.5234375, -13.001953125, -12.48046875, -11.958984375, -11.4375, -10.916015625, -10.39453125, -9.873046875, -9.3515625, -8.830078125, -8.30859375, -7.787109375, -7.265625, -6.744140625, -6.22265625, -5.701171875, -5.1796875, -4.658203125, -4.13671875, -3.615234375, -3.09375, -2.572265625, -2.05078125, -1.529296875, -1.0078125, -0.486328125, 0.03515625, 0.556640625, 1.078125, 1.599609375, 2.12109375, 2.642578125, 3.1640625, 3.685546875, 4.20703125, 4.728515625, 5.25, 5.771484375, 6.29296875, 6.814453125, 7.3359375, 7.857421875, 8.37890625, 8.900390625, 9.421875, 9.943359375, 10.46484375, 10.986328125, 11.5078125, 12.029296875, 12.55078125, 13.072265625, 13.59375, 14.115234375, 14.63671875, 15.158203125, 15.6796875, 16.201171875, 16.72265625, 17.244140625, 17.765625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 24.0, 32.0, 70.0, 99.0, 201.0, 391.0, 604.0, 1066.0, 1876.0, 3216.0, 5871.0, 9526.0, 15517.0, 25198.0, 39398.0, 60128.0, 88556.0, 125151.0, 171395.0, 222625.0, 276698.0, 325164.0, 363913.0, 383450.0, 382102.0, 359446.0, 320340.0, 270123.0, 217317.0, 164764.0, 120209.0, 85311.0, 57335.0, 37200.0, 23760.0, 14856.0, 8947.0, 5242.0, 3060.0, 1718.0, 1069.0, 563.0, 335.0, 185.0, 102.0, 59.0, 34.0, 10.0, 11.0, 6.0, 5.0, 1.0], "bins": [-12.328125, -11.985107421875, -11.64208984375, -11.299072265625, -10.9560546875, -10.613037109375, -10.27001953125, -9.927001953125, -9.583984375, -9.240966796875, -8.89794921875, -8.554931640625, -8.2119140625, -7.868896484375, -7.52587890625, -7.182861328125, -6.83984375, -6.496826171875, -6.15380859375, -5.810791015625, -5.4677734375, -5.124755859375, -4.78173828125, -4.438720703125, -4.095703125, -3.752685546875, -3.40966796875, -3.066650390625, -2.7236328125, -2.380615234375, -2.03759765625, -1.694580078125, -1.3515625, -1.008544921875, -0.66552734375, -0.322509765625, 0.0205078125, 0.363525390625, 0.70654296875, 1.049560546875, 1.392578125, 1.735595703125, 2.07861328125, 2.421630859375, 2.7646484375, 3.107666015625, 3.45068359375, 3.793701171875, 4.13671875, 4.479736328125, 4.82275390625, 5.165771484375, 5.5087890625, 5.851806640625, 6.19482421875, 6.537841796875, 6.880859375, 7.223876953125, 7.56689453125, 7.909912109375, 8.2529296875, 8.595947265625, 8.93896484375, 9.281982421875, 9.625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 10.0, 11.0, 15.0, 16.0, 24.0, 34.0, 29.0, 29.0, 58.0, 60.0, 87.0, 107.0, 101.0, 129.0, 138.0, 133.0, 153.0, 160.0, 166.0, 188.0, 183.0, 212.0, 193.0, 213.0, 154.0, 168.0, 176.0, 146.0, 156.0, 137.0, 109.0, 96.0, 82.0, 80.0, 71.0, 43.0, 30.0, 36.0, 25.0, 23.0, 23.0, 12.0, 15.0, 8.0, 5.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.5, -6.29461669921875, -6.0892333984375, -5.88385009765625, -5.678466796875, -5.47308349609375, -5.2677001953125, -5.06231689453125, -4.85693359375, -4.65155029296875, -4.4461669921875, -4.24078369140625, -4.035400390625, -3.83001708984375, -3.6246337890625, -3.41925048828125, -3.2138671875, -3.00848388671875, -2.8031005859375, -2.59771728515625, -2.392333984375, -2.18695068359375, -1.9815673828125, -1.77618408203125, -1.57080078125, -1.36541748046875, -1.1600341796875, -0.95465087890625, -0.749267578125, -0.54388427734375, -0.3385009765625, -0.13311767578125, 0.072265625, 0.27764892578125, 0.4830322265625, 0.68841552734375, 0.893798828125, 1.09918212890625, 1.3045654296875, 1.50994873046875, 1.71533203125, 1.92071533203125, 2.1260986328125, 2.33148193359375, 2.536865234375, 2.74224853515625, 2.9476318359375, 3.15301513671875, 3.3583984375, 3.56378173828125, 3.7691650390625, 3.97454833984375, 4.179931640625, 4.38531494140625, 4.5906982421875, 4.79608154296875, 5.00146484375, 5.20684814453125, 5.4122314453125, 5.61761474609375, 5.822998046875, 6.02838134765625, 6.2337646484375, 6.43914794921875, 6.64453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 8.0, 9.0, 9.0, 15.0, 21.0, 30.0, 23.0, 23.0, 41.0, 35.0, 36.0, 42.0, 44.0, 42.0, 47.0, 61.0, 42.0, 45.0, 45.0, 48.0, 41.0, 29.0, 35.0, 32.0, 28.0, 31.0, 17.0, 29.0, 14.0, 14.0, 15.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.612018585205078, -17.076082229614258, -16.540143966674805, -16.004207611083984, -15.468269348144531, -14.932332992553711, -14.396395683288574, -13.860458374023438, -13.3245210647583, -12.788583755493164, -12.252646446228027, -11.71670913696289, -11.18077278137207, -10.644834518432617, -10.108898162841797, -9.57296085357666, -9.037023544311523, -8.501086235046387, -7.96514892578125, -7.4292120933532715, -6.893274784088135, -6.357337474822998, -5.8214006423950195, -5.285463333129883, -4.749526023864746, -4.213588714599609, -3.6776516437530518, -3.141714572906494, -2.6057772636413574, -2.0698399543762207, -1.533902883529663, -0.9979658126831055, -0.46203041076660156, 0.0739067792892456, 0.6098439693450928, 1.14578115940094, 1.681718349456787, 2.217655658721924, 2.7535927295684814, 3.289529800415039, 3.825467109680176, 4.3614044189453125, 4.897341728210449, 5.433278560638428, 5.9692158699035645, 6.505153179168701, 7.04109001159668, 7.577027320861816, 8.112964630126953, 8.64890193939209, 9.184839248657227, 9.720776557922363, 10.2567138671875, 10.79265022277832, 11.328587532043457, 11.864524841308594, 12.40046215057373, 12.936399459838867, 13.472336769104004, 14.00827407836914, 14.544210433959961, 15.080148696899414, 15.616085052490234, 16.152023315429688, 16.687959671020508]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 3.0, 7.0, 9.0, 11.0, 14.0, 21.0, 25.0, 27.0, 30.0, 32.0, 32.0, 38.0, 43.0, 49.0, 39.0, 42.0, 53.0, 59.0, 52.0, 55.0, 47.0, 42.0, 33.0, 39.0, 42.0, 26.0, 24.0, 18.0, 20.0, 17.0, 11.0, 7.0, 7.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.404544830322266, -18.736053466796875, -18.067562103271484, -17.399070739746094, -16.730579376220703, -16.062088012695312, -15.393597602844238, -14.725106239318848, -14.056614875793457, -13.388123512268066, -12.719632148742676, -12.051141738891602, -11.382650375366211, -10.71415901184082, -10.04566764831543, -9.377176284790039, -8.708684921264648, -8.040193557739258, -7.371702194213867, -6.703211307525635, -6.034719944000244, -5.3662285804748535, -4.697737693786621, -4.0292463302612305, -3.36075496673584, -2.692263603210449, -2.0237724781036377, -1.3552813529968262, -0.6867899894714355, -0.018298625946044922, 0.6501922607421875, 1.3186836242675781, 1.987173080444336, 2.6556644439697266, 3.324155569076538, 3.9926466941833496, 4.66113805770874, 5.329629421234131, 5.998120307922363, 6.666611671447754, 7.3351030349731445, 8.003594398498535, 8.672085762023926, 9.340576171875, 10.00906753540039, 10.677558898925781, 11.346050262451172, 12.014541625976562, 12.683032989501953, 13.351524353027344, 14.020015716552734, 14.688507080078125, 15.356998443603516, 16.025489807128906, 16.693981170654297, 17.362472534179688, 18.030963897705078, 18.69945526123047, 19.36794662475586, 20.03643798828125, 20.70492935180664, 21.37342071533203, 22.041912078857422, 22.710403442382812, 23.37889289855957]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 18.0, 36.0, 36.0, 52.0, 76.0, 134.0, 220.0, 339.0, 502.0, 822.0, 1313.0, 1917.0, 2989.0, 4796.0, 7474.0, 12010.0, 18644.0, 29426.0, 45755.0, 69854.0, 101362.0, 132664.0, 150358.0, 139694.0, 109386.0, 77183.0, 51500.0, 32880.0, 20900.0, 13149.0, 8241.0, 5334.0, 3443.0, 2153.0, 1406.0, 871.0, 586.0, 348.0, 235.0, 155.0, 106.0, 68.0, 48.0, 22.0, 12.0, 10.0, 9.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.55072021484375, -2.4725341796875, -2.39434814453125, -2.316162109375, -2.23797607421875, -2.1597900390625, -2.08160400390625, -2.00341796875, -1.92523193359375, -1.8470458984375, -1.76885986328125, -1.690673828125, -1.61248779296875, -1.5343017578125, -1.45611572265625, -1.3779296875, -1.29974365234375, -1.2215576171875, -1.14337158203125, -1.065185546875, -0.98699951171875, -0.9088134765625, -0.83062744140625, -0.75244140625, -0.67425537109375, -0.5960693359375, -0.51788330078125, -0.439697265625, -0.36151123046875, -0.2833251953125, -0.20513916015625, -0.126953125, -0.04876708984375, 0.0294189453125, 0.10760498046875, 0.185791015625, 0.26397705078125, 0.3421630859375, 0.42034912109375, 0.49853515625, 0.57672119140625, 0.6549072265625, 0.73309326171875, 0.811279296875, 0.88946533203125, 0.9676513671875, 1.04583740234375, 1.1240234375, 1.20220947265625, 1.2803955078125, 1.35858154296875, 1.436767578125, 1.51495361328125, 1.5931396484375, 1.67132568359375, 1.74951171875, 1.82769775390625, 1.9058837890625, 1.98406982421875, 2.062255859375, 2.14044189453125, 2.2186279296875, 2.29681396484375, 2.375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 7.0, 3.0, 6.0, 11.0, 18.0, 22.0, 18.0, 16.0, 27.0, 34.0, 35.0, 36.0, 35.0, 32.0, 26.0, 28.0, 57.0, 61.0, 53.0, 36.0, 52.0, 48.0, 45.0, 41.0, 32.0, 30.0, 32.0, 26.0, 18.0, 27.0, 14.0, 19.0, 10.0, 6.0, 13.0, 6.0, 0.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.71875, -19.0908203125, -18.462890625, -17.8349609375, -17.20703125, -16.5791015625, -15.951171875, -15.3232421875, -14.6953125, -14.0673828125, -13.439453125, -12.8115234375, -12.18359375, -11.5556640625, -10.927734375, -10.2998046875, -9.671875, -9.0439453125, -8.416015625, -7.7880859375, -7.16015625, -6.5322265625, -5.904296875, -5.2763671875, -4.6484375, -4.0205078125, -3.392578125, -2.7646484375, -2.13671875, -1.5087890625, -0.880859375, -0.2529296875, 0.375, 1.0029296875, 1.630859375, 2.2587890625, 2.88671875, 3.5146484375, 4.142578125, 4.7705078125, 5.3984375, 6.0263671875, 6.654296875, 7.2822265625, 7.91015625, 8.5380859375, 9.166015625, 9.7939453125, 10.421875, 11.0498046875, 11.677734375, 12.3056640625, 12.93359375, 13.5615234375, 14.189453125, 14.8173828125, 15.4453125, 16.0732421875, 16.701171875, 17.3291015625, 17.95703125, 18.5849609375, 19.212890625, 19.8408203125, 20.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 14.0, 24.0, 41.0, 58.0, 109.0, 186.0, 251.0, 428.0, 643.0, 1173.0, 1754.0, 2914.0, 4720.0, 7662.0, 12766.0, 20998.0, 33836.0, 53282.0, 80444.0, 113255.0, 142361.0, 150591.0, 132480.0, 100865.0, 69997.0, 44984.0, 28104.0, 17318.0, 10493.0, 6395.0, 3956.0, 2406.0, 1496.0, 906.0, 612.0, 340.0, 256.0, 148.0, 104.0, 62.0, 43.0, 19.0, 22.0, 7.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.7216796875, -2.634765625, -2.5478515625, -2.4609375, -2.3740234375, -2.287109375, -2.2001953125, -2.11328125, -2.0263671875, -1.939453125, -1.8525390625, -1.765625, -1.6787109375, -1.591796875, -1.5048828125, -1.41796875, -1.3310546875, -1.244140625, -1.1572265625, -1.0703125, -0.9833984375, -0.896484375, -0.8095703125, -0.72265625, -0.6357421875, -0.548828125, -0.4619140625, -0.375, -0.2880859375, -0.201171875, -0.1142578125, -0.02734375, 0.0595703125, 0.146484375, 0.2333984375, 0.3203125, 0.4072265625, 0.494140625, 0.5810546875, 0.66796875, 0.7548828125, 0.841796875, 0.9287109375, 1.015625, 1.1025390625, 1.189453125, 1.2763671875, 1.36328125, 1.4501953125, 1.537109375, 1.6240234375, 1.7109375, 1.7978515625, 1.884765625, 1.9716796875, 2.05859375, 2.1455078125, 2.232421875, 2.3193359375, 2.40625, 2.4931640625, 2.580078125, 2.6669921875, 2.75390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 11.0, 8.0, 25.0, 18.0, 21.0, 28.0, 25.0, 42.0, 39.0, 39.0, 34.0, 46.0, 35.0, 36.0, 44.0, 38.0, 58.0, 42.0, 50.0, 53.0, 32.0, 33.0, 41.0, 29.0, 21.0, 13.0, 18.0, 20.0, 14.0, 14.0, 11.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8515625, -11.423583984375, -10.99560546875, -10.567626953125, -10.1396484375, -9.711669921875, -9.28369140625, -8.855712890625, -8.427734375, -7.999755859375, -7.57177734375, -7.143798828125, -6.7158203125, -6.287841796875, -5.85986328125, -5.431884765625, -5.00390625, -4.575927734375, -4.14794921875, -3.719970703125, -3.2919921875, -2.864013671875, -2.43603515625, -2.008056640625, -1.580078125, -1.152099609375, -0.72412109375, -0.296142578125, 0.1318359375, 0.559814453125, 0.98779296875, 1.415771484375, 1.84375, 2.271728515625, 2.69970703125, 3.127685546875, 3.5556640625, 3.983642578125, 4.41162109375, 4.839599609375, 5.267578125, 5.695556640625, 6.12353515625, 6.551513671875, 6.9794921875, 7.407470703125, 7.83544921875, 8.263427734375, 8.69140625, 9.119384765625, 9.54736328125, 9.975341796875, 10.4033203125, 10.831298828125, 11.25927734375, 11.687255859375, 12.115234375, 12.543212890625, 12.97119140625, 13.399169921875, 13.8271484375, 14.255126953125, 14.68310546875, 15.111083984375, 15.5390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 19.0, 25.0, 24.0, 38.0, 72.0, 87.0, 99.0, 182.0, 267.0, 383.0, 618.0, 963.0, 1486.0, 2481.0, 4180.0, 7021.0, 12280.0, 21670.0, 38974.0, 68937.0, 116190.0, 175531.0, 200601.0, 159245.0, 100852.0, 58696.0, 32836.0, 18763.0, 10530.0, 6023.0, 3502.0, 2177.0, 1337.0, 826.0, 533.0, 331.0, 222.0, 162.0, 100.0, 75.0, 67.0, 37.0, 40.0, 17.0, 10.0, 14.0, 6.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.30859375, -0.29986572265625, -0.2911376953125, -0.28240966796875, -0.273681640625, -0.26495361328125, -0.2562255859375, -0.24749755859375, -0.23876953125, -0.23004150390625, -0.2213134765625, -0.21258544921875, -0.203857421875, -0.19512939453125, -0.1864013671875, -0.17767333984375, -0.1689453125, -0.16021728515625, -0.1514892578125, -0.14276123046875, -0.134033203125, -0.12530517578125, -0.1165771484375, -0.10784912109375, -0.09912109375, -0.09039306640625, -0.0816650390625, -0.07293701171875, -0.064208984375, -0.05548095703125, -0.0467529296875, -0.03802490234375, -0.029296875, -0.02056884765625, -0.0118408203125, -0.00311279296875, 0.005615234375, 0.01434326171875, 0.0230712890625, 0.03179931640625, 0.04052734375, 0.04925537109375, 0.0579833984375, 0.06671142578125, 0.075439453125, 0.08416748046875, 0.0928955078125, 0.10162353515625, 0.1103515625, 0.11907958984375, 0.1278076171875, 0.13653564453125, 0.145263671875, 0.15399169921875, 0.1627197265625, 0.17144775390625, 0.18017578125, 0.18890380859375, 0.1976318359375, 0.20635986328125, 0.215087890625, 0.22381591796875, 0.2325439453125, 0.24127197265625, 0.25]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 17.0, 9.0, 15.0, 19.0, 27.0, 34.0, 41.0, 30.0, 40.0, 50.0, 61.0, 59.0, 51.0, 46.0, 54.0, 45.0, 56.0, 57.0, 40.0, 37.0, 27.0, 29.0, 31.0, 27.0, 20.0, 18.0, 10.0, 8.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.319287836551666e-05, -4.198029637336731e-05, -4.0767714381217957e-05, -3.9555132389068604e-05, -3.834255039691925e-05, -3.71299684047699e-05, -3.5917386412620544e-05, -3.470480442047119e-05, -3.349222242832184e-05, -3.2279640436172485e-05, -3.106705844402313e-05, -2.985447645187378e-05, -2.8641894459724426e-05, -2.7429312467575073e-05, -2.621673047542572e-05, -2.5004148483276367e-05, -2.3791566491127014e-05, -2.257898449897766e-05, -2.1366402506828308e-05, -2.0153820514678955e-05, -1.8941238522529602e-05, -1.772865653038025e-05, -1.6516074538230896e-05, -1.5303492546081543e-05, -1.409091055393219e-05, -1.2878328561782837e-05, -1.1665746569633484e-05, -1.0453164577484131e-05, -9.240582585334778e-06, -8.028000593185425e-06, -6.815418601036072e-06, -5.602836608886719e-06, -4.390254616737366e-06, -3.1776726245880127e-06, -1.9650906324386597e-06, -7.525086402893066e-07, 4.600733518600464e-07, 1.6726553440093994e-06, 2.8852373361587524e-06, 4.0978193283081055e-06, 5.3104013204574585e-06, 6.5229833126068115e-06, 7.735565304756165e-06, 8.948147296905518e-06, 1.016072928905487e-05, 1.1373311281204224e-05, 1.2585893273353577e-05, 1.379847526550293e-05, 1.5011057257652283e-05, 1.6223639249801636e-05, 1.743622124195099e-05, 1.8648803234100342e-05, 1.9861385226249695e-05, 2.1073967218399048e-05, 2.22865492105484e-05, 2.3499131202697754e-05, 2.4711713194847107e-05, 2.592429518699646e-05, 2.7136877179145813e-05, 2.8349459171295166e-05, 2.956204116344452e-05, 3.077462315559387e-05, 3.1987205147743225e-05, 3.319978713989258e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 8.0, 11.0, 14.0, 15.0, 22.0, 40.0, 61.0, 81.0, 109.0, 174.0, 248.0, 328.0, 502.0, 789.0, 1305.0, 2162.0, 3487.0, 6412.0, 12354.0, 24739.0, 53296.0, 114416.0, 222790.0, 274244.0, 171004.0, 82197.0, 37733.0, 18222.0, 9222.0, 4917.0, 2781.0, 1752.0, 1034.0, 673.0, 428.0, 308.0, 221.0, 129.0, 95.0, 62.0, 51.0, 35.0, 27.0, 17.0, 14.0, 8.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-0.7900390625, -0.7676467895507812, -0.7452545166015625, -0.7228622436523438, -0.700469970703125, -0.6780776977539062, -0.6556854248046875, -0.6332931518554688, -0.61090087890625, -0.5885086059570312, -0.5661163330078125, -0.5437240600585938, -0.521331787109375, -0.49893951416015625, -0.4765472412109375, -0.45415496826171875, -0.4317626953125, -0.40937042236328125, -0.3869781494140625, -0.36458587646484375, -0.342193603515625, -0.31980133056640625, -0.2974090576171875, -0.27501678466796875, -0.25262451171875, -0.23023223876953125, -0.2078399658203125, -0.18544769287109375, -0.163055419921875, -0.14066314697265625, -0.1182708740234375, -0.09587860107421875, -0.073486328125, -0.05109405517578125, -0.0287017822265625, -0.00630950927734375, 0.016082763671875, 0.03847503662109375, 0.0608673095703125, 0.08325958251953125, 0.10565185546875, 0.12804412841796875, 0.1504364013671875, 0.17282867431640625, 0.195220947265625, 0.21761322021484375, 0.2400054931640625, 0.26239776611328125, 0.2847900390625, 0.30718231201171875, 0.3295745849609375, 0.35196685791015625, 0.374359130859375, 0.39675140380859375, 0.4191436767578125, 0.44153594970703125, 0.46392822265625, 0.48632049560546875, 0.5087127685546875, 0.5311050415039062, 0.553497314453125, 0.5758895874023438, 0.5982818603515625, 0.6206741333007812, 0.64306640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 22.0, 23.0, 27.0, 36.0, 55.0, 64.0, 73.0, 83.0, 107.0, 92.0, 71.0, 51.0, 41.0, 42.0, 32.0, 23.0, 23.0, 23.0, 4.0, 17.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.420654296875, -0.4088172912597656, -0.39698028564453125, -0.3851432800292969, -0.3733062744140625, -0.3614692687988281, -0.34963226318359375, -0.3377952575683594, -0.325958251953125, -0.3141212463378906, -0.30228424072265625, -0.2904472351074219, -0.2786102294921875, -0.2667732238769531, -0.25493621826171875, -0.24309921264648438, -0.23126220703125, -0.21942520141601562, -0.20758819580078125, -0.19575119018554688, -0.1839141845703125, -0.17207717895507812, -0.16024017333984375, -0.14840316772460938, -0.136566162109375, -0.12472915649414062, -0.11289215087890625, -0.10105514526367188, -0.0892181396484375, -0.07738113403320312, -0.06554412841796875, -0.053707122802734375, -0.0418701171875, -0.030033111572265625, -0.01819610595703125, -0.006359100341796875, 0.0054779052734375, 0.017314910888671875, 0.02915191650390625, 0.040988922119140625, 0.052825927734375, 0.06466293334960938, 0.07649993896484375, 0.08833694458007812, 0.1001739501953125, 0.11201095581054688, 0.12384796142578125, 0.13568496704101562, 0.14752197265625, 0.15935897827148438, 0.17119598388671875, 0.18303298950195312, 0.1948699951171875, 0.20670700073242188, 0.21854400634765625, 0.23038101196289062, 0.242218017578125, 0.2540550231933594, 0.26589202880859375, 0.2777290344238281, 0.2895660400390625, 0.3014030456542969, 0.31324005126953125, 0.3250770568847656, 0.3369140625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 8.0, 10.0, 11.0, 14.0, 26.0, 24.0, 22.0, 31.0, 40.0, 32.0, 36.0, 51.0, 43.0, 45.0, 57.0, 49.0, 49.0, 43.0, 47.0, 46.0, 41.0, 22.0, 35.0, 35.0, 29.0, 25.0, 27.0, 18.0, 15.0, 16.0, 9.0, 10.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.778034210205078, -17.23383903503418, -16.68964385986328, -16.145448684692383, -15.601253509521484, -15.057058334350586, -14.512862205505371, -13.968667030334473, -13.424471855163574, -12.880276679992676, -12.336081504821777, -11.791886329650879, -11.247690200805664, -10.703495025634766, -10.159299850463867, -9.615104675292969, -9.07090950012207, -8.526714324951172, -7.982519149780273, -7.438323497772217, -6.894128322601318, -6.34993314743042, -5.805737495422363, -5.261542320251465, -4.717347145080566, -4.173151969909668, -3.6289565563201904, -3.084761142730713, -2.5405659675598145, -1.996370792388916, -1.4521753787994385, -0.9079799652099609, -0.3637847900390625, 0.1804105043411255, 0.7246057987213135, 1.2688010931015015, 1.8129963874816895, 2.357191562652588, 2.9013869762420654, 3.445582389831543, 3.9897775650024414, 4.53397274017334, 5.078167915344238, 5.622363567352295, 6.166558742523193, 6.710753917694092, 7.254949569702148, 7.799144744873047, 8.343339920043945, 8.887535095214844, 9.431730270385742, 9.97592544555664, 10.520120620727539, 11.064315795898438, 11.608511924743652, 12.15270709991455, 12.69690227508545, 13.241097450256348, 13.785292625427246, 14.329487800598145, 14.87368392944336, 15.417879104614258, 15.962074279785156, 16.506269454956055, 17.050464630126953]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 5.0, 3.0, 6.0, 10.0, 11.0, 13.0, 22.0, 24.0, 26.0, 31.0, 32.0, 33.0, 34.0, 44.0, 51.0, 35.0, 46.0, 50.0, 59.0, 50.0, 55.0, 51.0, 41.0, 34.0, 40.0, 40.0, 25.0, 27.0, 20.0, 17.0, 20.0, 10.0, 6.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.389698028564453, -18.723114013671875, -18.05653190612793, -17.38994789123535, -16.723365783691406, -16.056781768798828, -15.390199661254883, -14.723615646362305, -14.05703353881836, -13.390450477600098, -12.723867416381836, -12.057284355163574, -11.390701293945312, -10.72411823272705, -10.057535171508789, -9.390951156616211, -8.72436809539795, -8.057785034179688, -7.391201972961426, -6.724618911743164, -6.058035850524902, -5.391452789306641, -4.724869251251221, -4.058286190032959, -3.3917031288146973, -2.7251200675964355, -2.058537006378174, -1.391953706741333, -0.7253706455230713, -0.05878758430480957, 0.6077957153320312, 1.274378776550293, 1.9409618377685547, 2.6075448989868164, 3.274127960205078, 3.940711259841919, 4.607294082641602, 5.273877143859863, 5.940460681915283, 6.607043743133545, 7.273626804351807, 7.940209865570068, 8.606793403625488, 9.27337646484375, 9.939959526062012, 10.606542587280273, 11.273125648498535, 11.939708709716797, 12.606291770935059, 13.27287483215332, 13.939457893371582, 14.606040954589844, 15.272624015808105, 15.939207077026367, 16.605791091918945, 17.27237319946289, 17.93895721435547, 18.605541229248047, 19.272123336791992, 19.93870735168457, 20.605289459228516, 21.271873474121094, 21.93845558166504, 22.605039596557617, 23.271621704101562]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 28.0, 34.0, 44.0, 69.0, 131.0, 209.0, 390.0, 608.0, 968.0, 1511.0, 2444.0, 3918.0, 5841.0, 8979.0, 13574.0, 19417.0, 27345.0, 37418.0, 49109.0, 61328.0, 75089.0, 85624.0, 92832.0, 93954.0, 91100.0, 83682.0, 72807.0, 59037.0, 46500.0, 35527.0, 25664.0, 18017.0, 12371.0, 8100.0, 5395.0, 3512.0, 2289.0, 1377.0, 888.0, 517.0, 351.0, 211.0, 129.0, 77.0, 46.0, 34.0, 13.0, 19.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.96875, -7.7149658203125, -7.461181640625, -7.2073974609375, -6.95361328125, -6.6998291015625, -6.446044921875, -6.1922607421875, -5.9384765625, -5.6846923828125, -5.430908203125, -5.1771240234375, -4.92333984375, -4.6695556640625, -4.415771484375, -4.1619873046875, -3.908203125, -3.6544189453125, -3.400634765625, -3.1468505859375, -2.89306640625, -2.6392822265625, -2.385498046875, -2.1317138671875, -1.8779296875, -1.6241455078125, -1.370361328125, -1.1165771484375, -0.86279296875, -0.6090087890625, -0.355224609375, -0.1014404296875, 0.15234375, 0.4061279296875, 0.659912109375, 0.9136962890625, 1.16748046875, 1.4212646484375, 1.675048828125, 1.9288330078125, 2.1826171875, 2.4364013671875, 2.690185546875, 2.9439697265625, 3.19775390625, 3.4515380859375, 3.705322265625, 3.9591064453125, 4.212890625, 4.4666748046875, 4.720458984375, 4.9742431640625, 5.22802734375, 5.4818115234375, 5.735595703125, 5.9893798828125, 6.2431640625, 6.4969482421875, 6.750732421875, 7.0045166015625, 7.25830078125, 7.5120849609375, 7.765869140625, 8.0196533203125, 8.2734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 5.0, 10.0, 11.0, 16.0, 17.0, 26.0, 18.0, 21.0, 30.0, 35.0, 28.0, 38.0, 37.0, 43.0, 44.0, 43.0, 45.0, 48.0, 49.0, 43.0, 55.0, 40.0, 47.0, 31.0, 36.0, 30.0, 20.0, 25.0, 20.0, 16.0, 12.0, 8.0, 8.0, 6.0, 10.0, 5.0, 7.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.849853515625, -15.21533203125, -14.580810546875, -13.9462890625, -13.311767578125, -12.67724609375, -12.042724609375, -11.408203125, -10.773681640625, -10.13916015625, -9.504638671875, -8.8701171875, -8.235595703125, -7.60107421875, -6.966552734375, -6.33203125, -5.697509765625, -5.06298828125, -4.428466796875, -3.7939453125, -3.159423828125, -2.52490234375, -1.890380859375, -1.255859375, -0.621337890625, 0.01318359375, 0.647705078125, 1.2822265625, 1.916748046875, 2.55126953125, 3.185791015625, 3.8203125, 4.454833984375, 5.08935546875, 5.723876953125, 6.3583984375, 6.992919921875, 7.62744140625, 8.261962890625, 8.896484375, 9.531005859375, 10.16552734375, 10.800048828125, 11.4345703125, 12.069091796875, 12.70361328125, 13.338134765625, 13.97265625, 14.607177734375, 15.24169921875, 15.876220703125, 16.5107421875, 17.145263671875, 17.77978515625, 18.414306640625, 19.048828125, 19.683349609375, 20.31787109375, 20.952392578125, 21.5869140625, 22.221435546875, 22.85595703125, 23.490478515625, 24.125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 9.0, 12.0, 12.0, 16.0, 37.0, 43.0, 62.0, 121.0, 219.0, 333.0, 500.0, 843.0, 1340.0, 2176.0, 3276.0, 5130.0, 7725.0, 11416.0, 16601.0, 24223.0, 33270.0, 44278.0, 57490.0, 70214.0, 82341.0, 91493.0, 95068.0, 93965.0, 87583.0, 76528.0, 63553.0, 50346.0, 38632.0, 28371.0, 20185.0, 13924.0, 9632.0, 6234.0, 4058.0, 2644.0, 1709.0, 1123.0, 693.0, 437.0, 259.0, 189.0, 97.0, 59.0, 37.0, 23.0, 19.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-8.6953125, -8.4298095703125, -8.164306640625, -7.8988037109375, -7.63330078125, -7.3677978515625, -7.102294921875, -6.8367919921875, -6.5712890625, -6.3057861328125, -6.040283203125, -5.7747802734375, -5.50927734375, -5.2437744140625, -4.978271484375, -4.7127685546875, -4.447265625, -4.1817626953125, -3.916259765625, -3.6507568359375, -3.38525390625, -3.1197509765625, -2.854248046875, -2.5887451171875, -2.3232421875, -2.0577392578125, -1.792236328125, -1.5267333984375, -1.26123046875, -0.9957275390625, -0.730224609375, -0.4647216796875, -0.19921875, 0.0662841796875, 0.331787109375, 0.5972900390625, 0.86279296875, 1.1282958984375, 1.393798828125, 1.6593017578125, 1.9248046875, 2.1903076171875, 2.455810546875, 2.7213134765625, 2.98681640625, 3.2523193359375, 3.517822265625, 3.7833251953125, 4.048828125, 4.3143310546875, 4.579833984375, 4.8453369140625, 5.11083984375, 5.3763427734375, 5.641845703125, 5.9073486328125, 6.1728515625, 6.4383544921875, 6.703857421875, 6.9693603515625, 7.23486328125, 7.5003662109375, 7.765869140625, 8.0313720703125, 8.296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 14.0, 26.0, 8.0, 16.0, 18.0, 10.0, 24.0, 27.0, 30.0, 28.0, 37.0, 36.0, 37.0, 49.0, 44.0, 36.0, 52.0, 34.0, 29.0, 31.0, 35.0, 34.0, 27.0, 33.0, 42.0, 24.0, 22.0, 27.0, 17.0, 16.0, 17.0, 17.0, 10.0, 10.0, 15.0, 12.0, 8.0, 9.0, 3.0, 8.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.374267578125, -10.02978515625, -9.685302734375, -9.3408203125, -8.996337890625, -8.65185546875, -8.307373046875, -7.962890625, -7.618408203125, -7.27392578125, -6.929443359375, -6.5849609375, -6.240478515625, -5.89599609375, -5.551513671875, -5.20703125, -4.862548828125, -4.51806640625, -4.173583984375, -3.8291015625, -3.484619140625, -3.14013671875, -2.795654296875, -2.451171875, -2.106689453125, -1.76220703125, -1.417724609375, -1.0732421875, -0.728759765625, -0.38427734375, -0.039794921875, 0.3046875, 0.649169921875, 0.99365234375, 1.338134765625, 1.6826171875, 2.027099609375, 2.37158203125, 2.716064453125, 3.060546875, 3.405029296875, 3.74951171875, 4.093994140625, 4.4384765625, 4.782958984375, 5.12744140625, 5.471923828125, 5.81640625, 6.160888671875, 6.50537109375, 6.849853515625, 7.1943359375, 7.538818359375, 7.88330078125, 8.227783203125, 8.572265625, 8.916748046875, 9.26123046875, 9.605712890625, 9.9501953125, 10.294677734375, 10.63916015625, 10.983642578125, 11.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 19.0, 16.0, 29.0, 57.0, 72.0, 136.0, 214.0, 345.0, 598.0, 946.0, 1704.0, 3070.0, 5357.0, 9297.0, 16023.0, 26991.0, 41715.0, 62129.0, 84717.0, 107090.0, 122046.0, 127091.0, 117501.0, 100355.0, 76594.0, 54493.0, 35942.0, 22599.0, 13288.0, 7819.0, 4421.0, 2530.0, 1449.0, 767.0, 454.0, 264.0, 157.0, 89.0, 58.0, 37.0, 23.0, 23.0, 6.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.609344482421875, -3.48626708984375, -3.363189697265625, -3.2401123046875, -3.117034912109375, -2.99395751953125, -2.870880126953125, -2.747802734375, -2.624725341796875, -2.50164794921875, -2.378570556640625, -2.2554931640625, -2.132415771484375, -2.00933837890625, -1.886260986328125, -1.76318359375, -1.640106201171875, -1.51702880859375, -1.393951416015625, -1.2708740234375, -1.147796630859375, -1.02471923828125, -0.901641845703125, -0.778564453125, -0.655487060546875, -0.53240966796875, -0.409332275390625, -0.2862548828125, -0.163177490234375, -0.04010009765625, 0.082977294921875, 0.2060546875, 0.329132080078125, 0.45220947265625, 0.575286865234375, 0.6983642578125, 0.821441650390625, 0.94451904296875, 1.067596435546875, 1.190673828125, 1.313751220703125, 1.43682861328125, 1.559906005859375, 1.6829833984375, 1.806060791015625, 1.92913818359375, 2.052215576171875, 2.17529296875, 2.298370361328125, 2.42144775390625, 2.544525146484375, 2.6676025390625, 2.790679931640625, 2.91375732421875, 3.036834716796875, 3.159912109375, 3.282989501953125, 3.40606689453125, 3.529144287109375, 3.6522216796875, 3.775299072265625, 3.89837646484375, 4.021453857421875, 4.14453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 14.0, 11.0, 16.0, 19.0, 28.0, 42.0, 39.0, 52.0, 53.0, 62.0, 65.0, 57.0, 65.0, 58.0, 54.0, 57.0, 61.0, 36.0, 37.0, 31.0, 29.0, 24.0, 21.0, 20.0, 15.0, 2.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000537872314453125, -0.0005202814936637878, -0.0005026906728744507, -0.0004850998520851135, -0.00046750903129577637, -0.0004499182105064392, -0.00043232738971710205, -0.0004147365689277649, -0.00039714574813842773, -0.0003795549273490906, -0.0003619641065597534, -0.00034437328577041626, -0.0003267824649810791, -0.00030919164419174194, -0.0002916008234024048, -0.0002740100026130676, -0.00025641918182373047, -0.0002388283610343933, -0.00022123754024505615, -0.000203646719455719, -0.00018605589866638184, -0.00016846507787704468, -0.00015087425708770752, -0.00013328343629837036, -0.0001156926155090332, -9.810179471969604e-05, -8.051097393035889e-05, -6.292015314102173e-05, -4.532933235168457e-05, -2.7738511562347412e-05, -1.0147690773010254e-05, 7.443130016326904e-06, 2.5033950805664062e-05, 4.262477159500122e-05, 6.021559238433838e-05, 7.780641317367554e-05, 9.53972339630127e-05, 0.00011298805475234985, 0.000130578875541687, 0.00014816969633102417, 0.00016576051712036133, 0.00018335133790969849, 0.00020094215869903564, 0.0002185329794883728, 0.00023612380027770996, 0.0002537146210670471, 0.0002713054418563843, 0.00028889626264572144, 0.0003064870834350586, 0.00032407790422439575, 0.0003416687250137329, 0.00035925954580307007, 0.0003768503665924072, 0.0003944411873817444, 0.00041203200817108154, 0.0004296228289604187, 0.00044721364974975586, 0.000464804470539093, 0.0004823952913284302, 0.0004999861121177673, 0.0005175769329071045, 0.0005351677536964417, 0.0005527585744857788, 0.000570349395275116, 0.0005879402160644531]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 13.0, 20.0, 41.0, 62.0, 93.0, 148.0, 235.0, 375.0, 569.0, 1106.0, 1796.0, 3079.0, 5498.0, 9192.0, 15419.0, 25951.0, 41219.0, 62180.0, 86327.0, 110643.0, 126919.0, 130879.0, 120563.0, 98900.0, 74602.0, 50875.0, 32745.0, 20291.0, 11754.0, 7118.0, 4030.0, 2368.0, 1363.0, 829.0, 522.0, 297.0, 187.0, 121.0, 78.0, 45.0, 36.0, 17.0, 14.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.87457275390625, -3.7374267578125, -3.60028076171875, -3.463134765625, -3.32598876953125, -3.1888427734375, -3.05169677734375, -2.91455078125, -2.77740478515625, -2.6402587890625, -2.50311279296875, -2.365966796875, -2.22882080078125, -2.0916748046875, -1.95452880859375, -1.8173828125, -1.68023681640625, -1.5430908203125, -1.40594482421875, -1.268798828125, -1.13165283203125, -0.9945068359375, -0.85736083984375, -0.72021484375, -0.58306884765625, -0.4459228515625, -0.30877685546875, -0.171630859375, -0.03448486328125, 0.1026611328125, 0.23980712890625, 0.376953125, 0.51409912109375, 0.6512451171875, 0.78839111328125, 0.925537109375, 1.06268310546875, 1.1998291015625, 1.33697509765625, 1.47412109375, 1.61126708984375, 1.7484130859375, 1.88555908203125, 2.022705078125, 2.15985107421875, 2.2969970703125, 2.43414306640625, 2.5712890625, 2.70843505859375, 2.8455810546875, 2.98272705078125, 3.119873046875, 3.25701904296875, 3.3941650390625, 3.53131103515625, 3.66845703125, 3.80560302734375, 3.9427490234375, 4.07989501953125, 4.217041015625, 4.35418701171875, 4.4913330078125, 4.62847900390625, 4.765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 9.0, 15.0, 27.0, 24.0, 31.0, 28.0, 40.0, 46.0, 33.0, 54.0, 47.0, 51.0, 54.0, 49.0, 45.0, 50.0, 55.0, 39.0, 33.0, 30.0, 33.0, 25.0, 24.0, 19.0, 17.0, 15.0, 19.0, 6.0, 15.0, 10.0, 7.0, 4.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6351470947265625, -1.575958251953125, -1.5167694091796875, -1.45758056640625, -1.3983917236328125, -1.339202880859375, -1.2800140380859375, -1.2208251953125, -1.1616363525390625, -1.102447509765625, -1.0432586669921875, -0.98406982421875, -0.9248809814453125, -0.865692138671875, -0.8065032958984375, -0.747314453125, -0.6881256103515625, -0.628936767578125, -0.5697479248046875, -0.51055908203125, -0.4513702392578125, -0.392181396484375, -0.3329925537109375, -0.2738037109375, -0.2146148681640625, -0.155426025390625, -0.0962371826171875, -0.03704833984375, 0.0221405029296875, 0.081329345703125, 0.1405181884765625, 0.19970703125, 0.2588958740234375, 0.318084716796875, 0.3772735595703125, 0.43646240234375, 0.4956512451171875, 0.554840087890625, 0.6140289306640625, 0.6732177734375, 0.7324066162109375, 0.791595458984375, 0.8507843017578125, 0.90997314453125, 0.9691619873046875, 1.028350830078125, 1.0875396728515625, 1.146728515625, 1.2059173583984375, 1.265106201171875, 1.3242950439453125, 1.38348388671875, 1.4426727294921875, 1.501861572265625, 1.5610504150390625, 1.6202392578125, 1.6794281005859375, 1.738616943359375, 1.7978057861328125, 1.85699462890625, 1.9161834716796875, 1.975372314453125, 2.0345611572265625, 2.09375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 6.0, 7.0, 12.0, 13.0, 26.0, 17.0, 21.0, 32.0, 27.0, 34.0, 35.0, 42.0, 48.0, 33.0, 50.0, 60.0, 48.0, 35.0, 42.0, 53.0, 34.0, 44.0, 31.0, 32.0, 42.0, 29.0, 24.0, 14.0, 14.0, 18.0, 8.0, 17.0, 10.0, 7.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.086942672729492, -17.560914993286133, -17.034887313842773, -16.508859634399414, -15.982831954956055, -15.456804275512695, -14.930777549743652, -14.404749870300293, -13.878722190856934, -13.352694511413574, -12.826666831970215, -12.300639152526855, -11.774612426757812, -11.248584747314453, -10.722557067871094, -10.196529388427734, -9.670501708984375, -9.144474029541016, -8.618446350097656, -8.092418670654297, -7.566391468048096, -7.040363788604736, -6.514336585998535, -5.988308906555176, -5.462281227111816, -4.936253547668457, -4.410225868225098, -3.8841986656188965, -3.358170986175537, -2.8321433067321777, -2.3061158657073975, -1.7800884246826172, -1.2540626525878906, -0.7280350923538208, -0.20200753211975098, 0.32402002811431885, 0.8500475883483887, 1.376075267791748, 1.9021027088165283, 2.4281301498413086, 2.954157829284668, 3.4801855087280273, 4.006213188171387, 4.532240390777588, 5.058268070220947, 5.584295749664307, 6.110322952270508, 6.636350631713867, 7.162378311157227, 7.688405990600586, 8.214433670043945, 8.740461349487305, 9.266489028930664, 9.792516708374023, 10.318543434143066, 10.844571113586426, 11.370598793029785, 11.896626472473145, 12.422654151916504, 12.948681831359863, 13.474708557128906, 14.000736236572266, 14.526763916015625, 15.052791595458984, 15.578819274902344]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 5.0, 10.0, 13.0, 17.0, 17.0, 26.0, 24.0, 25.0, 33.0, 34.0, 39.0, 40.0, 48.0, 40.0, 47.0, 56.0, 59.0, 41.0, 50.0, 37.0, 50.0, 38.0, 41.0, 32.0, 22.0, 32.0, 26.0, 17.0, 11.0, 14.0, 8.0, 13.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.4061222076416, -21.68741226196289, -20.96870231628418, -20.24999237060547, -19.531280517578125, -18.812570571899414, -18.093860626220703, -17.375150680541992, -16.65644073486328, -15.93773078918457, -15.219019889831543, -14.500309944152832, -13.781599044799805, -13.062889099121094, -12.344179153442383, -11.625469207763672, -10.906757354736328, -10.188047409057617, -9.46933650970459, -8.750626564025879, -8.031915664672852, -7.313205718994141, -6.59449577331543, -5.8757853507995605, -5.157074928283691, -4.438364505767822, -3.7196543216705322, -3.000944137573242, -2.282233715057373, -1.563523292541504, -0.844813346862793, -0.12610292434692383, 0.5926094055175781, 1.3113197088241577, 2.0300300121307373, 2.7487401962280273, 3.4674506187438965, 4.186161041259766, 4.904870986938477, 5.623581409454346, 6.342291831970215, 7.061002254486084, 7.779712677001953, 8.498422622680664, 9.217132568359375, 9.935843467712402, 10.654553413391113, 11.37326431274414, 12.091974258422852, 12.810684204101562, 13.52939510345459, 14.2481050491333, 14.966815948486328, 15.685525894165039, 16.40423583984375, 17.12294578552246, 17.841655731201172, 18.560365676879883, 19.279075622558594, 19.997787475585938, 20.71649742126465, 21.43520736694336, 22.15391731262207, 22.87262725830078, 23.591339111328125]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 11.0, 16.0, 29.0, 44.0, 88.0, 154.0, 236.0, 390.0, 582.0, 1015.0, 1723.0, 2680.0, 4361.0, 6782.0, 10669.0, 16837.0, 25305.0, 38028.0, 55033.0, 78360.0, 108239.0, 145426.0, 189166.0, 236433.0, 281995.0, 322045.0, 350568.0, 360728.0, 353185.0, 329240.0, 292441.0, 245553.0, 199344.0, 155027.0, 116065.0, 84697.0, 60077.0, 41899.0, 28030.0, 18461.0, 12079.0, 7854.0, 4947.0, 3190.0, 2047.0, 1206.0, 766.0, 488.0, 281.0, 204.0, 104.0, 69.0, 41.0, 24.0, 19.0, 4.0, 3.0, 4.0], "bins": [-11.4296875, -11.08984375, -10.75, -10.41015625, -10.0703125, -9.73046875, -9.390625, -9.05078125, -8.7109375, -8.37109375, -8.03125, -7.69140625, -7.3515625, -7.01171875, -6.671875, -6.33203125, -5.9921875, -5.65234375, -5.3125, -4.97265625, -4.6328125, -4.29296875, -3.953125, -3.61328125, -3.2734375, -2.93359375, -2.59375, -2.25390625, -1.9140625, -1.57421875, -1.234375, -0.89453125, -0.5546875, -0.21484375, 0.125, 0.46484375, 0.8046875, 1.14453125, 1.484375, 1.82421875, 2.1640625, 2.50390625, 2.84375, 3.18359375, 3.5234375, 3.86328125, 4.203125, 4.54296875, 4.8828125, 5.22265625, 5.5625, 5.90234375, 6.2421875, 6.58203125, 6.921875, 7.26171875, 7.6015625, 7.94140625, 8.28125, 8.62109375, 8.9609375, 9.30078125, 9.640625, 9.98046875, 10.3203125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 2.0, 6.0, 7.0, 14.0, 17.0, 17.0, 14.0, 16.0, 42.0, 44.0, 42.0, 42.0, 42.0, 44.0, 48.0, 35.0, 44.0, 61.0, 63.0, 36.0, 57.0, 48.0, 33.0, 34.0, 29.0, 21.0, 26.0, 27.0, 22.0, 9.0, 12.0, 14.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.591796875, -19.94921875, -19.306640625, -18.6640625, -18.021484375, -17.37890625, -16.736328125, -16.09375, -15.451171875, -14.80859375, -14.166015625, -13.5234375, -12.880859375, -12.23828125, -11.595703125, -10.953125, -10.310546875, -9.66796875, -9.025390625, -8.3828125, -7.740234375, -7.09765625, -6.455078125, -5.8125, -5.169921875, -4.52734375, -3.884765625, -3.2421875, -2.599609375, -1.95703125, -1.314453125, -0.671875, -0.029296875, 0.61328125, 1.255859375, 1.8984375, 2.541015625, 3.18359375, 3.826171875, 4.46875, 5.111328125, 5.75390625, 6.396484375, 7.0390625, 7.681640625, 8.32421875, 8.966796875, 9.609375, 10.251953125, 10.89453125, 11.537109375, 12.1796875, 12.822265625, 13.46484375, 14.107421875, 14.75, 15.392578125, 16.03515625, 16.677734375, 17.3203125, 17.962890625, 18.60546875, 19.248046875, 19.890625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 6.0, 24.0, 21.0, 33.0, 76.0, 122.0, 190.0, 325.0, 591.0, 950.0, 1641.0, 2668.0, 4399.0, 7004.0, 11076.0, 17258.0, 26425.0, 39756.0, 57988.0, 82266.0, 113210.0, 150238.0, 192727.0, 236756.0, 279876.0, 314764.0, 340602.0, 351359.0, 344318.0, 322604.0, 289513.0, 247816.0, 202009.0, 159017.0, 120904.0, 88762.0, 63078.0, 43311.0, 29126.0, 19319.0, 12215.0, 7700.0, 4890.0, 2881.0, 1810.0, 1099.0, 628.0, 390.0, 222.0, 148.0, 66.0, 43.0, 33.0, 11.0, 12.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-11.484375, -11.12109375, -10.7578125, -10.39453125, -10.03125, -9.66796875, -9.3046875, -8.94140625, -8.578125, -8.21484375, -7.8515625, -7.48828125, -7.125, -6.76171875, -6.3984375, -6.03515625, -5.671875, -5.30859375, -4.9453125, -4.58203125, -4.21875, -3.85546875, -3.4921875, -3.12890625, -2.765625, -2.40234375, -2.0390625, -1.67578125, -1.3125, -0.94921875, -0.5859375, -0.22265625, 0.140625, 0.50390625, 0.8671875, 1.23046875, 1.59375, 1.95703125, 2.3203125, 2.68359375, 3.046875, 3.41015625, 3.7734375, 4.13671875, 4.5, 4.86328125, 5.2265625, 5.58984375, 5.953125, 6.31640625, 6.6796875, 7.04296875, 7.40625, 7.76953125, 8.1328125, 8.49609375, 8.859375, 9.22265625, 9.5859375, 9.94921875, 10.3125, 10.67578125, 11.0390625, 11.40234375, 11.765625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 14.0, 30.0, 21.0, 28.0, 30.0, 46.0, 54.0, 65.0, 68.0, 101.0, 102.0, 104.0, 154.0, 173.0, 163.0, 169.0, 210.0, 210.0, 206.0, 215.0, 188.0, 203.0, 194.0, 156.0, 185.0, 165.0, 111.0, 133.0, 107.0, 90.0, 83.0, 61.0, 46.0, 42.0, 45.0, 23.0, 15.0, 14.0, 13.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.953125, -7.6968994140625, -7.440673828125, -7.1844482421875, -6.92822265625, -6.6719970703125, -6.415771484375, -6.1595458984375, -5.9033203125, -5.6470947265625, -5.390869140625, -5.1346435546875, -4.87841796875, -4.6221923828125, -4.365966796875, -4.1097412109375, -3.853515625, -3.5972900390625, -3.341064453125, -3.0848388671875, -2.82861328125, -2.5723876953125, -2.316162109375, -2.0599365234375, -1.8037109375, -1.5474853515625, -1.291259765625, -1.0350341796875, -0.77880859375, -0.5225830078125, -0.266357421875, -0.0101318359375, 0.24609375, 0.5023193359375, 0.758544921875, 1.0147705078125, 1.27099609375, 1.5272216796875, 1.783447265625, 2.0396728515625, 2.2958984375, 2.5521240234375, 2.808349609375, 3.0645751953125, 3.32080078125, 3.5770263671875, 3.833251953125, 4.0894775390625, 4.345703125, 4.6019287109375, 4.858154296875, 5.1143798828125, 5.37060546875, 5.6268310546875, 5.883056640625, 6.1392822265625, 6.3955078125, 6.6517333984375, 6.907958984375, 7.1641845703125, 7.42041015625, 7.6766357421875, 7.932861328125, 8.1890869140625, 8.4453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 13.0, 14.0, 17.0, 23.0, 24.0, 25.0, 43.0, 29.0, 36.0, 34.0, 58.0, 48.0, 53.0, 35.0, 48.0, 45.0, 34.0, 39.0, 55.0, 45.0, 46.0, 37.0, 21.0, 22.0, 22.0, 22.0, 17.0, 16.0, 20.0, 8.0, 3.0, 8.0, 7.0, 0.0, 7.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.027252197265625, -19.412723541259766, -18.798194885253906, -18.183666229248047, -17.569137573242188, -16.954608917236328, -16.34008026123047, -15.725553512573242, -15.111024856567383, -14.496496200561523, -13.881967544555664, -13.267438888549805, -12.652911186218262, -12.038382530212402, -11.423853874206543, -10.809326171875, -10.194796562194824, -9.580267906188965, -8.965739250183105, -8.351211547851562, -7.736682891845703, -7.122154235839844, -6.507625579833984, -5.893097400665283, -5.278568744659424, -4.6640400886535645, -4.049511909484863, -3.434983253479004, -2.8204548358917236, -2.2059264183044434, -1.591397762298584, -0.9768695831298828, -0.36234092712402344, 0.2521875500679016, 0.8667160272598267, 1.4812445640563965, 2.0957729816436768, 2.710301399230957, 3.3248300552368164, 3.9393582344055176, 4.553886890411377, 5.168415546417236, 5.7829437255859375, 6.397472381591797, 7.012001037597656, 7.626529216766357, 8.241058349609375, 8.855586051940918, 9.470114707946777, 10.084643363952637, 10.699172019958496, 11.313699722290039, 11.928228378295898, 12.542757034301758, 13.157285690307617, 13.771814346313477, 14.386343002319336, 15.000871658325195, 15.615400314331055, 16.229928970336914, 16.844457626342773, 17.458984375, 18.07351303100586, 18.68804168701172, 19.302570343017578]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 14.0, 10.0, 11.0, 15.0, 12.0, 25.0, 19.0, 21.0, 27.0, 23.0, 33.0, 32.0, 38.0, 44.0, 50.0, 44.0, 51.0, 52.0, 46.0, 51.0, 45.0, 38.0, 31.0, 37.0, 22.0, 33.0, 23.0, 26.0, 19.0, 26.0, 21.0, 7.0, 13.0, 6.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.068527221679688, -19.354019165039062, -18.639509201049805, -17.92500114440918, -17.210491180419922, -16.495983123779297, -15.781474113464355, -15.066965103149414, -14.352456092834473, -13.637947082519531, -12.92343807220459, -12.208929061889648, -11.494421005249023, -10.779911041259766, -10.06540298461914, -9.3508939743042, -8.636384963989258, -7.921875953674316, -7.207366943359375, -6.492858409881592, -5.77834939956665, -5.063840389251709, -4.349331855773926, -3.6348228454589844, -2.920313835144043, -2.2058048248291016, -1.4912960529327393, -0.776787281036377, -0.06227827072143555, 0.6522307395935059, 1.366739273071289, 2.0812482833862305, 2.795755386352539, 3.5102643966674805, 4.224773406982422, 4.939281940460205, 5.6537909507751465, 6.368299961090088, 7.082808494567871, 7.7973175048828125, 8.511826515197754, 9.226335525512695, 9.940844535827637, 10.655353546142578, 11.369861602783203, 12.084371566772461, 12.798879623413086, 13.513388633728027, 14.227897644042969, 14.94240665435791, 15.656915664672852, 16.371423721313477, 17.085933685302734, 17.80044174194336, 18.514949798583984, 19.229459762573242, 19.9439697265625, 20.658477783203125, 21.372987747192383, 22.087495803833008, 22.802005767822266, 23.51651382446289, 24.231021881103516, 24.945531845092773, 25.6600399017334]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 11.0, 20.0, 22.0, 44.0, 79.0, 132.0, 214.0, 408.0, 658.0, 1142.0, 1883.0, 3282.0, 5854.0, 10440.0, 18940.0, 33288.0, 58428.0, 97039.0, 144974.0, 180940.0, 172413.0, 128302.0, 81032.0, 47649.0, 26782.0, 14970.0, 8389.0, 4777.0, 2684.0, 1524.0, 867.0, 552.0, 304.0, 203.0, 116.0, 73.0, 39.0, 18.0, 25.0, 12.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.0184326171875, -2.909912109375, -2.8013916015625, -2.69287109375, -2.5843505859375, -2.475830078125, -2.3673095703125, -2.2587890625, -2.1502685546875, -2.041748046875, -1.9332275390625, -1.82470703125, -1.7161865234375, -1.607666015625, -1.4991455078125, -1.390625, -1.2821044921875, -1.173583984375, -1.0650634765625, -0.95654296875, -0.8480224609375, -0.739501953125, -0.6309814453125, -0.5224609375, -0.4139404296875, -0.305419921875, -0.1968994140625, -0.08837890625, 0.0201416015625, 0.128662109375, 0.2371826171875, 0.345703125, 0.4542236328125, 0.562744140625, 0.6712646484375, 0.77978515625, 0.8883056640625, 0.996826171875, 1.1053466796875, 1.2138671875, 1.3223876953125, 1.430908203125, 1.5394287109375, 1.64794921875, 1.7564697265625, 1.864990234375, 1.9735107421875, 2.08203125, 2.1905517578125, 2.299072265625, 2.4075927734375, 2.51611328125, 2.6246337890625, 2.733154296875, 2.8416748046875, 2.9501953125, 3.0587158203125, 3.167236328125, 3.2757568359375, 3.38427734375, 3.4927978515625, 3.601318359375, 3.7098388671875, 3.818359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 8.0, 13.0, 17.0, 16.0, 25.0, 18.0, 23.0, 25.0, 30.0, 34.0, 29.0, 41.0, 41.0, 39.0, 41.0, 55.0, 49.0, 58.0, 41.0, 34.0, 35.0, 36.0, 23.0, 34.0, 32.0, 30.0, 18.0, 28.0, 20.0, 19.0, 10.0, 13.0, 7.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.015625, -20.28955078125, -19.5634765625, -18.83740234375, -18.111328125, -17.38525390625, -16.6591796875, -15.93310546875, -15.20703125, -14.48095703125, -13.7548828125, -13.02880859375, -12.302734375, -11.57666015625, -10.8505859375, -10.12451171875, -9.3984375, -8.67236328125, -7.9462890625, -7.22021484375, -6.494140625, -5.76806640625, -5.0419921875, -4.31591796875, -3.58984375, -2.86376953125, -2.1376953125, -1.41162109375, -0.685546875, 0.04052734375, 0.7666015625, 1.49267578125, 2.21875, 2.94482421875, 3.6708984375, 4.39697265625, 5.123046875, 5.84912109375, 6.5751953125, 7.30126953125, 8.02734375, 8.75341796875, 9.4794921875, 10.20556640625, 10.931640625, 11.65771484375, 12.3837890625, 13.10986328125, 13.8359375, 14.56201171875, 15.2880859375, 16.01416015625, 16.740234375, 17.46630859375, 18.1923828125, 18.91845703125, 19.64453125, 20.37060546875, 21.0966796875, 21.82275390625, 22.548828125, 23.27490234375, 24.0009765625, 24.72705078125, 25.453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 13.0, 9.0, 18.0, 42.0, 58.0, 90.0, 154.0, 196.0, 320.0, 404.0, 676.0, 1103.0, 1510.0, 2449.0, 3477.0, 5676.0, 8292.0, 12620.0, 18986.0, 27648.0, 40783.0, 57939.0, 78922.0, 101194.0, 118747.0, 124217.0, 114380.0, 95073.0, 72195.0, 51801.0, 36123.0, 24705.0, 16438.0, 11062.0, 7205.0, 4831.0, 3085.0, 2063.0, 1349.0, 936.0, 588.0, 413.0, 261.0, 184.0, 120.0, 80.0, 43.0, 28.0, 16.0, 11.0, 9.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.547637939453125, -2.46636962890625, -2.385101318359375, -2.3038330078125, -2.222564697265625, -2.14129638671875, -2.060028076171875, -1.978759765625, -1.897491455078125, -1.81622314453125, -1.734954833984375, -1.6536865234375, -1.572418212890625, -1.49114990234375, -1.409881591796875, -1.32861328125, -1.247344970703125, -1.16607666015625, -1.084808349609375, -1.0035400390625, -0.922271728515625, -0.84100341796875, -0.759735107421875, -0.678466796875, -0.597198486328125, -0.51593017578125, -0.434661865234375, -0.3533935546875, -0.272125244140625, -0.19085693359375, -0.109588623046875, -0.0283203125, 0.052947998046875, 0.13421630859375, 0.215484619140625, 0.2967529296875, 0.378021240234375, 0.45928955078125, 0.540557861328125, 0.621826171875, 0.703094482421875, 0.78436279296875, 0.865631103515625, 0.9468994140625, 1.028167724609375, 1.10943603515625, 1.190704345703125, 1.27197265625, 1.353240966796875, 1.43450927734375, 1.515777587890625, 1.5970458984375, 1.678314208984375, 1.75958251953125, 1.840850830078125, 1.922119140625, 2.003387451171875, 2.08465576171875, 2.165924072265625, 2.2471923828125, 2.328460693359375, 2.40972900390625, 2.490997314453125, 2.572265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 6.0, 6.0, 5.0, 8.0, 5.0, 20.0, 12.0, 14.0, 12.0, 24.0, 22.0, 18.0, 29.0, 31.0, 27.0, 31.0, 36.0, 40.0, 43.0, 44.0, 46.0, 39.0, 37.0, 41.0, 45.0, 35.0, 45.0, 28.0, 32.0, 28.0, 31.0, 27.0, 25.0, 21.0, 24.0, 11.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.484375, -13.014404296875, -12.54443359375, -12.074462890625, -11.6044921875, -11.134521484375, -10.66455078125, -10.194580078125, -9.724609375, -9.254638671875, -8.78466796875, -8.314697265625, -7.8447265625, -7.374755859375, -6.90478515625, -6.434814453125, -5.96484375, -5.494873046875, -5.02490234375, -4.554931640625, -4.0849609375, -3.614990234375, -3.14501953125, -2.675048828125, -2.205078125, -1.735107421875, -1.26513671875, -0.795166015625, -0.3251953125, 0.144775390625, 0.61474609375, 1.084716796875, 1.5546875, 2.024658203125, 2.49462890625, 2.964599609375, 3.4345703125, 3.904541015625, 4.37451171875, 4.844482421875, 5.314453125, 5.784423828125, 6.25439453125, 6.724365234375, 7.1943359375, 7.664306640625, 8.13427734375, 8.604248046875, 9.07421875, 9.544189453125, 10.01416015625, 10.484130859375, 10.9541015625, 11.424072265625, 11.89404296875, 12.364013671875, 12.833984375, 13.303955078125, 13.77392578125, 14.243896484375, 14.7138671875, 15.183837890625, 15.65380859375, 16.123779296875, 16.59375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 3.0, 3.0, 6.0, 17.0, 17.0, 20.0, 38.0, 61.0, 86.0, 112.0, 197.0, 245.0, 372.0, 555.0, 843.0, 1205.0, 1813.0, 2739.0, 3976.0, 5924.0, 9085.0, 13667.0, 20706.0, 31518.0, 47260.0, 68321.0, 94857.0, 122216.0, 138711.0, 130963.0, 106799.0, 79761.0, 55177.0, 37626.0, 24909.0, 16019.0, 10884.0, 7143.0, 4760.0, 3208.0, 2131.0, 1529.0, 946.0, 715.0, 446.0, 316.0, 239.0, 145.0, 92.0, 54.0, 43.0, 32.0, 17.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2164306640625, -0.20960426330566406, -0.20277786254882812, -0.1959514617919922, -0.18912506103515625, -0.1822986602783203, -0.17547225952148438, -0.16864585876464844, -0.1618194580078125, -0.15499305725097656, -0.14816665649414062, -0.1413402557373047, -0.13451385498046875, -0.1276874542236328, -0.12086105346679688, -0.11403465270996094, -0.107208251953125, -0.10038185119628906, -0.09355545043945312, -0.08672904968261719, -0.07990264892578125, -0.07307624816894531, -0.06624984741210938, -0.05942344665527344, -0.0525970458984375, -0.04577064514160156, -0.038944244384765625, -0.03211784362792969, -0.02529144287109375, -0.018465042114257812, -0.011638641357421875, -0.0048122406005859375, 0.00201416015625, 0.008840560913085938, 0.015666961669921875, 0.022493362426757812, 0.02931976318359375, 0.03614616394042969, 0.042972564697265625, 0.04979896545410156, 0.0566253662109375, 0.06345176696777344, 0.07027816772460938, 0.07710456848144531, 0.08393096923828125, 0.09075736999511719, 0.09758377075195312, 0.10441017150878906, 0.111236572265625, 0.11806297302246094, 0.12488937377929688, 0.1317157745361328, 0.13854217529296875, 0.1453685760498047, 0.15219497680664062, 0.15902137756347656, 0.1658477783203125, 0.17267417907714844, 0.17950057983398438, 0.1863269805908203, 0.19315338134765625, 0.1999797821044922, 0.20680618286132812, 0.21363258361816406, 0.220458984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 3.0, 2.0, 14.0, 13.0, 21.0, 14.0, 13.0, 27.0, 22.0, 26.0, 36.0, 37.0, 36.0, 50.0, 46.0, 43.0, 50.0, 46.0, 50.0, 49.0, 38.0, 47.0, 43.0, 42.0, 46.0, 28.0, 21.0, 27.0, 22.0, 19.0, 8.0, 9.0, 12.0, 7.0, 5.0, 6.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.641843795776367e-05, -3.528594970703125e-05, -3.415346145629883e-05, -3.3020973205566406e-05, -3.1888484954833984e-05, -3.075599670410156e-05, -2.962350845336914e-05, -2.849102020263672e-05, -2.7358531951904297e-05, -2.6226043701171875e-05, -2.5093555450439453e-05, -2.396106719970703e-05, -2.282857894897461e-05, -2.1696090698242188e-05, -2.0563602447509766e-05, -1.9431114196777344e-05, -1.8298625946044922e-05, -1.71661376953125e-05, -1.6033649444580078e-05, -1.4901161193847656e-05, -1.3768672943115234e-05, -1.2636184692382812e-05, -1.150369644165039e-05, -1.0371208190917969e-05, -9.238719940185547e-06, -8.106231689453125e-06, -6.973743438720703e-06, -5.841255187988281e-06, -4.708766937255859e-06, -3.5762786865234375e-06, -2.4437904357910156e-06, -1.3113021850585938e-06, -1.7881393432617188e-07, 9.5367431640625e-07, 2.086162567138672e-06, 3.2186508178710938e-06, 4.351139068603516e-06, 5.4836273193359375e-06, 6.616115570068359e-06, 7.748603820800781e-06, 8.881092071533203e-06, 1.0013580322265625e-05, 1.1146068572998047e-05, 1.2278556823730469e-05, 1.341104507446289e-05, 1.4543533325195312e-05, 1.5676021575927734e-05, 1.6808509826660156e-05, 1.7940998077392578e-05, 1.9073486328125e-05, 2.0205974578857422e-05, 2.1338462829589844e-05, 2.2470951080322266e-05, 2.3603439331054688e-05, 2.473592758178711e-05, 2.586841583251953e-05, 2.7000904083251953e-05, 2.8133392333984375e-05, 2.9265880584716797e-05, 3.039836883544922e-05, 3.153085708618164e-05, 3.266334533691406e-05, 3.3795833587646484e-05, 3.4928321838378906e-05, 3.606081008911133e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 9.0, 16.0, 8.0, 15.0, 18.0, 33.0, 57.0, 102.0, 154.0, 199.0, 321.0, 455.0, 687.0, 1007.0, 1578.0, 2255.0, 3391.0, 5148.0, 7816.0, 11783.0, 17991.0, 27338.0, 41200.0, 61750.0, 89427.0, 121036.0, 144989.0, 142284.0, 115147.0, 83076.0, 56963.0, 38240.0, 25168.0, 16467.0, 10883.0, 7261.0, 4707.0, 3096.0, 2090.0, 1483.0, 955.0, 668.0, 410.0, 290.0, 215.0, 129.0, 74.0, 58.0, 38.0, 20.0, 20.0, 11.0, 10.0, 6.0, 4.0, 4.0, 1.0, 2.0], "bins": [-0.440673828125, -0.4272804260253906, -0.41388702392578125, -0.4004936218261719, -0.3871002197265625, -0.3737068176269531, -0.36031341552734375, -0.3469200134277344, -0.333526611328125, -0.3201332092285156, -0.30673980712890625, -0.2933464050292969, -0.2799530029296875, -0.2665596008300781, -0.25316619873046875, -0.23977279663085938, -0.22637939453125, -0.21298599243164062, -0.19959259033203125, -0.18619918823242188, -0.1728057861328125, -0.15941238403320312, -0.14601898193359375, -0.13262557983398438, -0.119232177734375, -0.10583877563476562, -0.09244537353515625, -0.07905197143554688, -0.0656585693359375, -0.052265167236328125, -0.03887176513671875, -0.025478363037109375, -0.0120849609375, 0.001308441162109375, 0.01470184326171875, 0.028095245361328125, 0.0414886474609375, 0.054882049560546875, 0.06827545166015625, 0.08166885375976562, 0.095062255859375, 0.10845565795898438, 0.12184906005859375, 0.13524246215820312, 0.1486358642578125, 0.16202926635742188, 0.17542266845703125, 0.18881607055664062, 0.20220947265625, 0.21560287475585938, 0.22899627685546875, 0.24238967895507812, 0.2557830810546875, 0.2691764831542969, 0.28256988525390625, 0.2959632873535156, 0.309356689453125, 0.3227500915527344, 0.33614349365234375, 0.3495368957519531, 0.3629302978515625, 0.3763236999511719, 0.38971710205078125, 0.4031105041503906, 0.41650390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 9.0, 6.0, 10.0, 9.0, 14.0, 12.0, 10.0, 10.0, 16.0, 27.0, 37.0, 32.0, 51.0, 52.0, 85.0, 77.0, 69.0, 72.0, 58.0, 55.0, 49.0, 50.0, 38.0, 21.0, 32.0, 16.0, 14.0, 12.0, 10.0, 8.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2213134765625, -0.2126331329345703, -0.20395278930664062, -0.19527244567871094, -0.18659210205078125, -0.17791175842285156, -0.16923141479492188, -0.1605510711669922, -0.1518707275390625, -0.1431903839111328, -0.13451004028320312, -0.12582969665527344, -0.11714935302734375, -0.10846900939941406, -0.09978866577148438, -0.09110832214355469, -0.082427978515625, -0.07374763488769531, -0.06506729125976562, -0.05638694763183594, -0.04770660400390625, -0.03902626037597656, -0.030345916748046875, -0.021665573120117188, -0.0129852294921875, -0.0043048858642578125, 0.004375457763671875, 0.013055801391601562, 0.02173614501953125, 0.030416488647460938, 0.039096832275390625, 0.04777717590332031, 0.05645751953125, 0.06513786315917969, 0.07381820678710938, 0.08249855041503906, 0.09117889404296875, 0.09985923767089844, 0.10853958129882812, 0.11721992492675781, 0.1259002685546875, 0.1345806121826172, 0.14326095581054688, 0.15194129943847656, 0.16062164306640625, 0.16930198669433594, 0.17798233032226562, 0.1866626739501953, 0.195343017578125, 0.2040233612060547, 0.21270370483398438, 0.22138404846191406, 0.23006439208984375, 0.23874473571777344, 0.24742507934570312, 0.2561054229736328, 0.2647857666015625, 0.2734661102294922, 0.2821464538574219, 0.29082679748535156, 0.29950714111328125, 0.30818748474121094, 0.3168678283691406, 0.3255481719970703, 0.334228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 3.0, 5.0, 15.0, 8.0, 13.0, 28.0, 26.0, 26.0, 34.0, 36.0, 36.0, 37.0, 48.0, 58.0, 38.0, 45.0, 53.0, 45.0, 36.0, 29.0, 58.0, 52.0, 44.0, 34.0, 22.0, 25.0, 23.0, 18.0, 17.0, 21.0, 18.0, 4.0, 6.0, 6.0, 8.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.251113891601562, -19.63152503967285, -19.01193618774414, -18.39234733581543, -17.77275848388672, -17.153169631958008, -16.533580780029297, -15.91399097442627, -15.294402122497559, -14.674813270568848, -14.055224418640137, -13.435635566711426, -12.816045761108398, -12.196456909179688, -11.576868057250977, -10.957279205322266, -10.337690353393555, -9.718101501464844, -9.098512649536133, -8.478923797607422, -7.859334468841553, -7.239745616912842, -6.620156288146973, -6.000567436218262, -5.380978584289551, -4.76138973236084, -4.141800880432129, -3.5222115516662598, -2.902622699737549, -2.283033847808838, -1.6634447574615479, -1.0438556671142578, -0.4242687225341797, 0.1953202486038208, 0.8149092197418213, 1.4344981908798218, 2.0540871620178223, 2.673676013946533, 3.2932651042938232, 3.9128541946411133, 4.532443046569824, 5.152031898498535, 5.771620750427246, 6.391210079193115, 7.010798931121826, 7.630387783050537, 8.249977111816406, 8.869565963745117, 9.489154815673828, 10.108743667602539, 10.72833251953125, 11.347921371459961, 11.967510223388672, 12.587099075317383, 13.20668888092041, 13.826277732849121, 14.445866584777832, 15.065455436706543, 15.685044288635254, 16.30463409423828, 16.924222946166992, 17.543811798095703, 18.163400650024414, 18.782989501953125, 19.402578353881836]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 11.0, 13.0, 13.0, 14.0, 23.0, 20.0, 22.0, 26.0, 22.0, 33.0, 31.0, 39.0, 47.0, 46.0, 46.0, 49.0, 55.0, 42.0, 55.0, 44.0, 36.0, 31.0, 38.0, 24.0, 29.0, 26.0, 25.0, 19.0, 30.0, 17.0, 7.0, 15.0, 5.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15969467163086, -19.44611167907715, -18.732526779174805, -18.018943786621094, -17.305360794067383, -16.591777801513672, -15.878192901611328, -15.164609909057617, -14.45102596282959, -13.737442016601562, -13.023859024047852, -12.310275077819824, -11.596691131591797, -10.883108139038086, -10.169524192810059, -9.455940246582031, -8.74235725402832, -8.028773307800293, -7.315190315246582, -6.601606369018555, -5.8880228996276855, -5.174439430236816, -4.460855484008789, -3.74727201461792, -3.033688545227051, -2.3201050758361816, -1.6065213680267334, -0.8929376602172852, -0.17935419082641602, 0.5342292785644531, 1.2478132247924805, 1.9613966941833496, 2.6749801635742188, 3.388563632965088, 4.102147102355957, 4.815731048583984, 5.5293145179748535, 6.242897987365723, 6.95648193359375, 7.670065402984619, 8.383648872375488, 9.097232818603516, 9.810815811157227, 10.524399757385254, 11.237983703613281, 11.951566696166992, 12.66515064239502, 13.378734588623047, 14.092317581176758, 14.805901527404785, 15.519484519958496, 16.233068466186523, 16.946651458740234, 17.660236358642578, 18.37381935119629, 19.08740234375, 19.800987243652344, 20.514570236206055, 21.2281551361084, 21.94173812866211, 22.65532112121582, 23.36890411376953, 24.082489013671875, 24.796072006225586, 25.509654998779297]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 14.0, 9.0, 14.0, 39.0, 42.0, 76.0, 112.0, 205.0, 307.0, 479.0, 778.0, 1231.0, 1993.0, 3005.0, 4376.0, 6943.0, 10165.0, 14581.0, 21117.0, 28688.0, 38454.0, 49283.0, 61294.0, 72789.0, 82085.0, 88408.0, 90607.0, 88222.0, 81048.0, 70486.0, 59095.0, 47327.0, 36586.0, 27174.0, 19688.0, 13849.0, 9591.0, 6447.0, 4170.0, 2775.0, 1760.0, 1177.0, 763.0, 506.0, 298.0, 202.0, 107.0, 78.0, 59.0, 23.0, 15.0, 8.0, 3.0, 6.0, 3.0, 3.0], "bins": [-9.515625, -9.2391357421875, -8.962646484375, -8.6861572265625, -8.40966796875, -8.1331787109375, -7.856689453125, -7.5802001953125, -7.3037109375, -7.0272216796875, -6.750732421875, -6.4742431640625, -6.19775390625, -5.9212646484375, -5.644775390625, -5.3682861328125, -5.091796875, -4.8153076171875, -4.538818359375, -4.2623291015625, -3.98583984375, -3.7093505859375, -3.432861328125, -3.1563720703125, -2.8798828125, -2.6033935546875, -2.326904296875, -2.0504150390625, -1.77392578125, -1.4974365234375, -1.220947265625, -0.9444580078125, -0.66796875, -0.3914794921875, -0.114990234375, 0.1614990234375, 0.43798828125, 0.7144775390625, 0.990966796875, 1.2674560546875, 1.5439453125, 1.8204345703125, 2.096923828125, 2.3734130859375, 2.64990234375, 2.9263916015625, 3.202880859375, 3.4793701171875, 3.755859375, 4.0323486328125, 4.308837890625, 4.5853271484375, 4.86181640625, 5.1383056640625, 5.414794921875, 5.6912841796875, 5.9677734375, 6.2442626953125, 6.520751953125, 6.7972412109375, 7.07373046875, 7.3502197265625, 7.626708984375, 7.9031982421875, 8.1796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 15.0, 15.0, 11.0, 16.0, 23.0, 16.0, 28.0, 23.0, 35.0, 28.0, 29.0, 43.0, 36.0, 40.0, 49.0, 40.0, 42.0, 37.0, 60.0, 48.0, 33.0, 36.0, 37.0, 30.0, 27.0, 30.0, 25.0, 18.0, 22.0, 23.0, 15.0, 18.0, 5.0, 15.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.0078125, -18.296875, -17.5859375, -16.875, -16.1640625, -15.453125, -14.7421875, -14.03125, -13.3203125, -12.609375, -11.8984375, -11.1875, -10.4765625, -9.765625, -9.0546875, -8.34375, -7.6328125, -6.921875, -6.2109375, -5.5, -4.7890625, -4.078125, -3.3671875, -2.65625, -1.9453125, -1.234375, -0.5234375, 0.1875, 0.8984375, 1.609375, 2.3203125, 3.03125, 3.7421875, 4.453125, 5.1640625, 5.875, 6.5859375, 7.296875, 8.0078125, 8.71875, 9.4296875, 10.140625, 10.8515625, 11.5625, 12.2734375, 12.984375, 13.6953125, 14.40625, 15.1171875, 15.828125, 16.5390625, 17.25, 17.9609375, 18.671875, 19.3828125, 20.09375, 20.8046875, 21.515625, 22.2265625, 22.9375, 23.6484375, 24.359375, 25.0703125, 25.78125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 5.0, 27.0, 16.0, 36.0, 64.0, 94.0, 160.0, 230.0, 397.0, 620.0, 978.0, 1653.0, 2582.0, 4005.0, 6127.0, 9355.0, 14039.0, 20227.0, 28816.0, 39158.0, 51758.0, 65399.0, 77946.0, 88041.0, 95172.0, 95737.0, 91479.0, 82339.0, 69803.0, 56335.0, 43599.0, 32278.0, 23143.0, 15979.0, 10893.0, 7213.0, 4641.0, 2980.0, 1880.0, 1299.0, 820.0, 476.0, 320.0, 192.0, 90.0, 61.0, 39.0, 22.0, 9.0, 13.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3616943359375, -9.051513671875, -8.7413330078125, -8.43115234375, -8.1209716796875, -7.810791015625, -7.5006103515625, -7.1904296875, -6.8802490234375, -6.570068359375, -6.2598876953125, -5.94970703125, -5.6395263671875, -5.329345703125, -5.0191650390625, -4.708984375, -4.3988037109375, -4.088623046875, -3.7784423828125, -3.46826171875, -3.1580810546875, -2.847900390625, -2.5377197265625, -2.2275390625, -1.9173583984375, -1.607177734375, -1.2969970703125, -0.98681640625, -0.6766357421875, -0.366455078125, -0.0562744140625, 0.25390625, 0.5640869140625, 0.874267578125, 1.1844482421875, 1.49462890625, 1.8048095703125, 2.114990234375, 2.4251708984375, 2.7353515625, 3.0455322265625, 3.355712890625, 3.6658935546875, 3.97607421875, 4.2862548828125, 4.596435546875, 4.9066162109375, 5.216796875, 5.5269775390625, 5.837158203125, 6.1473388671875, 6.45751953125, 6.7677001953125, 7.077880859375, 7.3880615234375, 7.6982421875, 8.0084228515625, 8.318603515625, 8.6287841796875, 8.93896484375, 9.2491455078125, 9.559326171875, 9.8695068359375, 10.1796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 13.0, 11.0, 6.0, 7.0, 14.0, 18.0, 17.0, 22.0, 28.0, 23.0, 24.0, 32.0, 22.0, 31.0, 38.0, 22.0, 40.0, 36.0, 40.0, 43.0, 44.0, 33.0, 33.0, 34.0, 36.0, 47.0, 43.0, 33.0, 28.0, 23.0, 26.0, 19.0, 28.0, 20.0, 12.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.4283447265625, -10.997314453125, -10.5662841796875, -10.13525390625, -9.7042236328125, -9.273193359375, -8.8421630859375, -8.4111328125, -7.9801025390625, -7.549072265625, -7.1180419921875, -6.68701171875, -6.2559814453125, -5.824951171875, -5.3939208984375, -4.962890625, -4.5318603515625, -4.100830078125, -3.6697998046875, -3.23876953125, -2.8077392578125, -2.376708984375, -1.9456787109375, -1.5146484375, -1.0836181640625, -0.652587890625, -0.2215576171875, 0.20947265625, 0.6405029296875, 1.071533203125, 1.5025634765625, 1.93359375, 2.3646240234375, 2.795654296875, 3.2266845703125, 3.65771484375, 4.0887451171875, 4.519775390625, 4.9508056640625, 5.3818359375, 5.8128662109375, 6.243896484375, 6.6749267578125, 7.10595703125, 7.5369873046875, 7.968017578125, 8.3990478515625, 8.830078125, 9.2611083984375, 9.692138671875, 10.1231689453125, 10.55419921875, 10.9852294921875, 11.416259765625, 11.8472900390625, 12.2783203125, 12.7093505859375, 13.140380859375, 13.5714111328125, 14.00244140625, 14.4334716796875, 14.864501953125, 15.2955322265625, 15.7265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 21.0, 34.0, 66.0, 111.0, 172.0, 269.0, 410.0, 681.0, 1117.0, 1934.0, 3310.0, 5462.0, 9280.0, 15158.0, 24748.0, 37615.0, 54948.0, 75414.0, 95477.0, 112528.0, 119862.0, 117222.0, 103589.0, 84349.0, 63122.0, 44335.0, 29602.0, 19039.0, 11247.0, 6986.0, 4116.0, 2479.0, 1550.0, 889.0, 510.0, 313.0, 213.0, 137.0, 89.0, 50.0, 29.0, 20.0, 15.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.11163330078125, -3.9732666015625, -3.83489990234375, -3.696533203125, -3.55816650390625, -3.4197998046875, -3.28143310546875, -3.14306640625, -3.00469970703125, -2.8663330078125, -2.72796630859375, -2.589599609375, -2.45123291015625, -2.3128662109375, -2.17449951171875, -2.0361328125, -1.89776611328125, -1.7593994140625, -1.62103271484375, -1.482666015625, -1.34429931640625, -1.2059326171875, -1.06756591796875, -0.92919921875, -0.79083251953125, -0.6524658203125, -0.51409912109375, -0.375732421875, -0.23736572265625, -0.0989990234375, 0.03936767578125, 0.177734375, 0.31610107421875, 0.4544677734375, 0.59283447265625, 0.731201171875, 0.86956787109375, 1.0079345703125, 1.14630126953125, 1.28466796875, 1.42303466796875, 1.5614013671875, 1.69976806640625, 1.838134765625, 1.97650146484375, 2.1148681640625, 2.25323486328125, 2.3916015625, 2.52996826171875, 2.6683349609375, 2.80670166015625, 2.945068359375, 3.08343505859375, 3.2218017578125, 3.36016845703125, 3.49853515625, 3.63690185546875, 3.7752685546875, 3.91363525390625, 4.052001953125, 4.19036865234375, 4.3287353515625, 4.46710205078125, 4.60546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 9.0, 6.0, 15.0, 17.0, 12.0, 27.0, 26.0, 34.0, 23.0, 35.0, 36.0, 43.0, 41.0, 34.0, 61.0, 43.0, 45.0, 35.0, 35.0, 39.0, 43.0, 48.0, 41.0, 32.0, 31.0, 19.0, 18.0, 22.0, 21.0, 19.0, 13.0, 16.0, 15.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0005240440368652344, -0.0005087852478027344, -0.0004935264587402344, -0.0004782676696777344, -0.0004630088806152344, -0.0004477500915527344, -0.0004324913024902344, -0.0004172325134277344, -0.0004019737243652344, -0.0003867149353027344, -0.0003714561462402344, -0.0003561973571777344, -0.0003409385681152344, -0.0003256797790527344, -0.0003104209899902344, -0.0002951622009277344, -0.0002799034118652344, -0.0002646446228027344, -0.0002493858337402344, -0.00023412704467773438, -0.00021886825561523438, -0.00020360946655273438, -0.00018835067749023438, -0.00017309188842773438, -0.00015783309936523438, -0.00014257431030273438, -0.00012731552124023438, -0.00011205673217773438, -9.679794311523438e-05, -8.153915405273438e-05, -6.628036499023438e-05, -5.1021575927734375e-05, -3.5762786865234375e-05, -2.0503997802734375e-05, -5.245208740234375e-06, 1.0013580322265625e-05, 2.5272369384765625e-05, 4.0531158447265625e-05, 5.5789947509765625e-05, 7.104873657226562e-05, 8.630752563476562e-05, 0.00010156631469726562, 0.00011682510375976562, 0.00013208389282226562, 0.00014734268188476562, 0.00016260147094726562, 0.00017786026000976562, 0.00019311904907226562, 0.00020837783813476562, 0.00022363662719726562, 0.00023889541625976562, 0.0002541542053222656, 0.0002694129943847656, 0.0002846717834472656, 0.0002999305725097656, 0.0003151893615722656, 0.0003304481506347656, 0.0003457069396972656, 0.0003609657287597656, 0.0003762245178222656, 0.0003914833068847656, 0.0004067420959472656, 0.0004220008850097656, 0.0004372596740722656, 0.0004525184631347656]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 9.0, 9.0, 10.0, 28.0, 27.0, 40.0, 59.0, 94.0, 107.0, 188.0, 266.0, 429.0, 614.0, 943.0, 1536.0, 2435.0, 3961.0, 6200.0, 9733.0, 15429.0, 23570.0, 34660.0, 50109.0, 67767.0, 86114.0, 101441.0, 110715.0, 111486.0, 102968.0, 88101.0, 69759.0, 52831.0, 37021.0, 25213.0, 16255.0, 10359.0, 6661.0, 4101.0, 2620.0, 1676.0, 1035.0, 700.0, 442.0, 281.0, 205.0, 122.0, 75.0, 59.0, 42.0, 19.0, 10.0, 11.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.4296875, -4.29156494140625, -4.1534423828125, -4.01531982421875, -3.877197265625, -3.73907470703125, -3.6009521484375, -3.46282958984375, -3.32470703125, -3.18658447265625, -3.0484619140625, -2.91033935546875, -2.772216796875, -2.63409423828125, -2.4959716796875, -2.35784912109375, -2.2197265625, -2.08160400390625, -1.9434814453125, -1.80535888671875, -1.667236328125, -1.52911376953125, -1.3909912109375, -1.25286865234375, -1.11474609375, -0.97662353515625, -0.8385009765625, -0.70037841796875, -0.562255859375, -0.42413330078125, -0.2860107421875, -0.14788818359375, -0.009765625, 0.12835693359375, 0.2664794921875, 0.40460205078125, 0.542724609375, 0.68084716796875, 0.8189697265625, 0.95709228515625, 1.09521484375, 1.23333740234375, 1.3714599609375, 1.50958251953125, 1.647705078125, 1.78582763671875, 1.9239501953125, 2.06207275390625, 2.2001953125, 2.33831787109375, 2.4764404296875, 2.61456298828125, 2.752685546875, 2.89080810546875, 3.0289306640625, 3.16705322265625, 3.30517578125, 3.44329833984375, 3.5814208984375, 3.71954345703125, 3.857666015625, 3.99578857421875, 4.1339111328125, 4.27203369140625, 4.41015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 10.0, 12.0, 10.0, 13.0, 20.0, 18.0, 30.0, 37.0, 46.0, 49.0, 51.0, 57.0, 50.0, 66.0, 65.0, 63.0, 54.0, 46.0, 46.0, 45.0, 39.0, 26.0, 33.0, 21.0, 17.0, 25.0, 10.0, 10.0, 6.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.278472900390625, -2.20343017578125, -2.128387451171875, -2.0533447265625, -1.978302001953125, -1.90325927734375, -1.828216552734375, -1.753173828125, -1.678131103515625, -1.60308837890625, -1.528045654296875, -1.4530029296875, -1.377960205078125, -1.30291748046875, -1.227874755859375, -1.15283203125, -1.077789306640625, -1.00274658203125, -0.927703857421875, -0.8526611328125, -0.777618408203125, -0.70257568359375, -0.627532958984375, -0.552490234375, -0.477447509765625, -0.40240478515625, -0.327362060546875, -0.2523193359375, -0.177276611328125, -0.10223388671875, -0.027191162109375, 0.0478515625, 0.122894287109375, 0.19793701171875, 0.272979736328125, 0.3480224609375, 0.423065185546875, 0.49810791015625, 0.573150634765625, 0.648193359375, 0.723236083984375, 0.79827880859375, 0.873321533203125, 0.9483642578125, 1.023406982421875, 1.09844970703125, 1.173492431640625, 1.24853515625, 1.323577880859375, 1.39862060546875, 1.473663330078125, 1.5487060546875, 1.623748779296875, 1.69879150390625, 1.773834228515625, 1.848876953125, 1.923919677734375, 1.99896240234375, 2.074005126953125, 2.1490478515625, 2.224090576171875, 2.29913330078125, 2.374176025390625, 2.44921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 8.0, 10.0, 10.0, 15.0, 12.0, 17.0, 32.0, 28.0, 35.0, 25.0, 47.0, 33.0, 42.0, 44.0, 49.0, 44.0, 47.0, 47.0, 43.0, 37.0, 41.0, 35.0, 37.0, 37.0, 31.0, 30.0, 16.0, 24.0, 15.0, 18.0, 10.0, 13.0, 10.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.210351943969727, -18.620548248291016, -18.030744552612305, -17.440940856933594, -16.851137161254883, -16.261333465576172, -15.671530723571777, -15.081727981567383, -14.491924285888672, -13.902120590209961, -13.31231689453125, -12.722513198852539, -12.132710456848145, -11.542906761169434, -10.953103065490723, -10.363300323486328, -9.7734956741333, -9.18369197845459, -8.593888282775879, -8.004085540771484, -7.414281845092773, -6.8244781494140625, -6.234674453735352, -5.644871234893799, -5.055067539215088, -4.465263843536377, -3.875460624694824, -3.2856569290161133, -2.6958534717559814, -2.1060500144958496, -1.5162463188171387, -0.9264430999755859, -0.336639404296875, 0.2531641125679016, 0.8429676294326782, 1.4327712059020996, 2.0225746631622314, 2.6123781204223633, 3.202181816101074, 3.791985034942627, 4.381788730621338, 4.971592426300049, 5.561395645141602, 6.1511993408203125, 6.741003036499023, 7.330806255340576, 7.920609951019287, 8.51041316986084, 9.10021686553955, 9.690020561218262, 10.279824256896973, 10.869626998901367, 11.459430694580078, 12.049234390258789, 12.6390380859375, 13.228841781616211, 13.818645477294922, 14.408449172973633, 14.998252868652344, 15.588056564331055, 16.177860260009766, 16.767662048339844, 17.357467651367188, 17.947269439697266, 18.537073135375977]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 3.0, 9.0, 12.0, 13.0, 12.0, 16.0, 16.0, 21.0, 24.0, 34.0, 30.0, 26.0, 40.0, 35.0, 40.0, 44.0, 38.0, 48.0, 57.0, 53.0, 49.0, 41.0, 40.0, 27.0, 41.0, 19.0, 24.0, 34.0, 23.0, 25.0, 23.0, 19.0, 9.0, 7.0, 12.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-25.008621215820312, -24.212242126464844, -23.415864944458008, -22.61948585510254, -21.82310676574707, -21.026729583740234, -20.230350494384766, -19.433971405029297, -18.637592315673828, -17.84121322631836, -17.044836044311523, -16.248456954956055, -15.452077865600586, -14.655699729919434, -13.859321594238281, -13.062942504882812, -12.266565322875977, -11.470187187194824, -10.673808097839355, -9.877429962158203, -9.081050872802734, -8.284672737121582, -7.48829460144043, -6.691915988922119, -5.895537376403809, -5.099158763885498, -4.3027801513671875, -3.506402015686035, -2.7100234031677246, -1.913644790649414, -1.1172666549682617, -0.32088804244995117, 0.4754924774169922, 1.2718709707260132, 2.068249464035034, 2.8646278381347656, 3.661006450653076, 4.457385063171387, 5.253763198852539, 6.05014181137085, 6.84652042388916, 7.642899036407471, 8.439277648925781, 9.235655784606934, 10.032033920288086, 10.828413009643555, 11.624791145324707, 12.42116928100586, 13.217548370361328, 14.01392650604248, 14.81030559539795, 15.606683731079102, 16.40306282043457, 17.199440002441406, 17.995819091796875, 18.792198181152344, 19.588577270507812, 20.38495635986328, 21.181333541870117, 21.977712631225586, 22.774091720581055, 23.57046890258789, 24.36684799194336, 25.163227081298828, 25.959604263305664]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 9.0, 19.0, 32.0, 33.0, 84.0, 133.0, 216.0, 391.0, 697.0, 1066.0, 1778.0, 2738.0, 4719.0, 7545.0, 11672.0, 18333.0, 28848.0, 42713.0, 63257.0, 91163.0, 127900.0, 171148.0, 222109.0, 275129.0, 323481.0, 360235.0, 380323.0, 378960.0, 355602.0, 315179.0, 265175.0, 211282.0, 162617.0, 118935.0, 84358.0, 57736.0, 39295.0, 25605.0, 16178.0, 10440.0, 6483.0, 4092.0, 2518.0, 1616.0, 953.0, 589.0, 355.0, 199.0, 139.0, 77.0, 53.0, 32.0, 22.0, 18.0, 2.0, 1.0, 5.0, 1.0, 1.0, 3.0], "bins": [-13.96875, -13.51708984375, -13.0654296875, -12.61376953125, -12.162109375, -11.71044921875, -11.2587890625, -10.80712890625, -10.35546875, -9.90380859375, -9.4521484375, -9.00048828125, -8.548828125, -8.09716796875, -7.6455078125, -7.19384765625, -6.7421875, -6.29052734375, -5.8388671875, -5.38720703125, -4.935546875, -4.48388671875, -4.0322265625, -3.58056640625, -3.12890625, -2.67724609375, -2.2255859375, -1.77392578125, -1.322265625, -0.87060546875, -0.4189453125, 0.03271484375, 0.484375, 0.93603515625, 1.3876953125, 1.83935546875, 2.291015625, 2.74267578125, 3.1943359375, 3.64599609375, 4.09765625, 4.54931640625, 5.0009765625, 5.45263671875, 5.904296875, 6.35595703125, 6.8076171875, 7.25927734375, 7.7109375, 8.16259765625, 8.6142578125, 9.06591796875, 9.517578125, 9.96923828125, 10.4208984375, 10.87255859375, 11.32421875, 11.77587890625, 12.2275390625, 12.67919921875, 13.130859375, 13.58251953125, 14.0341796875, 14.48583984375, 14.9375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 11.0, 9.0, 18.0, 15.0, 22.0, 20.0, 27.0, 31.0, 30.0, 30.0, 41.0, 42.0, 43.0, 60.0, 54.0, 49.0, 43.0, 61.0, 44.0, 55.0, 36.0, 26.0, 31.0, 39.0, 27.0, 22.0, 27.0, 18.0, 10.0, 9.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.28125, -23.460693359375, -22.64013671875, -21.819580078125, -20.9990234375, -20.178466796875, -19.35791015625, -18.537353515625, -17.716796875, -16.896240234375, -16.07568359375, -15.255126953125, -14.4345703125, -13.614013671875, -12.79345703125, -11.972900390625, -11.15234375, -10.331787109375, -9.51123046875, -8.690673828125, -7.8701171875, -7.049560546875, -6.22900390625, -5.408447265625, -4.587890625, -3.767333984375, -2.94677734375, -2.126220703125, -1.3056640625, -0.485107421875, 0.33544921875, 1.156005859375, 1.9765625, 2.797119140625, 3.61767578125, 4.438232421875, 5.2587890625, 6.079345703125, 6.89990234375, 7.720458984375, 8.541015625, 9.361572265625, 10.18212890625, 11.002685546875, 11.8232421875, 12.643798828125, 13.46435546875, 14.284912109375, 15.10546875, 15.926025390625, 16.74658203125, 17.567138671875, 18.3876953125, 19.208251953125, 20.02880859375, 20.849365234375, 21.669921875, 22.490478515625, 23.31103515625, 24.131591796875, 24.9521484375, 25.772705078125, 26.59326171875, 27.413818359375, 28.234375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 14.0, 16.0, 44.0, 71.0, 125.0, 236.0, 403.0, 758.0, 1286.0, 2119.0, 3817.0, 6609.0, 11372.0, 19164.0, 31287.0, 49612.0, 76882.0, 114512.0, 163466.0, 221435.0, 284619.0, 344011.0, 389662.0, 414948.0, 411032.0, 382601.0, 332920.0, 272654.0, 210752.0, 153137.0, 106948.0, 71584.0, 45803.0, 28879.0, 17209.0, 10151.0, 5919.0, 3493.0, 2106.0, 1184.0, 635.0, 348.0, 215.0, 121.0, 55.0, 31.0, 22.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.846923828125, -17.28759765625, -16.728271484375, -16.1689453125, -15.609619140625, -15.05029296875, -14.490966796875, -13.931640625, -13.372314453125, -12.81298828125, -12.253662109375, -11.6943359375, -11.135009765625, -10.57568359375, -10.016357421875, -9.45703125, -8.897705078125, -8.33837890625, -7.779052734375, -7.2197265625, -6.660400390625, -6.10107421875, -5.541748046875, -4.982421875, -4.423095703125, -3.86376953125, -3.304443359375, -2.7451171875, -2.185791015625, -1.62646484375, -1.067138671875, -0.5078125, 0.051513671875, 0.61083984375, 1.170166015625, 1.7294921875, 2.288818359375, 2.84814453125, 3.407470703125, 3.966796875, 4.526123046875, 5.08544921875, 5.644775390625, 6.2041015625, 6.763427734375, 7.32275390625, 7.882080078125, 8.44140625, 9.000732421875, 9.56005859375, 10.119384765625, 10.6787109375, 11.238037109375, 11.79736328125, 12.356689453125, 12.916015625, 13.475341796875, 14.03466796875, 14.593994140625, 15.1533203125, 15.712646484375, 16.27197265625, 16.831298828125, 17.390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 5.0, 10.0, 14.0, 19.0, 31.0, 21.0, 40.0, 39.0, 55.0, 74.0, 74.0, 93.0, 120.0, 115.0, 163.0, 161.0, 170.0, 183.0, 206.0, 191.0, 210.0, 208.0, 216.0, 199.0, 200.0, 180.0, 180.0, 141.0, 132.0, 120.0, 99.0, 87.0, 78.0, 45.0, 43.0, 41.0, 30.0, 24.0, 18.0, 8.0, 7.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.96484375, -9.6171875, -9.26953125, -8.921875, -8.57421875, -8.2265625, -7.87890625, -7.53125, -7.18359375, -6.8359375, -6.48828125, -6.140625, -5.79296875, -5.4453125, -5.09765625, -4.75, -4.40234375, -4.0546875, -3.70703125, -3.359375, -3.01171875, -2.6640625, -2.31640625, -1.96875, -1.62109375, -1.2734375, -0.92578125, -0.578125, -0.23046875, 0.1171875, 0.46484375, 0.8125, 1.16015625, 1.5078125, 1.85546875, 2.203125, 2.55078125, 2.8984375, 3.24609375, 3.59375, 3.94140625, 4.2890625, 4.63671875, 4.984375, 5.33203125, 5.6796875, 6.02734375, 6.375, 6.72265625, 7.0703125, 7.41796875, 7.765625, 8.11328125, 8.4609375, 8.80859375, 9.15625, 9.50390625, 9.8515625, 10.19921875, 10.546875, 10.89453125, 11.2421875, 11.58984375, 11.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 13.0, 9.0, 15.0, 12.0, 16.0, 25.0, 27.0, 36.0, 49.0, 39.0, 38.0, 62.0, 62.0, 50.0, 58.0, 44.0, 47.0, 41.0, 48.0, 44.0, 33.0, 47.0, 31.0, 32.0, 16.0, 22.0, 22.0, 8.0, 17.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.577030181884766, -30.613937377929688, -29.65084457397461, -28.68775177001953, -27.724658966064453, -26.761566162109375, -25.798473358154297, -24.83538055419922, -23.87228775024414, -22.909194946289062, -21.946102142333984, -20.983009338378906, -20.019916534423828, -19.05682373046875, -18.093730926513672, -17.130638122558594, -16.16754722595215, -15.20445442199707, -14.241361618041992, -13.278268814086914, -12.315176010131836, -11.352083206176758, -10.388991355895996, -9.425898551940918, -8.46280574798584, -7.499712944030762, -6.536620140075684, -5.573527812957764, -4.6104350090026855, -3.6473422050476074, -2.6842498779296875, -1.7211570739746094, -0.7580642700195312, 0.20502841472625732, 1.168121099472046, 2.131213665008545, 3.094306468963623, 4.057399272918701, 5.020491600036621, 5.983584403991699, 6.946677207946777, 7.9097700119018555, 8.872862815856934, 9.835954666137695, 10.799047470092773, 11.762140274047852, 12.72523307800293, 13.688325881958008, 14.651418685913086, 15.614511489868164, 16.577604293823242, 17.54069709777832, 18.5037899017334, 19.466882705688477, 20.429973602294922, 21.39306640625, 22.356159210205078, 23.319252014160156, 24.282344818115234, 25.245437622070312, 26.20853042602539, 27.17162322998047, 28.134716033935547, 29.097808837890625, 30.060901641845703]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 1.0, 3.0, 8.0, 9.0, 16.0, 17.0, 19.0, 12.0, 30.0, 22.0, 32.0, 38.0, 35.0, 33.0, 40.0, 58.0, 52.0, 44.0, 41.0, 41.0, 51.0, 33.0, 35.0, 47.0, 44.0, 33.0, 21.0, 30.0, 36.0, 26.0, 19.0, 13.0, 15.0, 10.0, 12.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.46427917480469, -34.44151306152344, -33.41874313354492, -32.39597702026367, -31.37320899963379, -30.350440979003906, -29.327674865722656, -28.304906845092773, -27.28213882446289, -26.259370803833008, -25.236602783203125, -24.213836669921875, -23.191068649291992, -22.16830062866211, -21.14553451538086, -20.122766494750977, -19.099998474121094, -18.07723045349121, -17.054462432861328, -16.031696319580078, -15.008928298950195, -13.986160278320312, -12.963393211364746, -11.94062614440918, -10.917858123779297, -9.895090103149414, -8.872323036193848, -7.849555492401123, -6.826787948608398, -5.804020404815674, -4.781252861022949, -3.7584853172302246, -2.7357139587402344, -1.7129464149475098, -0.6901788711547852, 0.33258867263793945, 1.355356216430664, 2.3781237602233887, 3.4008913040161133, 4.423658847808838, 5.4464263916015625, 6.469193935394287, 7.491961479187012, 8.514728546142578, 9.537496566772461, 10.560264587402344, 11.58303165435791, 12.605798721313477, 13.62856674194336, 14.651334762573242, 15.674101829528809, 16.696868896484375, 17.719636917114258, 18.74240493774414, 19.76517105102539, 20.787939071655273, 21.810707092285156, 22.83347511291504, 23.856243133544922, 24.879009246826172, 25.901777267456055, 26.924545288085938, 27.947311401367188, 28.97007942199707, 29.992847442626953]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 12.0, 16.0, 17.0, 26.0, 51.0, 85.0, 115.0, 190.0, 300.0, 450.0, 725.0, 1180.0, 1926.0, 3108.0, 5443.0, 9340.0, 16154.0, 28211.0, 48811.0, 80772.0, 123981.0, 163005.0, 173114.0, 142854.0, 99699.0, 62447.0, 36342.0, 21026.0, 11894.0, 6870.0, 4064.0, 2442.0, 1403.0, 894.0, 552.0, 368.0, 242.0, 149.0, 90.0, 59.0, 39.0, 34.0, 15.0, 10.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.88671875, -4.74395751953125, -4.6011962890625, -4.45843505859375, -4.315673828125, -4.17291259765625, -4.0301513671875, -3.88739013671875, -3.74462890625, -3.60186767578125, -3.4591064453125, -3.31634521484375, -3.173583984375, -3.03082275390625, -2.8880615234375, -2.74530029296875, -2.6025390625, -2.45977783203125, -2.3170166015625, -2.17425537109375, -2.031494140625, -1.88873291015625, -1.7459716796875, -1.60321044921875, -1.46044921875, -1.31768798828125, -1.1749267578125, -1.03216552734375, -0.889404296875, -0.74664306640625, -0.6038818359375, -0.46112060546875, -0.318359375, -0.17559814453125, -0.0328369140625, 0.10992431640625, 0.252685546875, 0.39544677734375, 0.5382080078125, 0.68096923828125, 0.82373046875, 0.96649169921875, 1.1092529296875, 1.25201416015625, 1.394775390625, 1.53753662109375, 1.6802978515625, 1.82305908203125, 1.9658203125, 2.10858154296875, 2.2513427734375, 2.39410400390625, 2.536865234375, 2.67962646484375, 2.8223876953125, 2.96514892578125, 3.10791015625, 3.25067138671875, 3.3934326171875, 3.53619384765625, 3.678955078125, 3.82171630859375, 3.9644775390625, 4.10723876953125, 4.25]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 3.0, 15.0, 13.0, 17.0, 16.0, 12.0, 32.0, 23.0, 25.0, 41.0, 43.0, 38.0, 49.0, 37.0, 40.0, 37.0, 47.0, 50.0, 47.0, 45.0, 41.0, 36.0, 40.0, 33.0, 31.0, 29.0, 32.0, 21.0, 19.0, 16.0, 15.0, 13.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.0625, -35.9921875, -34.921875, -33.8515625, -32.78125, -31.7109375, -30.640625, -29.5703125, -28.5, -27.4296875, -26.359375, -25.2890625, -24.21875, -23.1484375, -22.078125, -21.0078125, -19.9375, -18.8671875, -17.796875, -16.7265625, -15.65625, -14.5859375, -13.515625, -12.4453125, -11.375, -10.3046875, -9.234375, -8.1640625, -7.09375, -6.0234375, -4.953125, -3.8828125, -2.8125, -1.7421875, -0.671875, 0.3984375, 1.46875, 2.5390625, 3.609375, 4.6796875, 5.75, 6.8203125, 7.890625, 8.9609375, 10.03125, 11.1015625, 12.171875, 13.2421875, 14.3125, 15.3828125, 16.453125, 17.5234375, 18.59375, 19.6640625, 20.734375, 21.8046875, 22.875, 23.9453125, 25.015625, 26.0859375, 27.15625, 28.2265625, 29.296875, 30.3671875, 31.4375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 20.0, 36.0, 42.0, 82.0, 106.0, 151.0, 229.0, 401.0, 578.0, 839.0, 1390.0, 1930.0, 2946.0, 4433.0, 6630.0, 9734.0, 14906.0, 22036.0, 33016.0, 48295.0, 68988.0, 93823.0, 117820.0, 131299.0, 124732.0, 105989.0, 80424.0, 57229.0, 39530.0, 27209.0, 17725.0, 12151.0, 7941.0, 5386.0, 3440.0, 2407.0, 1593.0, 1046.0, 673.0, 469.0, 293.0, 220.0, 123.0, 83.0, 49.0, 37.0, 23.0, 11.0, 13.0, 11.0, 6.0, 1.0, 1.0, 1.0], "bins": [-3.7890625, -3.676727294921875, -3.56439208984375, -3.452056884765625, -3.3397216796875, -3.227386474609375, -3.11505126953125, -3.002716064453125, -2.890380859375, -2.778045654296875, -2.66571044921875, -2.553375244140625, -2.4410400390625, -2.328704833984375, -2.21636962890625, -2.104034423828125, -1.99169921875, -1.879364013671875, -1.76702880859375, -1.654693603515625, -1.5423583984375, -1.430023193359375, -1.31768798828125, -1.205352783203125, -1.093017578125, -0.980682373046875, -0.86834716796875, -0.756011962890625, -0.6436767578125, -0.531341552734375, -0.41900634765625, -0.306671142578125, -0.1943359375, -0.082000732421875, 0.03033447265625, 0.142669677734375, 0.2550048828125, 0.367340087890625, 0.47967529296875, 0.592010498046875, 0.704345703125, 0.816680908203125, 0.92901611328125, 1.041351318359375, 1.1536865234375, 1.266021728515625, 1.37835693359375, 1.490692138671875, 1.60302734375, 1.715362548828125, 1.82769775390625, 1.940032958984375, 2.0523681640625, 2.164703369140625, 2.27703857421875, 2.389373779296875, 2.501708984375, 2.614044189453125, 2.72637939453125, 2.838714599609375, 2.9510498046875, 3.063385009765625, 3.17572021484375, 3.288055419921875, 3.400390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 6.0, 8.0, 8.0, 19.0, 12.0, 19.0, 17.0, 17.0, 21.0, 21.0, 28.0, 39.0, 26.0, 34.0, 39.0, 34.0, 43.0, 37.0, 38.0, 38.0, 32.0, 28.0, 36.0, 29.0, 33.0, 33.0, 26.0, 32.0, 21.0, 16.0, 16.0, 26.0, 20.0, 13.0, 14.0, 15.0, 6.0, 8.0, 12.0, 7.0, 9.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-17.140625, -16.609130859375, -16.07763671875, -15.546142578125, -15.0146484375, -14.483154296875, -13.95166015625, -13.420166015625, -12.888671875, -12.357177734375, -11.82568359375, -11.294189453125, -10.7626953125, -10.231201171875, -9.69970703125, -9.168212890625, -8.63671875, -8.105224609375, -7.57373046875, -7.042236328125, -6.5107421875, -5.979248046875, -5.44775390625, -4.916259765625, -4.384765625, -3.853271484375, -3.32177734375, -2.790283203125, -2.2587890625, -1.727294921875, -1.19580078125, -0.664306640625, -0.1328125, 0.398681640625, 0.93017578125, 1.461669921875, 1.9931640625, 2.524658203125, 3.05615234375, 3.587646484375, 4.119140625, 4.650634765625, 5.18212890625, 5.713623046875, 6.2451171875, 6.776611328125, 7.30810546875, 7.839599609375, 8.37109375, 8.902587890625, 9.43408203125, 9.965576171875, 10.4970703125, 11.028564453125, 11.56005859375, 12.091552734375, 12.623046875, 13.154541015625, 13.68603515625, 14.217529296875, 14.7490234375, 15.280517578125, 15.81201171875, 16.343505859375, 16.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 16.0, 12.0, 23.0, 28.0, 36.0, 56.0, 78.0, 127.0, 187.0, 329.0, 477.0, 631.0, 1174.0, 1646.0, 2581.0, 4131.0, 6437.0, 10351.0, 16286.0, 26193.0, 41569.0, 65272.0, 98306.0, 136082.0, 161153.0, 148991.0, 113790.0, 77336.0, 50330.0, 31283.0, 19721.0, 12340.0, 7823.0, 4991.0, 3067.0, 1994.0, 1261.0, 839.0, 533.0, 345.0, 228.0, 176.0, 97.0, 76.0, 42.0, 36.0, 18.0, 19.0, 15.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.38916015625, -0.3776130676269531, -0.36606597900390625, -0.3545188903808594, -0.3429718017578125, -0.3314247131347656, -0.31987762451171875, -0.3083305358886719, -0.296783447265625, -0.2852363586425781, -0.27368927001953125, -0.2621421813964844, -0.2505950927734375, -0.23904800415039062, -0.22750091552734375, -0.21595382690429688, -0.20440673828125, -0.19285964965820312, -0.18131256103515625, -0.16976547241210938, -0.1582183837890625, -0.14667129516601562, -0.13512420654296875, -0.12357711791992188, -0.112030029296875, -0.10048294067382812, -0.08893585205078125, -0.07738876342773438, -0.0658416748046875, -0.054294586181640625, -0.04274749755859375, -0.031200408935546875, -0.0196533203125, -0.008106231689453125, 0.00344085693359375, 0.014987945556640625, 0.0265350341796875, 0.038082122802734375, 0.04962921142578125, 0.061176300048828125, 0.072723388671875, 0.08427047729492188, 0.09581756591796875, 0.10736465454101562, 0.1189117431640625, 0.13045883178710938, 0.14200592041015625, 0.15355300903320312, 0.16510009765625, 0.17664718627929688, 0.18819427490234375, 0.19974136352539062, 0.2112884521484375, 0.22283554077148438, 0.23438262939453125, 0.24592971801757812, 0.257476806640625, 0.2690238952636719, 0.28057098388671875, 0.2921180725097656, 0.3036651611328125, 0.3152122497558594, 0.32675933837890625, 0.3383064270019531, 0.349853515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 5.0, 13.0, 11.0, 24.0, 26.0, 31.0, 31.0, 34.0, 44.0, 43.0, 51.0, 53.0, 57.0, 48.0, 36.0, 66.0, 52.0, 52.0, 43.0, 30.0, 35.0, 41.0, 27.0, 39.0, 30.0, 22.0, 13.0, 11.0, 10.0, 1.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65648078918457e-05, -5.482882261276245e-05, -5.30928373336792e-05, -5.135685205459595e-05, -4.9620866775512695e-05, -4.788488149642944e-05, -4.614889621734619e-05, -4.441291093826294e-05, -4.267692565917969e-05, -4.0940940380096436e-05, -3.9204955101013184e-05, -3.746896982192993e-05, -3.573298454284668e-05, -3.399699926376343e-05, -3.2261013984680176e-05, -3.0525028705596924e-05, -2.8789043426513672e-05, -2.705305814743042e-05, -2.5317072868347168e-05, -2.3581087589263916e-05, -2.1845102310180664e-05, -2.0109117031097412e-05, -1.837313175201416e-05, -1.6637146472930908e-05, -1.4901161193847656e-05, -1.3165175914764404e-05, -1.1429190635681152e-05, -9.6932053565979e-06, -7.957220077514648e-06, -6.2212347984313965e-06, -4.4852495193481445e-06, -2.7492642402648926e-06, -1.0132789611816406e-06, 7.227063179016113e-07, 2.4586915969848633e-06, 4.194676876068115e-06, 5.930662155151367e-06, 7.666647434234619e-06, 9.402632713317871e-06, 1.1138617992401123e-05, 1.2874603271484375e-05, 1.4610588550567627e-05, 1.634657382965088e-05, 1.808255910873413e-05, 1.9818544387817383e-05, 2.1554529666900635e-05, 2.3290514945983887e-05, 2.502650022506714e-05, 2.676248550415039e-05, 2.8498470783233643e-05, 3.0234456062316895e-05, 3.1970441341400146e-05, 3.37064266204834e-05, 3.544241189956665e-05, 3.71783971786499e-05, 3.8914382457733154e-05, 4.0650367736816406e-05, 4.238635301589966e-05, 4.412233829498291e-05, 4.585832357406616e-05, 4.7594308853149414e-05, 4.9330294132232666e-05, 5.106627941131592e-05, 5.280226469039917e-05, 5.453824996948242e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 13.0, 16.0, 31.0, 45.0, 62.0, 107.0, 174.0, 290.0, 421.0, 723.0, 1156.0, 1891.0, 3150.0, 5182.0, 9005.0, 15396.0, 27503.0, 49094.0, 86679.0, 146943.0, 208455.0, 194382.0, 127292.0, 73847.0, 41207.0, 23283.0, 13127.0, 7601.0, 4481.0, 2670.0, 1669.0, 1023.0, 625.0, 371.0, 233.0, 158.0, 91.0, 63.0, 29.0, 20.0, 17.0, 12.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.8234100341796875, -0.796722412109375, -0.7700347900390625, -0.74334716796875, -0.7166595458984375, -0.689971923828125, -0.6632843017578125, -0.6365966796875, -0.6099090576171875, -0.583221435546875, -0.5565338134765625, -0.52984619140625, -0.5031585693359375, -0.476470947265625, -0.4497833251953125, -0.423095703125, -0.3964080810546875, -0.369720458984375, -0.3430328369140625, -0.31634521484375, -0.2896575927734375, -0.262969970703125, -0.2362823486328125, -0.2095947265625, -0.1829071044921875, -0.156219482421875, -0.1295318603515625, -0.10284423828125, -0.0761566162109375, -0.049468994140625, -0.0227813720703125, 0.00390625, 0.0305938720703125, 0.057281494140625, 0.0839691162109375, 0.11065673828125, 0.1373443603515625, 0.164031982421875, 0.1907196044921875, 0.2174072265625, 0.2440948486328125, 0.270782470703125, 0.2974700927734375, 0.32415771484375, 0.3508453369140625, 0.377532958984375, 0.4042205810546875, 0.430908203125, 0.4575958251953125, 0.484283447265625, 0.5109710693359375, 0.53765869140625, 0.5643463134765625, 0.591033935546875, 0.6177215576171875, 0.6444091796875, 0.6710968017578125, 0.697784423828125, 0.7244720458984375, 0.75115966796875, 0.7778472900390625, 0.804534912109375, 0.8312225341796875, 0.85791015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 12.0, 10.0, 20.0, 17.0, 15.0, 24.0, 28.0, 47.0, 40.0, 51.0, 56.0, 74.0, 85.0, 73.0, 65.0, 54.0, 50.0, 41.0, 40.0, 28.0, 29.0, 24.0, 19.0, 11.0, 11.0, 13.0, 4.0, 6.0, 7.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.39270782470703125, -0.3786773681640625, -0.36464691162109375, -0.350616455078125, -0.33658599853515625, -0.3225555419921875, -0.30852508544921875, -0.29449462890625, -0.28046417236328125, -0.2664337158203125, -0.25240325927734375, -0.238372802734375, -0.22434234619140625, -0.2103118896484375, -0.19628143310546875, -0.1822509765625, -0.16822052001953125, -0.1541900634765625, -0.14015960693359375, -0.126129150390625, -0.11209869384765625, -0.0980682373046875, -0.08403778076171875, -0.07000732421875, -0.05597686767578125, -0.0419464111328125, -0.02791595458984375, -0.013885498046875, 0.00014495849609375, 0.0141754150390625, 0.02820587158203125, 0.042236328125, 0.05626678466796875, 0.0702972412109375, 0.08432769775390625, 0.098358154296875, 0.11238861083984375, 0.1264190673828125, 0.14044952392578125, 0.15447998046875, 0.16851043701171875, 0.1825408935546875, 0.19657135009765625, 0.210601806640625, 0.22463226318359375, 0.2386627197265625, 0.25269317626953125, 0.2667236328125, 0.28075408935546875, 0.2947845458984375, 0.30881500244140625, 0.322845458984375, 0.33687591552734375, 0.3509063720703125, 0.36493682861328125, 0.37896728515625, 0.39299774169921875, 0.4070281982421875, 0.42105865478515625, 0.435089111328125, 0.44911956787109375, 0.4631500244140625, 0.47718048095703125, 0.4912109375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 1.0, 8.0, 13.0, 11.0, 15.0, 14.0, 14.0, 25.0, 29.0, 45.0, 44.0, 39.0, 50.0, 54.0, 60.0, 54.0, 53.0, 45.0, 50.0, 44.0, 42.0, 41.0, 41.0, 43.0, 28.0, 27.0, 20.0, 22.0, 15.0, 16.0, 13.0, 2.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.737403869628906, -30.766916275024414, -29.796428680419922, -28.825939178466797, -27.855451583862305, -26.884963989257812, -25.91447639465332, -24.943988800048828, -23.973499298095703, -23.00301170349121, -22.03252410888672, -21.062034606933594, -20.0915470123291, -19.12105941772461, -18.150571823120117, -17.180084228515625, -16.209596633911133, -15.23910903930664, -14.268620491027832, -13.29813289642334, -12.327644348144531, -11.357156753540039, -10.386669158935547, -9.416181564331055, -8.445693016052246, -7.475204944610596, -6.504716873168945, -5.534229278564453, -4.563741207122803, -3.5932531356811523, -2.62276554107666, -1.6522774696350098, -0.6817913055419922, 0.28869664669036865, 1.2591845989227295, 2.229672431945801, 3.200160503387451, 4.170648574829102, 5.141136169433594, 6.111624240875244, 7.0821123123168945, 8.052599906921387, 9.023088455200195, 9.993576049804688, 10.96406364440918, 11.934552192687988, 12.90503978729248, 13.875528335571289, 14.846015930175781, 15.816503524780273, 16.786991119384766, 17.75748062133789, 18.727968215942383, 19.698455810546875, 20.668943405151367, 21.63943099975586, 22.609920501708984, 23.580408096313477, 24.55089569091797, 25.521385192871094, 26.491872787475586, 27.462360382080078, 28.43284797668457, 29.403335571289062, 30.373823165893555]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 7.0, 10.0, 15.0, 18.0, 17.0, 15.0, 29.0, 20.0, 32.0, 40.0, 32.0, 33.0, 42.0, 55.0, 49.0, 48.0, 45.0, 40.0, 49.0, 34.0, 35.0, 44.0, 44.0, 35.0, 24.0, 29.0, 37.0, 24.0, 18.0, 15.0, 15.0, 8.0, 11.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.5777587890625, -34.55222702026367, -33.526695251464844, -32.50116729736328, -31.47563362121582, -30.450103759765625, -29.424571990966797, -28.39904022216797, -27.37350845336914, -26.347976684570312, -25.322446823120117, -24.29691505432129, -23.27138328552246, -22.245853424072266, -21.220321655273438, -20.19478988647461, -19.169260025024414, -18.143728256225586, -17.11819839477539, -16.092666625976562, -15.067134857177734, -14.041604042053223, -13.016073226928711, -11.990541458129883, -10.965010643005371, -9.93947982788086, -8.913948059082031, -7.8884172439575195, -6.86288595199585, -5.83735466003418, -4.811823844909668, -3.786292552947998, -2.760761260986328, -1.7352300882339478, -0.7096989154815674, 0.31583213806152344, 1.3413634300231934, 2.3668947219848633, 3.392425537109375, 4.417956829071045, 5.443488121032715, 6.469019412994385, 7.494550704956055, 8.520081520080566, 9.545612335205078, 10.571144104003906, 11.596674919128418, 12.62220573425293, 13.647737503051758, 14.67326831817627, 15.698800086975098, 16.72433090209961, 17.749862670898438, 18.775394439697266, 19.80092430114746, 20.82645606994629, 21.851985931396484, 22.877517700195312, 23.903047561645508, 24.928579330444336, 25.954111099243164, 26.97964096069336, 28.005172729492188, 29.030704498291016, 30.056236267089844]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 9.0, 16.0, 17.0, 37.0, 72.0, 86.0, 144.0, 235.0, 348.0, 611.0, 890.0, 1406.0, 2316.0, 3967.0, 6404.0, 10282.0, 16212.0, 25260.0, 37840.0, 54439.0, 73606.0, 93268.0, 108211.0, 115877.0, 113518.0, 101953.0, 84127.0, 64442.0, 46056.0, 31502.0, 20789.0, 13009.0, 8288.0, 5046.0, 3092.0, 1949.0, 1177.0, 752.0, 455.0, 340.0, 211.0, 106.0, 53.0, 47.0, 35.0, 25.0, 9.0, 9.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.194091796875, -13.70068359375, -13.207275390625, -12.7138671875, -12.220458984375, -11.72705078125, -11.233642578125, -10.740234375, -10.246826171875, -9.75341796875, -9.260009765625, -8.7666015625, -8.273193359375, -7.77978515625, -7.286376953125, -6.79296875, -6.299560546875, -5.80615234375, -5.312744140625, -4.8193359375, -4.325927734375, -3.83251953125, -3.339111328125, -2.845703125, -2.352294921875, -1.85888671875, -1.365478515625, -0.8720703125, -0.378662109375, 0.11474609375, 0.608154296875, 1.1015625, 1.594970703125, 2.08837890625, 2.581787109375, 3.0751953125, 3.568603515625, 4.06201171875, 4.555419921875, 5.048828125, 5.542236328125, 6.03564453125, 6.529052734375, 7.0224609375, 7.515869140625, 8.00927734375, 8.502685546875, 8.99609375, 9.489501953125, 9.98291015625, 10.476318359375, 10.9697265625, 11.463134765625, 11.95654296875, 12.449951171875, 12.943359375, 13.436767578125, 13.93017578125, 14.423583984375, 14.9169921875, 15.410400390625, 15.90380859375, 16.397216796875, 16.890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 13.0, 10.0, 15.0, 13.0, 27.0, 21.0, 29.0, 22.0, 27.0, 34.0, 37.0, 50.0, 31.0, 49.0, 45.0, 46.0, 40.0, 48.0, 34.0, 39.0, 36.0, 23.0, 45.0, 28.0, 25.0, 25.0, 35.0, 25.0, 26.0, 16.0, 13.0, 13.0, 6.0, 9.0, 7.0, 9.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-33.6875, -32.759521484375, -31.83154296875, -30.903564453125, -29.9755859375, -29.047607421875, -28.11962890625, -27.191650390625, -26.263671875, -25.335693359375, -24.40771484375, -23.479736328125, -22.5517578125, -21.623779296875, -20.69580078125, -19.767822265625, -18.83984375, -17.911865234375, -16.98388671875, -16.055908203125, -15.1279296875, -14.199951171875, -13.27197265625, -12.343994140625, -11.416015625, -10.488037109375, -9.56005859375, -8.632080078125, -7.7041015625, -6.776123046875, -5.84814453125, -4.920166015625, -3.9921875, -3.064208984375, -2.13623046875, -1.208251953125, -0.2802734375, 0.647705078125, 1.57568359375, 2.503662109375, 3.431640625, 4.359619140625, 5.28759765625, 6.215576171875, 7.1435546875, 8.071533203125, 8.99951171875, 9.927490234375, 10.85546875, 11.783447265625, 12.71142578125, 13.639404296875, 14.5673828125, 15.495361328125, 16.42333984375, 17.351318359375, 18.279296875, 19.207275390625, 20.13525390625, 21.063232421875, 21.9912109375, 22.919189453125, 23.84716796875, 24.775146484375, 25.703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 19.0, 26.0, 38.0, 54.0, 79.0, 132.0, 180.0, 272.0, 429.0, 658.0, 986.0, 1484.0, 2427.0, 3548.0, 5500.0, 8165.0, 12807.0, 18966.0, 28582.0, 41661.0, 58031.0, 77487.0, 96325.0, 110454.0, 115579.0, 110348.0, 95247.0, 77111.0, 57439.0, 41106.0, 28159.0, 19113.0, 12538.0, 8278.0, 5275.0, 3478.0, 2293.0, 1397.0, 982.0, 635.0, 424.0, 308.0, 185.0, 110.0, 80.0, 61.0, 30.0, 27.0, 17.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -16.986328125, -16.41015625, -15.833984375, -15.2578125, -14.681640625, -14.10546875, -13.529296875, -12.953125, -12.376953125, -11.80078125, -11.224609375, -10.6484375, -10.072265625, -9.49609375, -8.919921875, -8.34375, -7.767578125, -7.19140625, -6.615234375, -6.0390625, -5.462890625, -4.88671875, -4.310546875, -3.734375, -3.158203125, -2.58203125, -2.005859375, -1.4296875, -0.853515625, -0.27734375, 0.298828125, 0.875, 1.451171875, 2.02734375, 2.603515625, 3.1796875, 3.755859375, 4.33203125, 4.908203125, 5.484375, 6.060546875, 6.63671875, 7.212890625, 7.7890625, 8.365234375, 8.94140625, 9.517578125, 10.09375, 10.669921875, 11.24609375, 11.822265625, 12.3984375, 12.974609375, 13.55078125, 14.126953125, 14.703125, 15.279296875, 15.85546875, 16.431640625, 17.0078125, 17.583984375, 18.16015625, 18.736328125, 19.3125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 10.0, 7.0, 10.0, 7.0, 21.0, 14.0, 19.0, 21.0, 25.0, 33.0, 34.0, 35.0, 31.0, 53.0, 45.0, 38.0, 51.0, 39.0, 47.0, 39.0, 47.0, 37.0, 44.0, 39.0, 29.0, 34.0, 32.0, 13.0, 16.0, 29.0, 17.0, 20.0, 13.0, 11.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.07568359375, -19.4482421875, -18.82080078125, -18.193359375, -17.56591796875, -16.9384765625, -16.31103515625, -15.68359375, -15.05615234375, -14.4287109375, -13.80126953125, -13.173828125, -12.54638671875, -11.9189453125, -11.29150390625, -10.6640625, -10.03662109375, -9.4091796875, -8.78173828125, -8.154296875, -7.52685546875, -6.8994140625, -6.27197265625, -5.64453125, -5.01708984375, -4.3896484375, -3.76220703125, -3.134765625, -2.50732421875, -1.8798828125, -1.25244140625, -0.625, 0.00244140625, 0.6298828125, 1.25732421875, 1.884765625, 2.51220703125, 3.1396484375, 3.76708984375, 4.39453125, 5.02197265625, 5.6494140625, 6.27685546875, 6.904296875, 7.53173828125, 8.1591796875, 8.78662109375, 9.4140625, 10.04150390625, 10.6689453125, 11.29638671875, 11.923828125, 12.55126953125, 13.1787109375, 13.80615234375, 14.43359375, 15.06103515625, 15.6884765625, 16.31591796875, 16.943359375, 17.57080078125, 18.1982421875, 18.82568359375, 19.453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 5.0, 10.0, 14.0, 30.0, 50.0, 59.0, 100.0, 149.0, 241.0, 311.0, 514.0, 774.0, 1191.0, 1834.0, 2941.0, 4753.0, 7683.0, 12567.0, 20824.0, 33868.0, 52217.0, 75365.0, 100100.0, 120330.0, 130321.0, 125776.0, 108507.0, 83722.0, 59955.0, 39848.0, 24845.0, 15133.0, 9283.0, 5559.0, 3429.0, 2158.0, 1324.0, 914.0, 633.0, 403.0, 285.0, 189.0, 129.0, 65.0, 58.0, 44.0, 22.0, 7.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83203125, -6.59381103515625, -6.3555908203125, -6.11737060546875, -5.879150390625, -5.64093017578125, -5.4027099609375, -5.16448974609375, -4.92626953125, -4.68804931640625, -4.4498291015625, -4.21160888671875, -3.973388671875, -3.73516845703125, -3.4969482421875, -3.25872802734375, -3.0205078125, -2.78228759765625, -2.5440673828125, -2.30584716796875, -2.067626953125, -1.82940673828125, -1.5911865234375, -1.35296630859375, -1.11474609375, -0.87652587890625, -0.6383056640625, -0.40008544921875, -0.161865234375, 0.07635498046875, 0.3145751953125, 0.55279541015625, 0.791015625, 1.02923583984375, 1.2674560546875, 1.50567626953125, 1.743896484375, 1.98211669921875, 2.2203369140625, 2.45855712890625, 2.69677734375, 2.93499755859375, 3.1732177734375, 3.41143798828125, 3.649658203125, 3.88787841796875, 4.1260986328125, 4.36431884765625, 4.6025390625, 4.84075927734375, 5.0789794921875, 5.31719970703125, 5.555419921875, 5.79364013671875, 6.0318603515625, 6.27008056640625, 6.50830078125, 6.74652099609375, 6.9847412109375, 7.22296142578125, 7.461181640625, 7.69940185546875, 7.9376220703125, 8.17584228515625, 8.4140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 7.0, 13.0, 20.0, 22.0, 34.0, 33.0, 21.0, 49.0, 60.0, 60.0, 56.0, 60.0, 43.0, 50.0, 76.0, 61.0, 60.0, 52.0, 43.0, 36.0, 33.0, 9.0, 18.0, 11.0, 11.0, 9.0, 6.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0012407302856445312, -0.0012067779898643494, -0.0011728256940841675, -0.0011388733983039856, -0.0011049211025238037, -0.0010709688067436218, -0.00103701651096344, -0.001003064215183258, -0.0009691119194030762, -0.0009351596236228943, -0.0009012073278427124, -0.0008672550320625305, -0.0008333027362823486, -0.0007993504405021667, -0.0007653981447219849, -0.000731445848941803, -0.0006974935531616211, -0.0006635412573814392, -0.0006295889616012573, -0.0005956366658210754, -0.0005616843700408936, -0.0005277320742607117, -0.0004937797784805298, -0.0004598274827003479, -0.000425875186920166, -0.00039192289113998413, -0.00035797059535980225, -0.00032401829957962036, -0.0002900660037994385, -0.0002561137080192566, -0.0002221614122390747, -0.00018820911645889282, -0.00015425682067871094, -0.00012030452489852905, -8.635222911834717e-05, -5.239993333816528e-05, -1.84476375579834e-05, 1.5504658222198486e-05, 4.945695400238037e-05, 8.340924978256226e-05, 0.00011736154556274414, 0.00015131384134292603, 0.0001852661371231079, 0.0002192184329032898, 0.0002531707286834717, 0.00028712302446365356, 0.00032107532024383545, 0.00035502761602401733, 0.0003889799118041992, 0.0004229322075843811, 0.000456884503364563, 0.0004908367991447449, 0.0005247890949249268, 0.0005587413907051086, 0.0005926936864852905, 0.0006266459822654724, 0.0006605982780456543, 0.0006945505738258362, 0.0007285028696060181, 0.0007624551653862, 0.0007964074611663818, 0.0008303597569465637, 0.0008643120527267456, 0.0008982643485069275, 0.0009322166442871094]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 13.0, 21.0, 26.0, 45.0, 70.0, 121.0, 170.0, 267.0, 389.0, 572.0, 924.0, 1455.0, 2220.0, 3321.0, 5400.0, 8698.0, 13982.0, 23333.0, 36404.0, 56039.0, 80368.0, 105203.0, 124706.0, 131365.0, 123217.0, 103041.0, 78399.0, 54456.0, 35536.0, 22143.0, 13700.0, 8415.0, 5304.0, 3269.0, 2091.0, 1350.0, 881.0, 574.0, 319.0, 265.0, 159.0, 117.0, 70.0, 43.0, 26.0, 22.0, 16.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.91015625, -7.65875244140625, -7.4073486328125, -7.15594482421875, -6.904541015625, -6.65313720703125, -6.4017333984375, -6.15032958984375, -5.89892578125, -5.64752197265625, -5.3961181640625, -5.14471435546875, -4.893310546875, -4.64190673828125, -4.3905029296875, -4.13909912109375, -3.8876953125, -3.63629150390625, -3.3848876953125, -3.13348388671875, -2.882080078125, -2.63067626953125, -2.3792724609375, -2.12786865234375, -1.87646484375, -1.62506103515625, -1.3736572265625, -1.12225341796875, -0.870849609375, -0.61944580078125, -0.3680419921875, -0.11663818359375, 0.134765625, 0.38616943359375, 0.6375732421875, 0.88897705078125, 1.140380859375, 1.39178466796875, 1.6431884765625, 1.89459228515625, 2.14599609375, 2.39739990234375, 2.6488037109375, 2.90020751953125, 3.151611328125, 3.40301513671875, 3.6544189453125, 3.90582275390625, 4.1572265625, 4.40863037109375, 4.6600341796875, 4.91143798828125, 5.162841796875, 5.41424560546875, 5.6656494140625, 5.91705322265625, 6.16845703125, 6.41986083984375, 6.6712646484375, 6.92266845703125, 7.174072265625, 7.42547607421875, 7.6768798828125, 7.92828369140625, 8.1796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 15.0, 13.0, 17.0, 16.0, 20.0, 22.0, 38.0, 35.0, 37.0, 46.0, 42.0, 54.0, 58.0, 68.0, 65.0, 60.0, 47.0, 50.0, 40.0, 59.0, 37.0, 25.0, 20.0, 25.0, 12.0, 13.0, 11.0, 10.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 8.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.68817138671875, -2.5716552734375, -2.45513916015625, -2.338623046875, -2.22210693359375, -2.1055908203125, -1.98907470703125, -1.87255859375, -1.75604248046875, -1.6395263671875, -1.52301025390625, -1.406494140625, -1.28997802734375, -1.1734619140625, -1.05694580078125, -0.9404296875, -0.82391357421875, -0.7073974609375, -0.59088134765625, -0.474365234375, -0.35784912109375, -0.2413330078125, -0.12481689453125, -0.00830078125, 0.10821533203125, 0.2247314453125, 0.34124755859375, 0.457763671875, 0.57427978515625, 0.6907958984375, 0.80731201171875, 0.923828125, 1.04034423828125, 1.1568603515625, 1.27337646484375, 1.389892578125, 1.50640869140625, 1.6229248046875, 1.73944091796875, 1.85595703125, 1.97247314453125, 2.0889892578125, 2.20550537109375, 2.322021484375, 2.43853759765625, 2.5550537109375, 2.67156982421875, 2.7880859375, 2.90460205078125, 3.0211181640625, 3.13763427734375, 3.254150390625, 3.37066650390625, 3.4871826171875, 3.60369873046875, 3.72021484375, 3.83673095703125, 3.9532470703125, 4.06976318359375, 4.186279296875, 4.30279541015625, 4.4193115234375, 4.53582763671875, 4.65234375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 3.0, 3.0, 8.0, 14.0, 7.0, 16.0, 22.0, 14.0, 16.0, 22.0, 31.0, 36.0, 41.0, 32.0, 58.0, 45.0, 57.0, 36.0, 56.0, 42.0, 45.0, 36.0, 50.0, 33.0, 42.0, 37.0, 36.0, 32.0, 23.0, 21.0, 18.0, 12.0, 13.0, 6.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.74311637878418, -26.811674118041992, -25.880233764648438, -24.94879150390625, -24.017349243164062, -23.085908889770508, -22.15446662902832, -21.223026275634766, -20.291584014892578, -19.36014175415039, -18.428701400756836, -17.49725914001465, -16.56581687927246, -15.634376525878906, -14.702934265136719, -13.771492958068848, -12.84005069732666, -11.908609390258789, -10.977167129516602, -10.04572582244873, -9.11428451538086, -8.182842254638672, -7.251400947570801, -6.31995964050293, -5.3885178565979, -4.457076072692871, -3.525634765625, -2.5941929817199707, -1.6627514362335205, -0.7313098907470703, 0.20013189315795898, 1.13157320022583, 2.0630149841308594, 2.9944565296173096, 3.9258980751037598, 4.857339859008789, 5.78878116607666, 6.7202229499816895, 7.651664733886719, 8.58310604095459, 9.514547348022461, 10.445988655090332, 11.37743091583252, 12.30887222290039, 13.240313529968262, 14.171754837036133, 15.10319709777832, 16.034637451171875, 16.966079711914062, 17.89752197265625, 18.828962326049805, 19.760404586791992, 20.69184684753418, 21.623287200927734, 22.554729461669922, 23.48617172241211, 24.417613983154297, 25.349056243896484, 26.28049659729004, 27.211938858032227, 28.143381118774414, 29.07482147216797, 30.006263732910156, 30.937705993652344, 31.8691463470459]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 5.0, 7.0, 13.0, 9.0, 16.0, 18.0, 12.0, 15.0, 17.0, 35.0, 24.0, 33.0, 35.0, 31.0, 49.0, 43.0, 48.0, 50.0, 41.0, 44.0, 48.0, 41.0, 41.0, 34.0, 34.0, 25.0, 16.0, 34.0, 31.0, 19.0, 27.0, 17.0, 17.0, 13.0, 13.0, 14.0, 6.0, 1.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.94686508178711, -38.799678802490234, -37.652488708496094, -36.50530242919922, -35.358116149902344, -34.2109260559082, -33.06373977661133, -31.91655158996582, -30.769363403320312, -29.622175216674805, -28.474987030029297, -27.327800750732422, -26.180612564086914, -25.033424377441406, -23.88623809814453, -22.739049911499023, -21.591861724853516, -20.444673538208008, -19.2974853515625, -18.150299072265625, -17.003110885620117, -15.85592269897461, -14.708735466003418, -13.561548233032227, -12.414360046386719, -11.267171859741211, -10.11998462677002, -8.972797393798828, -7.82560920715332, -6.678421497344971, -5.531233787536621, -4.38404655456543, -3.2368621826171875, -2.089674472808838, -0.9424867630004883, 0.20470094680786133, 1.351888656616211, 2.4990763664245605, 3.64626407623291, 4.793451309204102, 5.940639495849609, 7.087827205657959, 8.235014915466309, 9.3822021484375, 10.529390335083008, 11.676578521728516, 12.823765754699707, 13.970952987670898, 15.118141174316406, 16.265329360961914, 17.412517547607422, 18.559703826904297, 19.706892013549805, 20.854080200195312, 22.001266479492188, 23.148454666137695, 24.295642852783203, 25.44283103942871, 26.59001922607422, 27.737205505371094, 28.8843936920166, 30.03158187866211, 31.178768157958984, 32.325958251953125, 33.47314453125]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 3.0, 5.0, 10.0, 13.0, 12.0, 16.0, 24.0, 37.0, 53.0, 63.0, 106.0, 113.0, 173.0, 251.0, 337.0, 452.0, 654.0, 893.0, 1190.0, 1547.0, 1935.0, 2541.0, 3237.0, 4229.0, 5893.0, 997599.0, 7931.0, 5160.0, 3775.0, 2955.0, 2317.0, 1868.0, 1373.0, 1060.0, 762.0, 574.0, 407.0, 295.0, 228.0, 152.0, 96.0, 74.0, 47.0, 35.0, 34.0, 26.0, 15.0, 8.0, 9.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-257.81195068359375, -250.18467712402344, -242.55738830566406, -234.93011474609375, -227.30282592773438, -219.67555236816406, -212.04827880859375, -204.42098999023438, -196.79371643066406, -189.16644287109375, -181.53915405273438, -173.91188049316406, -166.2845916748047, -158.65731811523438, -151.030029296875, -143.4027557373047, -135.77548217773438, -128.14820861816406, -120.52091979980469, -112.89364624023438, -105.26636505126953, -97.63908386230469, -90.01180267333984, -82.384521484375, -74.75723266601562, -67.12995147705078, -59.5026741027832, -51.87539291381836, -44.24811553955078, -36.62083435058594, -28.993553161621094, -21.366275787353516, -13.738998413085938, -6.111718654632568, 1.5155611038208008, 9.142841339111328, 16.77012062072754, 24.39739990234375, 32.024681091308594, 39.65195846557617, 47.279239654541016, 54.90652084350586, 62.53379821777344, 70.16107940673828, 77.78836059570312, 85.41563415527344, 93.04292297363281, 100.67019653320312, 108.29747772216797, 115.92475891113281, 123.55204010009766, 131.1793212890625, 138.8065948486328, 146.43386840820312, 154.0611572265625, 161.6884307861328, 169.3157196044922, 176.9429931640625, 184.57028198242188, 192.1975555419922, 199.82484436035156, 207.45211791992188, 215.07940673828125, 222.70668029785156, 230.33395385742188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 10.0, 17.0, 19.0, 28.0, 37.0, 35.0, 44.0, 65.0, 85.0, 132.0, 170.0, 218.0, 295.0, 412.0, 574.0, 896.0, 1311.0, 2061.0, 3273.0, 5378.0, 8518.0, 13349.0, 19840.0, 28639.0, 64402.0, 51195416.0, 47716.0, 26262.0, 18170.0, 12240.0, 7995.0, 4768.0, 3061.0, 1844.0, 1212.0, 805.0, 539.0, 393.0, 294.0, 207.0, 152.0, 131.0, 94.0, 70.0, 46.0, 34.0, 27.0, 15.0, 16.0, 7.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-271.0247802734375, -262.1094970703125, -253.19424438476562, -244.2789764404297, -235.36370849609375, -226.44842529296875, -217.5331573486328, -208.61788940429688, -199.70262145996094, -190.787353515625, -181.87208557128906, -172.95681762695312, -164.04153442382812, -155.12628173828125, -146.21099853515625, -137.2957305908203, -128.38046264648438, -119.46519470214844, -110.5499267578125, -101.63465118408203, -92.7193832397461, -83.80411529541016, -74.88883972167969, -65.97357177734375, -57.05830383300781, -48.143035888671875, -39.22776412963867, -30.3124942779541, -21.39722442626953, -12.481956481933594, -3.5666847229003906, 5.3485870361328125, 14.26385498046875, 23.17912483215332, 32.09439468383789, 41.009666442871094, 49.92493438720703, 58.84020233154297, 67.75547790527344, 76.67074584960938, 85.58601379394531, 94.50128173828125, 103.41654968261719, 112.33182525634766, 121.2470932006836, 130.162353515625, 139.07763671875, 147.99290466308594, 156.90817260742188, 165.8234405517578, 174.73870849609375, 183.6539764404297, 192.56924438476562, 201.48452758789062, 210.39979553222656, 219.3150634765625, 228.23033142089844, 237.14559936523438, 246.0608673095703, 254.97613525390625, 263.89141845703125, 272.8066711425781, 281.7219543457031, 290.63720703125, 299.552490234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 9.0, 31.0, 38.0, 51.0, 78.0, 133.0, 193.0, 284.0, 468.0, 716.0, 1103.0, 1790.0, 3057.0, 5101.0, 8824.0, 15114.0, 27621.0, 49058.0, 87531.0, 153575.0, 263976.0, 465697.0, 1303595.0, 2411586.0, 685559.0, 340396.0, 200253.0, 114439.0, 65571.0, 36856.0, 20479.0, 11645.0, 6715.0, 3800.0, 2232.0, 1455.0, 934.0, 563.0, 350.0, 182.0, 117.0, 94.0, 45.0, 24.0, 25.0, 22.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-6.1484375, -5.95166015625, -5.7548828125, -5.55810546875, -5.361328125, -5.16455078125, -4.9677734375, -4.77099609375, -4.57421875, -4.37744140625, -4.1806640625, -3.98388671875, -3.787109375, -3.59033203125, -3.3935546875, -3.19677734375, -3.0, -2.80322265625, -2.6064453125, -2.40966796875, -2.212890625, -2.01611328125, -1.8193359375, -1.62255859375, -1.42578125, -1.22900390625, -1.0322265625, -0.83544921875, -0.638671875, -0.44189453125, -0.2451171875, -0.04833984375, 0.1484375, 0.34521484375, 0.5419921875, 0.73876953125, 0.935546875, 1.13232421875, 1.3291015625, 1.52587890625, 1.72265625, 1.91943359375, 2.1162109375, 2.31298828125, 2.509765625, 2.70654296875, 2.9033203125, 3.10009765625, 3.296875, 3.49365234375, 3.6904296875, 3.88720703125, 4.083984375, 4.28076171875, 4.4775390625, 4.67431640625, 4.87109375, 5.06787109375, 5.2646484375, 5.46142578125, 5.658203125, 5.85498046875, 6.0517578125, 6.24853515625, 6.4453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 14.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 14.0, 14.0, 23.0, 23.0, 26.0, 27.0, 31.0, 27.0, 35.0, 47.0, 33.0, 48.0, 105.0, 414.0, 485.0, 169.0, 55.0, 39.0, 40.0, 27.0, 34.0, 23.0, 26.0, 28.0, 21.0, 17.0, 19.0, 19.0, 12.0, 11.0, 12.0, 11.0, 8.0, 8.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-32.8125, -31.8203125, -30.828125, -29.8359375, -28.84375, -27.8515625, -26.859375, -25.8671875, -24.875, -23.8828125, -22.890625, -21.8984375, -20.90625, -19.9140625, -18.921875, -17.9296875, -16.9375, -15.9453125, -14.953125, -13.9609375, -12.96875, -11.9765625, -10.984375, -9.9921875, -9.0, -8.0078125, -7.015625, -6.0234375, -5.03125, -4.0390625, -3.046875, -2.0546875, -1.0625, -0.0703125, 0.921875, 1.9140625, 2.90625, 3.8984375, 4.890625, 5.8828125, 6.875, 7.8671875, 8.859375, 9.8515625, 10.84375, 11.8359375, 12.828125, 13.8203125, 14.8125, 15.8046875, 16.796875, 17.7890625, 18.78125, 19.7734375, 20.765625, 21.7578125, 22.75, 23.7421875, 24.734375, 25.7265625, 26.71875, 27.7109375, 28.703125, 29.6953125, 30.6875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 7.0, 8.0, 11.0, 23.0, 25.0, 36.0, 46.0, 73.0, 92.0, 155.0, 225.0, 359.0, 625.0, 930.0, 1516.0, 2459.0, 4011.0, 6471.0, 10569.0, 17234.0, 28243.0, 46962.0, 76492.0, 124549.0, 197085.0, 302826.0, 509852.0, 2249613.0, 1527200.0, 441482.0, 275343.0, 178626.0, 112001.0, 69054.0, 41978.0, 25362.0, 15274.0, 9420.0, 5723.0, 3561.0, 2152.0, 1316.0, 894.0, 544.0, 354.0, 232.0, 162.0, 93.0, 64.0, 43.0, 28.0, 12.0, 16.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.43359375, -5.26318359375, -5.0927734375, -4.92236328125, -4.751953125, -4.58154296875, -4.4111328125, -4.24072265625, -4.0703125, -3.89990234375, -3.7294921875, -3.55908203125, -3.388671875, -3.21826171875, -3.0478515625, -2.87744140625, -2.70703125, -2.53662109375, -2.3662109375, -2.19580078125, -2.025390625, -1.85498046875, -1.6845703125, -1.51416015625, -1.34375, -1.17333984375, -1.0029296875, -0.83251953125, -0.662109375, -0.49169921875, -0.3212890625, -0.15087890625, 0.01953125, 0.18994140625, 0.3603515625, 0.53076171875, 0.701171875, 0.87158203125, 1.0419921875, 1.21240234375, 1.3828125, 1.55322265625, 1.7236328125, 1.89404296875, 2.064453125, 2.23486328125, 2.4052734375, 2.57568359375, 2.74609375, 2.91650390625, 3.0869140625, 3.25732421875, 3.427734375, 3.59814453125, 3.7685546875, 3.93896484375, 4.109375, 4.27978515625, 4.4501953125, 4.62060546875, 4.791015625, 4.96142578125, 5.1318359375, 5.30224609375, 5.47265625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 8.0, 4.0, 18.0, 6.0, 12.0, 14.0, 23.0, 14.0, 21.0, 20.0, 18.0, 26.0, 36.0, 23.0, 24.0, 29.0, 32.0, 33.0, 39.0, 43.0, 401.0, 584.0, 119.0, 40.0, 50.0, 34.0, 32.0, 33.0, 34.0, 24.0, 30.0, 17.0, 18.0, 16.0, 28.0, 12.0, 15.0, 5.0, 9.0, 9.0, 11.0, 9.0, 6.0, 7.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0], "bins": [-44.0, -42.7470703125, -41.494140625, -40.2412109375, -38.98828125, -37.7353515625, -36.482421875, -35.2294921875, -33.9765625, -32.7236328125, -31.470703125, -30.2177734375, -28.96484375, -27.7119140625, -26.458984375, -25.2060546875, -23.953125, -22.7001953125, -21.447265625, -20.1943359375, -18.94140625, -17.6884765625, -16.435546875, -15.1826171875, -13.9296875, -12.6767578125, -11.423828125, -10.1708984375, -8.91796875, -7.6650390625, -6.412109375, -5.1591796875, -3.90625, -2.6533203125, -1.400390625, -0.1474609375, 1.10546875, 2.3583984375, 3.611328125, 4.8642578125, 6.1171875, 7.3701171875, 8.623046875, 9.8759765625, 11.12890625, 12.3818359375, 13.634765625, 14.8876953125, 16.140625, 17.3935546875, 18.646484375, 19.8994140625, 21.15234375, 22.4052734375, 23.658203125, 24.9111328125, 26.1640625, 27.4169921875, 28.669921875, 29.9228515625, 31.17578125, 32.4287109375, 33.681640625, 34.9345703125, 36.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 2.0, 5.0, 7.0, 9.0, 11.0, 13.0, 22.0, 29.0, 26.0, 49.0, 69.0, 97.0, 122.0, 172.0, 260.0, 345.0, 516.0, 759.0, 1212.0, 1890.0, 2868.0, 4297.0, 7188.0, 11303.0, 18631.0, 29892.0, 48980.0, 83750.0, 235822.0, 5541692.0, 130052.0, 66079.0, 40049.0, 24682.0, 14914.0, 9066.0, 5768.0, 3586.0, 2439.0, 1469.0, 1001.0, 697.0, 503.0, 295.0, 230.0, 160.0, 137.0, 97.0, 51.0, 46.0, 30.0, 13.0, 6.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0], "bins": [-19.890625, -19.29296875, -18.6953125, -18.09765625, -17.5, -16.90234375, -16.3046875, -15.70703125, -15.109375, -14.51171875, -13.9140625, -13.31640625, -12.71875, -12.12109375, -11.5234375, -10.92578125, -10.328125, -9.73046875, -9.1328125, -8.53515625, -7.9375, -7.33984375, -6.7421875, -6.14453125, -5.546875, -4.94921875, -4.3515625, -3.75390625, -3.15625, -2.55859375, -1.9609375, -1.36328125, -0.765625, -0.16796875, 0.4296875, 1.02734375, 1.625, 2.22265625, 2.8203125, 3.41796875, 4.015625, 4.61328125, 5.2109375, 5.80859375, 6.40625, 7.00390625, 7.6015625, 8.19921875, 8.796875, 9.39453125, 9.9921875, 10.58984375, 11.1875, 11.78515625, 12.3828125, 12.98046875, 13.578125, 14.17578125, 14.7734375, 15.37109375, 15.96875, 16.56640625, 17.1640625, 17.76171875, 18.359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 8.0, 11.0, 8.0, 20.0, 17.0, 13.0, 19.0, 22.0, 22.0, 20.0, 22.0, 29.0, 41.0, 35.0, 36.0, 32.0, 28.0, 52.0, 181.0, 837.0, 108.0, 52.0, 48.0, 44.0, 32.0, 29.0, 35.0, 17.0, 38.0, 12.0, 20.0, 25.0, 13.0, 16.0, 14.0, 14.0, 12.0, 10.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.1875, -62.20361328125, -60.2197265625, -58.23583984375, -56.251953125, -54.26806640625, -52.2841796875, -50.30029296875, -48.31640625, -46.33251953125, -44.3486328125, -42.36474609375, -40.380859375, -38.39697265625, -36.4130859375, -34.42919921875, -32.4453125, -30.46142578125, -28.4775390625, -26.49365234375, -24.509765625, -22.52587890625, -20.5419921875, -18.55810546875, -16.57421875, -14.59033203125, -12.6064453125, -10.62255859375, -8.638671875, -6.65478515625, -4.6708984375, -2.68701171875, -0.703125, 1.28076171875, 3.2646484375, 5.24853515625, 7.232421875, 9.21630859375, 11.2001953125, 13.18408203125, 15.16796875, 17.15185546875, 19.1357421875, 21.11962890625, 23.103515625, 25.08740234375, 27.0712890625, 29.05517578125, 31.0390625, 33.02294921875, 35.0068359375, 36.99072265625, 38.974609375, 40.95849609375, 42.9423828125, 44.92626953125, 46.91015625, 48.89404296875, 50.8779296875, 52.86181640625, 54.845703125, 56.82958984375, 58.8134765625, 60.79736328125, 62.78125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 11.0, 17.0, 40.0, 71.0, 146.0, 460.0, 94.0, 55.0, 21.0, 15.0, 12.0, 13.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-618.604736328125, -600.5810546875, -582.557373046875, -564.53369140625, -546.5100708007812, -528.4863891601562, -510.46270751953125, -492.43902587890625, -474.41534423828125, -456.39166259765625, -438.3680114746094, -420.3443298339844, -402.3206481933594, -384.2969970703125, -366.2733154296875, -348.2496337890625, -330.2259826660156, -312.2023010253906, -294.17864990234375, -276.15496826171875, -258.13128662109375, -240.1076202392578, -222.08395385742188, -204.06027221679688, -186.03660583496094, -168.012939453125, -149.9892578125, -131.96559143066406, -113.9419174194336, -95.91824340820312, -77.89457702636719, -59.87090301513672, -41.84722900390625, -23.823556900024414, -5.799884796142578, 12.223785400390625, 30.247459411621094, 48.27113342285156, 66.2947998046875, 84.31847381591797, 102.34214782714844, 120.3658218383789, 138.38949584960938, 156.4131622314453, 174.43682861328125, 192.46051025390625, 210.4841766357422, 228.50784301757812, 246.53152465820312, 264.5552062988281, 282.578857421875, 300.6025390625, 318.626220703125, 336.64990234375, 354.6735534667969, 372.6972351074219, 390.72088623046875, 408.74456787109375, 426.7682189941406, 444.7919006347656, 462.8155822753906, 480.8392333984375, 498.8629150390625, 516.8865966796875, 534.9102783203125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 14.0, 8.0, 15.0, 25.0, 25.0, 51.0, 86.0, 192.0, 239.0, 74.0, 58.0, 49.0, 33.0, 11.0, 11.0, 13.0, 17.0, 11.0, 1.0, 7.0, 7.0, 2.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1072.4566650390625, -1041.036865234375, -1009.6170654296875, -978.197265625, -946.7774658203125, -915.357666015625, -883.9378662109375, -852.51806640625, -821.0982666015625, -789.678466796875, -758.2586669921875, -726.8388671875, -695.4190673828125, -663.999267578125, -632.5794677734375, -601.15966796875, -569.7398681640625, -538.320068359375, -506.9002685546875, -475.48046875, -444.0606689453125, -412.640869140625, -381.2210693359375, -349.80126953125, -318.3814697265625, -286.961669921875, -255.5418701171875, -224.1220703125, -192.7022705078125, -161.282470703125, -129.8626708984375, -98.44287109375, -67.0230712890625, -35.603271484375, -4.1834716796875, 27.236328125, 58.6561279296875, 90.075927734375, 121.4957275390625, 152.91552734375, 184.3353271484375, 215.755126953125, 247.1749267578125, 278.5947265625, 310.0145263671875, 341.434326171875, 372.8541259765625, 404.27392578125, 435.6937255859375, 467.113525390625, 498.5333251953125, 529.953125, 561.3729248046875, 592.792724609375, 624.2125244140625, 655.63232421875, 687.0521240234375, 718.471923828125, 749.8917236328125, 781.3115234375, 812.7313232421875, 844.151123046875, 875.5709228515625, 906.99072265625, 938.4105224609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 12.0, 16.0, 11.0, 30.0, 34.0, 59.0, 77.0, 124.0, 198.0, 286.0, 444.0, 730.0, 1287.0, 2336.0, 4454.0, 9058.0, 19794.0, 51909.0, 225951.0, 3693177.0, 119359.0, 36696.0, 14487.0, 6460.0, 3077.0, 1724.0, 887.0, 571.0, 340.0, 194.0, 148.0, 96.0, 58.0, 47.0, 32.0, 28.0, 23.0, 17.0, 11.0, 7.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.61053466796875, -4.4476318359375, -4.28472900390625, -4.121826171875, -3.95892333984375, -3.7960205078125, -3.63311767578125, -3.47021484375, -3.30731201171875, -3.1444091796875, -2.98150634765625, -2.818603515625, -2.65570068359375, -2.4927978515625, -2.32989501953125, -2.1669921875, -2.00408935546875, -1.8411865234375, -1.67828369140625, -1.515380859375, -1.35247802734375, -1.1895751953125, -1.02667236328125, -0.86376953125, -0.70086669921875, -0.5379638671875, -0.37506103515625, -0.212158203125, -0.04925537109375, 0.1136474609375, 0.27655029296875, 0.439453125, 0.60235595703125, 0.7652587890625, 0.92816162109375, 1.091064453125, 1.25396728515625, 1.4168701171875, 1.57977294921875, 1.74267578125, 1.90557861328125, 2.0684814453125, 2.23138427734375, 2.394287109375, 2.55718994140625, 2.7200927734375, 2.88299560546875, 3.0458984375, 3.20880126953125, 3.3717041015625, 3.53460693359375, 3.697509765625, 3.86041259765625, 4.0233154296875, 4.18621826171875, 4.34912109375, 4.51202392578125, 4.6749267578125, 4.83782958984375, 5.000732421875, 5.16363525390625, 5.3265380859375, 5.48944091796875, 5.65234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 8.0, 11.0, 10.0, 19.0, 26.0, 34.0, 677.0, 78.0, 31.0, 16.0, 16.0, 4.0, 12.0, 7.0, 5.0, 8.0, 3.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.99053955078125, -1.9185791015625, -1.84661865234375, -1.774658203125, -1.70269775390625, -1.6307373046875, -1.55877685546875, -1.48681640625, -1.41485595703125, -1.3428955078125, -1.27093505859375, -1.198974609375, -1.12701416015625, -1.0550537109375, -0.98309326171875, -0.9111328125, -0.83917236328125, -0.7672119140625, -0.69525146484375, -0.623291015625, -0.55133056640625, -0.4793701171875, -0.40740966796875, -0.33544921875, -0.26348876953125, -0.1915283203125, -0.11956787109375, -0.047607421875, 0.02435302734375, 0.0963134765625, 0.16827392578125, 0.240234375, 0.31219482421875, 0.3841552734375, 0.45611572265625, 0.528076171875, 0.60003662109375, 0.6719970703125, 0.74395751953125, 0.81591796875, 0.88787841796875, 0.9598388671875, 1.03179931640625, 1.103759765625, 1.17572021484375, 1.2476806640625, 1.31964111328125, 1.3916015625, 1.46356201171875, 1.5355224609375, 1.60748291015625, 1.679443359375, 1.75140380859375, 1.8233642578125, 1.89532470703125, 1.96728515625, 2.03924560546875, 2.1112060546875, 2.18316650390625, 2.255126953125, 2.32708740234375, 2.3990478515625, 2.47100830078125, 2.54296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 5.0, 10.0, 11.0, 9.0, 13.0, 26.0, 25.0, 46.0, 57.0, 102.0, 127.0, 170.0, 332.0, 529.0, 866.0, 1517.0, 2548.0, 4769.0, 9537.0, 19880.0, 45706.0, 119165.0, 381624.0, 1808265.0, 1342266.0, 294556.0, 93436.0, 36281.0, 15868.0, 7489.0, 3974.0, 2065.0, 1071.0, 691.0, 446.0, 239.0, 163.0, 109.0, 82.0, 65.0, 34.0, 22.0, 23.0, 13.0, 15.0, 10.0, 7.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.443359375, -2.371307373046875, -2.29925537109375, -2.227203369140625, -2.1551513671875, -2.083099365234375, -2.01104736328125, -1.938995361328125, -1.866943359375, -1.794891357421875, -1.72283935546875, -1.650787353515625, -1.5787353515625, -1.506683349609375, -1.43463134765625, -1.362579345703125, -1.29052734375, -1.218475341796875, -1.14642333984375, -1.074371337890625, -1.0023193359375, -0.930267333984375, -0.85821533203125, -0.786163330078125, -0.714111328125, -0.642059326171875, -0.57000732421875, -0.497955322265625, -0.4259033203125, -0.353851318359375, -0.28179931640625, -0.209747314453125, -0.1376953125, -0.065643310546875, 0.00640869140625, 0.078460693359375, 0.1505126953125, 0.222564697265625, 0.29461669921875, 0.366668701171875, 0.438720703125, 0.510772705078125, 0.58282470703125, 0.654876708984375, 0.7269287109375, 0.798980712890625, 0.87103271484375, 0.943084716796875, 1.01513671875, 1.087188720703125, 1.15924072265625, 1.231292724609375, 1.3033447265625, 1.375396728515625, 1.44744873046875, 1.519500732421875, 1.591552734375, 1.663604736328125, 1.73565673828125, 1.807708740234375, 1.8797607421875, 1.951812744140625, 2.02386474609375, 2.095916748046875, 2.16796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 18.0, 13.0, 17.0, 23.0, 35.0, 36.0, 48.0, 65.0, 77.0, 102.0, 128.0, 157.0, 237.0, 308.0, 420.0, 644.0, 500.0, 294.0, 248.0, 187.0, 116.0, 84.0, 64.0, 57.0, 34.0, 35.0, 19.0, 24.0, 17.0, 10.0, 7.0, 6.0, 9.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.7177734375, -1.6681060791015625, -1.618438720703125, -1.5687713623046875, -1.51910400390625, -1.4694366455078125, -1.419769287109375, -1.3701019287109375, -1.3204345703125, -1.2707672119140625, -1.221099853515625, -1.1714324951171875, -1.12176513671875, -1.0720977783203125, -1.022430419921875, -0.9727630615234375, -0.923095703125, -0.8734283447265625, -0.823760986328125, -0.7740936279296875, -0.72442626953125, -0.6747589111328125, -0.625091552734375, -0.5754241943359375, -0.5257568359375, -0.4760894775390625, -0.426422119140625, -0.3767547607421875, -0.32708740234375, -0.2774200439453125, -0.227752685546875, -0.1780853271484375, -0.12841796875, -0.0787506103515625, -0.029083251953125, 0.0205841064453125, 0.07025146484375, 0.1199188232421875, 0.169586181640625, 0.2192535400390625, 0.2689208984375, 0.3185882568359375, 0.368255615234375, 0.4179229736328125, 0.46759033203125, 0.5172576904296875, 0.566925048828125, 0.6165924072265625, 0.666259765625, 0.7159271240234375, 0.765594482421875, 0.8152618408203125, 0.86492919921875, 0.9145965576171875, 0.964263916015625, 1.0139312744140625, 1.0635986328125, 1.1132659912109375, 1.162933349609375, 1.2126007080078125, 1.26226806640625, 1.3119354248046875, 1.361602783203125, 1.4112701416015625, 1.4609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 13.0, 26.0, 81.0, 222.0, 356.0, 197.0, 76.0, 22.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.911849975585938, -31.19810676574707, -30.484363555908203, -29.770618438720703, -29.056875228881836, -28.34313201904297, -27.62938690185547, -26.9156436920166, -26.201900482177734, -25.488157272338867, -24.7744140625, -24.0606689453125, -23.346925735473633, -22.633182525634766, -21.919437408447266, -21.2056941986084, -20.49195098876953, -19.778207778930664, -19.064464569091797, -18.350719451904297, -17.63697624206543, -16.923233032226562, -16.209487915039062, -15.495744705200195, -14.782001495361328, -14.068258285522461, -13.354514122009277, -12.640769958496094, -11.927026748657227, -11.21328353881836, -10.499539375305176, -9.785795211791992, -9.072052955627441, -8.358308792114258, -7.644565582275391, -6.930821895599365, -6.21707820892334, -5.5033345222473145, -4.789590835571289, -4.075847148895264, -3.3621034622192383, -2.648359775543213, -1.9346160888671875, -1.220872402191162, -0.5071287155151367, 0.20661497116088867, 0.9203586578369141, 1.6341023445129395, 2.347846031188965, 3.0615897178649902, 3.7753334045410156, 4.489077091217041, 5.202820777893066, 5.916564464569092, 6.630308151245117, 7.344051837921143, 8.057795524597168, 8.771539688110352, 9.485282897949219, 10.199026107788086, 10.91277027130127, 11.626514434814453, 12.34025764465332, 13.054000854492188, 13.767745018005371]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 12.0, 11.0, 10.0, 22.0, 19.0, 19.0, 33.0, 24.0, 36.0, 37.0, 49.0, 40.0, 52.0, 48.0, 43.0, 67.0, 48.0, 60.0, 48.0, 49.0, 38.0, 39.0, 41.0, 24.0, 34.0, 21.0, 17.0, 11.0, 9.0, 12.0, 7.0, 8.0, 5.0, 4.0, 1.0, 2.0], "bins": [-12.806951522827148, -12.502330780029297, -12.197710037231445, -11.893089294433594, -11.588468551635742, -11.283846855163574, -10.979226112365723, -10.674605369567871, -10.36998462677002, -10.065363883972168, -9.760743141174316, -9.456122398376465, -9.151500701904297, -8.846879959106445, -8.542259216308594, -8.237638473510742, -7.933017730712891, -7.628396987915039, -7.3237762451171875, -7.019155025482178, -6.714534282684326, -6.409913539886475, -6.105292320251465, -5.800671577453613, -5.496050834655762, -5.19143009185791, -4.886809349060059, -4.582188129425049, -4.277567386627197, -3.9729466438293457, -3.668325662612915, -3.3637046813964844, -3.0590829849243164, -2.754462242126465, -2.449841260910034, -2.1452202796936035, -1.840599536895752, -1.5359786748886108, -1.2313578128814697, -0.9267368316650391, -0.6221160888671875, -0.3174952268600464, -0.012874364852905273, 0.29174649715423584, 0.596367359161377, 0.9009882211685181, 1.2056090831756592, 1.5102300643920898, 1.8148508071899414, 2.119471549987793, 2.4240925312042236, 2.7287135124206543, 3.033334255218506, 3.3379549980163574, 3.642575979232788, 3.9471969604492188, 4.25181770324707, 4.556438446044922, 4.861059188842773, 5.165680408477783, 5.470301151275635, 5.774921894073486, 6.079543113708496, 6.384163856506348, 6.688784599304199]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 13.0, 8.0, 12.0, 13.0, 31.0, 27.0, 41.0, 59.0, 81.0, 118.0, 163.0, 273.0, 378.0, 646.0, 1144.0, 1949.0, 3530.0, 6987.0, 14735.0, 36794.0, 593255.0, 328210.0, 32142.0, 13408.0, 6503.0, 3371.0, 1882.0, 1039.0, 601.0, 377.0, 232.0, 129.0, 109.0, 74.0, 53.0, 36.0, 32.0, 28.0, 16.0, 7.0, 8.0, 11.0, 9.0, 1.0, 1.0, 9.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.93048095703125, -4.7711181640625, -4.61175537109375, -4.452392578125, -4.29302978515625, -4.1336669921875, -3.97430419921875, -3.81494140625, -3.65557861328125, -3.4962158203125, -3.33685302734375, -3.177490234375, -3.01812744140625, -2.8587646484375, -2.69940185546875, -2.5400390625, -2.38067626953125, -2.2213134765625, -2.06195068359375, -1.902587890625, -1.74322509765625, -1.5838623046875, -1.42449951171875, -1.26513671875, -1.10577392578125, -0.9464111328125, -0.78704833984375, -0.627685546875, -0.46832275390625, -0.3089599609375, -0.14959716796875, 0.009765625, 0.16912841796875, 0.3284912109375, 0.48785400390625, 0.647216796875, 0.80657958984375, 0.9659423828125, 1.12530517578125, 1.28466796875, 1.44403076171875, 1.6033935546875, 1.76275634765625, 1.922119140625, 2.08148193359375, 2.2408447265625, 2.40020751953125, 2.5595703125, 2.71893310546875, 2.8782958984375, 3.03765869140625, 3.197021484375, 3.35638427734375, 3.5157470703125, 3.67510986328125, 3.83447265625, 3.99383544921875, 4.1531982421875, 4.31256103515625, 4.471923828125, 4.63128662109375, 4.7906494140625, 4.95001220703125, 5.109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 3.0, 3.0, 5.0, 11.0, 6.0, 10.0, 14.0, 23.0, 43.0, 167.0, 406.0, 161.0, 53.0, 15.0, 17.0, 7.0, 11.0, 8.0, 10.0, 4.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.9398193359375, -1.871826171875, -1.8038330078125, -1.73583984375, -1.6678466796875, -1.599853515625, -1.5318603515625, -1.4638671875, -1.3958740234375, -1.327880859375, -1.2598876953125, -1.19189453125, -1.1239013671875, -1.055908203125, -0.9879150390625, -0.919921875, -0.8519287109375, -0.783935546875, -0.7159423828125, -0.64794921875, -0.5799560546875, -0.511962890625, -0.4439697265625, -0.3759765625, -0.3079833984375, -0.239990234375, -0.1719970703125, -0.10400390625, -0.0360107421875, 0.031982421875, 0.0999755859375, 0.16796875, 0.2359619140625, 0.303955078125, 0.3719482421875, 0.43994140625, 0.5079345703125, 0.575927734375, 0.6439208984375, 0.7119140625, 0.7799072265625, 0.847900390625, 0.9158935546875, 0.98388671875, 1.0518798828125, 1.119873046875, 1.1878662109375, 1.255859375, 1.3238525390625, 1.391845703125, 1.4598388671875, 1.52783203125, 1.5958251953125, 1.663818359375, 1.7318115234375, 1.7998046875, 1.8677978515625, 1.935791015625, 2.0037841796875, 2.07177734375, 2.1397705078125, 2.207763671875, 2.2757568359375, 2.34375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 13.0, 12.0, 11.0, 9.0, 14.0, 26.0, 32.0, 49.0, 53.0, 96.0, 208.0, 384.0, 884.0, 2006.0, 4941.0, 13338.0, 41490.0, 151012.0, 502439.0, 238986.0, 61738.0, 19015.0, 6870.0, 2653.0, 1113.0, 470.0, 256.0, 150.0, 73.0, 45.0, 34.0, 32.0, 22.0, 12.0, 14.0, 12.0, 6.0, 3.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6796875, -5.50579833984375, -5.3319091796875, -5.15802001953125, -4.984130859375, -4.81024169921875, -4.6363525390625, -4.46246337890625, -4.28857421875, -4.11468505859375, -3.9407958984375, -3.76690673828125, -3.593017578125, -3.41912841796875, -3.2452392578125, -3.07135009765625, -2.8974609375, -2.72357177734375, -2.5496826171875, -2.37579345703125, -2.201904296875, -2.02801513671875, -1.8541259765625, -1.68023681640625, -1.50634765625, -1.33245849609375, -1.1585693359375, -0.98468017578125, -0.810791015625, -0.63690185546875, -0.4630126953125, -0.28912353515625, -0.115234375, 0.05865478515625, 0.2325439453125, 0.40643310546875, 0.580322265625, 0.75421142578125, 0.9281005859375, 1.10198974609375, 1.27587890625, 1.44976806640625, 1.6236572265625, 1.79754638671875, 1.971435546875, 2.14532470703125, 2.3192138671875, 2.49310302734375, 2.6669921875, 2.84088134765625, 3.0147705078125, 3.18865966796875, 3.362548828125, 3.53643798828125, 3.7103271484375, 3.88421630859375, 4.05810546875, 4.23199462890625, 4.4058837890625, 4.57977294921875, 4.753662109375, 4.92755126953125, 5.1014404296875, 5.27532958984375, 5.44921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 12.0, 11.0, 18.0, 24.0, 28.0, 20.0, 28.0, 26.0, 32.0, 38.0, 32.0, 31.0, 38.0, 31.0, 39.0, 37.0, 45.0, 39.0, 37.0, 42.0, 27.0, 24.0, 46.0, 31.0, 22.0, 23.0, 25.0, 24.0, 19.0, 22.0, 18.0, 16.0, 14.0, 10.0, 17.0, 7.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.78515625, -6.58624267578125, -6.3873291015625, -6.18841552734375, -5.989501953125, -5.79058837890625, -5.5916748046875, -5.39276123046875, -5.19384765625, -4.99493408203125, -4.7960205078125, -4.59710693359375, -4.398193359375, -4.19927978515625, -4.0003662109375, -3.80145263671875, -3.6025390625, -3.40362548828125, -3.2047119140625, -3.00579833984375, -2.806884765625, -2.60797119140625, -2.4090576171875, -2.21014404296875, -2.01123046875, -1.81231689453125, -1.6134033203125, -1.41448974609375, -1.215576171875, -1.01666259765625, -0.8177490234375, -0.61883544921875, -0.419921875, -0.22100830078125, -0.0220947265625, 0.17681884765625, 0.375732421875, 0.57464599609375, 0.7735595703125, 0.97247314453125, 1.17138671875, 1.37030029296875, 1.5692138671875, 1.76812744140625, 1.967041015625, 2.16595458984375, 2.3648681640625, 2.56378173828125, 2.7626953125, 2.96160888671875, 3.1605224609375, 3.35943603515625, 3.558349609375, 3.75726318359375, 3.9561767578125, 4.15509033203125, 4.35400390625, 4.55291748046875, 4.7518310546875, 4.95074462890625, 5.149658203125, 5.34857177734375, 5.5474853515625, 5.74639892578125, 5.9453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 9.0, 13.0, 17.0, 29.0, 35.0, 66.0, 94.0, 166.0, 275.0, 515.0, 1059.0, 2488.0, 7380.0, 35587.0, 784125.0, 192465.0, 16351.0, 4386.0, 1730.0, 771.0, 400.0, 212.0, 117.0, 93.0, 48.0, 29.0, 27.0, 13.0, 13.0, 8.0, 6.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.89581298828125, -5.6978759765625, -5.49993896484375, -5.302001953125, -5.10406494140625, -4.9061279296875, -4.70819091796875, -4.51025390625, -4.31231689453125, -4.1143798828125, -3.91644287109375, -3.718505859375, -3.52056884765625, -3.3226318359375, -3.12469482421875, -2.9267578125, -2.72882080078125, -2.5308837890625, -2.33294677734375, -2.135009765625, -1.93707275390625, -1.7391357421875, -1.54119873046875, -1.34326171875, -1.14532470703125, -0.9473876953125, -0.74945068359375, -0.551513671875, -0.35357666015625, -0.1556396484375, 0.04229736328125, 0.240234375, 0.43817138671875, 0.6361083984375, 0.83404541015625, 1.031982421875, 1.22991943359375, 1.4278564453125, 1.62579345703125, 1.82373046875, 2.02166748046875, 2.2196044921875, 2.41754150390625, 2.615478515625, 2.81341552734375, 3.0113525390625, 3.20928955078125, 3.4072265625, 3.60516357421875, 3.8031005859375, 4.00103759765625, 4.198974609375, 4.39691162109375, 4.5948486328125, 4.79278564453125, 4.99072265625, 5.18865966796875, 5.3865966796875, 5.58453369140625, 5.782470703125, 5.98040771484375, 6.1783447265625, 6.37628173828125, 6.57421875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 22.0, 27.0, 39.0, 58.0, 91.0, 113.0, 121.0, 144.0, 106.0, 85.0, 56.0, 34.0, 26.0, 17.0, 18.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00021696090698242188, -0.00021111220121383667, -0.00020526349544525146, -0.00019941478967666626, -0.00019356608390808105, -0.00018771737813949585, -0.00018186867237091064, -0.00017601996660232544, -0.00017017126083374023, -0.00016432255506515503, -0.00015847384929656982, -0.00015262514352798462, -0.00014677643775939941, -0.0001409277319908142, -0.000135079026222229, -0.0001292303204536438, -0.0001233816146850586, -0.00011753290891647339, -0.00011168420314788818, -0.00010583549737930298, -9.998679161071777e-05, -9.413808584213257e-05, -8.828938007354736e-05, -8.244067430496216e-05, -7.659196853637695e-05, -7.074326276779175e-05, -6.489455699920654e-05, -5.904585123062134e-05, -5.319714546203613e-05, -4.734843969345093e-05, -4.149973392486572e-05, -3.565102815628052e-05, -2.9802322387695312e-05, -2.3953616619110107e-05, -1.8104910850524902e-05, -1.2256205081939697e-05, -6.407499313354492e-06, -5.587935447692871e-07, 5.289912223815918e-06, 1.1138617992401123e-05, 1.6987323760986328e-05, 2.2836029529571533e-05, 2.8684735298156738e-05, 3.453344106674194e-05, 4.038214683532715e-05, 4.6230852603912354e-05, 5.207955837249756e-05, 5.7928264141082764e-05, 6.377696990966797e-05, 6.962567567825317e-05, 7.547438144683838e-05, 8.132308721542358e-05, 8.717179298400879e-05, 9.3020498752594e-05, 9.88692045211792e-05, 0.0001047179102897644, 0.00011056661605834961, 0.00011641532182693481, 0.00012226402759552002, 0.00012811273336410522, 0.00013396143913269043, 0.00013981014490127563, 0.00014565885066986084, 0.00015150755643844604, 0.00015735626220703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 14.0, 17.0, 13.0, 37.0, 44.0, 84.0, 174.0, 267.0, 536.0, 1254.0, 3067.0, 9157.0, 37885.0, 320299.0, 596044.0, 59769.0, 12912.0, 3973.0, 1511.0, 683.0, 341.0, 193.0, 100.0, 50.0, 45.0, 26.0, 15.0, 12.0, 6.0, 10.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.255859375, -3.101776123046875, -2.94769287109375, -2.793609619140625, -2.6395263671875, -2.485443115234375, -2.33135986328125, -2.177276611328125, -2.023193359375, -1.869110107421875, -1.71502685546875, -1.560943603515625, -1.4068603515625, -1.252777099609375, -1.09869384765625, -0.944610595703125, -0.79052734375, -0.636444091796875, -0.48236083984375, -0.328277587890625, -0.1741943359375, -0.020111083984375, 0.13397216796875, 0.288055419921875, 0.442138671875, 0.596221923828125, 0.75030517578125, 0.904388427734375, 1.0584716796875, 1.212554931640625, 1.36663818359375, 1.520721435546875, 1.6748046875, 1.828887939453125, 1.98297119140625, 2.137054443359375, 2.2911376953125, 2.445220947265625, 2.59930419921875, 2.753387451171875, 2.907470703125, 3.061553955078125, 3.21563720703125, 3.369720458984375, 3.5238037109375, 3.677886962890625, 3.83197021484375, 3.986053466796875, 4.14013671875, 4.294219970703125, 4.44830322265625, 4.602386474609375, 4.7564697265625, 4.910552978515625, 5.06463623046875, 5.218719482421875, 5.372802734375, 5.526885986328125, 5.68096923828125, 5.835052490234375, 5.9891357421875, 6.143218994140625, 6.29730224609375, 6.451385498046875, 6.60546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 3.0, 11.0, 5.0, 10.0, 13.0, 20.0, 18.0, 24.0, 23.0, 27.0, 58.0, 61.0, 70.0, 77.0, 100.0, 87.0, 63.0, 66.0, 43.0, 45.0, 40.0, 22.0, 23.0, 16.0, 15.0, 16.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.133209228515625, -4.98907470703125, -4.844940185546875, -4.7008056640625, -4.556671142578125, -4.41253662109375, -4.268402099609375, -4.124267578125, -3.980133056640625, -3.83599853515625, -3.691864013671875, -3.5477294921875, -3.403594970703125, -3.25946044921875, -3.115325927734375, -2.97119140625, -2.827056884765625, -2.68292236328125, -2.538787841796875, -2.3946533203125, -2.250518798828125, -2.10638427734375, -1.962249755859375, -1.818115234375, -1.673980712890625, -1.52984619140625, -1.385711669921875, -1.2415771484375, -1.097442626953125, -0.95330810546875, -0.809173583984375, -0.6650390625, -0.520904541015625, -0.37677001953125, -0.232635498046875, -0.0885009765625, 0.055633544921875, 0.19976806640625, 0.343902587890625, 0.488037109375, 0.632171630859375, 0.77630615234375, 0.920440673828125, 1.0645751953125, 1.208709716796875, 1.35284423828125, 1.496978759765625, 1.64111328125, 1.785247802734375, 1.92938232421875, 2.073516845703125, 2.2176513671875, 2.361785888671875, 2.50592041015625, 2.650054931640625, 2.794189453125, 2.938323974609375, 3.08245849609375, 3.226593017578125, 3.3707275390625, 3.514862060546875, 3.65899658203125, 3.803131103515625, 3.947265625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 10.0, 12.0, 48.0, 180.0, 511.0, 166.0, 48.0, 13.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.89703369140625, -99.28172302246094, -94.6664047241211, -90.05109405517578, -85.43577575683594, -80.82046508789062, -76.20515441894531, -71.58984375, -66.97452545166016, -62.35921096801758, -57.743896484375, -53.12858581542969, -48.51327133178711, -43.89795684814453, -39.28264617919922, -34.66733169555664, -30.052017211914062, -25.436702728271484, -20.82139015197754, -16.206077575683594, -11.590763092041016, -6.9754486083984375, -2.360136032104492, 2.255176544189453, 6.870491027832031, 11.485804557800293, 16.101118087768555, 20.7164306640625, 25.331745147705078, 29.947059631347656, 34.56237030029297, 39.17768478393555, 43.79301452636719, 48.408329010009766, 53.023643493652344, 57.638954162597656, 62.254268646240234, 66.86958312988281, 71.48489379882812, 76.10020446777344, 80.71552276611328, 85.3308334350586, 89.94615173339844, 94.56146240234375, 99.17677307128906, 103.7920913696289, 108.40740203857422, 113.02272033691406, 117.63803100585938, 122.25334167480469, 126.86865997314453, 131.48397827148438, 136.0992889404297, 140.714599609375, 145.3299102783203, 149.94522094726562, 154.560546875, 159.1758575439453, 163.79116821289062, 168.406494140625, 173.0218048095703, 177.63711547851562, 182.25242614746094, 186.86773681640625, 191.48304748535156]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 6.0, 4.0, 8.0, 8.0, 7.0, 15.0, 28.0, 31.0, 49.0, 71.0, 92.0, 107.0, 116.0, 124.0, 101.0, 51.0, 44.0, 36.0, 23.0, 16.0, 11.0, 4.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-110.92841339111328, -107.02137756347656, -103.11434936523438, -99.20731353759766, -95.30028533935547, -91.39324951171875, -87.48622131347656, -83.57918548583984, -79.67214965820312, -75.7651138305664, -71.85808563232422, -67.9510498046875, -64.04402160644531, -60.136985778808594, -56.22995376586914, -52.32292175292969, -48.4158935546875, -44.50886154174805, -40.601829528808594, -36.694793701171875, -32.78776550292969, -28.8807315826416, -24.973697662353516, -21.066665649414062, -17.15963363647461, -13.252601623535156, -9.345568656921387, -5.438535690307617, -1.531503677368164, 2.375528335571289, 6.282562255859375, 10.189594268798828, 14.096633911132812, 18.003665924072266, 21.91069793701172, 25.817731857299805, 29.724763870239258, 33.631797790527344, 37.5388298034668, 41.44586181640625, 45.3528938293457, 49.259925842285156, 53.16695785522461, 57.07398986816406, 60.98102569580078, 64.88805389404297, 68.79508972167969, 72.70211791992188, 76.6091537475586, 80.51618957519531, 84.4232177734375, 88.33025360107422, 92.2372817993164, 96.14431762695312, 100.05134582519531, 103.95838165283203, 107.86541748046875, 111.77245330810547, 115.67948150634766, 119.58651733398438, 123.49354553222656, 127.40058135986328, 131.3076171875, 135.2146453857422, 139.12167358398438]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 10.0, 9.0, 8.0, 15.0, 21.0, 35.0, 32.0, 57.0, 85.0, 87.0, 125.0, 183.0, 296.0, 453.0, 757.0, 1263.0, 2186.0, 4207.0, 9122.0, 26010.0, 143518.0, 3820257.0, 140125.0, 25593.0, 9219.0, 4205.0, 2312.0, 1357.0, 886.0, 551.0, 385.0, 260.0, 159.0, 132.0, 75.0, 76.0, 47.0, 38.0, 29.0, 24.0, 16.0, 15.0, 14.0, 7.0, 7.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-15.078125, -14.5994873046875, -14.120849609375, -13.6422119140625, -13.16357421875, -12.6849365234375, -12.206298828125, -11.7276611328125, -11.2490234375, -10.7703857421875, -10.291748046875, -9.8131103515625, -9.33447265625, -8.8558349609375, -8.377197265625, -7.8985595703125, -7.419921875, -6.9412841796875, -6.462646484375, -5.9840087890625, -5.50537109375, -5.0267333984375, -4.548095703125, -4.0694580078125, -3.5908203125, -3.1121826171875, -2.633544921875, -2.1549072265625, -1.67626953125, -1.1976318359375, -0.718994140625, -0.2403564453125, 0.23828125, 0.7169189453125, 1.195556640625, 1.6741943359375, 2.15283203125, 2.6314697265625, 3.110107421875, 3.5887451171875, 4.0673828125, 4.5460205078125, 5.024658203125, 5.5032958984375, 5.98193359375, 6.4605712890625, 6.939208984375, 7.4178466796875, 7.896484375, 8.3751220703125, 8.853759765625, 9.3323974609375, 9.81103515625, 10.2896728515625, 10.768310546875, 11.2469482421875, 11.7255859375, 12.2042236328125, 12.682861328125, 13.1614990234375, 13.64013671875, 14.1187744140625, 14.597412109375, 15.0760498046875, 15.5546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 0.0, 4.0, 5.0, 6.0, 3.0, 5.0, 9.0, 8.0, 12.0, 18.0, 23.0, 37.0, 79.0, 94.0, 145.0, 165.0, 116.0, 84.0, 59.0, 27.0, 25.0, 12.0, 10.0, 5.0, 8.0, 2.0, 10.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.466796875, -1.4183349609375, -1.369873046875, -1.3214111328125, -1.27294921875, -1.2244873046875, -1.176025390625, -1.1275634765625, -1.0791015625, -1.0306396484375, -0.982177734375, -0.9337158203125, -0.88525390625, -0.8367919921875, -0.788330078125, -0.7398681640625, -0.69140625, -0.6429443359375, -0.594482421875, -0.5460205078125, -0.49755859375, -0.4490966796875, -0.400634765625, -0.3521728515625, -0.3037109375, -0.2552490234375, -0.206787109375, -0.1583251953125, -0.10986328125, -0.0614013671875, -0.012939453125, 0.0355224609375, 0.083984375, 0.1324462890625, 0.180908203125, 0.2293701171875, 0.27783203125, 0.3262939453125, 0.374755859375, 0.4232177734375, 0.4716796875, 0.5201416015625, 0.568603515625, 0.6170654296875, 0.66552734375, 0.7139892578125, 0.762451171875, 0.8109130859375, 0.859375, 0.9078369140625, 0.956298828125, 1.0047607421875, 1.05322265625, 1.1016845703125, 1.150146484375, 1.1986083984375, 1.2470703125, 1.2955322265625, 1.343994140625, 1.3924560546875, 1.44091796875, 1.4893798828125, 1.537841796875, 1.5863037109375, 1.634765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 22.0, 31.0, 37.0, 62.0, 69.0, 136.0, 185.0, 282.0, 514.0, 945.0, 1892.0, 4201.0, 12144.0, 57383.0, 2582382.0, 1466972.0, 49118.0, 10589.0, 3673.0, 1564.0, 856.0, 461.0, 268.0, 166.0, 106.0, 57.0, 44.0, 27.0, 19.0, 14.0, 10.0, 7.0, 6.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.59375, -12.1734619140625, -11.753173828125, -11.3328857421875, -10.91259765625, -10.4923095703125, -10.072021484375, -9.6517333984375, -9.2314453125, -8.8111572265625, -8.390869140625, -7.9705810546875, -7.55029296875, -7.1300048828125, -6.709716796875, -6.2894287109375, -5.869140625, -5.4488525390625, -5.028564453125, -4.6082763671875, -4.18798828125, -3.7677001953125, -3.347412109375, -2.9271240234375, -2.5068359375, -2.0865478515625, -1.666259765625, -1.2459716796875, -0.82568359375, -0.4053955078125, 0.014892578125, 0.4351806640625, 0.85546875, 1.2757568359375, 1.696044921875, 2.1163330078125, 2.53662109375, 2.9569091796875, 3.377197265625, 3.7974853515625, 4.2177734375, 4.6380615234375, 5.058349609375, 5.4786376953125, 5.89892578125, 6.3192138671875, 6.739501953125, 7.1597900390625, 7.580078125, 8.0003662109375, 8.420654296875, 8.8409423828125, 9.26123046875, 9.6815185546875, 10.101806640625, 10.5220947265625, 10.9423828125, 11.3626708984375, 11.782958984375, 12.2032470703125, 12.62353515625, 13.0438232421875, 13.464111328125, 13.8843994140625, 14.3046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 9.0, 10.0, 10.0, 19.0, 31.0, 49.0, 92.0, 230.0, 906.0, 1977.0, 410.0, 167.0, 57.0, 43.0, 22.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357421875, -3.242340087890625, -3.12725830078125, -3.012176513671875, -2.8970947265625, -2.782012939453125, -2.66693115234375, -2.551849365234375, -2.436767578125, -2.321685791015625, -2.20660400390625, -2.091522216796875, -1.9764404296875, -1.861358642578125, -1.74627685546875, -1.631195068359375, -1.51611328125, -1.401031494140625, -1.28594970703125, -1.170867919921875, -1.0557861328125, -0.940704345703125, -0.82562255859375, -0.710540771484375, -0.595458984375, -0.480377197265625, -0.36529541015625, -0.250213623046875, -0.1351318359375, -0.020050048828125, 0.09503173828125, 0.210113525390625, 0.3251953125, 0.440277099609375, 0.55535888671875, 0.670440673828125, 0.7855224609375, 0.900604248046875, 1.01568603515625, 1.130767822265625, 1.245849609375, 1.360931396484375, 1.47601318359375, 1.591094970703125, 1.7061767578125, 1.821258544921875, 1.93634033203125, 2.051422119140625, 2.16650390625, 2.281585693359375, 2.39666748046875, 2.511749267578125, 2.6268310546875, 2.741912841796875, 2.85699462890625, 2.972076416015625, 3.087158203125, 3.202239990234375, 3.31732177734375, 3.432403564453125, 3.5474853515625, 3.662567138671875, 3.77764892578125, 3.892730712890625, 4.0078125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 13.0, 16.0, 46.0, 75.0, 183.0, 255.0, 200.0, 98.0, 46.0, 20.0, 15.0, 10.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.447733879089355, -14.952469825744629, -14.457205772399902, -13.96194076538086, -13.466676712036133, -12.971412658691406, -12.47614860534668, -11.980884552001953, -11.485620498657227, -10.9903564453125, -10.495092391967773, -9.999828338623047, -9.504563331604004, -9.009299278259277, -8.51403522491455, -8.018771171569824, -7.523506164550781, -7.028242111206055, -6.53297758102417, -6.037713527679443, -5.542448997497559, -5.047184944152832, -4.5519208908081055, -4.056656837463379, -3.561392307281494, -3.0661280155181885, -2.570863723754883, -2.0755996704101562, -1.5803353786468506, -1.085071086883545, -0.5898070335388184, -0.0945427417755127, 0.40072059631347656, 0.8959848284721375, 1.3912490606307983, 1.8865132331848145, 2.38177752494812, 2.877041816711426, 3.3723058700561523, 3.867570161819458, 4.362834453582764, 4.85809850692749, 5.353363037109375, 5.848627090454102, 6.343891143798828, 6.839155673980713, 7.3344197273254395, 7.829684257507324, 8.32494831085205, 8.820212364196777, 9.315476417541504, 9.810741424560547, 10.306005477905273, 10.80126953125, 11.296533584594727, 11.791797637939453, 12.28706169128418, 12.782325744628906, 13.277589797973633, 13.77285385131836, 14.268118858337402, 14.763382911682129, 15.258646965026855, 15.753911018371582, 16.249176025390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 13.0, 18.0, 41.0, 55.0, 80.0, 102.0, 101.0, 92.0, 92.0, 100.0, 80.0, 74.0, 46.0, 28.0, 15.0, 12.0, 9.0, 7.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.30668067932129, -16.71780014038086, -16.128921508789062, -15.540040969848633, -14.951160430908203, -14.36228084564209, -13.773401260375977, -13.184520721435547, -12.595641136169434, -12.00676155090332, -11.41788101196289, -10.829001426696777, -10.240121841430664, -9.651241302490234, -9.062361717224121, -8.473482131958008, -7.884601593017578, -7.295721530914307, -6.706841468811035, -6.117961883544922, -5.52908182144165, -4.940201759338379, -4.351322174072266, -3.762442111968994, -3.1735620498657227, -2.584681987762451, -1.9958021640777588, -1.4069222211837769, -0.8180422782897949, -0.22916221618652344, 0.35971760749816895, 0.9485974311828613, 1.5374755859375, 2.1263556480407715, 2.715235471725464, 3.3041152954101562, 3.8929953575134277, 4.481875419616699, 5.0707550048828125, 5.659635066986084, 6.2485151290893555, 6.837395191192627, 7.426275253295898, 8.015154838562012, 8.604034423828125, 9.192914962768555, 9.781794548034668, 10.370674133300781, 10.959554672241211, 11.548434257507324, 12.137314796447754, 12.726194381713867, 13.315074920654297, 13.90395450592041, 14.492834091186523, 15.081714630126953, 15.670594215393066, 16.25947380065918, 16.84835433959961, 17.43723487854004, 18.026113510131836, 18.614994049072266, 19.203874588012695, 19.792753219604492, 20.381633758544922]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 14.0, 18.0, 21.0, 31.0, 27.0, 31.0, 47.0, 61.0, 116.0, 306.0, 1387.0, 11948.0, 682133.0, 341657.0, 9058.0, 1065.0, 253.0, 103.0, 67.0, 46.0, 28.0, 17.0, 24.0, 19.0, 11.0, 13.0, 17.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.546875, -29.590576171875, -28.63427734375, -27.677978515625, -26.7216796875, -25.765380859375, -24.80908203125, -23.852783203125, -22.896484375, -21.940185546875, -20.98388671875, -20.027587890625, -19.0712890625, -18.114990234375, -17.15869140625, -16.202392578125, -15.24609375, -14.289794921875, -13.33349609375, -12.377197265625, -11.4208984375, -10.464599609375, -9.50830078125, -8.552001953125, -7.595703125, -6.639404296875, -5.68310546875, -4.726806640625, -3.7705078125, -2.814208984375, -1.85791015625, -0.901611328125, 0.0546875, 1.010986328125, 1.96728515625, 2.923583984375, 3.8798828125, 4.836181640625, 5.79248046875, 6.748779296875, 7.705078125, 8.661376953125, 9.61767578125, 10.573974609375, 11.5302734375, 12.486572265625, 13.44287109375, 14.399169921875, 15.35546875, 16.311767578125, 17.26806640625, 18.224365234375, 19.1806640625, 20.136962890625, 21.09326171875, 22.049560546875, 23.005859375, 23.962158203125, 24.91845703125, 25.874755859375, 26.8310546875, 27.787353515625, 28.74365234375, 29.699951171875, 30.65625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 8.0, 5.0, 3.0, 8.0, 20.0, 36.0, 80.0, 194.0, 256.0, 211.0, 108.0, 34.0, 21.0, 10.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.8649368286132812, -0.7655181884765625, -0.6660995483398438, -0.566680908203125, -0.46726226806640625, -0.3678436279296875, -0.26842498779296875, -0.16900634765625, -0.06958770751953125, 0.0298309326171875, 0.12924957275390625, 0.228668212890625, 0.32808685302734375, 0.4275054931640625, 0.5269241333007812, 0.6263427734375, 0.7257614135742188, 0.8251800537109375, 0.9245986938476562, 1.024017333984375, 1.1234359741210938, 1.2228546142578125, 1.3222732543945312, 1.42169189453125, 1.5211105346679688, 1.6205291748046875, 1.7199478149414062, 1.819366455078125, 1.9187850952148438, 2.0182037353515625, 2.1176223754882812, 2.217041015625, 2.3164596557617188, 2.4158782958984375, 2.5152969360351562, 2.614715576171875, 2.7141342163085938, 2.8135528564453125, 2.9129714965820312, 3.01239013671875, 3.1118087768554688, 3.2112274169921875, 3.3106460571289062, 3.410064697265625, 3.5094833374023438, 3.6089019775390625, 3.7083206176757812, 3.8077392578125, 3.9071578979492188, 4.0065765380859375, 4.105995178222656, 4.205413818359375, 4.304832458496094, 4.4042510986328125, 4.503669738769531, 4.60308837890625, 4.702507019042969, 4.8019256591796875, 4.901344299316406, 5.000762939453125, 5.100181579589844, 5.1996002197265625, 5.299018859863281, 5.3984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 10.0, 11.0, 17.0, 40.0, 92.0, 238.0, 641.0, 1852.0, 5803.0, 22220.0, 109586.0, 581594.0, 264681.0, 45640.0, 11100.0, 3209.0, 1062.0, 420.0, 161.0, 93.0, 36.0, 24.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.27288818359375, -7.0106201171875, -6.74835205078125, -6.486083984375, -6.22381591796875, -5.9615478515625, -5.69927978515625, -5.43701171875, -5.17474365234375, -4.9124755859375, -4.65020751953125, -4.387939453125, -4.12567138671875, -3.8634033203125, -3.60113525390625, -3.3388671875, -3.07659912109375, -2.8143310546875, -2.55206298828125, -2.289794921875, -2.02752685546875, -1.7652587890625, -1.50299072265625, -1.24072265625, -0.97845458984375, -0.7161865234375, -0.45391845703125, -0.191650390625, 0.07061767578125, 0.3328857421875, 0.59515380859375, 0.857421875, 1.11968994140625, 1.3819580078125, 1.64422607421875, 1.906494140625, 2.16876220703125, 2.4310302734375, 2.69329833984375, 2.95556640625, 3.21783447265625, 3.4801025390625, 3.74237060546875, 4.004638671875, 4.26690673828125, 4.5291748046875, 4.79144287109375, 5.0537109375, 5.31597900390625, 5.5782470703125, 5.84051513671875, 6.102783203125, 6.36505126953125, 6.6273193359375, 6.88958740234375, 7.15185546875, 7.41412353515625, 7.6763916015625, 7.93865966796875, 8.200927734375, 8.46319580078125, 8.7254638671875, 8.98773193359375, 9.25]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 7.0, 4.0, 5.0, 11.0, 12.0, 12.0, 11.0, 15.0, 11.0, 20.0, 24.0, 18.0, 25.0, 24.0, 37.0, 40.0, 42.0, 27.0, 35.0, 39.0, 50.0, 35.0, 34.0, 37.0, 33.0, 34.0, 38.0, 35.0, 41.0, 27.0, 23.0, 25.0, 28.0, 24.0, 17.0, 22.0, 12.0, 9.0, 10.0, 11.0, 12.0, 10.0, 3.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.0078125, -3.87786865234375, -3.7479248046875, -3.61798095703125, -3.488037109375, -3.35809326171875, -3.2281494140625, -3.09820556640625, -2.96826171875, -2.83831787109375, -2.7083740234375, -2.57843017578125, -2.448486328125, -2.31854248046875, -2.1885986328125, -2.05865478515625, -1.9287109375, -1.79876708984375, -1.6688232421875, -1.53887939453125, -1.408935546875, -1.27899169921875, -1.1490478515625, -1.01910400390625, -0.88916015625, -0.75921630859375, -0.6292724609375, -0.49932861328125, -0.369384765625, -0.23944091796875, -0.1094970703125, 0.02044677734375, 0.150390625, 0.28033447265625, 0.4102783203125, 0.54022216796875, 0.670166015625, 0.80010986328125, 0.9300537109375, 1.05999755859375, 1.18994140625, 1.31988525390625, 1.4498291015625, 1.57977294921875, 1.709716796875, 1.83966064453125, 1.9696044921875, 2.09954833984375, 2.2294921875, 2.35943603515625, 2.4893798828125, 2.61932373046875, 2.749267578125, 2.87921142578125, 3.0091552734375, 3.13909912109375, 3.26904296875, 3.39898681640625, 3.5289306640625, 3.65887451171875, 3.788818359375, 3.91876220703125, 4.0487060546875, 4.17864990234375, 4.30859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 11.0, 12.0, 20.0, 29.0, 48.0, 71.0, 151.0, 347.0, 881.0, 2933.0, 13729.0, 297899.0, 708249.0, 18893.0, 3512.0, 1021.0, 371.0, 155.0, 73.0, 51.0, 27.0, 24.0, 16.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.425537109375, -16.75732421875, -16.089111328125, -15.4208984375, -14.752685546875, -14.08447265625, -13.416259765625, -12.748046875, -12.079833984375, -11.41162109375, -10.743408203125, -10.0751953125, -9.406982421875, -8.73876953125, -8.070556640625, -7.40234375, -6.734130859375, -6.06591796875, -5.397705078125, -4.7294921875, -4.061279296875, -3.39306640625, -2.724853515625, -2.056640625, -1.388427734375, -0.72021484375, -0.052001953125, 0.6162109375, 1.284423828125, 1.95263671875, 2.620849609375, 3.2890625, 3.957275390625, 4.62548828125, 5.293701171875, 5.9619140625, 6.630126953125, 7.29833984375, 7.966552734375, 8.634765625, 9.302978515625, 9.97119140625, 10.639404296875, 11.3076171875, 11.975830078125, 12.64404296875, 13.312255859375, 13.98046875, 14.648681640625, 15.31689453125, 15.985107421875, 16.6533203125, 17.321533203125, 17.98974609375, 18.657958984375, 19.326171875, 19.994384765625, 20.66259765625, 21.330810546875, 21.9990234375, 22.667236328125, 23.33544921875, 24.003662109375, 24.671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 9.0, 7.0, 9.0, 8.0, 16.0, 13.0, 41.0, 67.0, 155.0, 274.0, 187.0, 88.0, 38.0, 28.0, 15.0, 8.0, 4.0, 9.0, 2.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007023811340332031, -0.0006793811917304993, -0.0006563812494277954, -0.0006333813071250916, -0.0006103813648223877, -0.0005873814225196838, -0.00056438148021698, -0.0005413815379142761, -0.0005183815956115723, -0.0004953816533088684, -0.00047238171100616455, -0.0004493817687034607, -0.00042638182640075684, -0.000403381884098053, -0.0003803819417953491, -0.00035738199949264526, -0.0003343820571899414, -0.00031138211488723755, -0.0002883821725845337, -0.00026538223028182983, -0.00024238228797912598, -0.00021938234567642212, -0.00019638240337371826, -0.0001733824610710144, -0.00015038251876831055, -0.0001273825764656067, -0.00010438263416290283, -8.138269186019897e-05, -5.838274955749512e-05, -3.538280725479126e-05, -1.2382864952087402e-05, 1.0617077350616455e-05, 3.361701965332031e-05, 5.661696195602417e-05, 7.961690425872803e-05, 0.00010261684656143188, 0.00012561678886413574, 0.0001486167311668396, 0.00017161667346954346, 0.00019461661577224731, 0.00021761655807495117, 0.00024061650037765503, 0.0002636164426803589, 0.00028661638498306274, 0.0003096163272857666, 0.00033261626958847046, 0.0003556162118911743, 0.0003786161541938782, 0.00040161609649658203, 0.0004246160387992859, 0.00044761598110198975, 0.0004706159234046936, 0.0004936158657073975, 0.0005166158080101013, 0.0005396157503128052, 0.000562615692615509, 0.0005856156349182129, 0.0006086155772209167, 0.0006316155195236206, 0.0006546154618263245, 0.0006776154041290283, 0.0007006153464317322, 0.000723615288734436, 0.0007466152310371399, 0.0007696151733398438]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 8.0, 12.0, 9.0, 27.0, 25.0, 48.0, 67.0, 74.0, 140.0, 177.0, 265.0, 460.0, 758.0, 1190.0, 2088.0, 3501.0, 6686.0, 13485.0, 30253.0, 87500.0, 411030.0, 357607.0, 77099.0, 27788.0, 12601.0, 6508.0, 3477.0, 2096.0, 1271.0, 755.0, 539.0, 335.0, 227.0, 147.0, 83.0, 72.0, 34.0, 36.0, 23.0, 8.0, 8.0, 12.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0], "bins": [-6.20703125, -6.0390625, -5.87109375, -5.703125, -5.53515625, -5.3671875, -5.19921875, -5.03125, -4.86328125, -4.6953125, -4.52734375, -4.359375, -4.19140625, -4.0234375, -3.85546875, -3.6875, -3.51953125, -3.3515625, -3.18359375, -3.015625, -2.84765625, -2.6796875, -2.51171875, -2.34375, -2.17578125, -2.0078125, -1.83984375, -1.671875, -1.50390625, -1.3359375, -1.16796875, -1.0, -0.83203125, -0.6640625, -0.49609375, -0.328125, -0.16015625, 0.0078125, 0.17578125, 0.34375, 0.51171875, 0.6796875, 0.84765625, 1.015625, 1.18359375, 1.3515625, 1.51953125, 1.6875, 1.85546875, 2.0234375, 2.19140625, 2.359375, 2.52734375, 2.6953125, 2.86328125, 3.03125, 3.19921875, 3.3671875, 3.53515625, 3.703125, 3.87109375, 4.0390625, 4.20703125, 4.375, 4.54296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 6.0, 7.0, 7.0, 14.0, 17.0, 21.0, 22.0, 31.0, 43.0, 52.0, 81.0, 108.0, 120.0, 99.0, 95.0, 78.0, 52.0, 31.0, 20.0, 11.0, 14.0, 16.0, 6.0, 3.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.879638671875, -6.66162109375, -6.443603515625, -6.2255859375, -6.007568359375, -5.78955078125, -5.571533203125, -5.353515625, -5.135498046875, -4.91748046875, -4.699462890625, -4.4814453125, -4.263427734375, -4.04541015625, -3.827392578125, -3.609375, -3.391357421875, -3.17333984375, -2.955322265625, -2.7373046875, -2.519287109375, -2.30126953125, -2.083251953125, -1.865234375, -1.647216796875, -1.42919921875, -1.211181640625, -0.9931640625, -0.775146484375, -0.55712890625, -0.339111328125, -0.12109375, 0.096923828125, 0.31494140625, 0.532958984375, 0.7509765625, 0.968994140625, 1.18701171875, 1.405029296875, 1.623046875, 1.841064453125, 2.05908203125, 2.277099609375, 2.4951171875, 2.713134765625, 2.93115234375, 3.149169921875, 3.3671875, 3.585205078125, 3.80322265625, 4.021240234375, 4.2392578125, 4.457275390625, 4.67529296875, 4.893310546875, 5.111328125, 5.329345703125, 5.54736328125, 5.765380859375, 5.9833984375, 6.201416015625, 6.41943359375, 6.637451171875, 6.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 55.0, 224.0, 373.0, 197.0, 82.0, 35.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.09200286865234, -82.81078338623047, -79.52957153320312, -76.24835205078125, -72.9671401977539, -69.68592071533203, -66.40470886230469, -63.12348937988281, -59.8422737121582, -56.561058044433594, -53.279842376708984, -49.998626708984375, -46.7174072265625, -43.436195373535156, -40.15497589111328, -36.87376022338867, -33.59254455566406, -30.311328887939453, -27.030113220214844, -23.7488956451416, -20.467679977416992, -17.186464309692383, -13.90524673461914, -10.624031066894531, -7.342815399169922, -4.061599254608154, -0.7803831100463867, 2.500833511352539, 5.782049179077148, 9.063264846801758, 12.344482421875, 15.62569808959961, 18.906906127929688, 22.188121795654297, 25.469337463378906, 28.75055503845215, 32.031768798828125, 35.31298828125, 38.59420394897461, 41.87541961669922, 45.15663528442383, 48.43785095214844, 51.71906661987305, 55.000282287597656, 58.28150177001953, 61.562713623046875, 64.84393310546875, 68.12515258789062, 71.40636444091797, 74.68758392333984, 77.96879577636719, 81.25001525878906, 84.5312271118164, 87.81244659423828, 91.09365844726562, 94.3748779296875, 97.65609741210938, 100.93731689453125, 104.2185287475586, 107.49974822998047, 110.78096008300781, 114.06217956542969, 117.34339904785156, 120.6246109008789, 123.90582275390625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 4.0, 1.0, 11.0, 6.0, 11.0, 9.0, 33.0, 31.0, 69.0, 93.0, 125.0, 157.0, 138.0, 127.0, 70.0, 59.0, 27.0, 11.0, 13.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-146.91952514648438, -143.66024780273438, -140.40098571777344, -137.14170837402344, -133.8824462890625, -130.6231689453125, -127.36390686035156, -124.10462951660156, -120.8453598022461, -117.58609008789062, -114.32682037353516, -111.06755065917969, -107.80828094482422, -104.54901123046875, -101.28973388671875, -98.03046417236328, -94.77119445800781, -91.51192474365234, -88.25265502929688, -84.9933853149414, -81.73411560058594, -78.47483825683594, -75.215576171875, -71.956298828125, -68.69703674316406, -65.4377670288086, -62.178497314453125, -58.919227600097656, -55.65995407104492, -52.40068435668945, -49.141414642333984, -45.88214111328125, -42.622867584228516, -39.36359786987305, -36.10432815551758, -32.845054626464844, -29.585784912109375, -26.326515197753906, -23.067245483398438, -19.807973861694336, -16.548704147338867, -13.289433479309082, -10.030162811279297, -6.770893096923828, -3.511622428894043, -0.2523517608642578, 3.006917953491211, 6.2661895751953125, 9.525459289550781, 12.784729957580566, 16.04400062561035, 19.30327033996582, 22.562541961669922, 25.82181167602539, 29.08108139038086, 32.340354919433594, 35.59962463378906, 38.85889434814453, 42.1181640625, 45.37743377685547, 48.6367073059082, 51.89597702026367, 55.15524673461914, 58.414520263671875, 61.67378616333008]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 17.0, 11.0, 26.0, 27.0, 35.0, 60.0, 83.0, 101.0, 122.0, 202.0, 370.0, 476.0, 876.0, 1513.0, 3140.0, 7553.0, 26726.0, 330810.0, 3736626.0, 64427.0, 12515.0, 4300.0, 1824.0, 948.0, 506.0, 329.0, 202.0, 149.0, 83.0, 68.0, 38.0, 29.0, 19.0, 17.0, 11.0, 9.0, 7.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-27.703125, -26.9970703125, -26.291015625, -25.5849609375, -24.87890625, -24.1728515625, -23.466796875, -22.7607421875, -22.0546875, -21.3486328125, -20.642578125, -19.9365234375, -19.23046875, -18.5244140625, -17.818359375, -17.1123046875, -16.40625, -15.7001953125, -14.994140625, -14.2880859375, -13.58203125, -12.8759765625, -12.169921875, -11.4638671875, -10.7578125, -10.0517578125, -9.345703125, -8.6396484375, -7.93359375, -7.2275390625, -6.521484375, -5.8154296875, -5.109375, -4.4033203125, -3.697265625, -2.9912109375, -2.28515625, -1.5791015625, -0.873046875, -0.1669921875, 0.5390625, 1.2451171875, 1.951171875, 2.6572265625, 3.36328125, 4.0693359375, 4.775390625, 5.4814453125, 6.1875, 6.8935546875, 7.599609375, 8.3056640625, 9.01171875, 9.7177734375, 10.423828125, 11.1298828125, 11.8359375, 12.5419921875, 13.248046875, 13.9541015625, 14.66015625, 15.3662109375, 16.072265625, 16.7783203125, 17.484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 22.0, 24.0, 23.0, 30.0, 53.0, 66.0, 78.0, 109.0, 103.0, 89.0, 87.0, 72.0, 52.0, 44.0, 27.0, 28.0, 19.0, 4.0, 8.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.32855224609375, -1.2899169921875, -1.25128173828125, -1.212646484375, -1.17401123046875, -1.1353759765625, -1.09674072265625, -1.05810546875, -1.01947021484375, -0.9808349609375, -0.94219970703125, -0.903564453125, -0.86492919921875, -0.8262939453125, -0.78765869140625, -0.7490234375, -0.71038818359375, -0.6717529296875, -0.63311767578125, -0.594482421875, -0.55584716796875, -0.5172119140625, -0.47857666015625, -0.43994140625, -0.40130615234375, -0.3626708984375, -0.32403564453125, -0.285400390625, -0.24676513671875, -0.2081298828125, -0.16949462890625, -0.130859375, -0.09222412109375, -0.0535888671875, -0.01495361328125, 0.023681640625, 0.06231689453125, 0.1009521484375, 0.13958740234375, 0.17822265625, 0.21685791015625, 0.2554931640625, 0.29412841796875, 0.332763671875, 0.37139892578125, 0.4100341796875, 0.44866943359375, 0.4873046875, 0.52593994140625, 0.5645751953125, 0.60321044921875, 0.641845703125, 0.68048095703125, 0.7191162109375, 0.75775146484375, 0.79638671875, 0.83502197265625, 0.8736572265625, 0.91229248046875, 0.950927734375, 0.98956298828125, 1.0281982421875, 1.06683349609375, 1.10546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 11.0, 7.0, 13.0, 11.0, 19.0, 21.0, 26.0, 55.0, 74.0, 115.0, 322.0, 1849.0, 42058.0, 4120392.0, 27128.0, 1508.0, 295.0, 124.0, 67.0, 42.0, 38.0, 19.0, 17.0, 9.0, 9.0, 6.0, 8.0, 4.0, 6.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.78125, -41.462890625, -40.14453125, -38.826171875, -37.5078125, -36.189453125, -34.87109375, -33.552734375, -32.234375, -30.916015625, -29.59765625, -28.279296875, -26.9609375, -25.642578125, -24.32421875, -23.005859375, -21.6875, -20.369140625, -19.05078125, -17.732421875, -16.4140625, -15.095703125, -13.77734375, -12.458984375, -11.140625, -9.822265625, -8.50390625, -7.185546875, -5.8671875, -4.548828125, -3.23046875, -1.912109375, -0.59375, 0.724609375, 2.04296875, 3.361328125, 4.6796875, 5.998046875, 7.31640625, 8.634765625, 9.953125, 11.271484375, 12.58984375, 13.908203125, 15.2265625, 16.544921875, 17.86328125, 19.181640625, 20.5, 21.818359375, 23.13671875, 24.455078125, 25.7734375, 27.091796875, 28.41015625, 29.728515625, 31.046875, 32.365234375, 33.68359375, 35.001953125, 36.3203125, 37.638671875, 38.95703125, 40.275390625, 41.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 7.0, 4.0, 10.0, 9.0, 13.0, 35.0, 35.0, 49.0, 76.0, 140.0, 215.0, 421.0, 1052.0, 950.0, 379.0, 218.0, 134.0, 92.0, 61.0, 43.0, 30.0, 19.0, 14.0, 11.0, 12.0, 1.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.8910675048828125, -1.828033447265625, -1.7649993896484375, -1.70196533203125, -1.6389312744140625, -1.575897216796875, -1.5128631591796875, -1.4498291015625, -1.3867950439453125, -1.323760986328125, -1.2607269287109375, -1.19769287109375, -1.1346588134765625, -1.071624755859375, -1.0085906982421875, -0.945556640625, -0.8825225830078125, -0.819488525390625, -0.7564544677734375, -0.69342041015625, -0.6303863525390625, -0.567352294921875, -0.5043182373046875, -0.4412841796875, -0.3782501220703125, -0.315216064453125, -0.2521820068359375, -0.18914794921875, -0.1261138916015625, -0.063079833984375, -4.57763671875e-05, 0.06298828125, 0.1260223388671875, 0.189056396484375, 0.2520904541015625, 0.31512451171875, 0.3781585693359375, 0.441192626953125, 0.5042266845703125, 0.5672607421875, 0.6302947998046875, 0.693328857421875, 0.7563629150390625, 0.81939697265625, 0.8824310302734375, 0.945465087890625, 1.0084991455078125, 1.071533203125, 1.1345672607421875, 1.197601318359375, 1.2606353759765625, 1.32366943359375, 1.3867034912109375, 1.449737548828125, 1.5127716064453125, 1.5758056640625, 1.6388397216796875, 1.701873779296875, 1.7649078369140625, 1.82794189453125, 1.8909759521484375, 1.954010009765625, 2.0170440673828125, 2.080078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 7.0, 8.0, 25.0, 33.0, 61.0, 122.0, 201.0, 234.0, 143.0, 82.0, 37.0, 25.0, 5.0, 13.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.572629928588867, -22.10427474975586, -21.635921478271484, -21.167566299438477, -20.6992130279541, -20.230857849121094, -19.76250457763672, -19.29414939880371, -18.825794219970703, -18.357439041137695, -17.88908576965332, -17.420730590820312, -16.952377319335938, -16.48402214050293, -16.015668869018555, -15.547313690185547, -15.078960418701172, -14.61060619354248, -14.142251968383789, -13.673897743225098, -13.205543518066406, -12.737188339233398, -12.268834114074707, -11.800479888916016, -11.332125663757324, -10.863771438598633, -10.395417213439941, -9.92706298828125, -9.458707809448242, -8.990354537963867, -8.52199935913086, -8.053645133972168, -7.585291862487793, -7.116937637329102, -6.64858341217041, -6.1802287101745605, -5.711874485015869, -5.243520259857178, -4.775165557861328, -4.306811332702637, -3.8384571075439453, -3.370102882385254, -2.9017484188079834, -2.433393955230713, -1.9650397300720215, -1.49668550491333, -1.0283310413360596, -0.5599765777587891, -0.09162235260009766, 0.3767319917678833, 0.8450863361358643, 1.3134406805038452, 1.7817950248718262, 2.2501492500305176, 2.718503713607788, 3.1868581771850586, 3.65521240234375, 4.123566627502441, 4.591920852661133, 5.060275554656982, 5.528629779815674, 5.996984004974365, 6.465338706970215, 6.933692932128906, 7.402047157287598]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 4.0, 8.0, 6.0, 17.0, 14.0, 19.0, 18.0, 21.0, 34.0, 29.0, 33.0, 49.0, 50.0, 40.0, 49.0, 47.0, 46.0, 59.0, 67.0, 37.0, 37.0, 54.0, 26.0, 39.0, 29.0, 30.0, 24.0, 16.0, 20.0, 14.0, 11.0, 9.0, 4.0, 5.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.331695556640625, -7.072372913360596, -6.813050270080566, -6.553727626800537, -6.294404983520508, -6.035082817077637, -5.775760173797607, -5.516437530517578, -5.257114887237549, -4.9977922439575195, -4.73846960067749, -4.479146957397461, -4.21982479095459, -3.9605019092559814, -3.7011795043945312, -3.441856861114502, -3.1825342178344727, -2.9232115745544434, -2.663888931274414, -2.404566526412964, -2.1452438831329346, -1.8859212398529053, -1.6265987157821655, -1.3672761917114258, -1.1079535484313965, -0.848630964756012, -0.5893083810806274, -0.3299857974052429, -0.0706632137298584, 0.1886594295501709, 0.44798195362091064, 0.7073044776916504, 0.9666271209716797, 1.225949764251709, 1.4852722883224487, 1.7445948123931885, 2.0039174556732178, 2.263240098953247, 2.5225625038146973, 2.7818851470947266, 3.041207790374756, 3.300530433654785, 3.5598530769348145, 3.8191754817962646, 4.078497886657715, 4.337821006774902, 4.597143173217773, 4.856465816497803, 5.115788459777832, 5.375111103057861, 5.634433746337891, 5.89375638961792, 6.153079032897949, 6.41240119934082, 6.67172384262085, 6.931046485900879, 7.190369129180908, 7.4496917724609375, 7.709014415740967, 7.968337059020996, 8.227659225463867, 8.486982345581055, 8.746304512023926, 9.005626678466797, 9.264949798583984]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 6.0, 17.0, 17.0, 26.0, 27.0, 29.0, 49.0, 70.0, 112.0, 137.0, 220.0, 391.0, 671.0, 1205.0, 2312.0, 5060.0, 12634.0, 38962.0, 155308.0, 485195.0, 253752.0, 61041.0, 17917.0, 6690.0, 3040.0, 1518.0, 795.0, 463.0, 304.0, 182.0, 112.0, 93.0, 50.0, 37.0, 25.0, 16.0, 14.0, 10.0, 12.0, 8.0, 5.0, 13.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.5330810546875, -6.320068359375, -6.1070556640625, -5.89404296875, -5.6810302734375, -5.468017578125, -5.2550048828125, -5.0419921875, -4.8289794921875, -4.615966796875, -4.4029541015625, -4.18994140625, -3.9769287109375, -3.763916015625, -3.5509033203125, -3.337890625, -3.1248779296875, -2.911865234375, -2.6988525390625, -2.48583984375, -2.2728271484375, -2.059814453125, -1.8468017578125, -1.6337890625, -1.4207763671875, -1.207763671875, -0.9947509765625, -0.78173828125, -0.5687255859375, -0.355712890625, -0.1427001953125, 0.0703125, 0.2833251953125, 0.496337890625, 0.7093505859375, 0.92236328125, 1.1353759765625, 1.348388671875, 1.5614013671875, 1.7744140625, 1.9874267578125, 2.200439453125, 2.4134521484375, 2.62646484375, 2.8394775390625, 3.052490234375, 3.2655029296875, 3.478515625, 3.6915283203125, 3.904541015625, 4.1175537109375, 4.33056640625, 4.5435791015625, 4.756591796875, 4.9696044921875, 5.1826171875, 5.3956298828125, 5.608642578125, 5.8216552734375, 6.03466796875, 6.2476806640625, 6.460693359375, 6.6737060546875, 6.88671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 11.0, 11.0, 18.0, 22.0, 41.0, 65.0, 53.0, 75.0, 81.0, 85.0, 101.0, 90.0, 74.0, 54.0, 56.0, 41.0, 36.0, 19.0, 15.0, 8.0, 18.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.177734375, -1.1412353515625, -1.104736328125, -1.0682373046875, -1.03173828125, -0.9952392578125, -0.958740234375, -0.9222412109375, -0.8857421875, -0.8492431640625, -0.812744140625, -0.7762451171875, -0.73974609375, -0.7032470703125, -0.666748046875, -0.6302490234375, -0.59375, -0.5572509765625, -0.520751953125, -0.4842529296875, -0.44775390625, -0.4112548828125, -0.374755859375, -0.3382568359375, -0.3017578125, -0.2652587890625, -0.228759765625, -0.1922607421875, -0.15576171875, -0.1192626953125, -0.082763671875, -0.0462646484375, -0.009765625, 0.0267333984375, 0.063232421875, 0.0997314453125, 0.13623046875, 0.1727294921875, 0.209228515625, 0.2457275390625, 0.2822265625, 0.3187255859375, 0.355224609375, 0.3917236328125, 0.42822265625, 0.4647216796875, 0.501220703125, 0.5377197265625, 0.57421875, 0.6107177734375, 0.647216796875, 0.6837158203125, 0.72021484375, 0.7567138671875, 0.793212890625, 0.8297119140625, 0.8662109375, 0.9027099609375, 0.939208984375, 0.9757080078125, 1.01220703125, 1.0487060546875, 1.085205078125, 1.1217041015625, 1.158203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 17.0, 27.0, 34.0, 49.0, 68.0, 97.0, 132.0, 226.0, 314.0, 457.0, 729.0, 1193.0, 2172.0, 4060.0, 8327.0, 18467.0, 45531.0, 121040.0, 300873.0, 320023.0, 134604.0, 49943.0, 20462.0, 9251.0, 4485.0, 2295.0, 1288.0, 802.0, 525.0, 315.0, 224.0, 161.0, 102.0, 76.0, 52.0, 37.0, 24.0, 17.0, 14.0, 13.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9334716796875, -4.769287109375, -4.6051025390625, -4.44091796875, -4.2767333984375, -4.112548828125, -3.9483642578125, -3.7841796875, -3.6199951171875, -3.455810546875, -3.2916259765625, -3.12744140625, -2.9632568359375, -2.799072265625, -2.6348876953125, -2.470703125, -2.3065185546875, -2.142333984375, -1.9781494140625, -1.81396484375, -1.6497802734375, -1.485595703125, -1.3214111328125, -1.1572265625, -0.9930419921875, -0.828857421875, -0.6646728515625, -0.50048828125, -0.3363037109375, -0.172119140625, -0.0079345703125, 0.15625, 0.3204345703125, 0.484619140625, 0.6488037109375, 0.81298828125, 0.9771728515625, 1.141357421875, 1.3055419921875, 1.4697265625, 1.6339111328125, 1.798095703125, 1.9622802734375, 2.12646484375, 2.2906494140625, 2.454833984375, 2.6190185546875, 2.783203125, 2.9473876953125, 3.111572265625, 3.2757568359375, 3.43994140625, 3.6041259765625, 3.768310546875, 3.9324951171875, 4.0966796875, 4.2608642578125, 4.425048828125, 4.5892333984375, 4.75341796875, 4.9176025390625, 5.081787109375, 5.2459716796875, 5.41015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 3.0, 9.0, 8.0, 13.0, 18.0, 17.0, 29.0, 17.0, 29.0, 28.0, 29.0, 25.0, 29.0, 33.0, 35.0, 41.0, 46.0, 32.0, 44.0, 51.0, 46.0, 42.0, 46.0, 38.0, 31.0, 28.0, 27.0, 30.0, 34.0, 19.0, 20.0, 12.0, 16.0, 11.0, 14.0, 14.0, 9.0, 3.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.25836181640625, -4.1143798828125, -3.97039794921875, -3.826416015625, -3.68243408203125, -3.5384521484375, -3.39447021484375, -3.25048828125, -3.10650634765625, -2.9625244140625, -2.81854248046875, -2.674560546875, -2.53057861328125, -2.3865966796875, -2.24261474609375, -2.0986328125, -1.95465087890625, -1.8106689453125, -1.66668701171875, -1.522705078125, -1.37872314453125, -1.2347412109375, -1.09075927734375, -0.94677734375, -0.80279541015625, -0.6588134765625, -0.51483154296875, -0.370849609375, -0.22686767578125, -0.0828857421875, 0.06109619140625, 0.205078125, 0.34906005859375, 0.4930419921875, 0.63702392578125, 0.781005859375, 0.92498779296875, 1.0689697265625, 1.21295166015625, 1.35693359375, 1.50091552734375, 1.6448974609375, 1.78887939453125, 1.932861328125, 2.07684326171875, 2.2208251953125, 2.36480712890625, 2.5087890625, 2.65277099609375, 2.7967529296875, 2.94073486328125, 3.084716796875, 3.22869873046875, 3.3726806640625, 3.51666259765625, 3.66064453125, 3.80462646484375, 3.9486083984375, 4.09259033203125, 4.236572265625, 4.38055419921875, 4.5245361328125, 4.66851806640625, 4.8125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 7.0, 13.0, 13.0, 20.0, 47.0, 61.0, 128.0, 196.0, 414.0, 831.0, 1995.0, 5977.0, 25434.0, 194822.0, 685341.0, 108895.0, 16926.0, 4436.0, 1558.0, 674.0, 328.0, 162.0, 102.0, 58.0, 37.0, 20.0, 19.0, 10.0, 8.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1484375, -8.8658447265625, -8.583251953125, -8.3006591796875, -8.01806640625, -7.7354736328125, -7.452880859375, -7.1702880859375, -6.8876953125, -6.6051025390625, -6.322509765625, -6.0399169921875, -5.75732421875, -5.4747314453125, -5.192138671875, -4.9095458984375, -4.626953125, -4.3443603515625, -4.061767578125, -3.7791748046875, -3.49658203125, -3.2139892578125, -2.931396484375, -2.6488037109375, -2.3662109375, -2.0836181640625, -1.801025390625, -1.5184326171875, -1.23583984375, -0.9532470703125, -0.670654296875, -0.3880615234375, -0.10546875, 0.1771240234375, 0.459716796875, 0.7423095703125, 1.02490234375, 1.3074951171875, 1.590087890625, 1.8726806640625, 2.1552734375, 2.4378662109375, 2.720458984375, 3.0030517578125, 3.28564453125, 3.5682373046875, 3.850830078125, 4.1334228515625, 4.416015625, 4.6986083984375, 4.981201171875, 5.2637939453125, 5.54638671875, 5.8289794921875, 6.111572265625, 6.3941650390625, 6.6767578125, 6.9593505859375, 7.241943359375, 7.5245361328125, 7.80712890625, 8.0897216796875, 8.372314453125, 8.6549072265625, 8.9375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 14.0, 10.0, 8.0, 18.0, 23.0, 22.0, 29.0, 31.0, 46.0, 55.0, 59.0, 77.0, 78.0, 78.0, 78.0, 68.0, 50.0, 34.0, 47.0, 30.0, 22.0, 15.0, 17.0, 14.0, 14.0, 11.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0005249977111816406, -0.0005104541778564453, -0.00049591064453125, -0.0004813671112060547, -0.0004668235778808594, -0.00045228004455566406, -0.00043773651123046875, -0.00042319297790527344, -0.0004086494445800781, -0.0003941059112548828, -0.0003795623779296875, -0.0003650188446044922, -0.0003504753112792969, -0.00033593177795410156, -0.00032138824462890625, -0.00030684471130371094, -0.0002923011779785156, -0.0002777576446533203, -0.000263214111328125, -0.0002486705780029297, -0.00023412704467773438, -0.00021958351135253906, -0.00020503997802734375, -0.00019049644470214844, -0.00017595291137695312, -0.0001614093780517578, -0.0001468658447265625, -0.0001323223114013672, -0.00011777877807617188, -0.00010323524475097656, -8.869171142578125e-05, -7.414817810058594e-05, -5.9604644775390625e-05, -4.506111145019531e-05, -3.0517578125e-05, -1.5974044799804688e-05, -1.430511474609375e-06, 1.3113021850585938e-05, 2.765655517578125e-05, 4.220008850097656e-05, 5.6743621826171875e-05, 7.128715515136719e-05, 8.58306884765625e-05, 0.00010037422180175781, 0.00011491775512695312, 0.00012946128845214844, 0.00014400482177734375, 0.00015854835510253906, 0.00017309188842773438, 0.0001876354217529297, 0.000202178955078125, 0.0002167224884033203, 0.00023126602172851562, 0.00024580955505371094, 0.00026035308837890625, 0.00027489662170410156, 0.0002894401550292969, 0.0003039836883544922, 0.0003185272216796875, 0.0003330707550048828, 0.0003476142883300781, 0.00036215782165527344, 0.00037670135498046875, 0.00039124488830566406, 0.0004057884216308594]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 9.0, 21.0, 17.0, 32.0, 46.0, 65.0, 79.0, 142.0, 217.0, 262.0, 484.0, 922.0, 1747.0, 3388.0, 7869.0, 19226.0, 55955.0, 192765.0, 468078.0, 203753.0, 58059.0, 19659.0, 7865.0, 3669.0, 1766.0, 939.0, 563.0, 346.0, 186.0, 112.0, 81.0, 64.0, 41.0, 36.0, 21.0, 18.0, 12.0, 11.0, 8.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.88671875, -4.7364501953125, -4.586181640625, -4.4359130859375, -4.28564453125, -4.1353759765625, -3.985107421875, -3.8348388671875, -3.6845703125, -3.5343017578125, -3.384033203125, -3.2337646484375, -3.08349609375, -2.9332275390625, -2.782958984375, -2.6326904296875, -2.482421875, -2.3321533203125, -2.181884765625, -2.0316162109375, -1.88134765625, -1.7310791015625, -1.580810546875, -1.4305419921875, -1.2802734375, -1.1300048828125, -0.979736328125, -0.8294677734375, -0.67919921875, -0.5289306640625, -0.378662109375, -0.2283935546875, -0.078125, 0.0721435546875, 0.222412109375, 0.3726806640625, 0.52294921875, 0.6732177734375, 0.823486328125, 0.9737548828125, 1.1240234375, 1.2742919921875, 1.424560546875, 1.5748291015625, 1.72509765625, 1.8753662109375, 2.025634765625, 2.1759033203125, 2.326171875, 2.4764404296875, 2.626708984375, 2.7769775390625, 2.92724609375, 3.0775146484375, 3.227783203125, 3.3780517578125, 3.5283203125, 3.6785888671875, 3.828857421875, 3.9791259765625, 4.12939453125, 4.2796630859375, 4.429931640625, 4.5802001953125, 4.73046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 7.0, 6.0, 9.0, 10.0, 9.0, 14.0, 19.0, 15.0, 15.0, 24.0, 34.0, 48.0, 57.0, 64.0, 62.0, 85.0, 73.0, 75.0, 68.0, 53.0, 43.0, 46.0, 24.0, 28.0, 12.0, 22.0, 18.0, 11.0, 6.0, 5.0, 7.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.51953125, -3.4129638671875, -3.306396484375, -3.1998291015625, -3.09326171875, -2.9866943359375, -2.880126953125, -2.7735595703125, -2.6669921875, -2.5604248046875, -2.453857421875, -2.3472900390625, -2.24072265625, -2.1341552734375, -2.027587890625, -1.9210205078125, -1.814453125, -1.7078857421875, -1.601318359375, -1.4947509765625, -1.38818359375, -1.2816162109375, -1.175048828125, -1.0684814453125, -0.9619140625, -0.8553466796875, -0.748779296875, -0.6422119140625, -0.53564453125, -0.4290771484375, -0.322509765625, -0.2159423828125, -0.109375, -0.0028076171875, 0.103759765625, 0.2103271484375, 0.31689453125, 0.4234619140625, 0.530029296875, 0.6365966796875, 0.7431640625, 0.8497314453125, 0.956298828125, 1.0628662109375, 1.16943359375, 1.2760009765625, 1.382568359375, 1.4891357421875, 1.595703125, 1.7022705078125, 1.808837890625, 1.9154052734375, 2.02197265625, 2.1285400390625, 2.235107421875, 2.3416748046875, 2.4482421875, 2.5548095703125, 2.661376953125, 2.7679443359375, 2.87451171875, 2.9810791015625, 3.087646484375, 3.1942138671875, 3.30078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 21.0, 44.0, 104.0, 221.0, 285.0, 154.0, 84.0, 31.0, 24.0, 8.0, 5.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.89102172851562, -80.39715576171875, -77.9032974243164, -75.40943145751953, -72.91557312011719, -70.42170715332031, -67.92784118652344, -65.43397521972656, -62.94011688232422, -60.44625473022461, -57.952392578125, -55.458526611328125, -52.964664459228516, -50.470802307128906, -47.97693634033203, -45.48307418823242, -42.98921203613281, -40.4953498840332, -38.001487731933594, -35.50762176513672, -33.01375961303711, -30.5198974609375, -28.026033401489258, -25.532169342041016, -23.038307189941406, -20.544445037841797, -18.050580978393555, -15.556717872619629, -13.062854766845703, -10.568991661071777, -8.075128555297852, -5.581264495849609, -3.08740234375, -0.5935392379760742, 1.9003238677978516, 4.394186973571777, 6.888050079345703, 9.381913185119629, 11.875776290893555, 14.369640350341797, 16.863502502441406, 19.357364654541016, 21.851228713989258, 24.3450927734375, 26.83895492553711, 29.33281707763672, 31.82668113708496, 34.3205451965332, 36.81440734863281, 39.30826950073242, 41.80213165283203, 44.295997619628906, 46.789859771728516, 49.283721923828125, 51.777587890625, 54.27145004272461, 56.76531219482422, 59.25917434692383, 61.75303649902344, 64.24690246582031, 66.74076843261719, 69.23462677001953, 71.7284927368164, 74.22235107421875, 76.71621704101562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 5.0, 4.0, 10.0, 17.0, 19.0, 34.0, 48.0, 45.0, 42.0, 71.0, 71.0, 92.0, 84.0, 81.0, 80.0, 73.0, 55.0, 51.0, 27.0, 32.0, 26.0, 17.0, 12.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.71028137207031, -71.56988525390625, -69.42948913574219, -67.28909301757812, -65.14869689941406, -63.008296966552734, -60.86790084838867, -58.72750473022461, -56.58710479736328, -54.44670867919922, -52.306312561035156, -50.165916442871094, -48.025516510009766, -45.8851203918457, -43.74472427368164, -41.60432815551758, -39.463932037353516, -37.32353591918945, -35.18313980102539, -33.04273986816406, -30.90234375, -28.761947631835938, -26.621551513671875, -24.481155395507812, -22.340757369995117, -20.200361251831055, -18.05996322631836, -15.919567108154297, -13.779170036315918, -11.638772964477539, -9.498376846313477, -7.357979774475098, -5.217578887939453, -3.0771820545196533, -0.9367852210998535, 1.2036113739013672, 3.344008445739746, 5.484405517578125, 7.6248016357421875, 9.765198707580566, 11.905595779418945, 14.045992851257324, 16.186389923095703, 18.326786041259766, 20.467182159423828, 22.607580184936523, 24.747976303100586, 26.88837432861328, 29.028770446777344, 31.169166564941406, 33.30956268310547, 35.44995880126953, 37.59035873413086, 39.73075485229492, 41.871150970458984, 44.01154708862305, 46.151947021484375, 48.29234313964844, 50.4327392578125, 52.57313537597656, 54.71353530883789, 56.85393142700195, 58.994327545166016, 61.13472366333008, 63.27511978149414]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 22.0, 28.0, 52.0, 74.0, 188.0, 423.0, 1182.0, 5581.0, 83519.0, 4070554.0, 28111.0, 3096.0, 798.0, 320.0, 128.0, 70.0, 44.0, 17.0, 15.0, 9.0, 7.0, 8.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.56005859375, -45.0263671875, -43.49267578125, -41.958984375, -40.42529296875, -38.8916015625, -37.35791015625, -35.82421875, -34.29052734375, -32.7568359375, -31.22314453125, -29.689453125, -28.15576171875, -26.6220703125, -25.08837890625, -23.5546875, -22.02099609375, -20.4873046875, -18.95361328125, -17.419921875, -15.88623046875, -14.3525390625, -12.81884765625, -11.28515625, -9.75146484375, -8.2177734375, -6.68408203125, -5.150390625, -3.61669921875, -2.0830078125, -0.54931640625, 0.984375, 2.51806640625, 4.0517578125, 5.58544921875, 7.119140625, 8.65283203125, 10.1865234375, 11.72021484375, 13.25390625, 14.78759765625, 16.3212890625, 17.85498046875, 19.388671875, 20.92236328125, 22.4560546875, 23.98974609375, 25.5234375, 27.05712890625, 28.5908203125, 30.12451171875, 31.658203125, 33.19189453125, 34.7255859375, 36.25927734375, 37.79296875, 39.32666015625, 40.8603515625, 42.39404296875, 43.927734375, 45.46142578125, 46.9951171875, 48.52880859375, 50.0625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 18.0, 25.0, 55.0, 81.0, 88.0, 107.0, 128.0, 135.0, 101.0, 75.0, 57.0, 40.0, 25.0, 15.0, 10.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.14447021484375, -2.0721435546875, -1.99981689453125, -1.927490234375, -1.85516357421875, -1.7828369140625, -1.71051025390625, -1.63818359375, -1.56585693359375, -1.4935302734375, -1.42120361328125, -1.348876953125, -1.27655029296875, -1.2042236328125, -1.13189697265625, -1.0595703125, -0.98724365234375, -0.9149169921875, -0.84259033203125, -0.770263671875, -0.69793701171875, -0.6256103515625, -0.55328369140625, -0.48095703125, -0.40863037109375, -0.3363037109375, -0.26397705078125, -0.191650390625, -0.11932373046875, -0.0469970703125, 0.02532958984375, 0.09765625, 0.16998291015625, 0.2423095703125, 0.31463623046875, 0.386962890625, 0.45928955078125, 0.5316162109375, 0.60394287109375, 0.67626953125, 0.74859619140625, 0.8209228515625, 0.89324951171875, 0.965576171875, 1.03790283203125, 1.1102294921875, 1.18255615234375, 1.2548828125, 1.32720947265625, 1.3995361328125, 1.47186279296875, 1.544189453125, 1.61651611328125, 1.6888427734375, 1.76116943359375, 1.83349609375, 1.90582275390625, 1.9781494140625, 2.05047607421875, 2.122802734375, 2.19512939453125, 2.2674560546875, 2.33978271484375, 2.412109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 12.0, 19.0, 17.0, 53.0, 84.0, 173.0, 475.0, 1422.0, 6001.0, 38081.0, 918811.0, 3150955.0, 65417.0, 9265.0, 2202.0, 714.0, 265.0, 156.0, 67.0, 36.0, 23.0, 18.0, 7.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.875, -16.349609375, -15.82421875, -15.298828125, -14.7734375, -14.248046875, -13.72265625, -13.197265625, -12.671875, -12.146484375, -11.62109375, -11.095703125, -10.5703125, -10.044921875, -9.51953125, -8.994140625, -8.46875, -7.943359375, -7.41796875, -6.892578125, -6.3671875, -5.841796875, -5.31640625, -4.791015625, -4.265625, -3.740234375, -3.21484375, -2.689453125, -2.1640625, -1.638671875, -1.11328125, -0.587890625, -0.0625, 0.462890625, 0.98828125, 1.513671875, 2.0390625, 2.564453125, 3.08984375, 3.615234375, 4.140625, 4.666015625, 5.19140625, 5.716796875, 6.2421875, 6.767578125, 7.29296875, 7.818359375, 8.34375, 8.869140625, 9.39453125, 9.919921875, 10.4453125, 10.970703125, 11.49609375, 12.021484375, 12.546875, 13.072265625, 13.59765625, 14.123046875, 14.6484375, 15.173828125, 15.69921875, 16.224609375, 16.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 9.0, 6.0, 8.0, 13.0, 13.0, 28.0, 42.0, 45.0, 73.0, 77.0, 149.0, 194.0, 409.0, 850.0, 970.0, 430.0, 232.0, 163.0, 89.0, 64.0, 39.0, 31.0, 28.0, 16.0, 11.0, 17.0, 15.0, 10.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.943359375, -1.874114990234375, -1.80487060546875, -1.735626220703125, -1.6663818359375, -1.597137451171875, -1.52789306640625, -1.458648681640625, -1.389404296875, -1.320159912109375, -1.25091552734375, -1.181671142578125, -1.1124267578125, -1.043182373046875, -0.97393798828125, -0.904693603515625, -0.83544921875, -0.766204833984375, -0.69696044921875, -0.627716064453125, -0.5584716796875, -0.489227294921875, -0.41998291015625, -0.350738525390625, -0.281494140625, -0.212249755859375, -0.14300537109375, -0.073760986328125, -0.0045166015625, 0.064727783203125, 0.13397216796875, 0.203216552734375, 0.2724609375, 0.341705322265625, 0.41094970703125, 0.480194091796875, 0.5494384765625, 0.618682861328125, 0.68792724609375, 0.757171630859375, 0.826416015625, 0.895660400390625, 0.96490478515625, 1.034149169921875, 1.1033935546875, 1.172637939453125, 1.24188232421875, 1.311126708984375, 1.38037109375, 1.449615478515625, 1.51885986328125, 1.588104248046875, 1.6573486328125, 1.726593017578125, 1.79583740234375, 1.865081787109375, 1.934326171875, 2.003570556640625, 2.07281494140625, 2.142059326171875, 2.2113037109375, 2.280548095703125, 2.34979248046875, 2.419036865234375, 2.48828125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 10.0, 24.0, 81.0, 262.0, 384.0, 187.0, 50.0, 10.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.276119232177734, -47.077842712402344, -45.87956619262695, -44.68128967285156, -43.48301696777344, -42.28474044799805, -41.086463928222656, -39.888187408447266, -38.689910888671875, -37.491634368896484, -36.293357849121094, -35.0950813293457, -33.89680480957031, -32.69853210449219, -31.500255584716797, -30.301979064941406, -29.103702545166016, -27.905426025390625, -26.707149505615234, -25.508874893188477, -24.310598373413086, -23.112321853637695, -21.914047241210938, -20.715770721435547, -19.517494201660156, -18.319217681884766, -17.120941162109375, -15.922666549682617, -14.724390029907227, -13.526113510131836, -12.327837944030762, -11.129562377929688, -9.931282043457031, -8.73300552368164, -7.534729957580566, -6.336453914642334, -5.138177871704102, -3.939901828765869, -2.7416257858276367, -1.5433502197265625, -0.3450736999511719, 0.8532023429870605, 2.051478385925293, 3.2497544288635254, 4.448030471801758, 5.64630651473999, 6.844582557678223, 8.042858123779297, 9.241134643554688, 10.439411163330078, 11.637686729431152, 12.835962295532227, 14.034238815307617, 15.232515335083008, 16.430789947509766, 17.629066467285156, 18.827342987060547, 20.025619506835938, 21.223896026611328, 22.422170639038086, 23.620447158813477, 24.818723678588867, 26.016998291015625, 27.215274810791016, 28.413551330566406]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 8.0, 15.0, 18.0, 18.0, 19.0, 27.0, 37.0, 44.0, 54.0, 56.0, 47.0, 62.0, 53.0, 55.0, 53.0, 56.0, 56.0, 53.0, 43.0, 34.0, 36.0, 31.0, 23.0, 27.0, 14.0, 15.0, 8.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.976312637329102, -12.615527153015137, -12.254741668701172, -11.893956184387207, -11.533170700073242, -11.172384262084961, -10.811599731445312, -10.450813293457031, -10.090027809143066, -9.729242324829102, -9.368456840515137, -9.007671356201172, -8.646885871887207, -8.286100387573242, -7.925314426422119, -7.564528465270996, -7.2037434577941895, -6.842957973480225, -6.48217248916626, -6.121386528015137, -5.760601043701172, -5.399815559387207, -5.039030075073242, -4.678244590759277, -4.3174591064453125, -3.9566736221313477, -3.5958878993988037, -3.235102415084839, -2.874316692352295, -2.51353120803833, -2.1527457237243652, -1.7919600009918213, -1.4311742782592773, -1.070388674736023, -0.7096031308174133, -0.3488175868988037, 0.011968016624450684, 0.3727536201477051, 0.7335391044616699, 1.0943248271942139, 1.4551103115081787, 1.815895915031433, 2.1766815185546875, 2.5374670028686523, 2.898252487182617, 3.259038209915161, 3.619823694229126, 3.98060941696167, 4.341394901275635, 4.7021803855896, 5.0629658699035645, 5.4237518310546875, 5.784537315368652, 6.145322799682617, 6.506108283996582, 6.866893768310547, 7.227679252624512, 7.588464736938477, 7.949250221252441, 8.310035705566406, 8.670821189880371, 9.031606674194336, 9.392393112182617, 9.753178596496582, 10.113964080810547]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 10.0, 4.0, 13.0, 14.0, 21.0, 29.0, 46.0, 82.0, 87.0, 177.0, 306.0, 652.0, 1694.0, 6262.0, 46950.0, 603299.0, 356699.0, 25432.0, 4257.0, 1281.0, 524.0, 256.0, 172.0, 96.0, 69.0, 37.0, 18.0, 16.0, 19.0, 15.0, 8.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.960693359375, -14.47607421875, -13.991455078125, -13.5068359375, -13.022216796875, -12.53759765625, -12.052978515625, -11.568359375, -11.083740234375, -10.59912109375, -10.114501953125, -9.6298828125, -9.145263671875, -8.66064453125, -8.176025390625, -7.69140625, -7.206787109375, -6.72216796875, -6.237548828125, -5.7529296875, -5.268310546875, -4.78369140625, -4.299072265625, -3.814453125, -3.329833984375, -2.84521484375, -2.360595703125, -1.8759765625, -1.391357421875, -0.90673828125, -0.422119140625, 0.0625, 0.547119140625, 1.03173828125, 1.516357421875, 2.0009765625, 2.485595703125, 2.97021484375, 3.454833984375, 3.939453125, 4.424072265625, 4.90869140625, 5.393310546875, 5.8779296875, 6.362548828125, 6.84716796875, 7.331787109375, 7.81640625, 8.301025390625, 8.78564453125, 9.270263671875, 9.7548828125, 10.239501953125, 10.72412109375, 11.208740234375, 11.693359375, 12.177978515625, 12.66259765625, 13.147216796875, 13.6318359375, 14.116455078125, 14.60107421875, 15.085693359375, 15.5703125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 33.0, 60.0, 91.0, 132.0, 156.0, 173.0, 119.0, 95.0, 57.0, 35.0, 17.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.804931640625, -2.71142578125, -2.617919921875, -2.5244140625, -2.430908203125, -2.33740234375, -2.243896484375, -2.150390625, -2.056884765625, -1.96337890625, -1.869873046875, -1.7763671875, -1.682861328125, -1.58935546875, -1.495849609375, -1.40234375, -1.308837890625, -1.21533203125, -1.121826171875, -1.0283203125, -0.934814453125, -0.84130859375, -0.747802734375, -0.654296875, -0.560791015625, -0.46728515625, -0.373779296875, -0.2802734375, -0.186767578125, -0.09326171875, 0.000244140625, 0.09375, 0.187255859375, 0.28076171875, 0.374267578125, 0.4677734375, 0.561279296875, 0.65478515625, 0.748291015625, 0.841796875, 0.935302734375, 1.02880859375, 1.122314453125, 1.2158203125, 1.309326171875, 1.40283203125, 1.496337890625, 1.58984375, 1.683349609375, 1.77685546875, 1.870361328125, 1.9638671875, 2.057373046875, 2.15087890625, 2.244384765625, 2.337890625, 2.431396484375, 2.52490234375, 2.618408203125, 2.7119140625, 2.805419921875, 2.89892578125, 2.992431640625, 3.0859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 2.0, 9.0, 6.0, 8.0, 11.0, 13.0, 16.0, 30.0, 49.0, 52.0, 135.0, 196.0, 272.0, 442.0, 835.0, 1452.0, 2852.0, 6432.0, 17113.0, 54339.0, 202848.0, 448302.0, 221524.0, 59793.0, 18346.0, 6988.0, 3036.0, 1435.0, 815.0, 458.0, 270.0, 170.0, 123.0, 79.0, 36.0, 22.0, 15.0, 15.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.50628662109375, -6.2860107421875, -6.06573486328125, -5.845458984375, -5.62518310546875, -5.4049072265625, -5.18463134765625, -4.96435546875, -4.74407958984375, -4.5238037109375, -4.30352783203125, -4.083251953125, -3.86297607421875, -3.6427001953125, -3.42242431640625, -3.2021484375, -2.98187255859375, -2.7615966796875, -2.54132080078125, -2.321044921875, -2.10076904296875, -1.8804931640625, -1.66021728515625, -1.43994140625, -1.21966552734375, -0.9993896484375, -0.77911376953125, -0.558837890625, -0.33856201171875, -0.1182861328125, 0.10198974609375, 0.322265625, 0.54254150390625, 0.7628173828125, 0.98309326171875, 1.203369140625, 1.42364501953125, 1.6439208984375, 1.86419677734375, 2.08447265625, 2.30474853515625, 2.5250244140625, 2.74530029296875, 2.965576171875, 3.18585205078125, 3.4061279296875, 3.62640380859375, 3.8466796875, 4.06695556640625, 4.2872314453125, 4.50750732421875, 4.727783203125, 4.94805908203125, 5.1683349609375, 5.38861083984375, 5.60888671875, 5.82916259765625, 6.0494384765625, 6.26971435546875, 6.489990234375, 6.71026611328125, 6.9305419921875, 7.15081787109375, 7.37109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 12.0, 14.0, 20.0, 19.0, 24.0, 34.0, 41.0, 38.0, 53.0, 55.0, 59.0, 58.0, 51.0, 70.0, 57.0, 48.0, 50.0, 58.0, 38.0, 43.0, 24.0, 24.0, 25.0, 20.0, 12.0, 15.0, 5.0, 10.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.46697998046875, -7.2269287109375, -6.98687744140625, -6.746826171875, -6.50677490234375, -6.2667236328125, -6.02667236328125, -5.78662109375, -5.54656982421875, -5.3065185546875, -5.06646728515625, -4.826416015625, -4.58636474609375, -4.3463134765625, -4.10626220703125, -3.8662109375, -3.62615966796875, -3.3861083984375, -3.14605712890625, -2.906005859375, -2.66595458984375, -2.4259033203125, -2.18585205078125, -1.94580078125, -1.70574951171875, -1.4656982421875, -1.22564697265625, -0.985595703125, -0.74554443359375, -0.5054931640625, -0.26544189453125, -0.025390625, 0.21466064453125, 0.4547119140625, 0.69476318359375, 0.934814453125, 1.17486572265625, 1.4149169921875, 1.65496826171875, 1.89501953125, 2.13507080078125, 2.3751220703125, 2.61517333984375, 2.855224609375, 3.09527587890625, 3.3353271484375, 3.57537841796875, 3.8154296875, 4.05548095703125, 4.2955322265625, 4.53558349609375, 4.775634765625, 5.01568603515625, 5.2557373046875, 5.49578857421875, 5.73583984375, 5.97589111328125, 6.2159423828125, 6.45599365234375, 6.696044921875, 6.93609619140625, 7.1761474609375, 7.41619873046875, 7.65625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 9.0, 10.0, 15.0, 23.0, 44.0, 75.0, 184.0, 495.0, 1993.0, 20477.0, 536480.0, 468695.0, 17345.0, 1844.0, 481.0, 173.0, 88.0, 51.0, 24.0, 18.0, 12.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.374755859375, -12.03076171875, -11.686767578125, -11.3427734375, -10.998779296875, -10.65478515625, -10.310791015625, -9.966796875, -9.622802734375, -9.27880859375, -8.934814453125, -8.5908203125, -8.246826171875, -7.90283203125, -7.558837890625, -7.21484375, -6.870849609375, -6.52685546875, -6.182861328125, -5.8388671875, -5.494873046875, -5.15087890625, -4.806884765625, -4.462890625, -4.118896484375, -3.77490234375, -3.430908203125, -3.0869140625, -2.742919921875, -2.39892578125, -2.054931640625, -1.7109375, -1.366943359375, -1.02294921875, -0.678955078125, -0.3349609375, 0.009033203125, 0.35302734375, 0.697021484375, 1.041015625, 1.385009765625, 1.72900390625, 2.072998046875, 2.4169921875, 2.760986328125, 3.10498046875, 3.448974609375, 3.79296875, 4.136962890625, 4.48095703125, 4.824951171875, 5.1689453125, 5.512939453125, 5.85693359375, 6.200927734375, 6.544921875, 6.888916015625, 7.23291015625, 7.576904296875, 7.9208984375, 8.264892578125, 8.60888671875, 8.952880859375, 9.296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 11.0, 12.0, 13.0, 13.0, 26.0, 26.0, 27.0, 36.0, 40.0, 51.0, 66.0, 90.0, 76.0, 88.0, 78.0, 57.0, 57.0, 33.0, 32.0, 22.0, 32.0, 22.0, 11.0, 11.0, 12.0, 3.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0], "bins": [-0.0005407333374023438, -0.0005267411470413208, -0.0005127489566802979, -0.0004987567663192749, -0.00048476457595825195, -0.000470772385597229, -0.00045678019523620605, -0.0004427880048751831, -0.00042879581451416016, -0.0004148036241531372, -0.00040081143379211426, -0.0003868192434310913, -0.00037282705307006836, -0.0003588348627090454, -0.00034484267234802246, -0.0003308504819869995, -0.00031685829162597656, -0.0003028661012649536, -0.00028887391090393066, -0.0002748817205429077, -0.00026088953018188477, -0.0002468973398208618, -0.00023290514945983887, -0.00021891295909881592, -0.00020492076873779297, -0.00019092857837677002, -0.00017693638801574707, -0.00016294419765472412, -0.00014895200729370117, -0.00013495981693267822, -0.00012096762657165527, -0.00010697543621063232, -9.298324584960938e-05, -7.899105548858643e-05, -6.499886512756348e-05, -5.100667476654053e-05, -3.701448440551758e-05, -2.302229404449463e-05, -9.03010368347168e-06, 4.9620866775512695e-06, 1.895427703857422e-05, 3.294646739959717e-05, 4.693865776062012e-05, 6.0930848121643066e-05, 7.492303848266602e-05, 8.891522884368896e-05, 0.00010290741920471191, 0.00011689960956573486, 0.0001308917999267578, 0.00014488399028778076, 0.0001588761806488037, 0.00017286837100982666, 0.0001868605613708496, 0.00020085275173187256, 0.0002148449420928955, 0.00022883713245391846, 0.0002428293228149414, 0.00025682151317596436, 0.0002708137035369873, 0.00028480589389801025, 0.0002987980842590332, 0.00031279027462005615, 0.0003267824649810791, 0.00034077465534210205, 0.000354766845703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 8.0, 7.0, 25.0, 38.0, 64.0, 113.0, 178.0, 344.0, 700.0, 1466.0, 3996.0, 13530.0, 60314.0, 314376.0, 505742.0, 112700.0, 23884.0, 6510.0, 2367.0, 1015.0, 503.0, 290.0, 131.0, 86.0, 57.0, 35.0, 28.0, 13.0, 13.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.7264404296875, -4.538818359375, -4.3511962890625, -4.16357421875, -3.9759521484375, -3.788330078125, -3.6007080078125, -3.4130859375, -3.2254638671875, -3.037841796875, -2.8502197265625, -2.66259765625, -2.4749755859375, -2.287353515625, -2.0997314453125, -1.912109375, -1.7244873046875, -1.536865234375, -1.3492431640625, -1.16162109375, -0.9739990234375, -0.786376953125, -0.5987548828125, -0.4111328125, -0.2235107421875, -0.035888671875, 0.1517333984375, 0.33935546875, 0.5269775390625, 0.714599609375, 0.9022216796875, 1.08984375, 1.2774658203125, 1.465087890625, 1.6527099609375, 1.84033203125, 2.0279541015625, 2.215576171875, 2.4031982421875, 2.5908203125, 2.7784423828125, 2.966064453125, 3.1536865234375, 3.34130859375, 3.5289306640625, 3.716552734375, 3.9041748046875, 4.091796875, 4.2794189453125, 4.467041015625, 4.6546630859375, 4.84228515625, 5.0299072265625, 5.217529296875, 5.4051513671875, 5.5927734375, 5.7803955078125, 5.968017578125, 6.1556396484375, 6.34326171875, 6.5308837890625, 6.718505859375, 6.9061279296875, 7.09375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 7.0, 17.0, 15.0, 22.0, 23.0, 33.0, 63.0, 82.0, 113.0, 94.0, 125.0, 101.0, 85.0, 62.0, 49.0, 32.0, 27.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640625, -4.47491455078125, -4.3092041015625, -4.14349365234375, -3.977783203125, -3.81207275390625, -3.6463623046875, -3.48065185546875, -3.31494140625, -3.14923095703125, -2.9835205078125, -2.81781005859375, -2.652099609375, -2.48638916015625, -2.3206787109375, -2.15496826171875, -1.9892578125, -1.82354736328125, -1.6578369140625, -1.49212646484375, -1.326416015625, -1.16070556640625, -0.9949951171875, -0.82928466796875, -0.66357421875, -0.49786376953125, -0.3321533203125, -0.16644287109375, -0.000732421875, 0.16497802734375, 0.3306884765625, 0.49639892578125, 0.662109375, 0.82781982421875, 0.9935302734375, 1.15924072265625, 1.324951171875, 1.49066162109375, 1.6563720703125, 1.82208251953125, 1.98779296875, 2.15350341796875, 2.3192138671875, 2.48492431640625, 2.650634765625, 2.81634521484375, 2.9820556640625, 3.14776611328125, 3.3134765625, 3.47918701171875, 3.6448974609375, 3.81060791015625, 3.976318359375, 4.14202880859375, 4.3077392578125, 4.47344970703125, 4.63916015625, 4.80487060546875, 4.9705810546875, 5.13629150390625, 5.302001953125, 5.46771240234375, 5.6334228515625, 5.79913330078125, 5.96484375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 9.0, 22.0, 47.0, 94.0, 193.0, 249.0, 177.0, 85.0, 51.0, 25.0, 12.0, 7.0, 9.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75575256347656, -69.32864379882812, -66.90152740478516, -64.47441864013672, -62.04730224609375, -59.62018966674805, -57.193077087402344, -54.765968322753906, -52.33885192871094, -49.911739349365234, -47.48462677001953, -45.05751419067383, -42.630401611328125, -40.20328903198242, -37.77617645263672, -35.34906768798828, -32.92195510864258, -30.494842529296875, -28.067729949951172, -25.64061737060547, -23.213504791259766, -20.786392211914062, -18.359281539916992, -15.932168960571289, -13.505056381225586, -11.077943801879883, -8.65083122253418, -6.223719596862793, -3.79660701751709, -1.3694944381713867, 1.0576171875, 3.484729766845703, 5.911842346191406, 8.33895492553711, 10.766067504882812, 13.1931791305542, 15.620291709899902, 18.047405242919922, 20.474515914916992, 22.901628494262695, 25.3287410736084, 27.7558536529541, 30.182966232299805, 32.610076904296875, 35.03718948364258, 37.46430206298828, 39.891414642333984, 42.31852722167969, 44.74563980102539, 47.172752380371094, 49.5998649597168, 52.0269775390625, 54.4540901184082, 56.881202697753906, 59.308311462402344, 61.73542785644531, 64.16253662109375, 66.58964538574219, 69.01676177978516, 71.4438705444336, 73.87098693847656, 76.298095703125, 78.72521209716797, 81.1523208618164, 83.57943725585938]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 19.0, 7.0, 8.0, 18.0, 25.0, 40.0, 35.0, 50.0, 58.0, 60.0, 59.0, 62.0, 64.0, 77.0, 67.0, 58.0, 56.0, 58.0, 47.0, 29.0, 14.0, 27.0, 13.0, 13.0, 8.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.577125549316406, -58.30147171020508, -56.025821685791016, -53.75016784667969, -51.47451400756836, -49.19886016845703, -46.92321014404297, -44.64755630493164, -42.37190246582031, -40.096248626708984, -37.82059860229492, -35.544944763183594, -33.269290924072266, -30.99363899230957, -28.717987060546875, -26.442333221435547, -24.166683197021484, -21.89103126525879, -19.61537742614746, -17.339725494384766, -15.064072608947754, -12.788419723510742, -10.512767791748047, -8.237114906311035, -5.961462020874023, -3.685809373855591, -1.4101567268371582, 0.8654956817626953, 3.141148567199707, 5.416801452636719, 7.692453384399414, 9.968106269836426, 12.243759155273438, 14.51941204071045, 16.79506492614746, 19.070716857910156, 21.346370697021484, 23.62202262878418, 25.897674560546875, 28.173328399658203, 30.4489803314209, 32.724632263183594, 35.00028610229492, 37.27593994140625, 39.55158996582031, 41.82724380493164, 44.10289764404297, 46.37854766845703, 48.65420150756836, 50.92985534667969, 53.20550537109375, 55.48115921020508, 57.756813049316406, 60.03246307373047, 62.3081169128418, 64.58377075195312, 66.85942077636719, 69.13507080078125, 71.41072845458984, 73.6863784790039, 75.96202850341797, 78.23768615722656, 80.51333618164062, 82.78898620605469, 85.06464385986328]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 7.0, 6.0, 10.0, 5.0, 13.0, 22.0, 22.0, 28.0, 51.0, 69.0, 148.0, 180.0, 318.0, 604.0, 1243.0, 2755.0, 7757.0, 29156.0, 258841.0, 3742478.0, 120877.0, 19736.0, 5713.0, 2036.0, 941.0, 467.0, 284.0, 166.0, 105.0, 66.0, 52.0, 29.0, 26.0, 19.0, 10.0, 12.0, 9.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.78125, -16.29296875, -15.8046875, -15.31640625, -14.828125, -14.33984375, -13.8515625, -13.36328125, -12.875, -12.38671875, -11.8984375, -11.41015625, -10.921875, -10.43359375, -9.9453125, -9.45703125, -8.96875, -8.48046875, -7.9921875, -7.50390625, -7.015625, -6.52734375, -6.0390625, -5.55078125, -5.0625, -4.57421875, -4.0859375, -3.59765625, -3.109375, -2.62109375, -2.1328125, -1.64453125, -1.15625, -0.66796875, -0.1796875, 0.30859375, 0.796875, 1.28515625, 1.7734375, 2.26171875, 2.75, 3.23828125, 3.7265625, 4.21484375, 4.703125, 5.19140625, 5.6796875, 6.16796875, 6.65625, 7.14453125, 7.6328125, 8.12109375, 8.609375, 9.09765625, 9.5859375, 10.07421875, 10.5625, 11.05078125, 11.5390625, 12.02734375, 12.515625, 13.00390625, 13.4921875, 13.98046875, 14.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 10.0, 5.0, 7.0, 13.0, 9.0, 11.0, 28.0, 39.0, 37.0, 42.0, 56.0, 55.0, 59.0, 61.0, 57.0, 65.0, 62.0, 56.0, 46.0, 56.0, 37.0, 37.0, 24.0, 28.0, 17.0, 19.0, 17.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.691741943359375, -1.64031982421875, -1.588897705078125, -1.5374755859375, -1.486053466796875, -1.43463134765625, -1.383209228515625, -1.331787109375, -1.280364990234375, -1.22894287109375, -1.177520751953125, -1.1260986328125, -1.074676513671875, -1.02325439453125, -0.971832275390625, -0.92041015625, -0.868988037109375, -0.81756591796875, -0.766143798828125, -0.7147216796875, -0.663299560546875, -0.61187744140625, -0.560455322265625, -0.509033203125, -0.457611083984375, -0.40618896484375, -0.354766845703125, -0.3033447265625, -0.251922607421875, -0.20050048828125, -0.149078369140625, -0.09765625, -0.046234130859375, 0.00518798828125, 0.056610107421875, 0.1080322265625, 0.159454345703125, 0.21087646484375, 0.262298583984375, 0.313720703125, 0.365142822265625, 0.41656494140625, 0.467987060546875, 0.5194091796875, 0.570831298828125, 0.62225341796875, 0.673675537109375, 0.72509765625, 0.776519775390625, 0.82794189453125, 0.879364013671875, 0.9307861328125, 0.982208251953125, 1.03363037109375, 1.085052490234375, 1.136474609375, 1.187896728515625, 1.23931884765625, 1.290740966796875, 1.3421630859375, 1.393585205078125, 1.44500732421875, 1.496429443359375, 1.5478515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 17.0, 30.0, 41.0, 108.0, 209.0, 438.0, 950.0, 2906.0, 13343.0, 162529.0, 3807024.0, 188491.0, 14094.0, 2731.0, 778.0, 286.0, 150.0, 80.0, 39.0, 16.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8984375, -10.4539794921875, -10.009521484375, -9.5650634765625, -9.12060546875, -8.6761474609375, -8.231689453125, -7.7872314453125, -7.3427734375, -6.8983154296875, -6.453857421875, -6.0093994140625, -5.56494140625, -5.1204833984375, -4.676025390625, -4.2315673828125, -3.787109375, -3.3426513671875, -2.898193359375, -2.4537353515625, -2.00927734375, -1.5648193359375, -1.120361328125, -0.6759033203125, -0.2314453125, 0.2130126953125, 0.657470703125, 1.1019287109375, 1.54638671875, 1.9908447265625, 2.435302734375, 2.8797607421875, 3.32421875, 3.7686767578125, 4.213134765625, 4.6575927734375, 5.10205078125, 5.5465087890625, 5.990966796875, 6.4354248046875, 6.8798828125, 7.3243408203125, 7.768798828125, 8.2132568359375, 8.65771484375, 9.1021728515625, 9.546630859375, 9.9910888671875, 10.435546875, 10.8800048828125, 11.324462890625, 11.7689208984375, 12.21337890625, 12.6578369140625, 13.102294921875, 13.5467529296875, 13.9912109375, 14.4356689453125, 14.880126953125, 15.3245849609375, 15.76904296875, 16.2135009765625, 16.657958984375, 17.1024169921875, 17.546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 14.0, 21.0, 22.0, 35.0, 54.0, 84.0, 128.0, 303.0, 786.0, 1400.0, 600.0, 239.0, 128.0, 83.0, 57.0, 27.0, 14.0, 17.0, 8.0, 5.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.43359375, -3.341583251953125, -3.24957275390625, -3.157562255859375, -3.0655517578125, -2.973541259765625, -2.88153076171875, -2.789520263671875, -2.697509765625, -2.605499267578125, -2.51348876953125, -2.421478271484375, -2.3294677734375, -2.237457275390625, -2.14544677734375, -2.053436279296875, -1.96142578125, -1.869415283203125, -1.77740478515625, -1.685394287109375, -1.5933837890625, -1.501373291015625, -1.40936279296875, -1.317352294921875, -1.225341796875, -1.133331298828125, -1.04132080078125, -0.949310302734375, -0.8572998046875, -0.765289306640625, -0.67327880859375, -0.581268310546875, -0.4892578125, -0.397247314453125, -0.30523681640625, -0.213226318359375, -0.1212158203125, -0.029205322265625, 0.06280517578125, 0.154815673828125, 0.246826171875, 0.338836669921875, 0.43084716796875, 0.522857666015625, 0.6148681640625, 0.706878662109375, 0.79888916015625, 0.890899658203125, 0.98291015625, 1.074920654296875, 1.16693115234375, 1.258941650390625, 1.3509521484375, 1.442962646484375, 1.53497314453125, 1.626983642578125, 1.718994140625, 1.811004638671875, 1.90301513671875, 1.995025634765625, 2.0870361328125, 2.179046630859375, 2.27105712890625, 2.363067626953125, 2.455078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 6.0, 6.0, 9.0, 25.0, 37.0, 59.0, 97.0, 148.0, 178.0, 162.0, 140.0, 67.0, 34.0, 13.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.280060768127441, -9.776605606079102, -9.273150444030762, -8.769695281982422, -8.266240119934082, -7.762784957885742, -7.2593302726745605, -6.755875110626221, -6.252419948577881, -5.748964786529541, -5.245509624481201, -4.7420549392700195, -4.23859977722168, -3.7351443767547607, -3.231689453125, -2.72823429107666, -2.2247791290283203, -1.7213239669799805, -1.2178689241409302, -0.7144138813018799, -0.21095871925354004, 0.2924964427947998, 0.7959513664245605, 1.2994065284729004, 1.8028616905212402, 2.30631685256958, 2.80977201461792, 3.3132269382476807, 3.8166821002960205, 4.320137023925781, 4.823592185974121, 5.327047348022461, 5.830501556396484, 6.333956718444824, 6.837411880493164, 7.340867042541504, 7.844322204589844, 8.347777366638184, 8.851232528686523, 9.354686737060547, 9.858142852783203, 10.361598014831543, 10.865053176879883, 11.368508338928223, 11.871963500976562, 12.375418663024902, 12.878873825073242, 13.382328033447266, 13.885783195495605, 14.389238357543945, 14.892693519592285, 15.396148681640625, 15.899603843688965, 16.403059005737305, 16.906513214111328, 17.409969329833984, 17.913423538208008, 18.41687774658203, 18.920333862304688, 19.42378807067871, 19.927244186401367, 20.43069839477539, 20.934154510498047, 21.43760871887207, 21.941064834594727]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 11.0, 11.0, 17.0, 19.0, 23.0, 27.0, 29.0, 37.0, 51.0, 47.0, 47.0, 50.0, 55.0, 60.0, 47.0, 66.0, 51.0, 58.0, 50.0, 35.0, 31.0, 28.0, 26.0, 24.0, 13.0, 21.0, 9.0, 9.0, 12.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.051424026489258, -8.704498291015625, -8.357573509216309, -8.010648727416992, -7.663722991943359, -7.316797733306885, -6.96987247467041, -6.6229472160339355, -6.276021957397461, -5.929096698760986, -5.582171440124512, -5.235246181488037, -4.8883209228515625, -4.541395664215088, -4.194470405578613, -3.8475451469421387, -3.500619888305664, -3.1536946296691895, -2.806769371032715, -2.4598441123962402, -2.1129188537597656, -1.765993595123291, -1.4190683364868164, -1.0721430778503418, -0.7252178192138672, -0.3782925605773926, -0.03136730194091797, 0.31555795669555664, 0.6624832153320312, 1.0094084739685059, 1.3563337326049805, 1.703258991241455, 2.0501842498779297, 2.3971095085144043, 2.744034767150879, 3.0909600257873535, 3.437885284423828, 3.7848105430603027, 4.131735801696777, 4.478661060333252, 4.825586318969727, 5.172511577606201, 5.519436836242676, 5.86636209487915, 6.213287353515625, 6.5602126121521, 6.907137870788574, 7.254063129425049, 7.600988388061523, 7.947913646697998, 8.294838905334473, 8.641763687133789, 8.988689422607422, 9.335615158081055, 9.682539939880371, 10.029464721679688, 10.37639045715332, 10.723316192626953, 11.07024097442627, 11.417165756225586, 11.764091491699219, 12.111017227172852, 12.457942008972168, 12.804866790771484, 13.151792526245117]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 28.0, 34.0, 56.0, 95.0, 139.0, 209.0, 314.0, 605.0, 1031.0, 1927.0, 3617.0, 7211.0, 15460.0, 35983.0, 95376.0, 267143.0, 359980.0, 159155.0, 56161.0, 22844.0, 10347.0, 5024.0, 2500.0, 1407.0, 733.0, 414.0, 246.0, 171.0, 107.0, 65.0, 49.0, 34.0, 22.0, 12.0, 11.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.2152099609375, -6.043701171875, -5.8721923828125, -5.70068359375, -5.5291748046875, -5.357666015625, -5.1861572265625, -5.0146484375, -4.8431396484375, -4.671630859375, -4.5001220703125, -4.32861328125, -4.1571044921875, -3.985595703125, -3.8140869140625, -3.642578125, -3.4710693359375, -3.299560546875, -3.1280517578125, -2.95654296875, -2.7850341796875, -2.613525390625, -2.4420166015625, -2.2705078125, -2.0989990234375, -1.927490234375, -1.7559814453125, -1.58447265625, -1.4129638671875, -1.241455078125, -1.0699462890625, -0.8984375, -0.7269287109375, -0.555419921875, -0.3839111328125, -0.21240234375, -0.0408935546875, 0.130615234375, 0.3021240234375, 0.4736328125, 0.6451416015625, 0.816650390625, 0.9881591796875, 1.15966796875, 1.3311767578125, 1.502685546875, 1.6741943359375, 1.845703125, 2.0172119140625, 2.188720703125, 2.3602294921875, 2.53173828125, 2.7032470703125, 2.874755859375, 3.0462646484375, 3.2177734375, 3.3892822265625, 3.560791015625, 3.7322998046875, 3.90380859375, 4.0753173828125, 4.246826171875, 4.4183349609375, 4.58984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 6.0, 5.0, 9.0, 11.0, 19.0, 18.0, 32.0, 37.0, 49.0, 55.0, 58.0, 67.0, 68.0, 70.0, 67.0, 57.0, 54.0, 60.0, 40.0, 35.0, 32.0, 29.0, 22.0, 24.0, 18.0, 12.0, 5.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9033203125, -1.8485870361328125, -1.793853759765625, -1.7391204833984375, -1.68438720703125, -1.6296539306640625, -1.574920654296875, -1.5201873779296875, -1.4654541015625, -1.4107208251953125, -1.355987548828125, -1.3012542724609375, -1.24652099609375, -1.1917877197265625, -1.137054443359375, -1.0823211669921875, -1.027587890625, -0.9728546142578125, -0.918121337890625, -0.8633880615234375, -0.80865478515625, -0.7539215087890625, -0.699188232421875, -0.6444549560546875, -0.5897216796875, -0.5349884033203125, -0.480255126953125, -0.4255218505859375, -0.37078857421875, -0.3160552978515625, -0.261322021484375, -0.2065887451171875, -0.15185546875, -0.0971221923828125, -0.042388916015625, 0.0123443603515625, 0.06707763671875, 0.1218109130859375, 0.176544189453125, 0.2312774658203125, 0.2860107421875, 0.3407440185546875, 0.395477294921875, 0.4502105712890625, 0.50494384765625, 0.5596771240234375, 0.614410400390625, 0.6691436767578125, 0.723876953125, 0.7786102294921875, 0.833343505859375, 0.8880767822265625, 0.94281005859375, 0.9975433349609375, 1.052276611328125, 1.1070098876953125, 1.1617431640625, 1.2164764404296875, 1.271209716796875, 1.3259429931640625, 1.38067626953125, 1.4354095458984375, 1.490142822265625, 1.5448760986328125, 1.599609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 17.0, 22.0, 21.0, 23.0, 24.0, 52.0, 80.0, 130.0, 172.0, 297.0, 533.0, 898.0, 1763.0, 3264.0, 6570.0, 15107.0, 39041.0, 126720.0, 371539.0, 323598.0, 100820.0, 32600.0, 12902.0, 5869.0, 2845.0, 1526.0, 820.0, 511.0, 284.0, 166.0, 104.0, 69.0, 37.0, 27.0, 31.0, 17.0, 9.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.96160888671875, -5.7747802734375, -5.58795166015625, -5.401123046875, -5.21429443359375, -5.0274658203125, -4.84063720703125, -4.65380859375, -4.46697998046875, -4.2801513671875, -4.09332275390625, -3.906494140625, -3.71966552734375, -3.5328369140625, -3.34600830078125, -3.1591796875, -2.97235107421875, -2.7855224609375, -2.59869384765625, -2.411865234375, -2.22503662109375, -2.0382080078125, -1.85137939453125, -1.66455078125, -1.47772216796875, -1.2908935546875, -1.10406494140625, -0.917236328125, -0.73040771484375, -0.5435791015625, -0.35675048828125, -0.169921875, 0.01690673828125, 0.2037353515625, 0.39056396484375, 0.577392578125, 0.76422119140625, 0.9510498046875, 1.13787841796875, 1.32470703125, 1.51153564453125, 1.6983642578125, 1.88519287109375, 2.072021484375, 2.25885009765625, 2.4456787109375, 2.63250732421875, 2.8193359375, 3.00616455078125, 3.1929931640625, 3.37982177734375, 3.566650390625, 3.75347900390625, 3.9403076171875, 4.12713623046875, 4.31396484375, 4.50079345703125, 4.6876220703125, 4.87445068359375, 5.061279296875, 5.24810791015625, 5.4349365234375, 5.62176513671875, 5.80859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 2.0, 8.0, 16.0, 15.0, 24.0, 28.0, 35.0, 27.0, 34.0, 25.0, 37.0, 56.0, 58.0, 59.0, 50.0, 56.0, 42.0, 48.0, 51.0, 42.0, 31.0, 37.0, 24.0, 30.0, 20.0, 20.0, 17.0, 13.0, 10.0, 9.0, 4.0, 6.0, 5.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.51171875, -6.285400390625, -6.05908203125, -5.832763671875, -5.6064453125, -5.380126953125, -5.15380859375, -4.927490234375, -4.701171875, -4.474853515625, -4.24853515625, -4.022216796875, -3.7958984375, -3.569580078125, -3.34326171875, -3.116943359375, -2.890625, -2.664306640625, -2.43798828125, -2.211669921875, -1.9853515625, -1.759033203125, -1.53271484375, -1.306396484375, -1.080078125, -0.853759765625, -0.62744140625, -0.401123046875, -0.1748046875, 0.051513671875, 0.27783203125, 0.504150390625, 0.73046875, 0.956787109375, 1.18310546875, 1.409423828125, 1.6357421875, 1.862060546875, 2.08837890625, 2.314697265625, 2.541015625, 2.767333984375, 2.99365234375, 3.219970703125, 3.4462890625, 3.672607421875, 3.89892578125, 4.125244140625, 4.3515625, 4.577880859375, 4.80419921875, 5.030517578125, 5.2568359375, 5.483154296875, 5.70947265625, 5.935791015625, 6.162109375, 6.388427734375, 6.61474609375, 6.841064453125, 7.0673828125, 7.293701171875, 7.52001953125, 7.746337890625, 7.97265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 11.0, 24.0, 34.0, 49.0, 87.0, 152.0, 336.0, 711.0, 1985.0, 6638.0, 27845.0, 139660.0, 493827.0, 297390.0, 60753.0, 13207.0, 3630.0, 1175.0, 447.0, 236.0, 125.0, 68.0, 30.0, 31.0, 19.0, 14.0, 10.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.753814697265625, -2.65802001953125, -2.562225341796875, -2.4664306640625, -2.370635986328125, -2.27484130859375, -2.179046630859375, -2.083251953125, -1.987457275390625, -1.89166259765625, -1.795867919921875, -1.7000732421875, -1.604278564453125, -1.50848388671875, -1.412689208984375, -1.31689453125, -1.221099853515625, -1.12530517578125, -1.029510498046875, -0.9337158203125, -0.837921142578125, -0.74212646484375, -0.646331787109375, -0.550537109375, -0.454742431640625, -0.35894775390625, -0.263153076171875, -0.1673583984375, -0.071563720703125, 0.02423095703125, 0.120025634765625, 0.2158203125, 0.311614990234375, 0.40740966796875, 0.503204345703125, 0.5989990234375, 0.694793701171875, 0.79058837890625, 0.886383056640625, 0.982177734375, 1.077972412109375, 1.17376708984375, 1.269561767578125, 1.3653564453125, 1.461151123046875, 1.55694580078125, 1.652740478515625, 1.74853515625, 1.844329833984375, 1.94012451171875, 2.035919189453125, 2.1317138671875, 2.227508544921875, 2.32330322265625, 2.419097900390625, 2.514892578125, 2.610687255859375, 2.70648193359375, 2.802276611328125, 2.8980712890625, 2.993865966796875, 3.08966064453125, 3.185455322265625, 3.28125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 5.0, 13.0, 18.0, 21.0, 21.0, 18.0, 42.0, 47.0, 49.0, 72.0, 94.0, 111.0, 96.0, 83.0, 59.0, 44.0, 41.0, 32.0, 23.0, 24.0, 23.0, 19.0, 11.0, 4.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004715919494628906, -0.0004580691456794739, -0.00044454634189605713, -0.0004310235381126404, -0.00041750073432922363, -0.0004039779305458069, -0.00039045512676239014, -0.0003769323229789734, -0.00036340951919555664, -0.0003498867154121399, -0.00033636391162872314, -0.0003228411078453064, -0.00030931830406188965, -0.0002957955002784729, -0.00028227269649505615, -0.0002687498927116394, -0.00025522708892822266, -0.0002417042851448059, -0.00022818148136138916, -0.0002146586775779724, -0.00020113587379455566, -0.00018761307001113892, -0.00017409026622772217, -0.00016056746244430542, -0.00014704465866088867, -0.00013352185487747192, -0.00011999905109405518, -0.00010647624731063843, -9.295344352722168e-05, -7.943063974380493e-05, -6.590783596038818e-05, -5.2385032176971436e-05, -3.886222839355469e-05, -2.533942461013794e-05, -1.1816620826721191e-05, 1.7061829566955566e-06, 1.5228986740112305e-05, 2.8751790523529053e-05, 4.22745943069458e-05, 5.579739809036255e-05, 6.93202018737793e-05, 8.284300565719604e-05, 9.636580944061279e-05, 0.00010988861322402954, 0.0001234114170074463, 0.00013693422079086304, 0.00015045702457427979, 0.00016397982835769653, 0.00017750263214111328, 0.00019102543592453003, 0.00020454823970794678, 0.00021807104349136353, 0.00023159384727478027, 0.000245116651058197, 0.00025863945484161377, 0.0002721622586250305, 0.00028568506240844727, 0.000299207866191864, 0.00031273066997528076, 0.0003262534737586975, 0.00033977627754211426, 0.000353299081325531, 0.00036682188510894775, 0.0003803446888923645, 0.00039386749267578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 10.0, 9.0, 12.0, 12.0, 34.0, 30.0, 50.0, 59.0, 100.0, 130.0, 247.0, 343.0, 614.0, 1011.0, 1905.0, 3568.0, 7388.0, 16133.0, 38410.0, 93903.0, 226083.0, 337679.0, 186131.0, 76321.0, 31409.0, 13490.0, 6297.0, 3108.0, 1596.0, 1005.0, 501.0, 315.0, 220.0, 133.0, 85.0, 58.0, 47.0, 34.0, 15.0, 20.0, 11.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.85546875, -1.794403076171875, -1.73333740234375, -1.672271728515625, -1.6112060546875, -1.550140380859375, -1.48907470703125, -1.428009033203125, -1.366943359375, -1.305877685546875, -1.24481201171875, -1.183746337890625, -1.1226806640625, -1.061614990234375, -1.00054931640625, -0.939483642578125, -0.87841796875, -0.817352294921875, -0.75628662109375, -0.695220947265625, -0.6341552734375, -0.573089599609375, -0.51202392578125, -0.450958251953125, -0.389892578125, -0.328826904296875, -0.26776123046875, -0.206695556640625, -0.1456298828125, -0.084564208984375, -0.02349853515625, 0.037567138671875, 0.0986328125, 0.159698486328125, 0.22076416015625, 0.281829833984375, 0.3428955078125, 0.403961181640625, 0.46502685546875, 0.526092529296875, 0.587158203125, 0.648223876953125, 0.70928955078125, 0.770355224609375, 0.8314208984375, 0.892486572265625, 0.95355224609375, 1.014617919921875, 1.07568359375, 1.136749267578125, 1.19781494140625, 1.258880615234375, 1.3199462890625, 1.381011962890625, 1.44207763671875, 1.503143310546875, 1.564208984375, 1.625274658203125, 1.68634033203125, 1.747406005859375, 1.8084716796875, 1.869537353515625, 1.93060302734375, 1.991668701171875, 2.052734375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 1.0, 3.0, 4.0, 11.0, 17.0, 25.0, 21.0, 26.0, 32.0, 46.0, 63.0, 75.0, 87.0, 73.0, 75.0, 72.0, 69.0, 58.0, 42.0, 41.0, 42.0, 30.0, 20.0, 17.0, 18.0, 8.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.541015625, -2.46221923828125, -2.3834228515625, -2.30462646484375, -2.225830078125, -2.14703369140625, -2.0682373046875, -1.98944091796875, -1.91064453125, -1.83184814453125, -1.7530517578125, -1.67425537109375, -1.595458984375, -1.51666259765625, -1.4378662109375, -1.35906982421875, -1.2802734375, -1.20147705078125, -1.1226806640625, -1.04388427734375, -0.965087890625, -0.88629150390625, -0.8074951171875, -0.72869873046875, -0.64990234375, -0.57110595703125, -0.4923095703125, -0.41351318359375, -0.334716796875, -0.25592041015625, -0.1771240234375, -0.09832763671875, -0.01953125, 0.05926513671875, 0.1380615234375, 0.21685791015625, 0.295654296875, 0.37445068359375, 0.4532470703125, 0.53204345703125, 0.61083984375, 0.68963623046875, 0.7684326171875, 0.84722900390625, 0.926025390625, 1.00482177734375, 1.0836181640625, 1.16241455078125, 1.2412109375, 1.32000732421875, 1.3988037109375, 1.47760009765625, 1.556396484375, 1.63519287109375, 1.7139892578125, 1.79278564453125, 1.87158203125, 1.95037841796875, 2.0291748046875, 2.10797119140625, 2.186767578125, 2.26556396484375, 2.3443603515625, 2.42315673828125, 2.501953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 8.0, 11.0, 23.0, 28.0, 59.0, 103.0, 151.0, 186.0, 160.0, 103.0, 68.0, 37.0, 28.0, 8.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.593894958496094, -59.95233154296875, -58.31076431274414, -56.6692008972168, -55.02763366699219, -53.386070251464844, -51.7445068359375, -50.10293960571289, -48.46137619018555, -46.8198127746582, -45.178245544433594, -43.53668212890625, -41.89511489868164, -40.2535514831543, -38.61198425292969, -36.970420837402344, -35.328857421875, -33.687294006347656, -32.04572677612305, -30.404163360595703, -28.762598037719727, -27.12103271484375, -25.479467391967773, -23.837902069091797, -22.196334838867188, -20.55476951599121, -18.913204193115234, -17.27164077758789, -15.630075454711914, -13.988510131835938, -12.346944808959961, -10.7053804397583, -9.06381607055664, -7.422251224517822, -5.780686378479004, -4.139121055603027, -2.497556209564209, -0.8559913635253906, 0.7855739593505859, 2.427138328552246, 4.068703651428223, 5.710268497467041, 7.351833343505859, 8.993398666381836, 10.634963989257812, 12.276528358459473, 13.91809368133545, 15.55965805053711, 17.201223373413086, 18.842788696289062, 20.48435401916504, 22.125919342041016, 23.76748275756836, 25.409048080444336, 27.050613403320312, 28.692176818847656, 30.333744049072266, 31.975309371948242, 33.61687469482422, 35.25843811035156, 36.90000534057617, 38.541568756103516, 40.183135986328125, 41.82469940185547, 43.46626281738281]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 12.0, 15.0, 27.0, 25.0, 28.0, 37.0, 45.0, 43.0, 63.0, 69.0, 57.0, 75.0, 81.0, 55.0, 52.0, 47.0, 46.0, 41.0, 40.0, 37.0, 25.0, 19.0, 25.0, 10.0, 11.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-69.49290466308594, -67.4550552368164, -65.41720581054688, -63.37936019897461, -61.34151077270508, -59.30366134643555, -57.26581573486328, -55.22796630859375, -53.19011688232422, -51.15226745605469, -49.114418029785156, -47.07657241821289, -45.03872299194336, -43.00087356567383, -40.96302795410156, -38.92517852783203, -36.8873291015625, -34.84947967529297, -32.81163024902344, -30.773784637451172, -28.73593521118164, -26.69808578491211, -24.66023826599121, -22.622390747070312, -20.58454132080078, -18.54669189453125, -16.50884437561035, -14.470995903015137, -12.433147430419922, -10.395298957824707, -8.357450485229492, -6.319602012634277, -4.281749725341797, -2.243901252746582, -0.2060527801513672, 1.8317956924438477, 3.8696441650390625, 5.907492637634277, 7.945341110229492, 9.983189582824707, 12.021038055419922, 14.058886528015137, 16.09673500061035, 18.13458251953125, 20.17243194580078, 22.210281372070312, 24.24812889099121, 26.28597640991211, 28.32382583618164, 30.361675262451172, 32.39952087402344, 34.43737030029297, 36.4752197265625, 38.51306915283203, 40.55091857910156, 42.58876419067383, 44.62661361694336, 46.66446304321289, 48.702308654785156, 50.74015808105469, 52.77800750732422, 54.81585693359375, 56.85370635986328, 58.89155197143555, 60.92940139770508]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 11.0, 14.0, 16.0, 31.0, 37.0, 49.0, 72.0, 101.0, 163.0, 266.0, 467.0, 836.0, 1698.0, 3869.0, 10114.0, 39717.0, 485025.0, 3525638.0, 97343.0, 17981.0, 5628.0, 2418.0, 1201.0, 615.0, 343.0, 202.0, 130.0, 79.0, 65.0, 44.0, 27.0, 24.0, 13.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.7813720703125, -8.500244140625, -8.2191162109375, -7.93798828125, -7.6568603515625, -7.375732421875, -7.0946044921875, -6.8134765625, -6.5323486328125, -6.251220703125, -5.9700927734375, -5.68896484375, -5.4078369140625, -5.126708984375, -4.8455810546875, -4.564453125, -4.2833251953125, -4.002197265625, -3.7210693359375, -3.43994140625, -3.1588134765625, -2.877685546875, -2.5965576171875, -2.3154296875, -2.0343017578125, -1.753173828125, -1.4720458984375, -1.19091796875, -0.9097900390625, -0.628662109375, -0.3475341796875, -0.06640625, 0.2147216796875, 0.495849609375, 0.7769775390625, 1.05810546875, 1.3392333984375, 1.620361328125, 1.9014892578125, 2.1826171875, 2.4637451171875, 2.744873046875, 3.0260009765625, 3.30712890625, 3.5882568359375, 3.869384765625, 4.1505126953125, 4.431640625, 4.7127685546875, 4.993896484375, 5.2750244140625, 5.55615234375, 5.8372802734375, 6.118408203125, 6.3995361328125, 6.6806640625, 6.9617919921875, 7.242919921875, 7.5240478515625, 7.80517578125, 8.0863037109375, 8.367431640625, 8.6485595703125, 8.9296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 8.0, 7.0, 12.0, 20.0, 29.0, 27.0, 27.0, 48.0, 35.0, 42.0, 63.0, 61.0, 70.0, 65.0, 62.0, 63.0, 49.0, 50.0, 54.0, 40.0, 30.0, 26.0, 20.0, 18.0, 14.0, 17.0, 7.0, 4.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7254638671875, -1.670654296875, -1.6158447265625, -1.56103515625, -1.5062255859375, -1.451416015625, -1.3966064453125, -1.341796875, -1.2869873046875, -1.232177734375, -1.1773681640625, -1.12255859375, -1.0677490234375, -1.012939453125, -0.9581298828125, -0.9033203125, -0.8485107421875, -0.793701171875, -0.7388916015625, -0.68408203125, -0.6292724609375, -0.574462890625, -0.5196533203125, -0.46484375, -0.4100341796875, -0.355224609375, -0.3004150390625, -0.24560546875, -0.1907958984375, -0.135986328125, -0.0811767578125, -0.0263671875, 0.0284423828125, 0.083251953125, 0.1380615234375, 0.19287109375, 0.2476806640625, 0.302490234375, 0.3572998046875, 0.412109375, 0.4669189453125, 0.521728515625, 0.5765380859375, 0.63134765625, 0.6861572265625, 0.740966796875, 0.7957763671875, 0.8505859375, 0.9053955078125, 0.960205078125, 1.0150146484375, 1.06982421875, 1.1246337890625, 1.179443359375, 1.2342529296875, 1.2890625, 1.3438720703125, 1.398681640625, 1.4534912109375, 1.50830078125, 1.5631103515625, 1.617919921875, 1.6727294921875, 1.7275390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 9.0, 20.0, 36.0, 84.0, 129.0, 300.0, 767.0, 2975.0, 26419.0, 2361640.0, 1773366.0, 24282.0, 2994.0, 742.0, 251.0, 115.0, 63.0, 41.0, 23.0, 11.0, 6.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.625, -12.230224609375, -11.83544921875, -11.440673828125, -11.0458984375, -10.651123046875, -10.25634765625, -9.861572265625, -9.466796875, -9.072021484375, -8.67724609375, -8.282470703125, -7.8876953125, -7.492919921875, -7.09814453125, -6.703369140625, -6.30859375, -5.913818359375, -5.51904296875, -5.124267578125, -4.7294921875, -4.334716796875, -3.93994140625, -3.545166015625, -3.150390625, -2.755615234375, -2.36083984375, -1.966064453125, -1.5712890625, -1.176513671875, -0.78173828125, -0.386962890625, 0.0078125, 0.402587890625, 0.79736328125, 1.192138671875, 1.5869140625, 1.981689453125, 2.37646484375, 2.771240234375, 3.166015625, 3.560791015625, 3.95556640625, 4.350341796875, 4.7451171875, 5.139892578125, 5.53466796875, 5.929443359375, 6.32421875, 6.718994140625, 7.11376953125, 7.508544921875, 7.9033203125, 8.298095703125, 8.69287109375, 9.087646484375, 9.482421875, 9.877197265625, 10.27197265625, 10.666748046875, 11.0615234375, 11.456298828125, 11.85107421875, 12.245849609375, 12.640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 15.0, 19.0, 35.0, 51.0, 95.0, 216.0, 458.0, 1504.0, 1013.0, 322.0, 152.0, 69.0, 55.0, 23.0, 14.0, 9.0, 6.0, 9.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.42828369140625, -2.3409423828125, -2.25360107421875, -2.166259765625, -2.07891845703125, -1.9915771484375, -1.90423583984375, -1.81689453125, -1.72955322265625, -1.6422119140625, -1.55487060546875, -1.467529296875, -1.38018798828125, -1.2928466796875, -1.20550537109375, -1.1181640625, -1.03082275390625, -0.9434814453125, -0.85614013671875, -0.768798828125, -0.68145751953125, -0.5941162109375, -0.50677490234375, -0.41943359375, -0.33209228515625, -0.2447509765625, -0.15740966796875, -0.070068359375, 0.01727294921875, 0.1046142578125, 0.19195556640625, 0.279296875, 0.36663818359375, 0.4539794921875, 0.54132080078125, 0.628662109375, 0.71600341796875, 0.8033447265625, 0.89068603515625, 0.97802734375, 1.06536865234375, 1.1527099609375, 1.24005126953125, 1.327392578125, 1.41473388671875, 1.5020751953125, 1.58941650390625, 1.6767578125, 1.76409912109375, 1.8514404296875, 1.93878173828125, 2.026123046875, 2.11346435546875, 2.2008056640625, 2.28814697265625, 2.37548828125, 2.46282958984375, 2.5501708984375, 2.63751220703125, 2.724853515625, 2.81219482421875, 2.8995361328125, 2.98687744140625, 3.07421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 10.0, 9.0, 36.0, 50.0, 127.0, 165.0, 205.0, 153.0, 116.0, 75.0, 24.0, 15.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.854011535644531, -9.370630264282227, -8.887248992919922, -8.403867721557617, -7.9204864501953125, -7.437105178833008, -6.953723430633545, -6.47034215927124, -5.9869608879089355, -5.503579616546631, -5.020198345184326, -4.536816596984863, -4.053435325622559, -3.570054292678833, -3.086672782897949, -2.6032915115356445, -2.11991024017334, -1.6365289688110352, -1.153147578239441, -0.6697661876678467, -0.186384916305542, 0.2969963550567627, 0.7803778648376465, 1.2637591361999512, 1.7471404075622559, 2.2305216789245605, 2.7139029502868652, 3.197284460067749, 3.6806657314300537, 4.1640472412109375, 4.647428512573242, 5.130809783935547, 5.614191055297852, 6.097572326660156, 6.580953598022461, 7.064334869384766, 7.54771614074707, 8.031097412109375, 8.51447868347168, 8.997859954833984, 9.481241226196289, 9.964622497558594, 10.448003768920898, 10.931385040283203, 11.414766311645508, 11.898147583007812, 12.381528854370117, 12.864910125732422, 13.348292350769043, 13.831673622131348, 14.315054893493652, 14.798436164855957, 15.281817436218262, 15.765198707580566, 16.248580932617188, 16.731962203979492, 17.215343475341797, 17.6987247467041, 18.182106018066406, 18.66548728942871, 19.148868560791016, 19.63224983215332, 20.115631103515625, 20.59901237487793, 21.082393646240234]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 6.0, 18.0, 11.0, 18.0, 36.0, 24.0, 30.0, 21.0, 40.0, 47.0, 56.0, 45.0, 54.0, 61.0, 70.0, 57.0, 61.0, 53.0, 52.0, 34.0, 36.0, 36.0, 24.0, 23.0, 18.0, 28.0, 14.0, 5.0, 4.0, 6.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.16443157196045, -8.89543342590332, -8.626435279846191, -8.357437133789062, -8.08843994140625, -7.819441318511963, -7.550443649291992, -7.281445503234863, -7.012447357177734, -6.7434492111206055, -6.474451065063477, -6.205453395843506, -5.936455249786377, -5.667457103729248, -5.398459434509277, -5.129461288452148, -4.8604631423950195, -4.591464996337891, -4.322466850280762, -4.053469181060791, -3.784471035003662, -3.515472888946533, -3.2464749813079834, -2.9774770736694336, -2.7084789276123047, -2.439480781555176, -2.170482873916626, -1.9014848470687866, -1.6324868202209473, -1.363488793373108, -1.0944907665252686, -0.8254927396774292, -0.5564937591552734, -0.2874957323074341, -0.018497705459594727, 0.25050032138824463, 0.519498348236084, 0.7884963750839233, 1.0574944019317627, 1.326492428779602, 1.5954904556274414, 1.8644884824752808, 2.13348650932312, 2.40248441696167, 2.671482563018799, 2.9404807090759277, 3.2094786167144775, 3.4784765243530273, 3.7474746704101562, 4.016472816467285, 4.285470962524414, 4.554468631744385, 4.823466777801514, 5.092464923858643, 5.361462593078613, 5.630460739135742, 5.899458885192871, 6.16845703125, 6.437455177307129, 6.7064528465271, 6.9754509925842285, 7.244449138641357, 7.513446807861328, 7.782444953918457, 8.051443099975586]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 15.0, 23.0, 19.0, 37.0, 45.0, 63.0, 97.0, 153.0, 265.0, 442.0, 683.0, 1183.0, 2291.0, 4251.0, 8584.0, 18208.0, 39923.0, 96758.0, 229141.0, 325032.0, 184050.0, 75089.0, 32139.0, 14618.0, 7185.0, 3607.0, 1952.0, 1040.0, 587.0, 392.0, 222.0, 140.0, 103.0, 68.0, 46.0, 32.0, 15.0, 18.0, 8.0, 4.0, 4.0, 2.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.09869384765625, -3.9591064453125, -3.81951904296875, -3.679931640625, -3.54034423828125, -3.4007568359375, -3.26116943359375, -3.12158203125, -2.98199462890625, -2.8424072265625, -2.70281982421875, -2.563232421875, -2.42364501953125, -2.2840576171875, -2.14447021484375, -2.0048828125, -1.86529541015625, -1.7257080078125, -1.58612060546875, -1.446533203125, -1.30694580078125, -1.1673583984375, -1.02777099609375, -0.88818359375, -0.74859619140625, -0.6090087890625, -0.46942138671875, -0.329833984375, -0.19024658203125, -0.0506591796875, 0.08892822265625, 0.228515625, 0.36810302734375, 0.5076904296875, 0.64727783203125, 0.786865234375, 0.92645263671875, 1.0660400390625, 1.20562744140625, 1.34521484375, 1.48480224609375, 1.6243896484375, 1.76397705078125, 1.903564453125, 2.04315185546875, 2.1827392578125, 2.32232666015625, 2.4619140625, 2.60150146484375, 2.7410888671875, 2.88067626953125, 3.020263671875, 3.15985107421875, 3.2994384765625, 3.43902587890625, 3.57861328125, 3.71820068359375, 3.8577880859375, 3.99737548828125, 4.136962890625, 4.27655029296875, 4.4161376953125, 4.55572509765625, 4.6953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 4.0, 13.0, 8.0, 10.0, 21.0, 20.0, 36.0, 32.0, 34.0, 45.0, 54.0, 48.0, 55.0, 76.0, 55.0, 53.0, 77.0, 54.0, 57.0, 39.0, 36.0, 33.0, 21.0, 28.0, 25.0, 15.0, 10.0, 13.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.015625, -1.9605560302734375, -1.905487060546875, -1.8504180908203125, -1.79534912109375, -1.7402801513671875, -1.685211181640625, -1.6301422119140625, -1.5750732421875, -1.5200042724609375, -1.464935302734375, -1.4098663330078125, -1.35479736328125, -1.2997283935546875, -1.244659423828125, -1.1895904541015625, -1.134521484375, -1.0794525146484375, -1.024383544921875, -0.9693145751953125, -0.91424560546875, -0.8591766357421875, -0.804107666015625, -0.7490386962890625, -0.6939697265625, -0.6389007568359375, -0.583831787109375, -0.5287628173828125, -0.47369384765625, -0.4186248779296875, -0.363555908203125, -0.3084869384765625, -0.25341796875, -0.1983489990234375, -0.143280029296875, -0.0882110595703125, -0.03314208984375, 0.0219268798828125, 0.076995849609375, 0.1320648193359375, 0.1871337890625, 0.2422027587890625, 0.297271728515625, 0.3523406982421875, 0.40740966796875, 0.4624786376953125, 0.517547607421875, 0.5726165771484375, 0.627685546875, 0.6827545166015625, 0.737823486328125, 0.7928924560546875, 0.84796142578125, 0.9030303955078125, 0.958099365234375, 1.0131683349609375, 1.0682373046875, 1.1233062744140625, 1.178375244140625, 1.2334442138671875, 1.28851318359375, 1.3435821533203125, 1.398651123046875, 1.4537200927734375, 1.5087890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 16.0, 10.0, 13.0, 16.0, 17.0, 29.0, 56.0, 55.0, 78.0, 117.0, 187.0, 274.0, 527.0, 896.0, 1703.0, 3590.0, 8272.0, 21191.0, 61576.0, 207698.0, 418782.0, 219740.0, 65217.0, 22184.0, 8558.0, 3617.0, 1763.0, 868.0, 546.0, 325.0, 218.0, 108.0, 91.0, 54.0, 36.0, 26.0, 21.0, 18.0, 15.0, 17.0, 5.0, 4.0, 11.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.30078125, -5.13262939453125, -4.9644775390625, -4.79632568359375, -4.628173828125, -4.46002197265625, -4.2918701171875, -4.12371826171875, -3.95556640625, -3.78741455078125, -3.6192626953125, -3.45111083984375, -3.282958984375, -3.11480712890625, -2.9466552734375, -2.77850341796875, -2.6103515625, -2.44219970703125, -2.2740478515625, -2.10589599609375, -1.937744140625, -1.76959228515625, -1.6014404296875, -1.43328857421875, -1.26513671875, -1.09698486328125, -0.9288330078125, -0.76068115234375, -0.592529296875, -0.42437744140625, -0.2562255859375, -0.08807373046875, 0.080078125, 0.24822998046875, 0.4163818359375, 0.58453369140625, 0.752685546875, 0.92083740234375, 1.0889892578125, 1.25714111328125, 1.42529296875, 1.59344482421875, 1.7615966796875, 1.92974853515625, 2.097900390625, 2.26605224609375, 2.4342041015625, 2.60235595703125, 2.7705078125, 2.93865966796875, 3.1068115234375, 3.27496337890625, 3.443115234375, 3.61126708984375, 3.7794189453125, 3.94757080078125, 4.11572265625, 4.28387451171875, 4.4520263671875, 4.62017822265625, 4.788330078125, 4.95648193359375, 5.1246337890625, 5.29278564453125, 5.4609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 12.0, 7.0, 12.0, 15.0, 19.0, 23.0, 24.0, 31.0, 31.0, 43.0, 40.0, 42.0, 52.0, 54.0, 50.0, 56.0, 54.0, 50.0, 49.0, 47.0, 35.0, 49.0, 27.0, 39.0, 14.0, 22.0, 23.0, 14.0, 10.0, 13.0, 10.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.765625, -6.5382080078125, -6.310791015625, -6.0833740234375, -5.85595703125, -5.6285400390625, -5.401123046875, -5.1737060546875, -4.9462890625, -4.7188720703125, -4.491455078125, -4.2640380859375, -4.03662109375, -3.8092041015625, -3.581787109375, -3.3543701171875, -3.126953125, -2.8995361328125, -2.672119140625, -2.4447021484375, -2.21728515625, -1.9898681640625, -1.762451171875, -1.5350341796875, -1.3076171875, -1.0802001953125, -0.852783203125, -0.6253662109375, -0.39794921875, -0.1705322265625, 0.056884765625, 0.2843017578125, 0.51171875, 0.7391357421875, 0.966552734375, 1.1939697265625, 1.42138671875, 1.6488037109375, 1.876220703125, 2.1036376953125, 2.3310546875, 2.5584716796875, 2.785888671875, 3.0133056640625, 3.24072265625, 3.4681396484375, 3.695556640625, 3.9229736328125, 4.150390625, 4.3778076171875, 4.605224609375, 4.8326416015625, 5.06005859375, 5.2874755859375, 5.514892578125, 5.7423095703125, 5.9697265625, 6.1971435546875, 6.424560546875, 6.6519775390625, 6.87939453125, 7.1068115234375, 7.334228515625, 7.5616455078125, 7.7890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 16.0, 18.0, 22.0, 45.0, 53.0, 94.0, 127.0, 268.0, 541.0, 1228.0, 2917.0, 8367.0, 27119.0, 100605.0, 344890.0, 389959.0, 123354.0, 32816.0, 9778.0, 3522.0, 1438.0, 601.0, 331.0, 160.0, 100.0, 70.0, 30.0, 23.0, 13.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8966827392578125, -1.831451416015625, -1.7662200927734375, -1.70098876953125, -1.6357574462890625, -1.570526123046875, -1.5052947998046875, -1.4400634765625, -1.3748321533203125, -1.309600830078125, -1.2443695068359375, -1.17913818359375, -1.1139068603515625, -1.048675537109375, -0.9834442138671875, -0.918212890625, -0.8529815673828125, -0.787750244140625, -0.7225189208984375, -0.65728759765625, -0.5920562744140625, -0.526824951171875, -0.4615936279296875, -0.3963623046875, -0.3311309814453125, -0.265899658203125, -0.2006683349609375, -0.13543701171875, -0.0702056884765625, -0.004974365234375, 0.0602569580078125, 0.12548828125, 0.1907196044921875, 0.255950927734375, 0.3211822509765625, 0.38641357421875, 0.4516448974609375, 0.516876220703125, 0.5821075439453125, 0.6473388671875, 0.7125701904296875, 0.777801513671875, 0.8430328369140625, 0.90826416015625, 0.9734954833984375, 1.038726806640625, 1.1039581298828125, 1.169189453125, 1.2344207763671875, 1.299652099609375, 1.3648834228515625, 1.43011474609375, 1.4953460693359375, 1.560577392578125, 1.6258087158203125, 1.6910400390625, 1.7562713623046875, 1.821502685546875, 1.8867340087890625, 1.95196533203125, 2.0171966552734375, 2.082427978515625, 2.1476593017578125, 2.212890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 2.0, 4.0, 12.0, 21.0, 9.0, 18.0, 17.0, 24.0, 28.0, 42.0, 36.0, 55.0, 59.0, 54.0, 68.0, 75.0, 72.0, 60.0, 41.0, 40.0, 37.0, 44.0, 30.0, 27.0, 11.0, 10.0, 13.0, 8.0, 14.0, 11.0, 8.0, 5.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002741813659667969, -0.0002656318247318268, -0.0002570822834968567, -0.0002485327422618866, -0.0002399832010269165, -0.0002314336597919464, -0.00022288411855697632, -0.00021433457732200623, -0.00020578503608703613, -0.00019723549485206604, -0.00018868595361709595, -0.00018013641238212585, -0.00017158687114715576, -0.00016303732991218567, -0.00015448778867721558, -0.00014593824744224548, -0.0001373887062072754, -0.0001288391649723053, -0.0001202896237373352, -0.00011174008250236511, -0.00010319054126739502, -9.464100003242493e-05, -8.609145879745483e-05, -7.754191756248474e-05, -6.899237632751465e-05, -6.0442835092544556e-05, -5.189329385757446e-05, -4.334375262260437e-05, -3.479421138763428e-05, -2.6244670152664185e-05, -1.7695128917694092e-05, -9.145587682723999e-06, -5.960464477539062e-07, 7.953494787216187e-06, 1.650303602218628e-05, 2.5052577257156372e-05, 3.3602118492126465e-05, 4.215165972709656e-05, 5.070120096206665e-05, 5.925074219703674e-05, 6.780028343200684e-05, 7.634982466697693e-05, 8.489936590194702e-05, 9.344890713691711e-05, 0.00010199844837188721, 0.0001105479896068573, 0.00011909753084182739, 0.00012764707207679749, 0.00013619661331176758, 0.00014474615454673767, 0.00015329569578170776, 0.00016184523701667786, 0.00017039477825164795, 0.00017894431948661804, 0.00018749386072158813, 0.00019604340195655823, 0.00020459294319152832, 0.0002131424844264984, 0.0002216920256614685, 0.0002302415668964386, 0.0002387911081314087, 0.0002473406493663788, 0.0002558901906013489, 0.00026443973183631897, 0.00027298927307128906]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 9.0, 30.0, 30.0, 42.0, 80.0, 123.0, 228.0, 404.0, 748.0, 1576.0, 3698.0, 10076.0, 30341.0, 104126.0, 351967.0, 376234.0, 116383.0, 33702.0, 11027.0, 4154.0, 1720.0, 830.0, 411.0, 228.0, 122.0, 86.0, 53.0, 29.0, 31.0, 12.0, 14.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.7135009765625, -1.647705078125, -1.5819091796875, -1.51611328125, -1.4503173828125, -1.384521484375, -1.3187255859375, -1.2529296875, -1.1871337890625, -1.121337890625, -1.0555419921875, -0.98974609375, -0.9239501953125, -0.858154296875, -0.7923583984375, -0.7265625, -0.6607666015625, -0.594970703125, -0.5291748046875, -0.46337890625, -0.3975830078125, -0.331787109375, -0.2659912109375, -0.2001953125, -0.1343994140625, -0.068603515625, -0.0028076171875, 0.06298828125, 0.1287841796875, 0.194580078125, 0.2603759765625, 0.326171875, 0.3919677734375, 0.457763671875, 0.5235595703125, 0.58935546875, 0.6551513671875, 0.720947265625, 0.7867431640625, 0.8525390625, 0.9183349609375, 0.984130859375, 1.0499267578125, 1.11572265625, 1.1815185546875, 1.247314453125, 1.3131103515625, 1.37890625, 1.4447021484375, 1.510498046875, 1.5762939453125, 1.64208984375, 1.7078857421875, 1.773681640625, 1.8394775390625, 1.9052734375, 1.9710693359375, 2.036865234375, 2.1026611328125, 2.16845703125, 2.2342529296875, 2.300048828125, 2.3658447265625, 2.431640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 4.0, 10.0, 8.0, 6.0, 9.0, 22.0, 25.0, 19.0, 32.0, 35.0, 49.0, 50.0, 76.0, 64.0, 61.0, 79.0, 67.0, 64.0, 51.0, 50.0, 42.0, 23.0, 36.0, 18.0, 18.0, 14.0, 12.0, 3.0, 11.0, 8.0, 13.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.9635009765625, -1.907470703125, -1.8514404296875, -1.79541015625, -1.7393798828125, -1.683349609375, -1.6273193359375, -1.5712890625, -1.5152587890625, -1.459228515625, -1.4031982421875, -1.34716796875, -1.2911376953125, -1.235107421875, -1.1790771484375, -1.123046875, -1.0670166015625, -1.010986328125, -0.9549560546875, -0.89892578125, -0.8428955078125, -0.786865234375, -0.7308349609375, -0.6748046875, -0.6187744140625, -0.562744140625, -0.5067138671875, -0.45068359375, -0.3946533203125, -0.338623046875, -0.2825927734375, -0.2265625, -0.1705322265625, -0.114501953125, -0.0584716796875, -0.00244140625, 0.0535888671875, 0.109619140625, 0.1656494140625, 0.2216796875, 0.2777099609375, 0.333740234375, 0.3897705078125, 0.44580078125, 0.5018310546875, 0.557861328125, 0.6138916015625, 0.669921875, 0.7259521484375, 0.781982421875, 0.8380126953125, 0.89404296875, 0.9500732421875, 1.006103515625, 1.0621337890625, 1.1181640625, 1.1741943359375, 1.230224609375, 1.2862548828125, 1.34228515625, 1.3983154296875, 1.454345703125, 1.5103759765625, 1.56640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 17.0, 18.0, 37.0, 62.0, 95.0, 165.0, 185.0, 134.0, 107.0, 82.0, 32.0, 30.0, 14.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.86506271362305, -47.368404388427734, -45.871742248535156, -44.375083923339844, -42.87842559814453, -41.38176727294922, -39.88510513305664, -38.38844680786133, -36.89178466796875, -35.39512634277344, -33.89846420288086, -32.40180587768555, -30.905147552490234, -29.40848731994629, -27.911827087402344, -26.41516876220703, -24.91851043701172, -23.421850204467773, -21.92519187927246, -20.428531646728516, -18.931873321533203, -17.435213088989258, -15.938552856445312, -14.441893577575684, -12.945234298706055, -11.448575019836426, -9.951915740966797, -8.455255508422852, -6.958596229553223, -5.461936950683594, -3.9652767181396484, -2.4686174392700195, -0.9719619750976562, 0.5246975421905518, 2.0213570594787598, 3.518016815185547, 5.014676094055176, 6.511335372924805, 8.00799560546875, 9.504654884338379, 11.001314163208008, 12.497973442077637, 13.994632720947266, 15.491292953491211, 16.987953186035156, 18.48461151123047, 19.981271743774414, 21.47793197631836, 22.974590301513672, 24.471250534057617, 25.96790885925293, 27.464569091796875, 28.961227416992188, 30.457887649536133, 31.954547882080078, 33.45120620727539, 34.94786834716797, 36.44452667236328, 37.94118881225586, 39.43784713745117, 40.934505462646484, 42.43116760253906, 43.927825927734375, 45.42448425292969, 46.921142578125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 11.0, 12.0, 13.0, 7.0, 24.0, 31.0, 31.0, 42.0, 49.0, 47.0, 62.0, 70.0, 63.0, 73.0, 75.0, 60.0, 58.0, 48.0, 52.0, 29.0, 32.0, 32.0, 26.0, 9.0, 17.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.17780303955078, -53.426483154296875, -51.67516326904297, -49.92384338378906, -48.17251968383789, -46.421199798583984, -44.66987991333008, -42.91856002807617, -41.167236328125, -39.415916442871094, -37.66459655761719, -35.91327667236328, -34.16195297241211, -32.4106330871582, -30.659313201904297, -28.90799331665039, -27.156673431396484, -25.405353546142578, -23.65403175354004, -21.902711868286133, -20.151390075683594, -18.400070190429688, -16.64875030517578, -14.897429466247559, -13.146108627319336, -11.394787788391113, -9.64346694946289, -7.892147064208984, -6.140826225280762, -4.389505386352539, -2.638185501098633, -0.8868646621704102, 0.8644561767578125, 2.615776777267456, 4.3670973777771, 6.118417739868164, 7.869738578796387, 9.62105941772461, 11.372379302978516, 13.123700141906738, 14.875020980834961, 16.626340866088867, 18.377662658691406, 20.128982543945312, 21.88030242919922, 23.631624221801758, 25.382944107055664, 27.134265899658203, 28.88558578491211, 30.636905670166016, 32.38822555541992, 34.139549255371094, 35.890869140625, 37.642189025878906, 39.39350891113281, 41.14482879638672, 42.896148681640625, 44.64746856689453, 46.39878845214844, 48.150108337402344, 49.901432037353516, 51.65275192260742, 53.40407180786133, 55.155391693115234, 56.906715393066406]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 12.0, 11.0, 29.0, 35.0, 42.0, 57.0, 97.0, 119.0, 208.0, 353.0, 584.0, 1004.0, 2001.0, 4070.0, 10403.0, 32414.0, 167025.0, 3304588.0, 580365.0, 62875.0, 16456.0, 5816.0, 2564.0, 1330.0, 696.0, 359.0, 267.0, 163.0, 107.0, 73.0, 48.0, 32.0, 16.0, 12.0, 14.0, 6.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.9375, -7.6873779296875, -7.437255859375, -7.1871337890625, -6.93701171875, -6.6868896484375, -6.436767578125, -6.1866455078125, -5.9365234375, -5.6864013671875, -5.436279296875, -5.1861572265625, -4.93603515625, -4.6859130859375, -4.435791015625, -4.1856689453125, -3.935546875, -3.6854248046875, -3.435302734375, -3.1851806640625, -2.93505859375, -2.6849365234375, -2.434814453125, -2.1846923828125, -1.9345703125, -1.6844482421875, -1.434326171875, -1.1842041015625, -0.93408203125, -0.6839599609375, -0.433837890625, -0.1837158203125, 0.06640625, 0.3165283203125, 0.566650390625, 0.8167724609375, 1.06689453125, 1.3170166015625, 1.567138671875, 1.8172607421875, 2.0673828125, 2.3175048828125, 2.567626953125, 2.8177490234375, 3.06787109375, 3.3179931640625, 3.568115234375, 3.8182373046875, 4.068359375, 4.3184814453125, 4.568603515625, 4.8187255859375, 5.06884765625, 5.3189697265625, 5.569091796875, 5.8192138671875, 6.0693359375, 6.3194580078125, 6.569580078125, 6.8197021484375, 7.06982421875, 7.3199462890625, 7.570068359375, 7.8201904296875, 8.0703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 10.0, 10.0, 14.0, 19.0, 24.0, 16.0, 30.0, 41.0, 37.0, 47.0, 62.0, 55.0, 74.0, 50.0, 60.0, 56.0, 64.0, 45.0, 49.0, 35.0, 37.0, 32.0, 25.0, 19.0, 17.0, 16.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8271484375, -1.7728424072265625, -1.718536376953125, -1.6642303466796875, -1.60992431640625, -1.5556182861328125, -1.501312255859375, -1.4470062255859375, -1.3927001953125, -1.3383941650390625, -1.284088134765625, -1.2297821044921875, -1.17547607421875, -1.1211700439453125, -1.066864013671875, -1.0125579833984375, -0.958251953125, -0.9039459228515625, -0.849639892578125, -0.7953338623046875, -0.74102783203125, -0.6867218017578125, -0.632415771484375, -0.5781097412109375, -0.5238037109375, -0.4694976806640625, -0.415191650390625, -0.3608856201171875, -0.30657958984375, -0.2522735595703125, -0.197967529296875, -0.1436614990234375, -0.08935546875, -0.0350494384765625, 0.019256591796875, 0.0735626220703125, 0.12786865234375, 0.1821746826171875, 0.236480712890625, 0.2907867431640625, 0.3450927734375, 0.3993988037109375, 0.453704833984375, 0.5080108642578125, 0.56231689453125, 0.6166229248046875, 0.670928955078125, 0.7252349853515625, 0.779541015625, 0.8338470458984375, 0.888153076171875, 0.9424591064453125, 0.99676513671875, 1.0510711669921875, 1.105377197265625, 1.1596832275390625, 1.2139892578125, 1.2682952880859375, 1.322601318359375, 1.3769073486328125, 1.43121337890625, 1.4855194091796875, 1.539825439453125, 1.5941314697265625, 1.6484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 14.0, 21.0, 41.0, 67.0, 112.0, 272.0, 752.0, 3854.0, 114591.0, 4044471.0, 27093.0, 2124.0, 530.0, 184.0, 70.0, 40.0, 31.0, 11.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.890625, -27.216064453125, -26.54150390625, -25.866943359375, -25.1923828125, -24.517822265625, -23.84326171875, -23.168701171875, -22.494140625, -21.819580078125, -21.14501953125, -20.470458984375, -19.7958984375, -19.121337890625, -18.44677734375, -17.772216796875, -17.09765625, -16.423095703125, -15.74853515625, -15.073974609375, -14.3994140625, -13.724853515625, -13.05029296875, -12.375732421875, -11.701171875, -11.026611328125, -10.35205078125, -9.677490234375, -9.0029296875, -8.328369140625, -7.65380859375, -6.979248046875, -6.3046875, -5.630126953125, -4.95556640625, -4.281005859375, -3.6064453125, -2.931884765625, -2.25732421875, -1.582763671875, -0.908203125, -0.233642578125, 0.44091796875, 1.115478515625, 1.7900390625, 2.464599609375, 3.13916015625, 3.813720703125, 4.48828125, 5.162841796875, 5.83740234375, 6.511962890625, 7.1865234375, 7.861083984375, 8.53564453125, 9.210205078125, 9.884765625, 10.559326171875, 11.23388671875, 11.908447265625, 12.5830078125, 13.257568359375, 13.93212890625, 14.606689453125, 15.28125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 14.0, 21.0, 45.0, 83.0, 168.0, 463.0, 1630.0, 1128.0, 279.0, 103.0, 54.0, 31.0, 18.0, 9.0, 5.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.2254638671875, -7.048583984375, -6.8717041015625, -6.69482421875, -6.5179443359375, -6.341064453125, -6.1641845703125, -5.9873046875, -5.8104248046875, -5.633544921875, -5.4566650390625, -5.27978515625, -5.1029052734375, -4.926025390625, -4.7491455078125, -4.572265625, -4.3953857421875, -4.218505859375, -4.0416259765625, -3.86474609375, -3.6878662109375, -3.510986328125, -3.3341064453125, -3.1572265625, -2.9803466796875, -2.803466796875, -2.6265869140625, -2.44970703125, -2.2728271484375, -2.095947265625, -1.9190673828125, -1.7421875, -1.5653076171875, -1.388427734375, -1.2115478515625, -1.03466796875, -0.8577880859375, -0.680908203125, -0.5040283203125, -0.3271484375, -0.1502685546875, 0.026611328125, 0.2034912109375, 0.38037109375, 0.5572509765625, 0.734130859375, 0.9110107421875, 1.087890625, 1.2647705078125, 1.441650390625, 1.6185302734375, 1.79541015625, 1.9722900390625, 2.149169921875, 2.3260498046875, 2.5029296875, 2.6798095703125, 2.856689453125, 3.0335693359375, 3.21044921875, 3.3873291015625, 3.564208984375, 3.7410888671875, 3.91796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 26.0, 63.0, 238.0, 382.0, 210.0, 61.0, 15.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1904067993164, -69.59600830078125, -68.0016098022461, -66.40721130371094, -64.81281280517578, -63.218414306640625, -61.62401580810547, -60.02961730957031, -58.435218811035156, -56.8408203125, -55.246421813964844, -53.65202331542969, -52.05762481689453, -50.463226318359375, -48.86882781982422, -47.27442932128906, -45.680030822753906, -44.08563232421875, -42.491233825683594, -40.89683532714844, -39.30243682861328, -37.708038330078125, -36.11363983154297, -34.51924133300781, -32.92483901977539, -31.330440521240234, -29.736042022705078, -28.141643524169922, -26.547245025634766, -24.95284652709961, -23.358448028564453, -21.764049530029297, -20.169649124145508, -18.57525062561035, -16.980852127075195, -15.386453628540039, -13.792055130004883, -12.197656631469727, -10.603257179260254, -9.008858680725098, -7.414460182189941, -5.820061683654785, -4.225663185119629, -2.6312642097473145, -1.0368657112121582, 0.557532787322998, 2.1519317626953125, 3.7463302612304688, 5.340728759765625, 6.935127258300781, 8.529525756835938, 10.123924255371094, 11.71832275390625, 13.312721252441406, 14.907120704650879, 16.50151824951172, 18.095916748046875, 19.69031524658203, 21.284713745117188, 22.879112243652344, 24.4735107421875, 26.067909240722656, 27.662307739257812, 29.25670623779297, 30.851106643676758]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 4.0, 12.0, 14.0, 23.0, 19.0, 27.0, 36.0, 50.0, 48.0, 49.0, 44.0, 74.0, 59.0, 59.0, 63.0, 54.0, 57.0, 41.0, 49.0, 40.0, 47.0, 31.0, 25.0, 17.0, 10.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.38701057434082, -18.855302810668945, -18.32359504699707, -17.791887283325195, -17.26017951965332, -16.728471755981445, -16.19676399230957, -15.665056228637695, -15.13334846496582, -14.601640701293945, -14.06993293762207, -13.538225173950195, -13.00651741027832, -12.474809646606445, -11.94310188293457, -11.411394119262695, -10.87968635559082, -10.347978591918945, -9.81627082824707, -9.284563064575195, -8.75285530090332, -8.221147537231445, -7.68943977355957, -7.157732009887695, -6.62602424621582, -6.094316482543945, -5.56260871887207, -5.030900955200195, -4.49919319152832, -3.9674854278564453, -3.4357776641845703, -2.9040699005126953, -2.372361183166504, -1.840653419494629, -1.308945655822754, -0.7772378921508789, -0.2455301284790039, 0.2861776351928711, 0.8178853988647461, 1.349593162536621, 1.881300926208496, 2.413008689880371, 2.944716453552246, 3.476424217224121, 4.008131980895996, 4.539839744567871, 5.071547508239746, 5.603255271911621, 6.134963035583496, 6.666670799255371, 7.198378562927246, 7.730086326599121, 8.261794090270996, 8.793501853942871, 9.325209617614746, 9.856917381286621, 10.388625144958496, 10.920332908630371, 11.452040672302246, 11.983748435974121, 12.515456199645996, 13.047163963317871, 13.578871726989746, 14.110579490661621, 14.642287254333496]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 2.0, 5.0, 3.0, 9.0, 9.0, 24.0, 27.0, 36.0, 50.0, 88.0, 155.0, 204.0, 338.0, 494.0, 832.0, 1535.0, 2878.0, 6287.0, 14477.0, 40192.0, 132380.0, 395572.0, 309727.0, 92525.0, 29441.0, 10971.0, 4821.0, 2279.0, 1255.0, 653.0, 423.0, 309.0, 208.0, 117.0, 73.0, 50.0, 36.0, 18.0, 13.0, 7.0, 6.0, 10.0, 2.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.27734375, -7.06854248046875, -6.8597412109375, -6.65093994140625, -6.442138671875, -6.23333740234375, -6.0245361328125, -5.81573486328125, -5.60693359375, -5.39813232421875, -5.1893310546875, -4.98052978515625, -4.771728515625, -4.56292724609375, -4.3541259765625, -4.14532470703125, -3.9365234375, -3.72772216796875, -3.5189208984375, -3.31011962890625, -3.101318359375, -2.89251708984375, -2.6837158203125, -2.47491455078125, -2.26611328125, -2.05731201171875, -1.8485107421875, -1.63970947265625, -1.430908203125, -1.22210693359375, -1.0133056640625, -0.80450439453125, -0.595703125, -0.38690185546875, -0.1781005859375, 0.03070068359375, 0.239501953125, 0.44830322265625, 0.6571044921875, 0.86590576171875, 1.07470703125, 1.28350830078125, 1.4923095703125, 1.70111083984375, 1.909912109375, 2.11871337890625, 2.3275146484375, 2.53631591796875, 2.7451171875, 2.95391845703125, 3.1627197265625, 3.37152099609375, 3.580322265625, 3.78912353515625, 3.9979248046875, 4.20672607421875, 4.41552734375, 4.62432861328125, 4.8331298828125, 5.04193115234375, 5.250732421875, 5.45953369140625, 5.6683349609375, 5.87713623046875, 6.0859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 12.0, 13.0, 7.0, 28.0, 21.0, 35.0, 46.0, 51.0, 51.0, 61.0, 63.0, 77.0, 82.0, 67.0, 55.0, 60.0, 57.0, 38.0, 41.0, 32.0, 25.0, 23.0, 7.0, 12.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.193359375, -2.1304168701171875, -2.067474365234375, -2.0045318603515625, -1.94158935546875, -1.8786468505859375, -1.815704345703125, -1.7527618408203125, -1.6898193359375, -1.6268768310546875, -1.563934326171875, -1.5009918212890625, -1.43804931640625, -1.3751068115234375, -1.312164306640625, -1.2492218017578125, -1.186279296875, -1.1233367919921875, -1.060394287109375, -0.9974517822265625, -0.93450927734375, -0.8715667724609375, -0.808624267578125, -0.7456817626953125, -0.6827392578125, -0.6197967529296875, -0.556854248046875, -0.4939117431640625, -0.43096923828125, -0.3680267333984375, -0.305084228515625, -0.2421417236328125, -0.17919921875, -0.1162567138671875, -0.053314208984375, 0.0096282958984375, 0.07257080078125, 0.1355133056640625, 0.198455810546875, 0.2613983154296875, 0.3243408203125, 0.3872833251953125, 0.450225830078125, 0.5131683349609375, 0.57611083984375, 0.6390533447265625, 0.701995849609375, 0.7649383544921875, 0.827880859375, 0.8908233642578125, 0.953765869140625, 1.0167083740234375, 1.07965087890625, 1.1425933837890625, 1.205535888671875, 1.2684783935546875, 1.3314208984375, 1.3943634033203125, 1.457305908203125, 1.5202484130859375, 1.58319091796875, 1.6461334228515625, 1.709075927734375, 1.7720184326171875, 1.8349609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 16.0, 19.0, 28.0, 21.0, 32.0, 52.0, 75.0, 75.0, 107.0, 165.0, 274.0, 448.0, 736.0, 1294.0, 2267.0, 3997.0, 7376.0, 14387.0, 28845.0, 63616.0, 142922.0, 265582.0, 260735.0, 136784.0, 60299.0, 28172.0, 13785.0, 7100.0, 3869.0, 2165.0, 1267.0, 741.0, 443.0, 259.0, 165.0, 112.0, 69.0, 62.0, 57.0, 35.0, 25.0, 23.0, 14.0, 8.0, 12.0, 3.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.549163818359375, -3.43817138671875, -3.327178955078125, -3.2161865234375, -3.105194091796875, -2.99420166015625, -2.883209228515625, -2.772216796875, -2.661224365234375, -2.55023193359375, -2.439239501953125, -2.3282470703125, -2.217254638671875, -2.10626220703125, -1.995269775390625, -1.88427734375, -1.773284912109375, -1.66229248046875, -1.551300048828125, -1.4403076171875, -1.329315185546875, -1.21832275390625, -1.107330322265625, -0.996337890625, -0.885345458984375, -0.77435302734375, -0.663360595703125, -0.5523681640625, -0.441375732421875, -0.33038330078125, -0.219390869140625, -0.1083984375, 0.002593994140625, 0.11358642578125, 0.224578857421875, 0.3355712890625, 0.446563720703125, 0.55755615234375, 0.668548583984375, 0.779541015625, 0.890533447265625, 1.00152587890625, 1.112518310546875, 1.2235107421875, 1.334503173828125, 1.44549560546875, 1.556488037109375, 1.66748046875, 1.778472900390625, 1.88946533203125, 2.000457763671875, 2.1114501953125, 2.222442626953125, 2.33343505859375, 2.444427490234375, 2.555419921875, 2.666412353515625, 2.77740478515625, 2.888397216796875, 2.9993896484375, 3.110382080078125, 3.22137451171875, 3.332366943359375, 3.443359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 4.0, 7.0, 8.0, 14.0, 14.0, 8.0, 11.0, 17.0, 21.0, 23.0, 24.0, 33.0, 38.0, 42.0, 26.0, 33.0, 34.0, 40.0, 38.0, 41.0, 35.0, 44.0, 37.0, 45.0, 44.0, 42.0, 32.0, 32.0, 23.0, 33.0, 17.0, 23.0, 17.0, 22.0, 13.0, 7.0, 8.0, 4.0, 8.0, 7.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.33367919921875, -5.1595458984375, -4.98541259765625, -4.811279296875, -4.63714599609375, -4.4630126953125, -4.28887939453125, -4.11474609375, -3.94061279296875, -3.7664794921875, -3.59234619140625, -3.418212890625, -3.24407958984375, -3.0699462890625, -2.89581298828125, -2.7216796875, -2.54754638671875, -2.3734130859375, -2.19927978515625, -2.025146484375, -1.85101318359375, -1.6768798828125, -1.50274658203125, -1.32861328125, -1.15447998046875, -0.9803466796875, -0.80621337890625, -0.632080078125, -0.45794677734375, -0.2838134765625, -0.10968017578125, 0.064453125, 0.23858642578125, 0.4127197265625, 0.58685302734375, 0.760986328125, 0.93511962890625, 1.1092529296875, 1.28338623046875, 1.45751953125, 1.63165283203125, 1.8057861328125, 1.97991943359375, 2.154052734375, 2.32818603515625, 2.5023193359375, 2.67645263671875, 2.8505859375, 3.02471923828125, 3.1988525390625, 3.37298583984375, 3.547119140625, 3.72125244140625, 3.8953857421875, 4.06951904296875, 4.24365234375, 4.41778564453125, 4.5919189453125, 4.76605224609375, 4.940185546875, 5.11431884765625, 5.2884521484375, 5.46258544921875, 5.63671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 15.0, 13.0, 22.0, 31.0, 48.0, 64.0, 113.0, 217.0, 343.0, 611.0, 1341.0, 3052.0, 7894.0, 23482.0, 80277.0, 286341.0, 431725.0, 149520.0, 41663.0, 13075.0, 4768.0, 1940.0, 865.0, 449.0, 252.0, 145.0, 83.0, 56.0, 39.0, 18.0, 13.0, 16.0, 14.0, 9.0, 6.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.1741943359375, -2.102294921875, -2.0303955078125, -1.95849609375, -1.8865966796875, -1.814697265625, -1.7427978515625, -1.6708984375, -1.5989990234375, -1.527099609375, -1.4552001953125, -1.38330078125, -1.3114013671875, -1.239501953125, -1.1676025390625, -1.095703125, -1.0238037109375, -0.951904296875, -0.8800048828125, -0.80810546875, -0.7362060546875, -0.664306640625, -0.5924072265625, -0.5205078125, -0.4486083984375, -0.376708984375, -0.3048095703125, -0.23291015625, -0.1610107421875, -0.089111328125, -0.0172119140625, 0.0546875, 0.1265869140625, 0.198486328125, 0.2703857421875, 0.34228515625, 0.4141845703125, 0.486083984375, 0.5579833984375, 0.6298828125, 0.7017822265625, 0.773681640625, 0.8455810546875, 0.91748046875, 0.9893798828125, 1.061279296875, 1.1331787109375, 1.205078125, 1.2769775390625, 1.348876953125, 1.4207763671875, 1.49267578125, 1.5645751953125, 1.636474609375, 1.7083740234375, 1.7802734375, 1.8521728515625, 1.924072265625, 1.9959716796875, 2.06787109375, 2.1397705078125, 2.211669921875, 2.2835693359375, 2.35546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 12.0, 12.0, 23.0, 21.0, 41.0, 46.0, 65.0, 81.0, 97.0, 108.0, 118.0, 56.0, 51.0, 52.0, 33.0, 31.0, 31.0, 18.0, 17.0, 10.0, 9.0, 5.0, 5.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00042629241943359375, -0.0004149340093135834, -0.000403575599193573, -0.0003922171890735626, -0.00038085877895355225, -0.00036950036883354187, -0.0003581419587135315, -0.0003467835485935211, -0.00033542513847351074, -0.00032406672835350037, -0.00031270831823349, -0.0003013499081134796, -0.00028999149799346924, -0.00027863308787345886, -0.0002672746777534485, -0.0002559162676334381, -0.00024455785751342773, -0.00023319944739341736, -0.00022184103727340698, -0.0002104826271533966, -0.00019912421703338623, -0.00018776580691337585, -0.00017640739679336548, -0.0001650489866733551, -0.00015369057655334473, -0.00014233216643333435, -0.00013097375631332397, -0.0001196153461933136, -0.00010825693607330322, -9.689852595329285e-05, -8.554011583328247e-05, -7.41817057132721e-05, -6.282329559326172e-05, -5.146488547325134e-05, -4.010647535324097e-05, -2.874806523323059e-05, -1.7389655113220215e-05, -6.031244993209839e-06, 5.327165126800537e-06, 1.6685575246810913e-05, 2.804398536682129e-05, 3.9402395486831665e-05, 5.076080560684204e-05, 6.211921572685242e-05, 7.347762584686279e-05, 8.483603596687317e-05, 9.619444608688354e-05, 0.00010755285620689392, 0.0001189112663269043, 0.00013026967644691467, 0.00014162808656692505, 0.00015298649668693542, 0.0001643449068069458, 0.00017570331692695618, 0.00018706172704696655, 0.00019842013716697693, 0.0002097785472869873, 0.00022113695740699768, 0.00023249536752700806, 0.00024385377764701843, 0.0002552121877670288, 0.0002665705978870392, 0.00027792900800704956, 0.00028928741812705994, 0.0003006458282470703]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 12.0, 14.0, 23.0, 23.0, 48.0, 64.0, 114.0, 194.0, 411.0, 825.0, 1877.0, 4817.0, 14341.0, 50950.0, 218170.0, 530001.0, 166793.0, 40841.0, 11773.0, 4086.0, 1601.0, 761.0, 333.0, 192.0, 93.0, 52.0, 43.0, 25.0, 26.0, 13.0, 5.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.478240966796875, -2.39398193359375, -2.309722900390625, -2.2254638671875, -2.141204833984375, -2.05694580078125, -1.972686767578125, -1.888427734375, -1.804168701171875, -1.71990966796875, -1.635650634765625, -1.5513916015625, -1.467132568359375, -1.38287353515625, -1.298614501953125, -1.21435546875, -1.130096435546875, -1.04583740234375, -0.961578369140625, -0.8773193359375, -0.793060302734375, -0.70880126953125, -0.624542236328125, -0.540283203125, -0.456024169921875, -0.37176513671875, -0.287506103515625, -0.2032470703125, -0.118988037109375, -0.03472900390625, 0.049530029296875, 0.1337890625, 0.218048095703125, 0.30230712890625, 0.386566162109375, 0.4708251953125, 0.555084228515625, 0.63934326171875, 0.723602294921875, 0.807861328125, 0.892120361328125, 0.97637939453125, 1.060638427734375, 1.1448974609375, 1.229156494140625, 1.31341552734375, 1.397674560546875, 1.48193359375, 1.566192626953125, 1.65045166015625, 1.734710693359375, 1.8189697265625, 1.903228759765625, 1.98748779296875, 2.071746826171875, 2.156005859375, 2.240264892578125, 2.32452392578125, 2.408782958984375, 2.4930419921875, 2.577301025390625, 2.66156005859375, 2.745819091796875, 2.830078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 3.0, 12.0, 13.0, 15.0, 30.0, 38.0, 38.0, 63.0, 79.0, 67.0, 100.0, 95.0, 83.0, 69.0, 59.0, 35.0, 46.0, 44.0, 22.0, 18.0, 12.0, 12.0, 4.0, 7.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8603515625, -1.7845306396484375, -1.708709716796875, -1.6328887939453125, -1.55706787109375, -1.4812469482421875, -1.405426025390625, -1.3296051025390625, -1.2537841796875, -1.1779632568359375, -1.102142333984375, -1.0263214111328125, -0.95050048828125, -0.8746795654296875, -0.798858642578125, -0.7230377197265625, -0.647216796875, -0.5713958740234375, -0.495574951171875, -0.4197540283203125, -0.34393310546875, -0.2681121826171875, -0.192291259765625, -0.1164703369140625, -0.0406494140625, 0.0351715087890625, 0.110992431640625, 0.1868133544921875, 0.26263427734375, 0.3384552001953125, 0.414276123046875, 0.4900970458984375, 0.56591796875, 0.6417388916015625, 0.717559814453125, 0.7933807373046875, 0.86920166015625, 0.9450225830078125, 1.020843505859375, 1.0966644287109375, 1.1724853515625, 1.2483062744140625, 1.324127197265625, 1.3999481201171875, 1.47576904296875, 1.5515899658203125, 1.627410888671875, 1.7032318115234375, 1.779052734375, 1.8548736572265625, 1.930694580078125, 2.0065155029296875, 2.08233642578125, 2.1581573486328125, 2.233978271484375, 2.3097991943359375, 2.3856201171875, 2.4614410400390625, 2.537261962890625, 2.6130828857421875, 2.68890380859375, 2.7647247314453125, 2.840545654296875, 2.9163665771484375, 2.9921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 24.0, 40.0, 39.0, 97.0, 161.0, 202.0, 195.0, 99.0, 56.0, 34.0, 19.0, 9.0, 5.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.545568466186523, -21.862661361694336, -20.17975425720215, -18.49684715270996, -16.813940048217773, -15.131033897399902, -13.448126792907715, -11.765219688415527, -10.08231258392334, -8.399405479431152, -6.716498374938965, -5.0335917472839355, -3.350684642791748, -1.6677780151367188, 0.01512908935546875, 1.6980361938476562, 3.3809432983398438, 5.063850402832031, 6.746757507324219, 8.429664611816406, 10.112571716308594, 11.795477867126465, 13.478384971618652, 15.16129207611084, 16.844200134277344, 18.52710723876953, 20.21001434326172, 21.892921447753906, 23.575828552246094, 25.25873565673828, 26.94164276123047, 28.624549865722656, 30.307453155517578, 31.990360260009766, 33.67326736450195, 35.35617446899414, 37.03908157348633, 38.721988677978516, 40.4048957824707, 42.08780288696289, 43.77070999145508, 45.453617095947266, 47.13652420043945, 48.81943130493164, 50.50233840942383, 52.185245513916016, 53.8681526184082, 55.55105972290039, 57.23396301269531, 58.9168701171875, 60.59977722167969, 62.282684326171875, 63.96559143066406, 65.64849853515625, 67.33140563964844, 69.01431274414062, 70.69721984863281, 72.380126953125, 74.06303405761719, 75.74594116210938, 77.42884826660156, 79.11175537109375, 80.79466247558594, 82.47756958007812, 84.16047668457031]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 6.0, 9.0, 11.0, 11.0, 17.0, 19.0, 23.0, 23.0, 25.0, 19.0, 34.0, 32.0, 35.0, 46.0, 51.0, 51.0, 34.0, 43.0, 53.0, 62.0, 46.0, 36.0, 45.0, 30.0, 36.0, 28.0, 24.0, 25.0, 20.0, 18.0, 18.0, 20.0, 7.0, 7.0, 14.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.64718246459961, -33.43120193481445, -32.2152214050293, -30.999238967895508, -29.78325843811035, -28.567277908325195, -27.351295471191406, -26.13531494140625, -24.919334411621094, -23.703353881835938, -22.48737335205078, -21.271390914916992, -20.055410385131836, -18.83942985534668, -17.62344741821289, -16.407466888427734, -15.191486358642578, -13.975505828857422, -12.75952434539795, -11.543542861938477, -10.32756233215332, -9.111581802368164, -7.895600318908691, -6.679618835449219, -5.4636383056640625, -4.247657299041748, -3.0316762924194336, -1.8156952857971191, -0.5997142791748047, 0.6162667274475098, 1.8322477340698242, 3.048229217529297, 4.264213562011719, 5.480194568634033, 6.696175575256348, 7.912156581878662, 9.128137588500977, 10.344118118286133, 11.560099601745605, 12.776081085205078, 13.992061614990234, 15.20804214477539, 16.424022674560547, 17.640005111694336, 18.855985641479492, 20.07196617126465, 21.287948608398438, 22.503929138183594, 23.71990966796875, 24.935890197753906, 26.151870727539062, 27.36785316467285, 28.583833694458008, 29.799814224243164, 31.015796661376953, 32.23177719116211, 33.447757720947266, 34.66373825073242, 35.87971878051758, 37.095699310302734, 38.311683654785156, 39.52766418457031, 40.74364471435547, 41.959625244140625, 43.17560577392578]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 12.0, 8.0, 10.0, 13.0, 17.0, 24.0, 50.0, 61.0, 75.0, 125.0, 217.0, 331.0, 578.0, 1009.0, 1878.0, 4160.0, 10891.0, 38706.0, 507142.0, 3526531.0, 74888.0, 16606.0, 5733.0, 2395.0, 1239.0, 614.0, 329.0, 232.0, 144.0, 88.0, 50.0, 32.0, 33.0, 15.0, 7.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.53125, -9.27490234375, -9.0185546875, -8.76220703125, -8.505859375, -8.24951171875, -7.9931640625, -7.73681640625, -7.48046875, -7.22412109375, -6.9677734375, -6.71142578125, -6.455078125, -6.19873046875, -5.9423828125, -5.68603515625, -5.4296875, -5.17333984375, -4.9169921875, -4.66064453125, -4.404296875, -4.14794921875, -3.8916015625, -3.63525390625, -3.37890625, -3.12255859375, -2.8662109375, -2.60986328125, -2.353515625, -2.09716796875, -1.8408203125, -1.58447265625, -1.328125, -1.07177734375, -0.8154296875, -0.55908203125, -0.302734375, -0.04638671875, 0.2099609375, 0.46630859375, 0.72265625, 0.97900390625, 1.2353515625, 1.49169921875, 1.748046875, 2.00439453125, 2.2607421875, 2.51708984375, 2.7734375, 3.02978515625, 3.2861328125, 3.54248046875, 3.798828125, 4.05517578125, 4.3115234375, 4.56787109375, 4.82421875, 5.08056640625, 5.3369140625, 5.59326171875, 5.849609375, 6.10595703125, 6.3623046875, 6.61865234375, 6.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 1.0, 12.0, 16.0, 18.0, 21.0, 18.0, 35.0, 49.0, 39.0, 52.0, 61.0, 72.0, 65.0, 81.0, 68.0, 49.0, 49.0, 52.0, 57.0, 36.0, 33.0, 28.0, 23.0, 16.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.35546875, -2.28863525390625, -2.2218017578125, -2.15496826171875, -2.088134765625, -2.02130126953125, -1.9544677734375, -1.88763427734375, -1.82080078125, -1.75396728515625, -1.6871337890625, -1.62030029296875, -1.553466796875, -1.48663330078125, -1.4197998046875, -1.35296630859375, -1.2861328125, -1.21929931640625, -1.1524658203125, -1.08563232421875, -1.018798828125, -0.95196533203125, -0.8851318359375, -0.81829833984375, -0.75146484375, -0.68463134765625, -0.6177978515625, -0.55096435546875, -0.484130859375, -0.41729736328125, -0.3504638671875, -0.28363037109375, -0.216796875, -0.14996337890625, -0.0831298828125, -0.01629638671875, 0.050537109375, 0.11737060546875, 0.1842041015625, 0.25103759765625, 0.31787109375, 0.38470458984375, 0.4515380859375, 0.51837158203125, 0.585205078125, 0.65203857421875, 0.7188720703125, 0.78570556640625, 0.8525390625, 0.91937255859375, 0.9862060546875, 1.05303955078125, 1.119873046875, 1.18670654296875, 1.2535400390625, 1.32037353515625, 1.38720703125, 1.45404052734375, 1.5208740234375, 1.58770751953125, 1.654541015625, 1.72137451171875, 1.7882080078125, 1.85504150390625, 1.921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 9.0, 15.0, 27.0, 26.0, 49.0, 70.0, 96.0, 150.0, 305.0, 516.0, 1242.0, 3550.0, 12083.0, 66014.0, 1867701.0, 2157029.0, 68074.0, 11731.0, 3268.0, 1169.0, 513.0, 273.0, 148.0, 61.0, 49.0, 33.0, 24.0, 16.0, 12.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -7.0482177734375, -6.834716796875, -6.6212158203125, -6.40771484375, -6.1942138671875, -5.980712890625, -5.7672119140625, -5.5537109375, -5.3402099609375, -5.126708984375, -4.9132080078125, -4.69970703125, -4.4862060546875, -4.272705078125, -4.0592041015625, -3.845703125, -3.6322021484375, -3.418701171875, -3.2052001953125, -2.99169921875, -2.7781982421875, -2.564697265625, -2.3511962890625, -2.1376953125, -1.9241943359375, -1.710693359375, -1.4971923828125, -1.28369140625, -1.0701904296875, -0.856689453125, -0.6431884765625, -0.4296875, -0.2161865234375, -0.002685546875, 0.2108154296875, 0.42431640625, 0.6378173828125, 0.851318359375, 1.0648193359375, 1.2783203125, 1.4918212890625, 1.705322265625, 1.9188232421875, 2.13232421875, 2.3458251953125, 2.559326171875, 2.7728271484375, 2.986328125, 3.1998291015625, 3.413330078125, 3.6268310546875, 3.84033203125, 4.0538330078125, 4.267333984375, 4.4808349609375, 4.6943359375, 4.9078369140625, 5.121337890625, 5.3348388671875, 5.54833984375, 5.7618408203125, 5.975341796875, 6.1888427734375, 6.40234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 6.0, 9.0, 11.0, 14.0, 26.0, 29.0, 62.0, 125.0, 296.0, 1000.0, 1730.0, 459.0, 156.0, 65.0, 39.0, 13.0, 11.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.986328125, -3.884674072265625, -3.78302001953125, -3.681365966796875, -3.5797119140625, -3.478057861328125, -3.37640380859375, -3.274749755859375, -3.173095703125, -3.071441650390625, -2.96978759765625, -2.868133544921875, -2.7664794921875, -2.664825439453125, -2.56317138671875, -2.461517333984375, -2.35986328125, -2.258209228515625, -2.15655517578125, -2.054901123046875, -1.9532470703125, -1.851593017578125, -1.74993896484375, -1.648284912109375, -1.546630859375, -1.444976806640625, -1.34332275390625, -1.241668701171875, -1.1400146484375, -1.038360595703125, -0.93670654296875, -0.835052490234375, -0.7333984375, -0.631744384765625, -0.53009033203125, -0.428436279296875, -0.3267822265625, -0.225128173828125, -0.12347412109375, -0.021820068359375, 0.079833984375, 0.181488037109375, 0.28314208984375, 0.384796142578125, 0.4864501953125, 0.588104248046875, 0.68975830078125, 0.791412353515625, 0.89306640625, 0.994720458984375, 1.09637451171875, 1.198028564453125, 1.2996826171875, 1.401336669921875, 1.50299072265625, 1.604644775390625, 1.706298828125, 1.807952880859375, 1.90960693359375, 2.011260986328125, 2.1129150390625, 2.214569091796875, 2.31622314453125, 2.417877197265625, 2.51953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 25.0, 28.0, 53.0, 80.0, 102.0, 108.0, 148.0, 134.0, 97.0, 69.0, 59.0, 27.0, 15.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.840119361877441, -15.464123725891113, -15.088129043579102, -14.712133407592773, -14.336138725280762, -13.960143089294434, -13.584148406982422, -13.208152770996094, -12.832158088684082, -12.456162452697754, -12.080167770385742, -11.704172134399414, -11.328177452087402, -10.952181816101074, -10.576187133789062, -10.200191497802734, -9.824195861816406, -9.448200225830078, -9.072205543518066, -8.696209907531738, -8.320215225219727, -7.944220066070557, -7.568224906921387, -7.192229270935059, -6.816234588623047, -6.440239429473877, -6.064244270324707, -5.688249111175537, -5.312253952026367, -4.936258792877197, -4.560263633728027, -4.184267997741699, -3.8082733154296875, -3.4322781562805176, -3.0562829971313477, -2.6802878379821777, -2.304292678833008, -1.9282974004745483, -1.5523021221160889, -1.176306962966919, -0.800311803817749, -0.4243166148662567, -0.048321425914764404, 0.3276737928390503, 0.7036689519882202, 1.0796641111373901, 1.4556593894958496, 1.8316545486450195, 2.2076497077941895, 2.5836448669433594, 2.9596400260925293, 3.335635185241699, 3.711630344390869, 4.087625503540039, 4.463621139526367, 4.839615821838379, 5.215611457824707, 5.591606616973877, 5.967601776123047, 6.343596935272217, 6.719592094421387, 7.095587253570557, 7.471582412719727, 7.847578048706055, 8.223572731018066]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 8.0, 7.0, 15.0, 18.0, 26.0, 30.0, 44.0, 58.0, 55.0, 56.0, 66.0, 64.0, 76.0, 69.0, 71.0, 70.0, 58.0, 48.0, 31.0, 32.0, 27.0, 25.0, 18.0, 5.0, 10.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.930217742919922, -9.551583290100098, -9.172948837280273, -8.794315338134766, -8.415680885314941, -8.037046432495117, -7.658412456512451, -7.279778480529785, -6.901144027709961, -6.522509574890137, -6.143875598907471, -5.765241622924805, -5.3866071701049805, -5.007972717285156, -4.62933874130249, -4.250704765319824, -3.8720703125, -3.493436098098755, -3.1148018836975098, -2.7361676692962646, -2.3575334548950195, -1.9788992404937744, -1.6002650260925293, -1.2216308116912842, -0.8429965972900391, -0.46436238288879395, -0.08572816848754883, 0.2929060459136963, 0.6715402603149414, 1.0501744747161865, 1.4288086891174316, 1.8074429035186768, 2.186077117919922, 2.564711332321167, 2.943345546722412, 3.3219797611236572, 3.7006139755249023, 4.079248428344727, 4.457882404327393, 4.836516380310059, 5.215150833129883, 5.593785285949707, 5.972419261932373, 6.351053237915039, 6.729687690734863, 7.1083221435546875, 7.4869561195373535, 7.8655900955200195, 8.244224548339844, 8.622859001159668, 9.001493453979492, 9.380126953125, 9.758761405944824, 10.137395858764648, 10.516029357910156, 10.89466381072998, 11.273298263549805, 11.651932716369629, 12.030567169189453, 12.409200668334961, 12.787835121154785, 13.16646957397461, 13.545103073120117, 13.923737525939941, 14.302371978759766]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 7.0, 13.0, 8.0, 21.0, 26.0, 39.0, 55.0, 73.0, 127.0, 199.0, 260.0, 417.0, 625.0, 1104.0, 1968.0, 3774.0, 7562.0, 15938.0, 37399.0, 96100.0, 252980.0, 354030.0, 166116.0, 61603.0, 24817.0, 11085.0, 5343.0, 2860.0, 1509.0, 893.0, 534.0, 361.0, 235.0, 136.0, 103.0, 76.0, 47.0, 33.0, 16.0, 22.0, 12.0, 10.0, 9.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.453125, -5.27874755859375, -5.1043701171875, -4.92999267578125, -4.755615234375, -4.58123779296875, -4.4068603515625, -4.23248291015625, -4.05810546875, -3.88372802734375, -3.7093505859375, -3.53497314453125, -3.360595703125, -3.18621826171875, -3.0118408203125, -2.83746337890625, -2.6630859375, -2.48870849609375, -2.3143310546875, -2.13995361328125, -1.965576171875, -1.79119873046875, -1.6168212890625, -1.44244384765625, -1.26806640625, -1.09368896484375, -0.9193115234375, -0.74493408203125, -0.570556640625, -0.39617919921875, -0.2218017578125, -0.04742431640625, 0.126953125, 0.30133056640625, 0.4757080078125, 0.65008544921875, 0.824462890625, 0.99884033203125, 1.1732177734375, 1.34759521484375, 1.52197265625, 1.69635009765625, 1.8707275390625, 2.04510498046875, 2.219482421875, 2.39385986328125, 2.5682373046875, 2.74261474609375, 2.9169921875, 3.09136962890625, 3.2657470703125, 3.44012451171875, 3.614501953125, 3.78887939453125, 3.9632568359375, 4.13763427734375, 4.31201171875, 4.48638916015625, 4.6607666015625, 4.83514404296875, 5.009521484375, 5.18389892578125, 5.3582763671875, 5.53265380859375, 5.70703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 5.0, 15.0, 11.0, 16.0, 28.0, 23.0, 33.0, 35.0, 51.0, 51.0, 62.0, 65.0, 63.0, 72.0, 56.0, 45.0, 69.0, 54.0, 41.0, 38.0, 32.0, 34.0, 31.0, 10.0, 13.0, 8.0, 12.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.2890625, -2.2258148193359375, -2.162567138671875, -2.0993194580078125, -2.03607177734375, -1.9728240966796875, -1.909576416015625, -1.8463287353515625, -1.7830810546875, -1.7198333740234375, -1.656585693359375, -1.5933380126953125, -1.53009033203125, -1.4668426513671875, -1.403594970703125, -1.3403472900390625, -1.277099609375, -1.2138519287109375, -1.150604248046875, -1.0873565673828125, -1.02410888671875, -0.9608612060546875, -0.897613525390625, -0.8343658447265625, -0.7711181640625, -0.7078704833984375, -0.644622802734375, -0.5813751220703125, -0.51812744140625, -0.4548797607421875, -0.391632080078125, -0.3283843994140625, -0.26513671875, -0.2018890380859375, -0.138641357421875, -0.0753936767578125, -0.01214599609375, 0.0511016845703125, 0.114349365234375, 0.1775970458984375, 0.2408447265625, 0.3040924072265625, 0.367340087890625, 0.4305877685546875, 0.49383544921875, 0.5570831298828125, 0.620330810546875, 0.6835784912109375, 0.746826171875, 0.8100738525390625, 0.873321533203125, 0.9365692138671875, 0.99981689453125, 1.0630645751953125, 1.126312255859375, 1.1895599365234375, 1.2528076171875, 1.3160552978515625, 1.379302978515625, 1.4425506591796875, 1.50579833984375, 1.5690460205078125, 1.632293701171875, 1.6955413818359375, 1.7587890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 9.0, 14.0, 14.0, 21.0, 24.0, 52.0, 69.0, 80.0, 122.0, 174.0, 235.0, 400.0, 606.0, 1035.0, 1870.0, 3605.0, 7631.0, 17562.0, 45713.0, 122110.0, 281510.0, 316204.0, 151916.0, 56993.0, 21868.0, 9302.0, 4154.0, 2124.0, 1113.0, 672.0, 417.0, 285.0, 184.0, 126.0, 105.0, 62.0, 49.0, 46.0, 24.0, 15.0, 8.0, 2.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.22265625, -4.098876953125, -3.97509765625, -3.851318359375, -3.7275390625, -3.603759765625, -3.47998046875, -3.356201171875, -3.232421875, -3.108642578125, -2.98486328125, -2.861083984375, -2.7373046875, -2.613525390625, -2.48974609375, -2.365966796875, -2.2421875, -2.118408203125, -1.99462890625, -1.870849609375, -1.7470703125, -1.623291015625, -1.49951171875, -1.375732421875, -1.251953125, -1.128173828125, -1.00439453125, -0.880615234375, -0.7568359375, -0.633056640625, -0.50927734375, -0.385498046875, -0.26171875, -0.137939453125, -0.01416015625, 0.109619140625, 0.2333984375, 0.357177734375, 0.48095703125, 0.604736328125, 0.728515625, 0.852294921875, 0.97607421875, 1.099853515625, 1.2236328125, 1.347412109375, 1.47119140625, 1.594970703125, 1.71875, 1.842529296875, 1.96630859375, 2.090087890625, 2.2138671875, 2.337646484375, 2.46142578125, 2.585205078125, 2.708984375, 2.832763671875, 2.95654296875, 3.080322265625, 3.2041015625, 3.327880859375, 3.45166015625, 3.575439453125, 3.69921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 7.0, 6.0, 10.0, 10.0, 12.0, 26.0, 31.0, 26.0, 29.0, 27.0, 29.0, 34.0, 31.0, 34.0, 47.0, 48.0, 47.0, 35.0, 40.0, 44.0, 41.0, 51.0, 34.0, 40.0, 35.0, 28.0, 28.0, 34.0, 25.0, 19.0, 9.0, 20.0, 12.0, 9.0, 7.0, 3.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62890625, -5.43878173828125, -5.2486572265625, -5.05853271484375, -4.868408203125, -4.67828369140625, -4.4881591796875, -4.29803466796875, -4.10791015625, -3.91778564453125, -3.7276611328125, -3.53753662109375, -3.347412109375, -3.15728759765625, -2.9671630859375, -2.77703857421875, -2.5869140625, -2.39678955078125, -2.2066650390625, -2.01654052734375, -1.826416015625, -1.63629150390625, -1.4461669921875, -1.25604248046875, -1.06591796875, -0.87579345703125, -0.6856689453125, -0.49554443359375, -0.305419921875, -0.11529541015625, 0.0748291015625, 0.26495361328125, 0.455078125, 0.64520263671875, 0.8353271484375, 1.02545166015625, 1.215576171875, 1.40570068359375, 1.5958251953125, 1.78594970703125, 1.97607421875, 2.16619873046875, 2.3563232421875, 2.54644775390625, 2.736572265625, 2.92669677734375, 3.1168212890625, 3.30694580078125, 3.4970703125, 3.68719482421875, 3.8773193359375, 4.06744384765625, 4.257568359375, 4.44769287109375, 4.6378173828125, 4.82794189453125, 5.01806640625, 5.20819091796875, 5.3983154296875, 5.58843994140625, 5.778564453125, 5.96868896484375, 6.1588134765625, 6.34893798828125, 6.5390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 7.0, 18.0, 34.0, 43.0, 73.0, 156.0, 301.0, 691.0, 1509.0, 3927.0, 11632.0, 38310.0, 168405.0, 527110.0, 224924.0, 49225.0, 13972.0, 4859.0, 1833.0, 774.0, 363.0, 181.0, 94.0, 47.0, 23.0, 15.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.3203125, -3.2385101318359375, -3.156707763671875, -3.0749053955078125, -2.99310302734375, -2.9113006591796875, -2.829498291015625, -2.7476959228515625, -2.6658935546875, -2.5840911865234375, -2.502288818359375, -2.4204864501953125, -2.33868408203125, -2.2568817138671875, -2.175079345703125, -2.0932769775390625, -2.011474609375, -1.9296722412109375, -1.847869873046875, -1.7660675048828125, -1.68426513671875, -1.6024627685546875, -1.520660400390625, -1.4388580322265625, -1.3570556640625, -1.2752532958984375, -1.193450927734375, -1.1116485595703125, -1.02984619140625, -0.9480438232421875, -0.866241455078125, -0.7844390869140625, -0.70263671875, -0.6208343505859375, -0.539031982421875, -0.4572296142578125, -0.37542724609375, -0.2936248779296875, -0.211822509765625, -0.1300201416015625, -0.0482177734375, 0.0335845947265625, 0.115386962890625, 0.1971893310546875, 0.27899169921875, 0.3607940673828125, 0.442596435546875, 0.5243988037109375, 0.606201171875, 0.6880035400390625, 0.769805908203125, 0.8516082763671875, 0.93341064453125, 1.0152130126953125, 1.097015380859375, 1.1788177490234375, 1.2606201171875, 1.3424224853515625, 1.424224853515625, 1.5060272216796875, 1.58782958984375, 1.6696319580078125, 1.751434326171875, 1.8332366943359375, 1.9150390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 11.0, 11.0, 11.0, 14.0, 16.0, 15.0, 27.0, 28.0, 37.0, 58.0, 60.0, 80.0, 76.0, 108.0, 100.0, 75.0, 51.0, 33.0, 24.0, 31.0, 26.0, 23.0, 19.0, 21.0, 11.0, 11.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036144256591796875, -0.00034914538264274597, -0.0003368481993675232, -0.0003245510160923004, -0.00031225383281707764, -0.00029995664954185486, -0.0002876594662666321, -0.0002753622829914093, -0.0002630650997161865, -0.00025076791644096375, -0.00023847073316574097, -0.0002261735498905182, -0.0002138763666152954, -0.00020157918334007263, -0.00018928200006484985, -0.00017698481678962708, -0.0001646876335144043, -0.00015239045023918152, -0.00014009326696395874, -0.00012779608368873596, -0.00011549890041351318, -0.0001032017171382904, -9.090453386306763e-05, -7.860735058784485e-05, -6.631016731262207e-05, -5.401298403739929e-05, -4.1715800762176514e-05, -2.9418617486953735e-05, -1.7121434211730957e-05, -4.824250936508179e-06, 7.4729323387146e-06, 1.9770115613937378e-05, 3.2067298889160156e-05, 4.4364482164382935e-05, 5.666166543960571e-05, 6.895884871482849e-05, 8.125603199005127e-05, 9.355321526527405e-05, 0.00010585039854049683, 0.0001181475818157196, 0.00013044476509094238, 0.00014274194836616516, 0.00015503913164138794, 0.00016733631491661072, 0.0001796334981918335, 0.00019193068146705627, 0.00020422786474227905, 0.00021652504801750183, 0.0002288222312927246, 0.0002411194145679474, 0.00025341659784317017, 0.00026571378111839294, 0.0002780109643936157, 0.0002903081476688385, 0.0003026053309440613, 0.00031490251421928406, 0.00032719969749450684, 0.0003394968807697296, 0.0003517940640449524, 0.00036409124732017517, 0.00037638843059539795, 0.00038868561387062073, 0.0004009827971458435, 0.0004132799804210663, 0.00042557716369628906]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 4.0, 8.0, 9.0, 16.0, 31.0, 35.0, 83.0, 105.0, 164.0, 282.0, 493.0, 941.0, 1901.0, 4013.0, 9735.0, 25404.0, 86266.0, 411044.0, 386180.0, 80480.0, 24288.0, 9276.0, 3874.0, 1783.0, 906.0, 471.0, 291.0, 176.0, 84.0, 67.0, 37.0, 25.0, 27.0, 18.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.673828125, -2.592742919921875, -2.51165771484375, -2.430572509765625, -2.3494873046875, -2.268402099609375, -2.18731689453125, -2.106231689453125, -2.025146484375, -1.944061279296875, -1.86297607421875, -1.781890869140625, -1.7008056640625, -1.619720458984375, -1.53863525390625, -1.457550048828125, -1.37646484375, -1.295379638671875, -1.21429443359375, -1.133209228515625, -1.0521240234375, -0.971038818359375, -0.88995361328125, -0.808868408203125, -0.727783203125, -0.646697998046875, -0.56561279296875, -0.484527587890625, -0.4034423828125, -0.322357177734375, -0.24127197265625, -0.160186767578125, -0.0791015625, 0.001983642578125, 0.08306884765625, 0.164154052734375, 0.2452392578125, 0.326324462890625, 0.40740966796875, 0.488494873046875, 0.569580078125, 0.650665283203125, 0.73175048828125, 0.812835693359375, 0.8939208984375, 0.975006103515625, 1.05609130859375, 1.137176513671875, 1.21826171875, 1.299346923828125, 1.38043212890625, 1.461517333984375, 1.5426025390625, 1.623687744140625, 1.70477294921875, 1.785858154296875, 1.866943359375, 1.948028564453125, 2.02911376953125, 2.110198974609375, 2.1912841796875, 2.272369384765625, 2.35345458984375, 2.434539794921875, 2.515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 8.0, 11.0, 16.0, 18.0, 25.0, 41.0, 53.0, 59.0, 81.0, 119.0, 98.0, 109.0, 82.0, 59.0, 55.0, 36.0, 20.0, 16.0, 19.0, 7.0, 13.0, 11.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.650390625, -2.5714111328125, -2.492431640625, -2.4134521484375, -2.33447265625, -2.2554931640625, -2.176513671875, -2.0975341796875, -2.0185546875, -1.9395751953125, -1.860595703125, -1.7816162109375, -1.70263671875, -1.6236572265625, -1.544677734375, -1.4656982421875, -1.38671875, -1.3077392578125, -1.228759765625, -1.1497802734375, -1.07080078125, -0.9918212890625, -0.912841796875, -0.8338623046875, -0.7548828125, -0.6759033203125, -0.596923828125, -0.5179443359375, -0.43896484375, -0.3599853515625, -0.281005859375, -0.2020263671875, -0.123046875, -0.0440673828125, 0.034912109375, 0.1138916015625, 0.19287109375, 0.2718505859375, 0.350830078125, 0.4298095703125, 0.5087890625, 0.5877685546875, 0.666748046875, 0.7457275390625, 0.82470703125, 0.9036865234375, 0.982666015625, 1.0616455078125, 1.140625, 1.2196044921875, 1.298583984375, 1.3775634765625, 1.45654296875, 1.5355224609375, 1.614501953125, 1.6934814453125, 1.7724609375, 1.8514404296875, 1.930419921875, 2.0093994140625, 2.08837890625, 2.1673583984375, 2.246337890625, 2.3253173828125, 2.404296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 21.0, 32.0, 69.0, 93.0, 140.0, 162.0, 157.0, 122.0, 72.0, 48.0, 28.0, 17.0, 11.0, 10.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.831026077270508, -24.46232795715332, -23.0936279296875, -21.724929809570312, -20.356229782104492, -18.987531661987305, -17.618831634521484, -16.250133514404297, -14.881434440612793, -13.512735366821289, -12.144036293029785, -10.775337219238281, -9.406639099121094, -8.037939071655273, -6.669240951538086, -5.300541877746582, -3.931842803955078, -2.563143730163574, -1.1944448947906494, 0.1742539405822754, 1.5429530143737793, 2.911652088165283, 4.280350685119629, 5.649049758911133, 7.017748832702637, 8.38644790649414, 9.755146980285645, 11.123846054077148, 12.492544174194336, 13.861244201660156, 15.229942321777344, 16.59864044189453, 17.96733856201172, 19.336036682128906, 20.704736709594727, 22.073434829711914, 23.442134857177734, 24.810832977294922, 26.17953109741211, 27.54823112487793, 28.91693115234375, 30.285629272460938, 31.654329299926758, 33.02302932739258, 34.391727447509766, 35.76042556762695, 37.12912368774414, 38.497825622558594, 39.86652374267578, 41.23522186279297, 42.603919982910156, 43.97262191772461, 45.3413200378418, 46.710018157958984, 48.07871627807617, 49.447418212890625, 50.81611251831055, 52.184810638427734, 53.55350875854492, 54.922210693359375, 56.29090881347656, 57.65960693359375, 59.02830505371094, 60.397003173828125, 61.76570510864258]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 14.0, 9.0, 8.0, 17.0, 20.0, 19.0, 14.0, 33.0, 26.0, 27.0, 33.0, 32.0, 35.0, 46.0, 44.0, 40.0, 43.0, 53.0, 48.0, 45.0, 47.0, 43.0, 43.0, 25.0, 31.0, 21.0, 24.0, 25.0, 24.0, 13.0, 20.0, 18.0, 16.0, 8.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.673675537109375, -31.614837646484375, -30.555999755859375, -29.497161865234375, -28.438323974609375, -27.379486083984375, -26.320650100708008, -25.261812210083008, -24.202974319458008, -23.144136428833008, -22.085298538208008, -21.026460647583008, -19.96762466430664, -18.90878677368164, -17.84994888305664, -16.79111099243164, -15.73227310180664, -14.67343521118164, -13.61459732055664, -12.555760383605957, -11.496922492980957, -10.438084602355957, -9.379247665405273, -8.320409774780273, -7.261571884155273, -6.202733993530273, -5.143896579742432, -4.08505916595459, -3.02622127532959, -1.9673833847045898, -0.908545970916748, 0.15029144287109375, 1.2091331481933594, 2.2679708003997803, 3.326808452606201, 4.385645866394043, 5.444483757019043, 6.503321647644043, 7.562159061431885, 8.620996475219727, 9.679834365844727, 10.738672256469727, 11.797510147094727, 12.85634708404541, 13.91518497467041, 14.97402286529541, 16.032859802246094, 17.091697692871094, 18.150535583496094, 19.209373474121094, 20.268211364746094, 21.327049255371094, 22.385887145996094, 23.444725036621094, 24.50356101989746, 25.56239891052246, 26.62123680114746, 27.68007469177246, 28.73891258239746, 29.79775047302246, 30.856586456298828, 31.915424346923828, 32.97426223754883, 34.03310012817383, 35.09193801879883]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 1.0, 3.0, 16.0, 8.0, 7.0, 22.0, 28.0, 41.0, 65.0, 104.0, 175.0, 250.0, 418.0, 721.0, 1378.0, 2966.0, 7252.0, 22370.0, 117006.0, 3573442.0, 408697.0, 40813.0, 10976.0, 3966.0, 1653.0, 806.0, 435.0, 263.0, 164.0, 79.0, 44.0, 31.0, 24.0, 23.0, 11.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.296875, -8.04327392578125, -7.7896728515625, -7.53607177734375, -7.282470703125, -7.02886962890625, -6.7752685546875, -6.52166748046875, -6.26806640625, -6.01446533203125, -5.7608642578125, -5.50726318359375, -5.253662109375, -5.00006103515625, -4.7464599609375, -4.49285888671875, -4.2392578125, -3.98565673828125, -3.7320556640625, -3.47845458984375, -3.224853515625, -2.97125244140625, -2.7176513671875, -2.46405029296875, -2.21044921875, -1.95684814453125, -1.7032470703125, -1.44964599609375, -1.196044921875, -0.94244384765625, -0.6888427734375, -0.43524169921875, -0.181640625, 0.07196044921875, 0.3255615234375, 0.57916259765625, 0.832763671875, 1.08636474609375, 1.3399658203125, 1.59356689453125, 1.84716796875, 2.10076904296875, 2.3543701171875, 2.60797119140625, 2.861572265625, 3.11517333984375, 3.3687744140625, 3.62237548828125, 3.8759765625, 4.12957763671875, 4.3831787109375, 4.63677978515625, 4.890380859375, 5.14398193359375, 5.3975830078125, 5.65118408203125, 5.90478515625, 6.15838623046875, 6.4119873046875, 6.66558837890625, 6.919189453125, 7.17279052734375, 7.4263916015625, 7.67999267578125, 7.93359375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 6.0, 17.0, 18.0, 17.0, 31.0, 28.0, 41.0, 41.0, 52.0, 60.0, 59.0, 59.0, 63.0, 77.0, 53.0, 49.0, 58.0, 49.0, 45.0, 31.0, 38.0, 20.0, 20.0, 14.0, 12.0, 3.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.20745849609375, -2.1395263671875, -2.07159423828125, -2.003662109375, -1.93572998046875, -1.8677978515625, -1.79986572265625, -1.73193359375, -1.66400146484375, -1.5960693359375, -1.52813720703125, -1.460205078125, -1.39227294921875, -1.3243408203125, -1.25640869140625, -1.1884765625, -1.12054443359375, -1.0526123046875, -0.98468017578125, -0.916748046875, -0.84881591796875, -0.7808837890625, -0.71295166015625, -0.64501953125, -0.57708740234375, -0.5091552734375, -0.44122314453125, -0.373291015625, -0.30535888671875, -0.2374267578125, -0.16949462890625, -0.1015625, -0.03363037109375, 0.0343017578125, 0.10223388671875, 0.170166015625, 0.23809814453125, 0.3060302734375, 0.37396240234375, 0.44189453125, 0.50982666015625, 0.5777587890625, 0.64569091796875, 0.713623046875, 0.78155517578125, 0.8494873046875, 0.91741943359375, 0.9853515625, 1.05328369140625, 1.1212158203125, 1.18914794921875, 1.257080078125, 1.32501220703125, 1.3929443359375, 1.46087646484375, 1.52880859375, 1.59674072265625, 1.6646728515625, 1.73260498046875, 1.800537109375, 1.86846923828125, 1.9364013671875, 2.00433349609375, 2.072265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 13.0, 11.0, 14.0, 16.0, 33.0, 60.0, 102.0, 116.0, 224.0, 392.0, 804.0, 1883.0, 5342.0, 21015.0, 145889.0, 3416514.0, 545648.0, 42261.0, 9000.0, 2742.0, 1048.0, 503.0, 226.0, 147.0, 118.0, 64.0, 33.0, 17.0, 9.0, 10.0, 9.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.69140625, -6.48040771484375, -6.2694091796875, -6.05841064453125, -5.847412109375, -5.63641357421875, -5.4254150390625, -5.21441650390625, -5.00341796875, -4.79241943359375, -4.5814208984375, -4.37042236328125, -4.159423828125, -3.94842529296875, -3.7374267578125, -3.52642822265625, -3.3154296875, -3.10443115234375, -2.8934326171875, -2.68243408203125, -2.471435546875, -2.26043701171875, -2.0494384765625, -1.83843994140625, -1.62744140625, -1.41644287109375, -1.2054443359375, -0.99444580078125, -0.783447265625, -0.57244873046875, -0.3614501953125, -0.15045166015625, 0.060546875, 0.27154541015625, 0.4825439453125, 0.69354248046875, 0.904541015625, 1.11553955078125, 1.3265380859375, 1.53753662109375, 1.74853515625, 1.95953369140625, 2.1705322265625, 2.38153076171875, 2.592529296875, 2.80352783203125, 3.0145263671875, 3.22552490234375, 3.4365234375, 3.64752197265625, 3.8585205078125, 4.06951904296875, 4.280517578125, 4.49151611328125, 4.7025146484375, 4.91351318359375, 5.12451171875, 5.33551025390625, 5.5465087890625, 5.75750732421875, 5.968505859375, 6.17950439453125, 6.3905029296875, 6.60150146484375, 6.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 11.0, 8.0, 22.0, 20.0, 23.0, 63.0, 127.0, 348.0, 1320.0, 1474.0, 353.0, 151.0, 66.0, 28.0, 22.0, 16.0, 7.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.656097412109375, -4.52313232421875, -4.390167236328125, -4.2572021484375, -4.124237060546875, -3.99127197265625, -3.858306884765625, -3.725341796875, -3.592376708984375, -3.45941162109375, -3.326446533203125, -3.1934814453125, -3.060516357421875, -2.92755126953125, -2.794586181640625, -2.66162109375, -2.528656005859375, -2.39569091796875, -2.262725830078125, -2.1297607421875, -1.996795654296875, -1.86383056640625, -1.730865478515625, -1.597900390625, -1.464935302734375, -1.33197021484375, -1.199005126953125, -1.0660400390625, -0.933074951171875, -0.80010986328125, -0.667144775390625, -0.5341796875, -0.401214599609375, -0.26824951171875, -0.135284423828125, -0.0023193359375, 0.130645751953125, 0.26361083984375, 0.396575927734375, 0.529541015625, 0.662506103515625, 0.79547119140625, 0.928436279296875, 1.0614013671875, 1.194366455078125, 1.32733154296875, 1.460296630859375, 1.59326171875, 1.726226806640625, 1.85919189453125, 1.992156982421875, 2.1251220703125, 2.258087158203125, 2.39105224609375, 2.524017333984375, 2.656982421875, 2.789947509765625, 2.92291259765625, 3.055877685546875, 3.1888427734375, 3.321807861328125, 3.45477294921875, 3.587738037109375, 3.720703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 21.0, 58.0, 132.0, 282.0, 278.0, 145.0, 54.0, 18.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.2313232421875, -41.24857711791992, -40.265830993652344, -39.283084869384766, -38.30033493041992, -37.317588806152344, -36.334842681884766, -35.35209655761719, -34.36935043334961, -33.38660430908203, -32.40385818481445, -31.421110153198242, -30.438364028930664, -29.455615997314453, -28.472869873046875, -27.490123748779297, -26.50737762451172, -25.52463150024414, -24.54188346862793, -23.55913734436035, -22.576391220092773, -21.593643188476562, -20.610897064208984, -19.628150939941406, -18.645402908325195, -17.662656784057617, -16.679908752441406, -15.697162628173828, -14.71441650390625, -13.731669425964355, -12.748922348022461, -11.766176223754883, -10.783430099487305, -9.80068302154541, -8.817936897277832, -7.8351898193359375, -6.852443695068359, -5.869696617126465, -4.8869500160217285, -3.904203414916992, -2.921456813812256, -1.9387102127075195, -0.9559634923934937, 0.026783227920532227, 1.0095298290252686, 1.992276668548584, 2.9750232696533203, 3.9577698707580566, 4.940516471862793, 5.923263072967529, 6.906009674072266, 7.88875675201416, 8.871502876281738, 9.854249954223633, 10.836996078491211, 11.819743156433105, 12.802490234375, 13.785237312316895, 14.767983436584473, 15.750730514526367, 16.733476638793945, 17.716224670410156, 18.698970794677734, 19.681716918945312, 20.66446304321289]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 11.0, 12.0, 12.0, 21.0, 26.0, 32.0, 36.0, 48.0, 46.0, 61.0, 56.0, 51.0, 72.0, 65.0, 67.0, 58.0, 52.0, 44.0, 42.0, 38.0, 45.0, 24.0, 28.0, 16.0, 12.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.574504852294922, -13.1665678024292, -12.758630752563477, -12.350693702697754, -11.942756652832031, -11.534820556640625, -11.126882553100586, -10.71894645690918, -10.311009407043457, -9.903072357177734, -9.495135307312012, -9.087198257446289, -8.679261207580566, -8.271324157714844, -7.863387584686279, -7.455451011657715, -7.047513484954834, -6.639576435089111, -6.231639385223389, -5.823702812194824, -5.415765762329102, -5.007828712463379, -4.599891662597656, -4.191954612731934, -3.78401780128479, -3.3760807514190674, -2.968143939971924, -2.560206890106201, -2.1522698402404785, -1.744333028793335, -1.3363959789276123, -0.9284591674804688, -0.5205221176147461, -0.1125851571559906, 0.2953518033027649, 0.7032887935638428, 1.1112257242202759, 1.519162654876709, 1.9270997047424316, 2.335036516189575, 2.742973566055298, 3.1509106159210205, 3.558847427368164, 3.9667844772338867, 4.374721527099609, 4.782658576965332, 5.190595626831055, 5.598532199859619, 6.006469249725342, 6.4144062995910645, 6.822343349456787, 7.230279922485352, 7.638216972351074, 8.046154022216797, 8.45409107208252, 8.862028121948242, 9.269965171813965, 9.677902221679688, 10.08583927154541, 10.493776321411133, 10.901713371276855, 11.309650421142578, 11.717586517333984, 12.125523567199707, 12.53346061706543]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 12.0, 18.0, 17.0, 22.0, 30.0, 41.0, 77.0, 121.0, 206.0, 315.0, 520.0, 916.0, 1765.0, 3649.0, 8391.0, 22328.0, 66893.0, 232637.0, 463233.0, 166488.0, 50314.0, 17284.0, 6730.0, 3065.0, 1456.0, 810.0, 465.0, 260.0, 158.0, 102.0, 62.0, 48.0, 40.0, 23.0, 18.0, 9.0, 5.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.47265625, -7.272705078125, -7.07275390625, -6.872802734375, -6.6728515625, -6.472900390625, -6.27294921875, -6.072998046875, -5.873046875, -5.673095703125, -5.47314453125, -5.273193359375, -5.0732421875, -4.873291015625, -4.67333984375, -4.473388671875, -4.2734375, -4.073486328125, -3.87353515625, -3.673583984375, -3.4736328125, -3.273681640625, -3.07373046875, -2.873779296875, -2.673828125, -2.473876953125, -2.27392578125, -2.073974609375, -1.8740234375, -1.674072265625, -1.47412109375, -1.274169921875, -1.07421875, -0.874267578125, -0.67431640625, -0.474365234375, -0.2744140625, -0.074462890625, 0.12548828125, 0.325439453125, 0.525390625, 0.725341796875, 0.92529296875, 1.125244140625, 1.3251953125, 1.525146484375, 1.72509765625, 1.925048828125, 2.125, 2.324951171875, 2.52490234375, 2.724853515625, 2.9248046875, 3.124755859375, 3.32470703125, 3.524658203125, 3.724609375, 3.924560546875, 4.12451171875, 4.324462890625, 4.5244140625, 4.724365234375, 4.92431640625, 5.124267578125, 5.32421875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 10.0, 15.0, 17.0, 23.0, 33.0, 26.0, 43.0, 45.0, 66.0, 48.0, 51.0, 68.0, 64.0, 66.0, 61.0, 40.0, 55.0, 41.0, 42.0, 43.0, 33.0, 25.0, 10.0, 18.0, 5.0, 4.0, 8.0, 8.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.305511474609375, -2.23992919921875, -2.174346923828125, -2.1087646484375, -2.043182373046875, -1.97760009765625, -1.912017822265625, -1.846435546875, -1.780853271484375, -1.71527099609375, -1.649688720703125, -1.5841064453125, -1.518524169921875, -1.45294189453125, -1.387359619140625, -1.32177734375, -1.256195068359375, -1.19061279296875, -1.125030517578125, -1.0594482421875, -0.993865966796875, -0.92828369140625, -0.862701416015625, -0.797119140625, -0.731536865234375, -0.66595458984375, -0.600372314453125, -0.5347900390625, -0.469207763671875, -0.40362548828125, -0.338043212890625, -0.2724609375, -0.206878662109375, -0.14129638671875, -0.075714111328125, -0.0101318359375, 0.055450439453125, 0.12103271484375, 0.186614990234375, 0.252197265625, 0.317779541015625, 0.38336181640625, 0.448944091796875, 0.5145263671875, 0.580108642578125, 0.64569091796875, 0.711273193359375, 0.77685546875, 0.842437744140625, 0.90802001953125, 0.973602294921875, 1.0391845703125, 1.104766845703125, 1.17034912109375, 1.235931396484375, 1.301513671875, 1.367095947265625, 1.43267822265625, 1.498260498046875, 1.5638427734375, 1.629425048828125, 1.69500732421875, 1.760589599609375, 1.826171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 3.0, 7.0, 18.0, 15.0, 24.0, 26.0, 40.0, 66.0, 89.0, 144.0, 213.0, 353.0, 563.0, 946.0, 1825.0, 4139.0, 9964.0, 28068.0, 87995.0, 301775.0, 412486.0, 134369.0, 40561.0, 14036.0, 5520.0, 2314.0, 1191.0, 665.0, 368.0, 248.0, 165.0, 123.0, 87.0, 44.0, 29.0, 24.0, 19.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.58984375, -5.430908203125, -5.27197265625, -5.113037109375, -4.9541015625, -4.795166015625, -4.63623046875, -4.477294921875, -4.318359375, -4.159423828125, -4.00048828125, -3.841552734375, -3.6826171875, -3.523681640625, -3.36474609375, -3.205810546875, -3.046875, -2.887939453125, -2.72900390625, -2.570068359375, -2.4111328125, -2.252197265625, -2.09326171875, -1.934326171875, -1.775390625, -1.616455078125, -1.45751953125, -1.298583984375, -1.1396484375, -0.980712890625, -0.82177734375, -0.662841796875, -0.50390625, -0.344970703125, -0.18603515625, -0.027099609375, 0.1318359375, 0.290771484375, 0.44970703125, 0.608642578125, 0.767578125, 0.926513671875, 1.08544921875, 1.244384765625, 1.4033203125, 1.562255859375, 1.72119140625, 1.880126953125, 2.0390625, 2.197998046875, 2.35693359375, 2.515869140625, 2.6748046875, 2.833740234375, 2.99267578125, 3.151611328125, 3.310546875, 3.469482421875, 3.62841796875, 3.787353515625, 3.9462890625, 4.105224609375, 4.26416015625, 4.423095703125, 4.58203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 9.0, 12.0, 15.0, 15.0, 13.0, 29.0, 24.0, 24.0, 33.0, 39.0, 43.0, 28.0, 53.0, 57.0, 59.0, 51.0, 68.0, 54.0, 59.0, 43.0, 35.0, 29.0, 30.0, 31.0, 28.0, 21.0, 19.0, 15.0, 13.0, 8.0, 6.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.125, -8.89300537109375, -8.6610107421875, -8.42901611328125, -8.197021484375, -7.96502685546875, -7.7330322265625, -7.50103759765625, -7.26904296875, -7.03704833984375, -6.8050537109375, -6.57305908203125, -6.341064453125, -6.10906982421875, -5.8770751953125, -5.64508056640625, -5.4130859375, -5.18109130859375, -4.9490966796875, -4.71710205078125, -4.485107421875, -4.25311279296875, -4.0211181640625, -3.78912353515625, -3.55712890625, -3.32513427734375, -3.0931396484375, -2.86114501953125, -2.629150390625, -2.39715576171875, -2.1651611328125, -1.93316650390625, -1.701171875, -1.46917724609375, -1.2371826171875, -1.00518798828125, -0.773193359375, -0.54119873046875, -0.3092041015625, -0.07720947265625, 0.15478515625, 0.38677978515625, 0.6187744140625, 0.85076904296875, 1.082763671875, 1.31475830078125, 1.5467529296875, 1.77874755859375, 2.0107421875, 2.24273681640625, 2.4747314453125, 2.70672607421875, 2.938720703125, 3.17071533203125, 3.4027099609375, 3.63470458984375, 3.86669921875, 4.09869384765625, 4.3306884765625, 4.56268310546875, 4.794677734375, 5.02667236328125, 5.2586669921875, 5.49066162109375, 5.72265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 6.0, 16.0, 34.0, 77.0, 191.0, 741.0, 4570.0, 60069.0, 867809.0, 106629.0, 7075.0, 943.0, 241.0, 79.0, 46.0, 11.0, 7.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.28057861328125, -6.1041259765625, -5.92767333984375, -5.751220703125, -5.57476806640625, -5.3983154296875, -5.22186279296875, -5.04541015625, -4.86895751953125, -4.6925048828125, -4.51605224609375, -4.339599609375, -4.16314697265625, -3.9866943359375, -3.81024169921875, -3.6337890625, -3.45733642578125, -3.2808837890625, -3.10443115234375, -2.927978515625, -2.75152587890625, -2.5750732421875, -2.39862060546875, -2.22216796875, -2.04571533203125, -1.8692626953125, -1.69281005859375, -1.516357421875, -1.33990478515625, -1.1634521484375, -0.98699951171875, -0.810546875, -0.63409423828125, -0.4576416015625, -0.28118896484375, -0.104736328125, 0.07171630859375, 0.2481689453125, 0.42462158203125, 0.60107421875, 0.77752685546875, 0.9539794921875, 1.13043212890625, 1.306884765625, 1.48333740234375, 1.6597900390625, 1.83624267578125, 2.0126953125, 2.18914794921875, 2.3656005859375, 2.54205322265625, 2.718505859375, 2.89495849609375, 3.0714111328125, 3.24786376953125, 3.42431640625, 3.60076904296875, 3.7772216796875, 3.95367431640625, 4.130126953125, 4.30657958984375, 4.4830322265625, 4.65948486328125, 4.8359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 12.0, 9.0, 17.0, 24.0, 24.0, 53.0, 118.0, 267.0, 238.0, 111.0, 43.0, 31.0, 18.0, 14.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012483596801757812, -0.0012205541133880615, -0.0011927485466003418, -0.001164942979812622, -0.0011371374130249023, -0.0011093318462371826, -0.0010815262794494629, -0.0010537207126617432, -0.0010259151458740234, -0.0009981095790863037, -0.000970304012298584, -0.0009424984455108643, -0.0009146928787231445, -0.0008868873119354248, -0.0008590817451477051, -0.0008312761783599854, -0.0008034706115722656, -0.0007756650447845459, -0.0007478594779968262, -0.0007200539112091064, -0.0006922483444213867, -0.000664442777633667, -0.0006366372108459473, -0.0006088316440582275, -0.0005810260772705078, -0.0005532205104827881, -0.0005254149436950684, -0.0004976093769073486, -0.0004698038101196289, -0.0004419982433319092, -0.00041419267654418945, -0.0003863871097564697, -0.00035858154296875, -0.0003307759761810303, -0.00030297040939331055, -0.0002751648426055908, -0.0002473592758178711, -0.00021955370903015137, -0.00019174814224243164, -0.00016394257545471191, -0.0001361370086669922, -0.00010833144187927246, -8.052587509155273e-05, -5.272030830383301e-05, -2.491474151611328e-05, 2.8908252716064453e-06, 3.069639205932617e-05, 5.85019588470459e-05, 8.630752563476562e-05, 0.00011411309242248535, 0.00014191865921020508, 0.0001697242259979248, 0.00019752979278564453, 0.00022533535957336426, 0.000253140926361084, 0.0002809464931488037, 0.00030875205993652344, 0.00033655762672424316, 0.0003643631935119629, 0.0003921687602996826, 0.00041997432708740234, 0.00044777989387512207, 0.0004755854606628418, 0.0005033910274505615, 0.0005311965942382812]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 16.0, 31.0, 40.0, 54.0, 105.0, 196.0, 382.0, 790.0, 2050.0, 6139.0, 23173.0, 116370.0, 728699.0, 134486.0, 25458.0, 6587.0, 2160.0, 892.0, 420.0, 202.0, 107.0, 70.0, 38.0, 20.0, 12.0, 10.0, 5.0, 5.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.139373779296875, -3.03656005859375, -2.933746337890625, -2.8309326171875, -2.728118896484375, -2.62530517578125, -2.522491455078125, -2.419677734375, -2.316864013671875, -2.21405029296875, -2.111236572265625, -2.0084228515625, -1.905609130859375, -1.80279541015625, -1.699981689453125, -1.59716796875, -1.494354248046875, -1.39154052734375, -1.288726806640625, -1.1859130859375, -1.083099365234375, -0.98028564453125, -0.877471923828125, -0.774658203125, -0.671844482421875, -0.56903076171875, -0.466217041015625, -0.3634033203125, -0.260589599609375, -0.15777587890625, -0.054962158203125, 0.0478515625, 0.150665283203125, 0.25347900390625, 0.356292724609375, 0.4591064453125, 0.561920166015625, 0.66473388671875, 0.767547607421875, 0.870361328125, 0.973175048828125, 1.07598876953125, 1.178802490234375, 1.2816162109375, 1.384429931640625, 1.48724365234375, 1.590057373046875, 1.69287109375, 1.795684814453125, 1.89849853515625, 2.001312255859375, 2.1041259765625, 2.206939697265625, 2.30975341796875, 2.412567138671875, 2.515380859375, 2.618194580078125, 2.72100830078125, 2.823822021484375, 2.9266357421875, 3.029449462890625, 3.13226318359375, 3.235076904296875, 3.337890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 13.0, 17.0, 23.0, 35.0, 50.0, 80.0, 131.0, 156.0, 143.0, 120.0, 71.0, 43.0, 32.0, 22.0, 13.0, 13.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.365386962890625, -3.24835205078125, -3.131317138671875, -3.0142822265625, -2.897247314453125, -2.78021240234375, -2.663177490234375, -2.546142578125, -2.429107666015625, -2.31207275390625, -2.195037841796875, -2.0780029296875, -1.960968017578125, -1.84393310546875, -1.726898193359375, -1.60986328125, -1.492828369140625, -1.37579345703125, -1.258758544921875, -1.1417236328125, -1.024688720703125, -0.90765380859375, -0.790618896484375, -0.673583984375, -0.556549072265625, -0.43951416015625, -0.322479248046875, -0.2054443359375, -0.088409423828125, 0.02862548828125, 0.145660400390625, 0.2626953125, 0.379730224609375, 0.49676513671875, 0.613800048828125, 0.7308349609375, 0.847869873046875, 0.96490478515625, 1.081939697265625, 1.198974609375, 1.316009521484375, 1.43304443359375, 1.550079345703125, 1.6671142578125, 1.784149169921875, 1.90118408203125, 2.018218994140625, 2.13525390625, 2.252288818359375, 2.36932373046875, 2.486358642578125, 2.6033935546875, 2.720428466796875, 2.83746337890625, 2.954498291015625, 3.071533203125, 3.188568115234375, 3.30560302734375, 3.422637939453125, 3.5396728515625, 3.656707763671875, 3.77374267578125, 3.890777587890625, 4.0078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 16.0, 21.0, 33.0, 35.0, 67.0, 93.0, 111.0, 93.0, 122.0, 106.0, 68.0, 80.0, 49.0, 23.0, 22.0, 12.0, 9.0, 2.0, 7.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.47974395751953, -35.41631317138672, -34.35288619995117, -33.289459228515625, -32.22602844238281, -31.162599563598633, -30.099170684814453, -29.035741806030273, -27.972312927246094, -26.908884048461914, -25.845455169677734, -24.782026290893555, -23.718597412109375, -22.655168533325195, -21.591739654541016, -20.528310775756836, -19.464881896972656, -18.401453018188477, -17.338024139404297, -16.274595260620117, -15.211166381835938, -14.147737503051758, -13.084308624267578, -12.020879745483398, -10.957450866699219, -9.894021987915039, -8.83059310913086, -7.76716423034668, -6.7037353515625, -5.64030647277832, -4.576877593994141, -3.513448715209961, -2.4500160217285156, -1.386587142944336, -0.32315826416015625, 0.7402706146240234, 1.8036994934082031, 2.867128372192383, 3.9305572509765625, 4.993986129760742, 6.057415008544922, 7.120843887329102, 8.184272766113281, 9.247701644897461, 10.31113052368164, 11.37455940246582, 12.43798828125, 13.50141716003418, 14.56484603881836, 15.628274917602539, 16.69170379638672, 17.7551326751709, 18.818561553955078, 19.881990432739258, 20.945419311523438, 22.008848190307617, 23.072277069091797, 24.135705947875977, 25.199134826660156, 26.262563705444336, 27.325992584228516, 28.389421463012695, 29.452850341796875, 30.516279220581055, 31.579708099365234]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 11.0, 10.0, 15.0, 17.0, 17.0, 23.0, 22.0, 18.0, 30.0, 22.0, 38.0, 25.0, 39.0, 22.0, 41.0, 48.0, 27.0, 40.0, 43.0, 32.0, 32.0, 40.0, 45.0, 28.0, 34.0, 29.0, 32.0, 21.0, 21.0, 29.0, 12.0, 24.0, 16.0, 16.0, 12.0, 9.0, 8.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.645950317382812, -26.70466423034668, -25.763378143310547, -24.822093963623047, -23.880807876586914, -22.93952178955078, -21.99823570251465, -21.056949615478516, -20.115665435791016, -19.174379348754883, -18.23309326171875, -17.29180908203125, -16.350522994995117, -15.409236907958984, -14.467950820922852, -13.526664733886719, -12.585378646850586, -11.644092559814453, -10.702807426452637, -9.761521339416504, -8.820236206054688, -7.878950119018555, -6.937664031982422, -5.996378421783447, -5.055092811584473, -4.113807201385498, -3.1725213527679443, -2.2312355041503906, -1.289949893951416, -0.3486642837524414, 0.5926218032836914, 1.533907413482666, 2.4751930236816406, 3.4164786338806152, 4.35776424407959, 5.299050331115723, 6.240335941314697, 7.181621551513672, 8.122907638549805, 9.064193725585938, 10.005478858947754, 10.946764945983887, 11.888050079345703, 12.829336166381836, 13.770622253417969, 14.711907386779785, 15.653193473815918, 16.594478607177734, 17.535764694213867, 18.47705078125, 19.418336868286133, 20.359622955322266, 21.300907135009766, 22.2421932220459, 23.18347930908203, 24.124765396118164, 25.066051483154297, 26.00733757019043, 26.948623657226562, 27.889907836914062, 28.831193923950195, 29.772480010986328, 30.71376609802246, 31.655052185058594, 32.596336364746094]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 14.0, 14.0, 19.0, 26.0, 31.0, 54.0, 57.0, 88.0, 143.0, 157.0, 269.0, 401.0, 584.0, 1033.0, 1776.0, 3392.0, 6477.0, 15118.0, 47308.0, 328796.0, 3576877.0, 155656.0, 32728.0, 11760.0, 5040.0, 2672.0, 1471.0, 854.0, 500.0, 295.0, 201.0, 160.0, 86.0, 60.0, 32.0, 25.0, 33.0, 14.0, 14.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.67578125, -6.4814453125, -6.287109375, -6.0927734375, -5.8984375, -5.7041015625, -5.509765625, -5.3154296875, -5.12109375, -4.9267578125, -4.732421875, -4.5380859375, -4.34375, -4.1494140625, -3.955078125, -3.7607421875, -3.56640625, -3.3720703125, -3.177734375, -2.9833984375, -2.7890625, -2.5947265625, -2.400390625, -2.2060546875, -2.01171875, -1.8173828125, -1.623046875, -1.4287109375, -1.234375, -1.0400390625, -0.845703125, -0.6513671875, -0.45703125, -0.2626953125, -0.068359375, 0.1259765625, 0.3203125, 0.5146484375, 0.708984375, 0.9033203125, 1.09765625, 1.2919921875, 1.486328125, 1.6806640625, 1.875, 2.0693359375, 2.263671875, 2.4580078125, 2.65234375, 2.8466796875, 3.041015625, 3.2353515625, 3.4296875, 3.6240234375, 3.818359375, 4.0126953125, 4.20703125, 4.4013671875, 4.595703125, 4.7900390625, 4.984375, 5.1787109375, 5.373046875, 5.5673828125, 5.76171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 3.0, 9.0, 5.0, 7.0, 11.0, 21.0, 12.0, 17.0, 36.0, 32.0, 30.0, 40.0, 47.0, 41.0, 66.0, 58.0, 67.0, 51.0, 55.0, 60.0, 46.0, 47.0, 53.0, 34.0, 33.0, 22.0, 17.0, 18.0, 18.0, 14.0, 8.0, 2.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.116851806640625, -2.05010986328125, -1.983367919921875, -1.9166259765625, -1.849884033203125, -1.78314208984375, -1.716400146484375, -1.649658203125, -1.582916259765625, -1.51617431640625, -1.449432373046875, -1.3826904296875, -1.315948486328125, -1.24920654296875, -1.182464599609375, -1.11572265625, -1.048980712890625, -0.98223876953125, -0.915496826171875, -0.8487548828125, -0.782012939453125, -0.71527099609375, -0.648529052734375, -0.581787109375, -0.515045166015625, -0.44830322265625, -0.381561279296875, -0.3148193359375, -0.248077392578125, -0.18133544921875, -0.114593505859375, -0.0478515625, 0.018890380859375, 0.08563232421875, 0.152374267578125, 0.2191162109375, 0.285858154296875, 0.35260009765625, 0.419342041015625, 0.486083984375, 0.552825927734375, 0.61956787109375, 0.686309814453125, 0.7530517578125, 0.819793701171875, 0.88653564453125, 0.953277587890625, 1.02001953125, 1.086761474609375, 1.15350341796875, 1.220245361328125, 1.2869873046875, 1.353729248046875, 1.42047119140625, 1.487213134765625, 1.553955078125, 1.620697021484375, 1.68743896484375, 1.754180908203125, 1.8209228515625, 1.887664794921875, 1.95440673828125, 2.021148681640625, 2.087890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 13.0, 11.0, 35.0, 57.0, 93.0, 157.0, 285.0, 615.0, 1402.0, 3947.0, 15756.0, 152667.0, 3812713.0, 182984.0, 16902.0, 3972.0, 1418.0, 571.0, 303.0, 171.0, 85.0, 50.0, 30.0, 18.0, 10.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.927734375, -5.67578125, -5.423828125, -5.171875, -4.919921875, -4.66796875, -4.416015625, -4.1640625, -3.912109375, -3.66015625, -3.408203125, -3.15625, -2.904296875, -2.65234375, -2.400390625, -2.1484375, -1.896484375, -1.64453125, -1.392578125, -1.140625, -0.888671875, -0.63671875, -0.384765625, -0.1328125, 0.119140625, 0.37109375, 0.623046875, 0.875, 1.126953125, 1.37890625, 1.630859375, 1.8828125, 2.134765625, 2.38671875, 2.638671875, 2.890625, 3.142578125, 3.39453125, 3.646484375, 3.8984375, 4.150390625, 4.40234375, 4.654296875, 4.90625, 5.158203125, 5.41015625, 5.662109375, 5.9140625, 6.166015625, 6.41796875, 6.669921875, 6.921875, 7.173828125, 7.42578125, 7.677734375, 7.9296875, 8.181640625, 8.43359375, 8.685546875, 8.9375, 9.189453125, 9.44140625, 9.693359375, 9.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 8.0, 11.0, 18.0, 31.0, 58.0, 115.0, 300.0, 1704.0, 1274.0, 294.0, 115.0, 58.0, 29.0, 18.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.2186279296875, -3.111083984375, -3.0035400390625, -2.89599609375, -2.7884521484375, -2.680908203125, -2.5733642578125, -2.4658203125, -2.3582763671875, -2.250732421875, -2.1431884765625, -2.03564453125, -1.9281005859375, -1.820556640625, -1.7130126953125, -1.60546875, -1.4979248046875, -1.390380859375, -1.2828369140625, -1.17529296875, -1.0677490234375, -0.960205078125, -0.8526611328125, -0.7451171875, -0.6375732421875, -0.530029296875, -0.4224853515625, -0.31494140625, -0.2073974609375, -0.099853515625, 0.0076904296875, 0.115234375, 0.2227783203125, 0.330322265625, 0.4378662109375, 0.54541015625, 0.6529541015625, 0.760498046875, 0.8680419921875, 0.9755859375, 1.0831298828125, 1.190673828125, 1.2982177734375, 1.40576171875, 1.5133056640625, 1.620849609375, 1.7283935546875, 1.8359375, 1.9434814453125, 2.051025390625, 2.1585693359375, 2.26611328125, 2.3736572265625, 2.481201171875, 2.5887451171875, 2.6962890625, 2.8038330078125, 2.911376953125, 3.0189208984375, 3.12646484375, 3.2340087890625, 3.341552734375, 3.4490966796875, 3.556640625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 18.0, 26.0, 66.0, 124.0, 168.0, 183.0, 169.0, 113.0, 68.0, 24.0, 20.0, 10.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.105419158935547, -25.56537437438965, -25.02532958984375, -24.48528480529785, -23.945240020751953, -23.405195236206055, -22.865150451660156, -22.32510757446289, -21.78506088256836, -21.24501609802246, -20.704971313476562, -20.164926528930664, -19.624881744384766, -19.084836959838867, -18.54479217529297, -18.004749298095703, -17.464704513549805, -16.924659729003906, -16.384614944458008, -15.84457015991211, -15.304525375366211, -14.764480590820312, -14.22443675994873, -13.684391975402832, -13.144347190856934, -12.604302406311035, -12.064257621765137, -11.524212837219238, -10.984169006347656, -10.444124221801758, -9.90407943725586, -9.364034652709961, -8.823991775512695, -8.283946990966797, -7.743902206420898, -7.203857898712158, -6.66381311416626, -6.123768329620361, -5.583724021911621, -5.043679237365723, -4.503634452819824, -3.963589668273926, -3.4235451221466064, -2.883500576019287, -2.3434557914733887, -1.8034110069274902, -1.263366460800171, -0.7233219146728516, -0.18327713012695312, 0.35676753520965576, 0.8968122005462646, 1.4368568658828735, 1.9769015312194824, 2.516946315765381, 3.0569908618927, 3.5970354080200195, 4.137080192565918, 4.677124977111816, 5.217169761657715, 5.757214069366455, 6.2972588539123535, 6.837303638458252, 7.377347946166992, 7.917392730712891, 8.457437515258789]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 13.0, 10.0, 16.0, 21.0, 25.0, 30.0, 19.0, 56.0, 38.0, 54.0, 52.0, 49.0, 59.0, 53.0, 63.0, 67.0, 60.0, 46.0, 24.0, 43.0, 40.0, 33.0, 30.0, 24.0, 19.0, 14.0, 5.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.014872550964355, -8.690292358398438, -8.36571216583252, -8.041132926940918, -7.716552734375, -7.391972541809082, -7.067392349243164, -6.742812156677246, -6.418232440948486, -6.093652248382568, -5.769072532653809, -5.444492340087891, -5.119912147521973, -4.795332431793213, -4.470752239227295, -4.146172523498535, -3.821592330932617, -3.4970123767852783, -3.1724324226379395, -2.8478522300720215, -2.5232722759246826, -2.1986923217773438, -1.8741122484207153, -1.549532175064087, -1.224952220916748, -0.9003722071647644, -0.5757921934127808, -0.2512121796607971, 0.07336783409118652, 0.3979477882385254, 0.7225278615951538, 1.0471079349517822, 1.3716888427734375, 1.6962687969207764, 2.0208487510681152, 2.345428943634033, 2.670008897781372, 2.994588851928711, 3.319169044494629, 3.6437489986419678, 3.9683289527893066, 4.292909145355225, 4.617488861083984, 4.942069053649902, 5.26664924621582, 5.59122896194458, 5.915809154510498, 6.240388870239258, 6.564969062805176, 6.889549255371094, 7.2141289710998535, 7.5387091636657715, 7.863288879394531, 8.18786907196045, 8.512449264526367, 8.837029457092285, 9.161609649658203, 9.486189842224121, 9.810770034790039, 10.13534927368164, 10.459929466247559, 10.784509658813477, 11.109089851379395, 11.433670043945312, 11.758249282836914]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 16.0, 20.0, 32.0, 43.0, 80.0, 150.0, 224.0, 428.0, 989.0, 2532.0, 7878.0, 29398.0, 141391.0, 565348.0, 236185.0, 46437.0, 11300.0, 3539.0, 1336.0, 558.0, 238.0, 171.0, 81.0, 49.0, 36.0, 23.0, 15.0, 6.0, 11.0, 7.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.3828125, -10.1070556640625, -9.831298828125, -9.5555419921875, -9.27978515625, -9.0040283203125, -8.728271484375, -8.4525146484375, -8.1767578125, -7.9010009765625, -7.625244140625, -7.3494873046875, -7.07373046875, -6.7979736328125, -6.522216796875, -6.2464599609375, -5.970703125, -5.6949462890625, -5.419189453125, -5.1434326171875, -4.86767578125, -4.5919189453125, -4.316162109375, -4.0404052734375, -3.7646484375, -3.4888916015625, -3.213134765625, -2.9373779296875, -2.66162109375, -2.3858642578125, -2.110107421875, -1.8343505859375, -1.55859375, -1.2828369140625, -1.007080078125, -0.7313232421875, -0.45556640625, -0.1798095703125, 0.095947265625, 0.3717041015625, 0.6474609375, 0.9232177734375, 1.198974609375, 1.4747314453125, 1.75048828125, 2.0262451171875, 2.302001953125, 2.5777587890625, 2.853515625, 3.1292724609375, 3.405029296875, 3.6807861328125, 3.95654296875, 4.2322998046875, 4.508056640625, 4.7838134765625, 5.0595703125, 5.3353271484375, 5.611083984375, 5.8868408203125, 6.16259765625, 6.4383544921875, 6.714111328125, 6.9898681640625, 7.265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 0.0, 3.0, 5.0, 4.0, 7.0, 9.0, 8.0, 10.0, 14.0, 28.0, 34.0, 24.0, 28.0, 44.0, 42.0, 46.0, 46.0, 68.0, 56.0, 57.0, 54.0, 57.0, 44.0, 56.0, 53.0, 42.0, 44.0, 23.0, 15.0, 20.0, 18.0, 11.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.443359375, -2.3759613037109375, -2.308563232421875, -2.2411651611328125, -2.17376708984375, -2.1063690185546875, -2.038970947265625, -1.9715728759765625, -1.9041748046875, -1.8367767333984375, -1.769378662109375, -1.7019805908203125, -1.63458251953125, -1.5671844482421875, -1.499786376953125, -1.4323883056640625, -1.364990234375, -1.2975921630859375, -1.230194091796875, -1.1627960205078125, -1.09539794921875, -1.0279998779296875, -0.960601806640625, -0.8932037353515625, -0.8258056640625, -0.7584075927734375, -0.691009521484375, -0.6236114501953125, -0.55621337890625, -0.4888153076171875, -0.421417236328125, -0.3540191650390625, -0.28662109375, -0.2192230224609375, -0.151824951171875, -0.0844268798828125, -0.01702880859375, 0.0503692626953125, 0.117767333984375, 0.1851654052734375, 0.2525634765625, 0.3199615478515625, 0.387359619140625, 0.4547576904296875, 0.52215576171875, 0.5895538330078125, 0.656951904296875, 0.7243499755859375, 0.791748046875, 0.8591461181640625, 0.926544189453125, 0.9939422607421875, 1.06134033203125, 1.1287384033203125, 1.196136474609375, 1.2635345458984375, 1.3309326171875, 1.3983306884765625, 1.465728759765625, 1.5331268310546875, 1.60052490234375, 1.6679229736328125, 1.735321044921875, 1.8027191162109375, 1.8701171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 11.0, 14.0, 19.0, 21.0, 37.0, 51.0, 50.0, 67.0, 100.0, 164.0, 200.0, 352.0, 609.0, 1059.0, 2428.0, 5564.0, 14414.0, 42164.0, 134124.0, 423427.0, 291972.0, 85748.0, 27744.0, 10007.0, 4055.0, 1838.0, 884.0, 509.0, 286.0, 169.0, 125.0, 104.0, 54.0, 42.0, 35.0, 23.0, 20.0, 15.0, 8.0, 3.0, 11.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.48333740234375, -4.3221435546875, -4.16094970703125, -3.999755859375, -3.83856201171875, -3.6773681640625, -3.51617431640625, -3.35498046875, -3.19378662109375, -3.0325927734375, -2.87139892578125, -2.710205078125, -2.54901123046875, -2.3878173828125, -2.22662353515625, -2.0654296875, -1.90423583984375, -1.7430419921875, -1.58184814453125, -1.420654296875, -1.25946044921875, -1.0982666015625, -0.93707275390625, -0.77587890625, -0.61468505859375, -0.4534912109375, -0.29229736328125, -0.131103515625, 0.03009033203125, 0.1912841796875, 0.35247802734375, 0.513671875, 0.67486572265625, 0.8360595703125, 0.99725341796875, 1.158447265625, 1.31964111328125, 1.4808349609375, 1.64202880859375, 1.80322265625, 1.96441650390625, 2.1256103515625, 2.28680419921875, 2.447998046875, 2.60919189453125, 2.7703857421875, 2.93157958984375, 3.0927734375, 3.25396728515625, 3.4151611328125, 3.57635498046875, 3.737548828125, 3.89874267578125, 4.0599365234375, 4.22113037109375, 4.38232421875, 4.54351806640625, 4.7047119140625, 4.86590576171875, 5.027099609375, 5.18829345703125, 5.3494873046875, 5.51068115234375, 5.671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 7.0, 4.0, 8.0, 9.0, 9.0, 14.0, 15.0, 26.0, 24.0, 24.0, 30.0, 31.0, 27.0, 38.0, 35.0, 41.0, 36.0, 45.0, 59.0, 38.0, 46.0, 38.0, 32.0, 41.0, 23.0, 35.0, 35.0, 34.0, 22.0, 26.0, 23.0, 24.0, 16.0, 13.0, 7.0, 10.0, 10.0, 11.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.96875, -5.77081298828125, -5.5728759765625, -5.37493896484375, -5.177001953125, -4.97906494140625, -4.7811279296875, -4.58319091796875, -4.38525390625, -4.18731689453125, -3.9893798828125, -3.79144287109375, -3.593505859375, -3.39556884765625, -3.1976318359375, -2.99969482421875, -2.8017578125, -2.60382080078125, -2.4058837890625, -2.20794677734375, -2.010009765625, -1.81207275390625, -1.6141357421875, -1.41619873046875, -1.21826171875, -1.02032470703125, -0.8223876953125, -0.62445068359375, -0.426513671875, -0.22857666015625, -0.0306396484375, 0.16729736328125, 0.365234375, 0.56317138671875, 0.7611083984375, 0.95904541015625, 1.156982421875, 1.35491943359375, 1.5528564453125, 1.75079345703125, 1.94873046875, 2.14666748046875, 2.3446044921875, 2.54254150390625, 2.740478515625, 2.93841552734375, 3.1363525390625, 3.33428955078125, 3.5322265625, 3.73016357421875, 3.9281005859375, 4.12603759765625, 4.323974609375, 4.52191162109375, 4.7198486328125, 4.91778564453125, 5.11572265625, 5.31365966796875, 5.5115966796875, 5.70953369140625, 5.907470703125, 6.10540771484375, 6.3033447265625, 6.50128173828125, 6.69921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 13.0, 15.0, 28.0, 68.0, 165.0, 443.0, 1498.0, 7210.0, 58765.0, 829071.0, 134954.0, 13036.0, 2245.0, 641.0, 227.0, 93.0, 39.0, 20.0, 8.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.481689453125, -4.33056640625, -4.179443359375, -4.0283203125, -3.877197265625, -3.72607421875, -3.574951171875, -3.423828125, -3.272705078125, -3.12158203125, -2.970458984375, -2.8193359375, -2.668212890625, -2.51708984375, -2.365966796875, -2.21484375, -2.063720703125, -1.91259765625, -1.761474609375, -1.6103515625, -1.459228515625, -1.30810546875, -1.156982421875, -1.005859375, -0.854736328125, -0.70361328125, -0.552490234375, -0.4013671875, -0.250244140625, -0.09912109375, 0.052001953125, 0.203125, 0.354248046875, 0.50537109375, 0.656494140625, 0.8076171875, 0.958740234375, 1.10986328125, 1.260986328125, 1.412109375, 1.563232421875, 1.71435546875, 1.865478515625, 2.0166015625, 2.167724609375, 2.31884765625, 2.469970703125, 2.62109375, 2.772216796875, 2.92333984375, 3.074462890625, 3.2255859375, 3.376708984375, 3.52783203125, 3.678955078125, 3.830078125, 3.981201171875, 4.13232421875, 4.283447265625, 4.4345703125, 4.585693359375, 4.73681640625, 4.887939453125, 5.0390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 4.0, 17.0, 23.0, 22.0, 27.0, 63.0, 113.0, 199.0, 210.0, 105.0, 58.0, 37.0, 21.0, 19.0, 16.0, 14.0, 8.0, 3.0, 4.0, 6.0, 2.0, 0.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004558563232421875, -0.00043683499097824097, -0.00041781365871429443, -0.0003987923264503479, -0.00037977099418640137, -0.00036074966192245483, -0.0003417283296585083, -0.00032270699739456177, -0.00030368566513061523, -0.0002846643328666687, -0.00026564300060272217, -0.00024662166833877563, -0.0002276003360748291, -0.00020857900381088257, -0.00018955767154693604, -0.0001705363392829895, -0.00015151500701904297, -0.00013249367475509644, -0.0001134723424911499, -9.445101022720337e-05, -7.542967796325684e-05, -5.64083456993103e-05, -3.738701343536377e-05, -1.8365681171417236e-05, 6.556510925292969e-07, 1.967698335647583e-05, 3.869831562042236e-05, 5.7719647884368896e-05, 7.674098014831543e-05, 9.576231241226196e-05, 0.0001147836446762085, 0.00013380497694015503, 0.00015282630920410156, 0.0001718476414680481, 0.00019086897373199463, 0.00020989030599594116, 0.0002289116382598877, 0.00024793297052383423, 0.00026695430278778076, 0.0002859756350517273, 0.00030499696731567383, 0.00032401829957962036, 0.0003430396318435669, 0.00036206096410751343, 0.00038108229637145996, 0.0004001036286354065, 0.00041912496089935303, 0.00043814629316329956, 0.0004571676254272461, 0.0004761889576911926, 0.0004952102899551392, 0.0005142316222190857, 0.0005332529544830322, 0.0005522742867469788, 0.0005712956190109253, 0.0005903169512748718, 0.0006093382835388184, 0.0006283596158027649, 0.0006473809480667114, 0.000666402280330658, 0.0006854236125946045, 0.000704444944858551, 0.0007234662771224976, 0.0007424876093864441, 0.0007615089416503906]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 17.0, 27.0, 55.0, 76.0, 256.0, 910.0, 5416.0, 57465.0, 921528.0, 56178.0, 5283.0, 872.0, 251.0, 95.0, 59.0, 25.0, 20.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.87542724609375, -3.6766357421875, -3.47784423828125, -3.279052734375, -3.08026123046875, -2.8814697265625, -2.68267822265625, -2.48388671875, -2.28509521484375, -2.0863037109375, -1.88751220703125, -1.688720703125, -1.48992919921875, -1.2911376953125, -1.09234619140625, -0.8935546875, -0.69476318359375, -0.4959716796875, -0.29718017578125, -0.098388671875, 0.10040283203125, 0.2991943359375, 0.49798583984375, 0.69677734375, 0.89556884765625, 1.0943603515625, 1.29315185546875, 1.491943359375, 1.69073486328125, 1.8895263671875, 2.08831787109375, 2.287109375, 2.48590087890625, 2.6846923828125, 2.88348388671875, 3.082275390625, 3.28106689453125, 3.4798583984375, 3.67864990234375, 3.87744140625, 4.07623291015625, 4.2750244140625, 4.47381591796875, 4.672607421875, 4.87139892578125, 5.0701904296875, 5.26898193359375, 5.4677734375, 5.66656494140625, 5.8653564453125, 6.06414794921875, 6.262939453125, 6.46173095703125, 6.6605224609375, 6.85931396484375, 7.05810546875, 7.25689697265625, 7.4556884765625, 7.65447998046875, 7.853271484375, 8.05206298828125, 8.2508544921875, 8.44964599609375, 8.6484375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 11.0, 16.0, 35.0, 42.0, 89.0, 135.0, 228.0, 197.0, 105.0, 48.0, 26.0, 23.0, 19.0, 6.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -1.998992919921875, -1.86322021484375, -1.727447509765625, -1.5916748046875, -1.455902099609375, -1.32012939453125, -1.184356689453125, -1.048583984375, -0.912811279296875, -0.77703857421875, -0.641265869140625, -0.5054931640625, -0.369720458984375, -0.23394775390625, -0.098175048828125, 0.03759765625, 0.173370361328125, 0.30914306640625, 0.444915771484375, 0.5806884765625, 0.716461181640625, 0.85223388671875, 0.988006591796875, 1.123779296875, 1.259552001953125, 1.39532470703125, 1.531097412109375, 1.6668701171875, 1.802642822265625, 1.93841552734375, 2.074188232421875, 2.2099609375, 2.345733642578125, 2.48150634765625, 2.617279052734375, 2.7530517578125, 2.888824462890625, 3.02459716796875, 3.160369873046875, 3.296142578125, 3.431915283203125, 3.56768798828125, 3.703460693359375, 3.8392333984375, 3.975006103515625, 4.11077880859375, 4.246551513671875, 4.38232421875, 4.518096923828125, 4.65386962890625, 4.789642333984375, 4.9254150390625, 5.061187744140625, 5.19696044921875, 5.332733154296875, 5.468505859375, 5.604278564453125, 5.74005126953125, 5.875823974609375, 6.0115966796875, 6.147369384765625, 6.28314208984375, 6.418914794921875, 6.5546875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 24.0, 52.0, 79.0, 145.0, 186.0, 192.0, 144.0, 81.0, 38.0, 24.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.9426155090332, -61.23741912841797, -59.5322265625, -57.827030181884766, -56.12183380126953, -54.41664123535156, -52.71144485473633, -51.006248474121094, -49.301055908203125, -47.59585952758789, -45.89066696166992, -44.18547058105469, -42.48027801513672, -40.775081634521484, -39.06988525390625, -37.36469268798828, -35.65949630737305, -33.95429992675781, -32.249107360839844, -30.54391098022461, -28.838716506958008, -27.133522033691406, -25.428325653076172, -23.72313117980957, -22.01793670654297, -20.312742233276367, -18.607547760009766, -16.90235137939453, -15.19715690612793, -13.491962432861328, -11.78676700592041, -10.081571578979492, -8.376380920410156, -6.6711859703063965, -4.965991020202637, -3.260796070098877, -1.5556011199951172, 0.14959335327148438, 1.8547887802124023, 3.5599842071533203, 5.265178680419922, 6.970373630523682, 8.675568580627441, 10.38076400756836, 12.085958480834961, 13.791152954101562, 15.49634838104248, 17.2015438079834, 18.90673828125, 20.6119327545166, 22.317127227783203, 24.022323608398438, 25.72751808166504, 27.43271255493164, 29.137908935546875, 30.843103408813477, 32.54829788208008, 34.25349426269531, 35.95868682861328, 37.663883209228516, 39.36907958984375, 41.07427215576172, 42.77946853637695, 44.48466491699219, 46.189857482910156]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 6.0, 9.0, 23.0, 16.0, 31.0, 28.0, 25.0, 36.0, 34.0, 37.0, 38.0, 44.0, 41.0, 43.0, 40.0, 41.0, 47.0, 42.0, 50.0, 41.0, 44.0, 27.0, 38.0, 17.0, 30.0, 22.0, 20.0, 23.0, 10.0, 16.0, 13.0, 10.0, 12.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53301239013672, -28.52191162109375, -27.510812759399414, -26.499711990356445, -25.48861312866211, -24.47751235961914, -23.466411590576172, -22.455310821533203, -21.444211959838867, -20.4331111907959, -19.422012329101562, -18.410911560058594, -17.399810791015625, -16.38871192932129, -15.37761116027832, -14.366511344909668, -13.355411529541016, -12.344311714172363, -11.333211898803711, -10.322111129760742, -9.31101131439209, -8.299911499023438, -7.288811206817627, -6.277710914611816, -5.266611099243164, -4.255511283874512, -3.244410991668701, -2.2333109378814697, -1.2222108840942383, -0.21111106872558594, 0.7999892234802246, 1.8110895156860352, 2.822193145751953, 3.8332931995391846, 4.844393253326416, 5.855493545532227, 6.866593360900879, 7.877693176269531, 8.8887939453125, 9.899893760681152, 10.910993576049805, 11.922093391418457, 12.93319320678711, 13.944293975830078, 14.95539379119873, 15.966493606567383, 16.97759437561035, 17.988693237304688, 18.999794006347656, 20.010894775390625, 21.02199363708496, 22.03309440612793, 23.044193267822266, 24.055294036865234, 25.066394805908203, 26.077495574951172, 27.088594436645508, 28.099695205688477, 29.110794067382812, 30.12189483642578, 31.13299560546875, 32.14409637451172, 33.15519332885742, 34.16629409790039, 35.17739486694336]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 10.0, 10.0, 11.0, 14.0, 19.0, 21.0, 27.0, 40.0, 41.0, 63.0, 130.0, 179.0, 212.0, 327.0, 482.0, 887.0, 1435.0, 2384.0, 4778.0, 10022.0, 26493.0, 128386.0, 3752016.0, 208590.0, 34040.0, 11834.0, 5153.0, 2729.0, 1498.0, 845.0, 540.0, 366.0, 232.0, 126.0, 89.0, 72.0, 46.0, 49.0, 23.0, 17.0, 19.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.8515625, -9.58233642578125, -9.3131103515625, -9.04388427734375, -8.774658203125, -8.50543212890625, -8.2362060546875, -7.96697998046875, -7.69775390625, -7.42852783203125, -7.1593017578125, -6.89007568359375, -6.620849609375, -6.35162353515625, -6.0823974609375, -5.81317138671875, -5.5439453125, -5.27471923828125, -5.0054931640625, -4.73626708984375, -4.467041015625, -4.19781494140625, -3.9285888671875, -3.65936279296875, -3.39013671875, -3.12091064453125, -2.8516845703125, -2.58245849609375, -2.313232421875, -2.04400634765625, -1.7747802734375, -1.50555419921875, -1.236328125, -0.96710205078125, -0.6978759765625, -0.42864990234375, -0.159423828125, 0.10980224609375, 0.3790283203125, 0.64825439453125, 0.91748046875, 1.18670654296875, 1.4559326171875, 1.72515869140625, 1.994384765625, 2.26361083984375, 2.5328369140625, 2.80206298828125, 3.0712890625, 3.34051513671875, 3.6097412109375, 3.87896728515625, 4.148193359375, 4.41741943359375, 4.6866455078125, 4.95587158203125, 5.22509765625, 5.49432373046875, 5.7635498046875, 6.03277587890625, 6.302001953125, 6.57122802734375, 6.8404541015625, 7.10968017578125, 7.37890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 13.0, 6.0, 8.0, 11.0, 14.0, 22.0, 18.0, 35.0, 34.0, 33.0, 47.0, 45.0, 51.0, 53.0, 57.0, 58.0, 55.0, 56.0, 62.0, 48.0, 43.0, 39.0, 34.0, 30.0, 30.0, 27.0, 13.0, 12.0, 13.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.4086151123046875, -2.338714599609375, -2.2688140869140625, -2.19891357421875, -2.1290130615234375, -2.059112548828125, -1.9892120361328125, -1.9193115234375, -1.8494110107421875, -1.779510498046875, -1.7096099853515625, -1.63970947265625, -1.5698089599609375, -1.499908447265625, -1.4300079345703125, -1.360107421875, -1.2902069091796875, -1.220306396484375, -1.1504058837890625, -1.08050537109375, -1.0106048583984375, -0.940704345703125, -0.8708038330078125, -0.8009033203125, -0.7310028076171875, -0.661102294921875, -0.5912017822265625, -0.52130126953125, -0.4514007568359375, -0.381500244140625, -0.3115997314453125, -0.24169921875, -0.1717987060546875, -0.101898193359375, -0.0319976806640625, 0.03790283203125, 0.1078033447265625, 0.177703857421875, 0.2476043701171875, 0.3175048828125, 0.3874053955078125, 0.457305908203125, 0.5272064208984375, 0.59710693359375, 0.6670074462890625, 0.736907958984375, 0.8068084716796875, 0.876708984375, 0.9466094970703125, 1.016510009765625, 1.0864105224609375, 1.15631103515625, 1.2262115478515625, 1.296112060546875, 1.3660125732421875, 1.4359130859375, 1.5058135986328125, 1.575714111328125, 1.6456146240234375, 1.71551513671875, 1.7854156494140625, 1.855316162109375, 1.9252166748046875, 1.9951171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 7.0, 15.0, 17.0, 30.0, 64.0, 127.0, 301.0, 819.0, 2811.0, 13490.0, 214716.0, 3902110.0, 50846.0, 6429.0, 1550.0, 530.0, 202.0, 90.0, 53.0, 33.0, 17.0, 19.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.6519775390625, -7.233642578125, -6.8153076171875, -6.39697265625, -5.9786376953125, -5.560302734375, -5.1419677734375, -4.7236328125, -4.3052978515625, -3.886962890625, -3.4686279296875, -3.05029296875, -2.6319580078125, -2.213623046875, -1.7952880859375, -1.376953125, -0.9586181640625, -0.540283203125, -0.1219482421875, 0.29638671875, 0.7147216796875, 1.133056640625, 1.5513916015625, 1.9697265625, 2.3880615234375, 2.806396484375, 3.2247314453125, 3.64306640625, 4.0614013671875, 4.479736328125, 4.8980712890625, 5.31640625, 5.7347412109375, 6.153076171875, 6.5714111328125, 6.98974609375, 7.4080810546875, 7.826416015625, 8.2447509765625, 8.6630859375, 9.0814208984375, 9.499755859375, 9.9180908203125, 10.33642578125, 10.7547607421875, 11.173095703125, 11.5914306640625, 12.009765625, 12.4281005859375, 12.846435546875, 13.2647705078125, 13.68310546875, 14.1014404296875, 14.519775390625, 14.9381103515625, 15.3564453125, 15.7747802734375, 16.193115234375, 16.6114501953125, 17.02978515625, 17.4481201171875, 17.866455078125, 18.2847900390625, 18.703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 8.0, 19.0, 29.0, 41.0, 68.0, 190.0, 813.0, 2384.0, 276.0, 105.0, 44.0, 23.0, 19.0, 7.0, 5.0, 9.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6640625, -3.53424072265625, -3.4044189453125, -3.27459716796875, -3.144775390625, -3.01495361328125, -2.8851318359375, -2.75531005859375, -2.62548828125, -2.49566650390625, -2.3658447265625, -2.23602294921875, -2.106201171875, -1.97637939453125, -1.8465576171875, -1.71673583984375, -1.5869140625, -1.45709228515625, -1.3272705078125, -1.19744873046875, -1.067626953125, -0.93780517578125, -0.8079833984375, -0.67816162109375, -0.54833984375, -0.41851806640625, -0.2886962890625, -0.15887451171875, -0.029052734375, 0.10076904296875, 0.2305908203125, 0.36041259765625, 0.490234375, 0.62005615234375, 0.7498779296875, 0.87969970703125, 1.009521484375, 1.13934326171875, 1.2691650390625, 1.39898681640625, 1.52880859375, 1.65863037109375, 1.7884521484375, 1.91827392578125, 2.048095703125, 2.17791748046875, 2.3077392578125, 2.43756103515625, 2.5673828125, 2.69720458984375, 2.8270263671875, 2.95684814453125, 3.086669921875, 3.21649169921875, 3.3463134765625, 3.47613525390625, 3.60595703125, 3.73577880859375, 3.8656005859375, 3.99542236328125, 4.125244140625, 4.25506591796875, 4.3848876953125, 4.51470947265625, 4.64453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 9.0, 15.0, 22.0, 41.0, 88.0, 99.0, 139.0, 157.0, 133.0, 103.0, 70.0, 54.0, 34.0, 14.0, 5.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.901444435119629, -15.409701347351074, -14.91795825958252, -14.426216125488281, -13.934473037719727, -13.442729949951172, -12.950986862182617, -12.459243774414062, -11.967500686645508, -11.475757598876953, -10.984014511108398, -10.492271423339844, -10.000529289245605, -9.50878620147705, -9.017043113708496, -8.525300025939941, -8.033557891845703, -7.541814804077148, -7.050072193145752, -6.558329105377197, -6.066586494445801, -5.574843406677246, -5.083100318908691, -4.591357231140137, -4.09961462020874, -3.6078717708587646, -3.116128921508789, -2.6243858337402344, -2.132642984390259, -1.6409001350402832, -1.1491570472717285, -0.6574141979217529, -0.16567039489746094, 0.3260725140571594, 0.8178154230117798, 1.309558391571045, 1.8013012409210205, 2.293044090270996, 2.784787178039551, 3.2765300273895264, 3.768272876739502, 4.260015964508057, 4.751758575439453, 5.243501663208008, 5.7352447509765625, 6.226987361907959, 6.718730449676514, 7.21047306060791, 7.702216148376465, 8.19395923614502, 8.685702323913574, 9.177444458007812, 9.669187545776367, 10.160930633544922, 10.652673721313477, 11.144416809082031, 11.636159896850586, 12.12790298461914, 12.619646072387695, 13.11138916015625, 13.603131294250488, 14.094874382019043, 14.586617469787598, 15.078360557556152, 15.57010269165039]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 3.0, 12.0, 12.0, 15.0, 16.0, 16.0, 19.0, 26.0, 41.0, 24.0, 25.0, 36.0, 49.0, 37.0, 35.0, 63.0, 35.0, 39.0, 39.0, 41.0, 42.0, 34.0, 36.0, 24.0, 40.0, 32.0, 31.0, 32.0, 22.0, 19.0, 11.0, 17.0, 17.0, 15.0, 4.0, 9.0, 5.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.623503684997559, -7.3664326667785645, -7.10936164855957, -6.852290630340576, -6.595219612121582, -6.338148593902588, -6.081077575683594, -5.8240065574646, -5.5669355392456055, -5.309864521026611, -5.052793502807617, -4.795722484588623, -4.538651466369629, -4.281580448150635, -4.024509429931641, -3.7674384117126465, -3.5103673934936523, -3.253296375274658, -2.996225357055664, -2.73915433883667, -2.482083320617676, -2.2250123023986816, -1.9679412841796875, -1.7108702659606934, -1.4537992477416992, -1.196728229522705, -0.9396572113037109, -0.6825861930847168, -0.42551517486572266, -0.16844415664672852, 0.08862686157226562, 0.34569787979125977, 0.6027679443359375, 0.8598389625549316, 1.1169099807739258, 1.37398099899292, 1.631052017211914, 1.8881230354309082, 2.1451940536499023, 2.4022650718688965, 2.6593360900878906, 2.9164071083068848, 3.173478126525879, 3.430549144744873, 3.687620162963867, 3.9446911811828613, 4.2017621994018555, 4.45883321762085, 4.715904235839844, 4.972975254058838, 5.230046272277832, 5.487117290496826, 5.74418830871582, 6.0012593269348145, 6.258330345153809, 6.515401363372803, 6.772472381591797, 7.029543399810791, 7.286614418029785, 7.543685436248779, 7.800756454467773, 8.05782699584961, 8.314898490905762, 8.571969985961914, 8.82904052734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 27.0, 23.0, 31.0, 51.0, 71.0, 129.0, 194.0, 315.0, 550.0, 914.0, 1786.0, 3472.0, 7911.0, 18732.0, 48743.0, 143655.0, 388832.0, 281372.0, 93930.0, 32946.0, 13123.0, 5659.0, 2803.0, 1435.0, 754.0, 412.0, 241.0, 132.0, 100.0, 67.0, 47.0, 14.0, 13.0, 14.0, 8.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.87835693359375, -5.6590576171875, -5.43975830078125, -5.220458984375, -5.00115966796875, -4.7818603515625, -4.56256103515625, -4.34326171875, -4.12396240234375, -3.9046630859375, -3.68536376953125, -3.466064453125, -3.24676513671875, -3.0274658203125, -2.80816650390625, -2.5888671875, -2.36956787109375, -2.1502685546875, -1.93096923828125, -1.711669921875, -1.49237060546875, -1.2730712890625, -1.05377197265625, -0.83447265625, -0.61517333984375, -0.3958740234375, -0.17657470703125, 0.042724609375, 0.26202392578125, 0.4813232421875, 0.70062255859375, 0.919921875, 1.13922119140625, 1.3585205078125, 1.57781982421875, 1.797119140625, 2.01641845703125, 2.2357177734375, 2.45501708984375, 2.67431640625, 2.89361572265625, 3.1129150390625, 3.33221435546875, 3.551513671875, 3.77081298828125, 3.9901123046875, 4.20941162109375, 4.4287109375, 4.64801025390625, 4.8673095703125, 5.08660888671875, 5.305908203125, 5.52520751953125, 5.7445068359375, 5.96380615234375, 6.18310546875, 6.40240478515625, 6.6217041015625, 6.84100341796875, 7.060302734375, 7.27960205078125, 7.4989013671875, 7.71820068359375, 7.9375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 11.0, 15.0, 22.0, 16.0, 21.0, 21.0, 37.0, 32.0, 52.0, 59.0, 51.0, 50.0, 54.0, 65.0, 54.0, 49.0, 58.0, 43.0, 49.0, 37.0, 38.0, 33.0, 26.0, 25.0, 15.0, 15.0, 9.0, 10.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.5057373046875, -2.433349609375, -2.3609619140625, -2.28857421875, -2.2161865234375, -2.143798828125, -2.0714111328125, -1.9990234375, -1.9266357421875, -1.854248046875, -1.7818603515625, -1.70947265625, -1.6370849609375, -1.564697265625, -1.4923095703125, -1.419921875, -1.3475341796875, -1.275146484375, -1.2027587890625, -1.13037109375, -1.0579833984375, -0.985595703125, -0.9132080078125, -0.8408203125, -0.7684326171875, -0.696044921875, -0.6236572265625, -0.55126953125, -0.4788818359375, -0.406494140625, -0.3341064453125, -0.26171875, -0.1893310546875, -0.116943359375, -0.0445556640625, 0.02783203125, 0.1002197265625, 0.172607421875, 0.2449951171875, 0.3173828125, 0.3897705078125, 0.462158203125, 0.5345458984375, 0.60693359375, 0.6793212890625, 0.751708984375, 0.8240966796875, 0.896484375, 0.9688720703125, 1.041259765625, 1.1136474609375, 1.18603515625, 1.2584228515625, 1.330810546875, 1.4031982421875, 1.4755859375, 1.5479736328125, 1.620361328125, 1.6927490234375, 1.76513671875, 1.8375244140625, 1.909912109375, 1.9822998046875, 2.0546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 10.0, 5.0, 11.0, 12.0, 11.0, 33.0, 37.0, 63.0, 122.0, 170.0, 319.0, 519.0, 1022.0, 2259.0, 6118.0, 20942.0, 91578.0, 477488.0, 357374.0, 65688.0, 15839.0, 4922.0, 1928.0, 891.0, 458.0, 278.0, 171.0, 106.0, 55.0, 44.0, 27.0, 16.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.046875, -8.79486083984375, -8.5428466796875, -8.29083251953125, -8.038818359375, -7.78680419921875, -7.5347900390625, -7.28277587890625, -7.03076171875, -6.77874755859375, -6.5267333984375, -6.27471923828125, -6.022705078125, -5.77069091796875, -5.5186767578125, -5.26666259765625, -5.0146484375, -4.76263427734375, -4.5106201171875, -4.25860595703125, -4.006591796875, -3.75457763671875, -3.5025634765625, -3.25054931640625, -2.99853515625, -2.74652099609375, -2.4945068359375, -2.24249267578125, -1.990478515625, -1.73846435546875, -1.4864501953125, -1.23443603515625, -0.982421875, -0.73040771484375, -0.4783935546875, -0.22637939453125, 0.025634765625, 0.27764892578125, 0.5296630859375, 0.78167724609375, 1.03369140625, 1.28570556640625, 1.5377197265625, 1.78973388671875, 2.041748046875, 2.29376220703125, 2.5457763671875, 2.79779052734375, 3.0498046875, 3.30181884765625, 3.5538330078125, 3.80584716796875, 4.057861328125, 4.30987548828125, 4.5618896484375, 4.81390380859375, 5.06591796875, 5.31793212890625, 5.5699462890625, 5.82196044921875, 6.073974609375, 6.32598876953125, 6.5780029296875, 6.83001708984375, 7.08203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 14.0, 13.0, 17.0, 31.0, 30.0, 49.0, 33.0, 45.0, 54.0, 63.0, 77.0, 73.0, 71.0, 70.0, 43.0, 64.0, 56.0, 37.0, 24.0, 23.0, 31.0, 12.0, 18.0, 14.0, 5.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6494140625, -11.259765625, -10.8701171875, -10.48046875, -10.0908203125, -9.701171875, -9.3115234375, -8.921875, -8.5322265625, -8.142578125, -7.7529296875, -7.36328125, -6.9736328125, -6.583984375, -6.1943359375, -5.8046875, -5.4150390625, -5.025390625, -4.6357421875, -4.24609375, -3.8564453125, -3.466796875, -3.0771484375, -2.6875, -2.2978515625, -1.908203125, -1.5185546875, -1.12890625, -0.7392578125, -0.349609375, 0.0400390625, 0.4296875, 0.8193359375, 1.208984375, 1.5986328125, 1.98828125, 2.3779296875, 2.767578125, 3.1572265625, 3.546875, 3.9365234375, 4.326171875, 4.7158203125, 5.10546875, 5.4951171875, 5.884765625, 6.2744140625, 6.6640625, 7.0537109375, 7.443359375, 7.8330078125, 8.22265625, 8.6123046875, 9.001953125, 9.3916015625, 9.78125, 10.1708984375, 10.560546875, 10.9501953125, 11.33984375, 11.7294921875, 12.119140625, 12.5087890625, 12.8984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 2.0, 5.0, 4.0, 7.0, 16.0, 26.0, 45.0, 48.0, 76.0, 116.0, 233.0, 431.0, 814.0, 1705.0, 3847.0, 11067.0, 87060.0, 865442.0, 61189.0, 9759.0, 3416.0, 1504.0, 766.0, 401.0, 219.0, 131.0, 77.0, 47.0, 32.0, 18.0, 17.0, 13.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.739990234375, -9.44873046875, -9.157470703125, -8.8662109375, -8.574951171875, -8.28369140625, -7.992431640625, -7.701171875, -7.409912109375, -7.11865234375, -6.827392578125, -6.5361328125, -6.244873046875, -5.95361328125, -5.662353515625, -5.37109375, -5.079833984375, -4.78857421875, -4.497314453125, -4.2060546875, -3.914794921875, -3.62353515625, -3.332275390625, -3.041015625, -2.749755859375, -2.45849609375, -2.167236328125, -1.8759765625, -1.584716796875, -1.29345703125, -1.002197265625, -0.7109375, -0.419677734375, -0.12841796875, 0.162841796875, 0.4541015625, 0.745361328125, 1.03662109375, 1.327880859375, 1.619140625, 1.910400390625, 2.20166015625, 2.492919921875, 2.7841796875, 3.075439453125, 3.36669921875, 3.657958984375, 3.94921875, 4.240478515625, 4.53173828125, 4.822998046875, 5.1142578125, 5.405517578125, 5.69677734375, 5.988037109375, 6.279296875, 6.570556640625, 6.86181640625, 7.153076171875, 7.4443359375, 7.735595703125, 8.02685546875, 8.318115234375, 8.609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 12.0, 20.0, 25.0, 51.0, 52.0, 133.0, 365.0, 144.0, 93.0, 55.0, 25.0, 13.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011434555053710938, -0.001095101237297058, -0.0010467469692230225, -0.0009983927011489868, -0.0009500384330749512, -0.0009016841650009155, -0.0008533298969268799, -0.0008049756288528442, -0.0007566213607788086, -0.000708267092704773, -0.0006599128246307373, -0.0006115585565567017, -0.000563204288482666, -0.0005148500204086304, -0.0004664957523345947, -0.0004181414842605591, -0.00036978721618652344, -0.0003214329481124878, -0.00027307868003845215, -0.0002247244119644165, -0.00017637014389038086, -0.00012801587581634521, -7.966160774230957e-05, -3.1307339668273926e-05, 1.704692840576172e-05, 6.540119647979736e-05, 0.00011375546455383301, 0.00016210973262786865, 0.0002104640007019043, 0.00025881826877593994, 0.0003071725368499756, 0.00035552680492401123, 0.0004038810729980469, 0.0004522353410720825, 0.0005005896091461182, 0.0005489438772201538, 0.0005972981452941895, 0.0006456524133682251, 0.0006940066814422607, 0.0007423609495162964, 0.000790715217590332, 0.0008390694856643677, 0.0008874237537384033, 0.000935778021812439, 0.0009841322898864746, 0.0010324865579605103, 0.001080840826034546, 0.0011291950941085815, 0.0011775493621826172, 0.0012259036302566528, 0.0012742578983306885, 0.0013226121664047241, 0.0013709664344787598, 0.0014193207025527954, 0.001467674970626831, 0.0015160292387008667, 0.0015643835067749023, 0.001612737774848938, 0.0016610920429229736, 0.0017094463109970093, 0.001757800579071045, 0.0018061548471450806, 0.0018545091152191162, 0.0019028633832931519, 0.0019512176513671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 7.0, 25.0, 27.0, 61.0, 126.0, 322.0, 836.0, 2961.0, 18848.0, 867112.0, 147655.0, 7825.0, 1773.0, 561.0, 195.0, 94.0, 44.0, 32.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.2783203125, -9.806640625, -9.3349609375, -8.86328125, -8.3916015625, -7.919921875, -7.4482421875, -6.9765625, -6.5048828125, -6.033203125, -5.5615234375, -5.08984375, -4.6181640625, -4.146484375, -3.6748046875, -3.203125, -2.7314453125, -2.259765625, -1.7880859375, -1.31640625, -0.8447265625, -0.373046875, 0.0986328125, 0.5703125, 1.0419921875, 1.513671875, 1.9853515625, 2.45703125, 2.9287109375, 3.400390625, 3.8720703125, 4.34375, 4.8154296875, 5.287109375, 5.7587890625, 6.23046875, 6.7021484375, 7.173828125, 7.6455078125, 8.1171875, 8.5888671875, 9.060546875, 9.5322265625, 10.00390625, 10.4755859375, 10.947265625, 11.4189453125, 11.890625, 12.3623046875, 12.833984375, 13.3056640625, 13.77734375, 14.2490234375, 14.720703125, 15.1923828125, 15.6640625, 16.1357421875, 16.607421875, 17.0791015625, 17.55078125, 18.0224609375, 18.494140625, 18.9658203125, 19.4375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 11.0, 32.0, 42.0, 76.0, 180.0, 317.0, 140.0, 77.0, 41.0, 19.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.2879638671875, -8.935302734375, -8.5826416015625, -8.22998046875, -7.8773193359375, -7.524658203125, -7.1719970703125, -6.8193359375, -6.4666748046875, -6.114013671875, -5.7613525390625, -5.40869140625, -5.0560302734375, -4.703369140625, -4.3507080078125, -3.998046875, -3.6453857421875, -3.292724609375, -2.9400634765625, -2.58740234375, -2.2347412109375, -1.882080078125, -1.5294189453125, -1.1767578125, -0.8240966796875, -0.471435546875, -0.1187744140625, 0.23388671875, 0.5865478515625, 0.939208984375, 1.2918701171875, 1.64453125, 1.9971923828125, 2.349853515625, 2.7025146484375, 3.05517578125, 3.4078369140625, 3.760498046875, 4.1131591796875, 4.4658203125, 4.8184814453125, 5.171142578125, 5.5238037109375, 5.87646484375, 6.2291259765625, 6.581787109375, 6.9344482421875, 7.287109375, 7.6397705078125, 7.992431640625, 8.3450927734375, 8.69775390625, 9.0504150390625, 9.403076171875, 9.7557373046875, 10.1083984375, 10.4610595703125, 10.813720703125, 11.1663818359375, 11.51904296875, 11.8717041015625, 12.224365234375, 12.5770263671875, 12.9296875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 8.0, 21.0, 34.0, 67.0, 114.0, 193.0, 198.0, 158.0, 94.0, 50.0, 28.0, 18.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.35716247558594, -71.17179870605469, -67.98644256591797, -64.80107879638672, -61.615718841552734, -58.43035888671875, -55.2449951171875, -52.059635162353516, -48.87427520751953, -45.68891525268555, -42.50355529785156, -39.31819152832031, -36.13283157348633, -32.947471618652344, -29.762109756469727, -26.57674789428711, -23.391387939453125, -20.20602798461914, -17.020666122436523, -13.835305213928223, -10.649944305419922, -7.464583396911621, -4.27922248840332, -1.0938606262207031, 2.0914993286132812, 5.276860237121582, 8.462221145629883, 11.647582054138184, 14.832942962646484, 18.01830291748047, 21.203664779663086, 24.389026641845703, 27.574386596679688, 30.759746551513672, 33.945106506347656, 37.130470275878906, 40.31583023071289, 43.501190185546875, 46.686553955078125, 49.87191390991211, 53.057273864746094, 56.24263381958008, 59.42799377441406, 62.61335754394531, 65.79872131347656, 68.98407745361328, 72.16944122314453, 75.35479736328125, 78.5401611328125, 81.72552490234375, 84.91088104248047, 88.09624481201172, 91.28160095214844, 94.46696472167969, 97.65232849121094, 100.83769226074219, 104.0230484008789, 107.20841217041016, 110.39376831054688, 113.57913208007812, 116.76449584960938, 119.9498519897461, 123.13521575927734, 126.32057189941406, 129.5059356689453]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 8.0, 6.0, 5.0, 7.0, 11.0, 15.0, 14.0, 15.0, 15.0, 16.0, 29.0, 20.0, 43.0, 35.0, 54.0, 45.0, 55.0, 40.0, 60.0, 51.0, 42.0, 57.0, 50.0, 48.0, 39.0, 36.0, 26.0, 28.0, 28.0, 24.0, 20.0, 8.0, 15.0, 11.0, 5.0, 7.0, 5.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.42919921875, -52.488861083984375, -50.54852294921875, -48.60818099975586, -46.667842864990234, -44.72750473022461, -42.78716278076172, -40.846824645996094, -38.90648651123047, -36.966148376464844, -35.02581024169922, -33.08546829223633, -31.145130157470703, -29.204792022705078, -27.26445198059082, -25.324111938476562, -23.383773803710938, -21.443435668945312, -19.503095626831055, -17.562755584716797, -15.622417449951172, -13.68207836151123, -11.741739273071289, -9.801400184631348, -7.861061096191406, -5.920722007751465, -3.9803829193115234, -2.040043830871582, -0.09970474243164062, 1.8406343460083008, 3.780973434448242, 5.721312522888184, 7.661651611328125, 9.601990699768066, 11.542329788208008, 13.48266887664795, 15.42300796508789, 17.363346099853516, 19.303686141967773, 21.24402618408203, 23.184364318847656, 25.12470245361328, 27.06504249572754, 29.005382537841797, 30.945720672607422, 32.88605880737305, 34.82640075683594, 36.76673889160156, 38.70707702636719, 40.64741516113281, 42.58775329589844, 44.52809524536133, 46.46843338012695, 48.40877151489258, 50.34911346435547, 52.289451599121094, 54.22978973388672, 56.170127868652344, 58.11046600341797, 60.05080795288086, 61.991146087646484, 63.93148422241211, 65.871826171875, 67.81216430664062, 69.75250244140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 0.0, 8.0, 9.0, 10.0, 18.0, 24.0, 32.0, 46.0, 66.0, 124.0, 186.0, 279.0, 520.0, 1051.0, 2066.0, 5417.0, 15865.0, 72571.0, 3311046.0, 718130.0, 47210.0, 12030.0, 4006.0, 1668.0, 812.0, 436.0, 209.0, 134.0, 95.0, 60.0, 46.0, 30.0, 26.0, 15.0, 8.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.023681640625, -8.68798828125, -8.352294921875, -8.0166015625, -7.680908203125, -7.34521484375, -7.009521484375, -6.673828125, -6.338134765625, -6.00244140625, -5.666748046875, -5.3310546875, -4.995361328125, -4.65966796875, -4.323974609375, -3.98828125, -3.652587890625, -3.31689453125, -2.981201171875, -2.6455078125, -2.309814453125, -1.97412109375, -1.638427734375, -1.302734375, -0.967041015625, -0.63134765625, -0.295654296875, 0.0400390625, 0.375732421875, 0.71142578125, 1.047119140625, 1.3828125, 1.718505859375, 2.05419921875, 2.389892578125, 2.7255859375, 3.061279296875, 3.39697265625, 3.732666015625, 4.068359375, 4.404052734375, 4.73974609375, 5.075439453125, 5.4111328125, 5.746826171875, 6.08251953125, 6.418212890625, 6.75390625, 7.089599609375, 7.42529296875, 7.760986328125, 8.0966796875, 8.432373046875, 8.76806640625, 9.103759765625, 9.439453125, 9.775146484375, 10.11083984375, 10.446533203125, 10.7822265625, 11.117919921875, 11.45361328125, 11.789306640625, 12.125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 12.0, 7.0, 4.0, 15.0, 16.0, 11.0, 20.0, 30.0, 26.0, 32.0, 21.0, 38.0, 46.0, 56.0, 50.0, 51.0, 51.0, 52.0, 59.0, 46.0, 52.0, 48.0, 39.0, 43.0, 26.0, 29.0, 26.0, 20.0, 16.0, 16.0, 11.0, 8.0, 10.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.435546875, -2.354461669921875, -2.27337646484375, -2.192291259765625, -2.1112060546875, -2.030120849609375, -1.94903564453125, -1.867950439453125, -1.786865234375, -1.705780029296875, -1.62469482421875, -1.543609619140625, -1.4625244140625, -1.381439208984375, -1.30035400390625, -1.219268798828125, -1.13818359375, -1.057098388671875, -0.97601318359375, -0.894927978515625, -0.8138427734375, -0.732757568359375, -0.65167236328125, -0.570587158203125, -0.489501953125, -0.408416748046875, -0.32733154296875, -0.246246337890625, -0.1651611328125, -0.084075927734375, -0.00299072265625, 0.078094482421875, 0.1591796875, 0.240264892578125, 0.32135009765625, 0.402435302734375, 0.4835205078125, 0.564605712890625, 0.64569091796875, 0.726776123046875, 0.807861328125, 0.888946533203125, 0.97003173828125, 1.051116943359375, 1.1322021484375, 1.213287353515625, 1.29437255859375, 1.375457763671875, 1.45654296875, 1.537628173828125, 1.61871337890625, 1.699798583984375, 1.7808837890625, 1.861968994140625, 1.94305419921875, 2.024139404296875, 2.105224609375, 2.186309814453125, 2.26739501953125, 2.348480224609375, 2.4295654296875, 2.510650634765625, 2.59173583984375, 2.672821044921875, 2.75390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 0.0, 8.0, 17.0, 22.0, 32.0, 35.0, 46.0, 88.0, 120.0, 237.0, 409.0, 958.0, 2386.0, 9952.0, 103256.0, 3937501.0, 123785.0, 10727.0, 2685.0, 956.0, 422.0, 233.0, 142.0, 79.0, 56.0, 35.0, 30.0, 18.0, 19.0, 9.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.59375, -15.09912109375, -14.6044921875, -14.10986328125, -13.615234375, -13.12060546875, -12.6259765625, -12.13134765625, -11.63671875, -11.14208984375, -10.6474609375, -10.15283203125, -9.658203125, -9.16357421875, -8.6689453125, -8.17431640625, -7.6796875, -7.18505859375, -6.6904296875, -6.19580078125, -5.701171875, -5.20654296875, -4.7119140625, -4.21728515625, -3.72265625, -3.22802734375, -2.7333984375, -2.23876953125, -1.744140625, -1.24951171875, -0.7548828125, -0.26025390625, 0.234375, 0.72900390625, 1.2236328125, 1.71826171875, 2.212890625, 2.70751953125, 3.2021484375, 3.69677734375, 4.19140625, 4.68603515625, 5.1806640625, 5.67529296875, 6.169921875, 6.66455078125, 7.1591796875, 7.65380859375, 8.1484375, 8.64306640625, 9.1376953125, 9.63232421875, 10.126953125, 10.62158203125, 11.1162109375, 11.61083984375, 12.10546875, 12.60009765625, 13.0947265625, 13.58935546875, 14.083984375, 14.57861328125, 15.0732421875, 15.56787109375, 16.0625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 9.0, 11.0, 22.0, 47.0, 82.0, 389.0, 2925.0, 413.0, 103.0, 39.0, 18.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.5421142578125, -8.193603515625, -7.8450927734375, -7.49658203125, -7.1480712890625, -6.799560546875, -6.4510498046875, -6.1025390625, -5.7540283203125, -5.405517578125, -5.0570068359375, -4.70849609375, -4.3599853515625, -4.011474609375, -3.6629638671875, -3.314453125, -2.9659423828125, -2.617431640625, -2.2689208984375, -1.92041015625, -1.5718994140625, -1.223388671875, -0.8748779296875, -0.5263671875, -0.1778564453125, 0.170654296875, 0.5191650390625, 0.86767578125, 1.2161865234375, 1.564697265625, 1.9132080078125, 2.26171875, 2.6102294921875, 2.958740234375, 3.3072509765625, 3.65576171875, 4.0042724609375, 4.352783203125, 4.7012939453125, 5.0498046875, 5.3983154296875, 5.746826171875, 6.0953369140625, 6.44384765625, 6.7923583984375, 7.140869140625, 7.4893798828125, 7.837890625, 8.1864013671875, 8.534912109375, 8.8834228515625, 9.23193359375, 9.5804443359375, 9.928955078125, 10.2774658203125, 10.6259765625, 10.9744873046875, 11.322998046875, 11.6715087890625, 12.02001953125, 12.3685302734375, 12.717041015625, 13.0655517578125, 13.4140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 13.0, 20.0, 44.0, 39.0, 69.0, 104.0, 118.0, 129.0, 119.0, 93.0, 69.0, 43.0, 39.0, 25.0, 15.0, 7.0, 9.0, 6.0, 6.0, 4.0, 1.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.337881088256836, -12.686314582824707, -12.034748077392578, -11.38318157196045, -10.73161506652832, -10.080049514770508, -9.428483009338379, -8.77691650390625, -8.125349998474121, -7.473783493041992, -6.822216987609863, -6.170650959014893, -5.519084453582764, -4.867517948150635, -4.215951919555664, -3.564385414123535, -2.9128189086914062, -2.2612524032592773, -1.6096861362457275, -0.9581197500228882, -0.30655336380004883, 0.3450131416320801, 0.9965794086456299, 1.6481456756591797, 2.2997121810913086, 2.9512786865234375, 3.6028449535369873, 4.254411220550537, 4.905977725982666, 5.557544231414795, 6.209110260009766, 6.8606767654418945, 7.512243270874023, 8.163809776306152, 8.815376281738281, 9.46694278717041, 10.118509292602539, 10.770074844360352, 11.42164134979248, 12.07320785522461, 12.724774360656738, 13.376340866088867, 14.027907371520996, 14.679473876953125, 15.331039428710938, 15.982606887817383, 16.634172439575195, 17.28573989868164, 17.937305450439453, 18.588871002197266, 19.24043846130371, 19.892004013061523, 20.54357147216797, 21.19513702392578, 21.846704483032227, 22.49827003479004, 23.149837493896484, 23.801403045654297, 24.452970504760742, 25.104536056518555, 25.756103515625, 26.407669067382812, 27.059236526489258, 27.71080207824707, 28.362367630004883]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 8.0, 10.0, 12.0, 10.0, 19.0, 20.0, 26.0, 22.0, 33.0, 33.0, 35.0, 25.0, 39.0, 29.0, 40.0, 47.0, 42.0, 38.0, 41.0, 49.0, 28.0, 35.0, 29.0, 33.0, 34.0, 35.0, 34.0, 24.0, 21.0, 28.0, 18.0, 16.0, 11.0, 12.0, 10.0, 8.0, 7.0, 9.0, 4.0, 6.0, 0.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-16.175437927246094, -15.715279579162598, -15.255121231079102, -14.794962882995605, -14.33480453491211, -13.874646186828613, -13.414487838745117, -12.954328536987305, -12.494171142578125, -12.034012794494629, -11.573854446411133, -11.113696098327637, -10.65353775024414, -10.193379402160645, -9.733221054077148, -9.273061752319336, -8.81290340423584, -8.352745056152344, -7.892586708068848, -7.432428359985352, -6.9722700119018555, -6.512111663818359, -6.051952838897705, -5.591794490814209, -5.131636142730713, -4.671477794647217, -4.211319446563721, -3.7511608600616455, -3.2910025119781494, -2.8308441638946533, -2.370685577392578, -1.910527229309082, -1.4503679275512695, -0.9902095198631287, -0.5300511121749878, -0.06989264488220215, 0.39026570320129395, 0.85042405128479, 1.3105826377868652, 1.7707409858703613, 2.2308993339538574, 2.6910576820373535, 3.1512160301208496, 3.611374616622925, 4.071533203125, 4.531691551208496, 4.991849899291992, 5.452008247375488, 5.912166595458984, 6.3723249435424805, 6.832483291625977, 7.292641639709473, 7.752799987792969, 8.212958335876465, 8.673116683959961, 9.133275985717773, 9.593433380126953, 10.05359172821045, 10.513750076293945, 10.973908424377441, 11.434066772460938, 11.894225120544434, 12.35438346862793, 12.814542770385742, 13.274701118469238]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 11.0, 10.0, 19.0, 27.0, 40.0, 55.0, 84.0, 139.0, 205.0, 291.0, 504.0, 691.0, 1169.0, 2009.0, 3325.0, 5885.0, 10305.0, 19569.0, 38027.0, 79786.0, 165158.0, 263119.0, 224439.0, 117599.0, 55320.0, 27624.0, 14355.0, 7745.0, 4435.0, 2491.0, 1514.0, 899.0, 607.0, 378.0, 256.0, 143.0, 94.0, 68.0, 59.0, 29.0, 19.0, 20.0, 8.0, 9.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.97265625, -4.82086181640625, -4.6690673828125, -4.51727294921875, -4.365478515625, -4.21368408203125, -4.0618896484375, -3.91009521484375, -3.75830078125, -3.60650634765625, -3.4547119140625, -3.30291748046875, -3.151123046875, -2.99932861328125, -2.8475341796875, -2.69573974609375, -2.5439453125, -2.39215087890625, -2.2403564453125, -2.08856201171875, -1.936767578125, -1.78497314453125, -1.6331787109375, -1.48138427734375, -1.32958984375, -1.17779541015625, -1.0260009765625, -0.87420654296875, -0.722412109375, -0.57061767578125, -0.4188232421875, -0.26702880859375, -0.115234375, 0.03656005859375, 0.1883544921875, 0.34014892578125, 0.491943359375, 0.64373779296875, 0.7955322265625, 0.94732666015625, 1.09912109375, 1.25091552734375, 1.4027099609375, 1.55450439453125, 1.706298828125, 1.85809326171875, 2.0098876953125, 2.16168212890625, 2.3134765625, 2.46527099609375, 2.6170654296875, 2.76885986328125, 2.920654296875, 3.07244873046875, 3.2242431640625, 3.37603759765625, 3.52783203125, 3.67962646484375, 3.8314208984375, 3.98321533203125, 4.135009765625, 4.28680419921875, 4.4385986328125, 4.59039306640625, 4.7421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 7.0, 10.0, 18.0, 15.0, 15.0, 21.0, 30.0, 30.0, 30.0, 33.0, 45.0, 42.0, 49.0, 54.0, 40.0, 52.0, 53.0, 52.0, 53.0, 46.0, 38.0, 38.0, 41.0, 25.0, 21.0, 25.0, 19.0, 17.0, 14.0, 9.0, 10.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.521453857421875, -2.44134521484375, -2.361236572265625, -2.2811279296875, -2.201019287109375, -2.12091064453125, -2.040802001953125, -1.960693359375, -1.880584716796875, -1.80047607421875, -1.720367431640625, -1.6402587890625, -1.560150146484375, -1.48004150390625, -1.399932861328125, -1.31982421875, -1.239715576171875, -1.15960693359375, -1.079498291015625, -0.9993896484375, -0.919281005859375, -0.83917236328125, -0.759063720703125, -0.678955078125, -0.598846435546875, -0.51873779296875, -0.438629150390625, -0.3585205078125, -0.278411865234375, -0.19830322265625, -0.118194580078125, -0.0380859375, 0.042022705078125, 0.12213134765625, 0.202239990234375, 0.2823486328125, 0.362457275390625, 0.44256591796875, 0.522674560546875, 0.602783203125, 0.682891845703125, 0.76300048828125, 0.843109130859375, 0.9232177734375, 1.003326416015625, 1.08343505859375, 1.163543701171875, 1.24365234375, 1.323760986328125, 1.40386962890625, 1.483978271484375, 1.5640869140625, 1.644195556640625, 1.72430419921875, 1.804412841796875, 1.884521484375, 1.964630126953125, 2.04473876953125, 2.124847412109375, 2.2049560546875, 2.285064697265625, 2.36517333984375, 2.445281982421875, 2.525390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 10.0, 12.0, 15.0, 18.0, 24.0, 28.0, 53.0, 84.0, 116.0, 205.0, 334.0, 734.0, 1496.0, 3593.0, 9453.0, 29647.0, 111071.0, 417815.0, 349195.0, 86831.0, 24032.0, 7968.0, 3036.0, 1338.0, 580.0, 329.0, 160.0, 105.0, 78.0, 46.0, 42.0, 28.0, 19.0, 18.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.573974609375, -7.31201171875, -7.050048828125, -6.7880859375, -6.526123046875, -6.26416015625, -6.002197265625, -5.740234375, -5.478271484375, -5.21630859375, -4.954345703125, -4.6923828125, -4.430419921875, -4.16845703125, -3.906494140625, -3.64453125, -3.382568359375, -3.12060546875, -2.858642578125, -2.5966796875, -2.334716796875, -2.07275390625, -1.810791015625, -1.548828125, -1.286865234375, -1.02490234375, -0.762939453125, -0.5009765625, -0.239013671875, 0.02294921875, 0.284912109375, 0.546875, 0.808837890625, 1.07080078125, 1.332763671875, 1.5947265625, 1.856689453125, 2.11865234375, 2.380615234375, 2.642578125, 2.904541015625, 3.16650390625, 3.428466796875, 3.6904296875, 3.952392578125, 4.21435546875, 4.476318359375, 4.73828125, 5.000244140625, 5.26220703125, 5.524169921875, 5.7861328125, 6.048095703125, 6.31005859375, 6.572021484375, 6.833984375, 7.095947265625, 7.35791015625, 7.619873046875, 7.8818359375, 8.143798828125, 8.40576171875, 8.667724609375, 8.9296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 10.0, 14.0, 12.0, 18.0, 15.0, 23.0, 27.0, 22.0, 36.0, 47.0, 40.0, 42.0, 55.0, 42.0, 50.0, 54.0, 56.0, 48.0, 48.0, 59.0, 36.0, 41.0, 30.0, 29.0, 28.0, 21.0, 17.0, 18.0, 16.0, 3.0, 12.0, 11.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2890625, -14.8214111328125, -14.353759765625, -13.8861083984375, -13.41845703125, -12.9508056640625, -12.483154296875, -12.0155029296875, -11.5478515625, -11.0802001953125, -10.612548828125, -10.1448974609375, -9.67724609375, -9.2095947265625, -8.741943359375, -8.2742919921875, -7.806640625, -7.3389892578125, -6.871337890625, -6.4036865234375, -5.93603515625, -5.4683837890625, -5.000732421875, -4.5330810546875, -4.0654296875, -3.5977783203125, -3.130126953125, -2.6624755859375, -2.19482421875, -1.7271728515625, -1.259521484375, -0.7918701171875, -0.32421875, 0.1434326171875, 0.611083984375, 1.0787353515625, 1.54638671875, 2.0140380859375, 2.481689453125, 2.9493408203125, 3.4169921875, 3.8846435546875, 4.352294921875, 4.8199462890625, 5.28759765625, 5.7552490234375, 6.222900390625, 6.6905517578125, 7.158203125, 7.6258544921875, 8.093505859375, 8.5611572265625, 9.02880859375, 9.4964599609375, 9.964111328125, 10.4317626953125, 10.8994140625, 11.3670654296875, 11.834716796875, 12.3023681640625, 12.77001953125, 13.2376708984375, 13.705322265625, 14.1729736328125, 14.640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 5.0, 7.0, 4.0, 17.0, 13.0, 14.0, 42.0, 29.0, 61.0, 87.0, 122.0, 180.0, 282.0, 502.0, 937.0, 2255.0, 6155.0, 22095.0, 106468.0, 451488.0, 357360.0, 75123.0, 16424.0, 4856.0, 1848.0, 905.0, 425.0, 272.0, 172.0, 116.0, 84.0, 45.0, 34.0, 39.0, 18.0, 14.0, 9.0, 9.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.751953125, -3.622100830078125, -3.49224853515625, -3.362396240234375, -3.2325439453125, -3.102691650390625, -2.97283935546875, -2.842987060546875, -2.713134765625, -2.583282470703125, -2.45343017578125, -2.323577880859375, -2.1937255859375, -2.063873291015625, -1.93402099609375, -1.804168701171875, -1.67431640625, -1.544464111328125, -1.41461181640625, -1.284759521484375, -1.1549072265625, -1.025054931640625, -0.89520263671875, -0.765350341796875, -0.635498046875, -0.505645751953125, -0.37579345703125, -0.245941162109375, -0.1160888671875, 0.013763427734375, 0.14361572265625, 0.273468017578125, 0.4033203125, 0.533172607421875, 0.66302490234375, 0.792877197265625, 0.9227294921875, 1.052581787109375, 1.18243408203125, 1.312286376953125, 1.442138671875, 1.571990966796875, 1.70184326171875, 1.831695556640625, 1.9615478515625, 2.091400146484375, 2.22125244140625, 2.351104736328125, 2.48095703125, 2.610809326171875, 2.74066162109375, 2.870513916015625, 3.0003662109375, 3.130218505859375, 3.26007080078125, 3.389923095703125, 3.519775390625, 3.649627685546875, 3.77947998046875, 3.909332275390625, 4.0391845703125, 4.169036865234375, 4.29888916015625, 4.428741455078125, 4.55859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 20.0, 25.0, 18.0, 40.0, 39.0, 55.0, 75.0, 63.0, 85.0, 82.0, 84.0, 78.0, 65.0, 61.0, 39.0, 43.0, 26.0, 24.0, 17.0, 8.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0008087158203125, -0.0007883831858634949, -0.0007680505514144897, -0.0007477179169654846, -0.0007273852825164795, -0.0007070526480674744, -0.0006867200136184692, -0.0006663873791694641, -0.000646054744720459, -0.0006257221102714539, -0.0006053894758224487, -0.0005850568413734436, -0.0005647242069244385, -0.0005443915724754333, -0.0005240589380264282, -0.0005037263035774231, -0.00048339366912841797, -0.00046306103467941284, -0.0004427284002304077, -0.0004223957657814026, -0.00040206313133239746, -0.00038173049688339233, -0.0003613978624343872, -0.0003410652279853821, -0.00032073259353637695, -0.0003003999590873718, -0.0002800673246383667, -0.00025973469018936157, -0.00023940205574035645, -0.00021906942129135132, -0.0001987367868423462, -0.00017840415239334106, -0.00015807151794433594, -0.0001377388834953308, -0.00011740624904632568, -9.707361459732056e-05, -7.674098014831543e-05, -5.64083456993103e-05, -3.6075711250305176e-05, -1.574307680130005e-05, 4.589557647705078e-06, 2.4922192096710205e-05, 4.525482654571533e-05, 6.558746099472046e-05, 8.592009544372559e-05, 0.00010625272989273071, 0.00012658536434173584, 0.00014691799879074097, 0.0001672506332397461, 0.00018758326768875122, 0.00020791590213775635, 0.00022824853658676147, 0.0002485811710357666, 0.00026891380548477173, 0.00028924643993377686, 0.000309579074382782, 0.0003299117088317871, 0.00035024434328079224, 0.00037057697772979736, 0.0003909096121788025, 0.0004112422466278076, 0.00043157488107681274, 0.00045190751552581787, 0.000472240149974823, 0.0004925727844238281]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 15.0, 12.0, 18.0, 29.0, 34.0, 58.0, 73.0, 136.0, 265.0, 376.0, 659.0, 1315.0, 3048.0, 7853.0, 25831.0, 97221.0, 331244.0, 398133.0, 130851.0, 33977.0, 10110.0, 3658.0, 1645.0, 819.0, 421.0, 283.0, 141.0, 109.0, 62.0, 40.0, 33.0, 18.0, 13.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.939605712890625, -3.82061767578125, -3.701629638671875, -3.5826416015625, -3.463653564453125, -3.34466552734375, -3.225677490234375, -3.106689453125, -2.987701416015625, -2.86871337890625, -2.749725341796875, -2.6307373046875, -2.511749267578125, -2.39276123046875, -2.273773193359375, -2.15478515625, -2.035797119140625, -1.91680908203125, -1.797821044921875, -1.6788330078125, -1.559844970703125, -1.44085693359375, -1.321868896484375, -1.202880859375, -1.083892822265625, -0.96490478515625, -0.845916748046875, -0.7269287109375, -0.607940673828125, -0.48895263671875, -0.369964599609375, -0.2509765625, -0.131988525390625, -0.01300048828125, 0.105987548828125, 0.2249755859375, 0.343963623046875, 0.46295166015625, 0.581939697265625, 0.700927734375, 0.819915771484375, 0.93890380859375, 1.057891845703125, 1.1768798828125, 1.295867919921875, 1.41485595703125, 1.533843994140625, 1.65283203125, 1.771820068359375, 1.89080810546875, 2.009796142578125, 2.1287841796875, 2.247772216796875, 2.36676025390625, 2.485748291015625, 2.604736328125, 2.723724365234375, 2.84271240234375, 2.961700439453125, 3.0806884765625, 3.199676513671875, 3.31866455078125, 3.437652587890625, 3.556640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 10.0, 7.0, 10.0, 16.0, 31.0, 36.0, 42.0, 61.0, 66.0, 83.0, 96.0, 105.0, 102.0, 84.0, 55.0, 52.0, 46.0, 32.0, 14.0, 18.0, 6.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.26031494140625, -4.0675048828125, -3.87469482421875, -3.681884765625, -3.48907470703125, -3.2962646484375, -3.10345458984375, -2.91064453125, -2.71783447265625, -2.5250244140625, -2.33221435546875, -2.139404296875, -1.94659423828125, -1.7537841796875, -1.56097412109375, -1.3681640625, -1.17535400390625, -0.9825439453125, -0.78973388671875, -0.596923828125, -0.40411376953125, -0.2113037109375, -0.01849365234375, 0.17431640625, 0.36712646484375, 0.5599365234375, 0.75274658203125, 0.945556640625, 1.13836669921875, 1.3311767578125, 1.52398681640625, 1.716796875, 1.90960693359375, 2.1024169921875, 2.29522705078125, 2.488037109375, 2.68084716796875, 2.8736572265625, 3.06646728515625, 3.25927734375, 3.45208740234375, 3.6448974609375, 3.83770751953125, 4.030517578125, 4.22332763671875, 4.4161376953125, 4.60894775390625, 4.8017578125, 4.99456787109375, 5.1873779296875, 5.38018798828125, 5.572998046875, 5.76580810546875, 5.9586181640625, 6.15142822265625, 6.34423828125, 6.53704833984375, 6.7298583984375, 6.92266845703125, 7.115478515625, 7.30828857421875, 7.5010986328125, 7.69390869140625, 7.88671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 6.0, 12.0, 13.0, 38.0, 107.0, 130.0, 214.0, 201.0, 107.0, 80.0, 37.0, 29.0, 12.0, 9.0, 4.0, 4.0, 2.0], "bins": [-167.0768585205078, -163.9799041748047, -160.88294982910156, -157.78599548339844, -154.6890411376953, -151.59207153320312, -148.4951171875, -145.39816284179688, -142.30120849609375, -139.20425415039062, -136.1072998046875, -133.01034545898438, -129.91339111328125, -126.8164291381836, -123.71947479248047, -120.62251281738281, -117.52555847167969, -114.42860412597656, -111.33164978027344, -108.23468780517578, -105.13773345947266, -102.04077911376953, -98.9438247680664, -95.84686279296875, -92.74991607666016, -89.65296173095703, -86.5560073852539, -83.45904541015625, -80.36209106445312, -77.26513671875, -74.16818237304688, -71.07122802734375, -67.9742660522461, -64.87731170654297, -61.78035354614258, -58.68339920043945, -55.58644104003906, -52.48948669433594, -49.39253234863281, -46.29557418823242, -43.1986198425293, -40.10166549682617, -37.00470733642578, -33.907752990722656, -30.810794830322266, -27.71384048461914, -24.616884231567383, -21.519927978515625, -18.422971725463867, -15.32601547241211, -12.229059219360352, -9.13210391998291, -6.035147666931152, -2.9381914138793945, 0.15876388549804688, 3.2557201385498047, 6.3526763916015625, 9.44963264465332, 12.546588897705078, 15.64354419708252, 18.740501403808594, 21.83745574951172, 24.934412002563477, 28.031368255615234, 31.128324508666992]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 10.0, 9.0, 16.0, 10.0, 12.0, 18.0, 21.0, 18.0, 31.0, 34.0, 39.0, 33.0, 36.0, 55.0, 50.0, 53.0, 58.0, 48.0, 37.0, 51.0, 43.0, 46.0, 32.0, 37.0, 35.0, 30.0, 25.0, 21.0, 17.0, 10.0, 8.0, 8.0, 19.0, 5.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.867942810058594, -60.53141784667969, -58.19489288330078, -55.858367919921875, -53.52184295654297, -51.18531799316406, -48.84879684448242, -46.512271881103516, -44.17574691772461, -41.8392219543457, -39.5026969909668, -37.16617202758789, -34.82965087890625, -32.493125915527344, -30.156600952148438, -27.82007598876953, -25.483551025390625, -23.14702606201172, -20.810501098632812, -18.47397804260254, -16.137453079223633, -13.800928115844727, -11.464404106140137, -9.127880096435547, -6.791355133056641, -4.454830646514893, -2.1183061599731445, 0.21821832656860352, 2.5547428131103516, 4.891267776489258, 7.227791786193848, 9.564315795898438, 11.900848388671875, 14.237373352050781, 16.573898315429688, 18.91042137145996, 21.246946334838867, 23.583471298217773, 25.919994354248047, 28.256519317626953, 30.59304428100586, 32.929569244384766, 35.26609420776367, 37.60261917114258, 39.93914031982422, 42.275665283203125, 44.61219024658203, 46.94871520996094, 49.285240173339844, 51.62176513671875, 53.958290100097656, 56.29481506347656, 58.63134002685547, 60.967864990234375, 63.304386138916016, 65.64091491699219, 67.97743225097656, 70.31395721435547, 72.65048217773438, 74.98700714111328, 77.32353210449219, 79.6600570678711, 81.99658203125, 84.33309936523438, 86.66963195800781]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 8.0, 4.0, 6.0, 4.0, 9.0, 16.0, 27.0, 45.0, 42.0, 77.0, 97.0, 132.0, 231.0, 330.0, 585.0, 994.0, 1932.0, 4167.0, 9585.0, 31188.0, 259536.0, 3791520.0, 66310.0, 15477.0, 5885.0, 2685.0, 1414.0, 759.0, 440.0, 248.0, 156.0, 104.0, 87.0, 62.0, 40.0, 20.0, 18.0, 17.0, 10.0, 6.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.80859375, -6.55853271484375, -6.3084716796875, -6.05841064453125, -5.808349609375, -5.55828857421875, -5.3082275390625, -5.05816650390625, -4.80810546875, -4.55804443359375, -4.3079833984375, -4.05792236328125, -3.807861328125, -3.55780029296875, -3.3077392578125, -3.05767822265625, -2.8076171875, -2.55755615234375, -2.3074951171875, -2.05743408203125, -1.807373046875, -1.55731201171875, -1.3072509765625, -1.05718994140625, -0.80712890625, -0.55706787109375, -0.3070068359375, -0.05694580078125, 0.193115234375, 0.44317626953125, 0.6932373046875, 0.94329833984375, 1.193359375, 1.44342041015625, 1.6934814453125, 1.94354248046875, 2.193603515625, 2.44366455078125, 2.6937255859375, 2.94378662109375, 3.19384765625, 3.44390869140625, 3.6939697265625, 3.94403076171875, 4.194091796875, 4.44415283203125, 4.6942138671875, 4.94427490234375, 5.1943359375, 5.44439697265625, 5.6944580078125, 5.94451904296875, 6.194580078125, 6.44464111328125, 6.6947021484375, 6.94476318359375, 7.19482421875, 7.44488525390625, 7.6949462890625, 7.94500732421875, 8.195068359375, 8.44512939453125, 8.6951904296875, 8.94525146484375, 9.1953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 7.0, 6.0, 5.0, 10.0, 9.0, 12.0, 13.0, 21.0, 29.0, 23.0, 28.0, 33.0, 37.0, 30.0, 46.0, 35.0, 52.0, 44.0, 58.0, 54.0, 44.0, 52.0, 40.0, 44.0, 44.0, 47.0, 28.0, 25.0, 26.0, 15.0, 18.0, 15.0, 12.0, 7.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8828125, -2.7855224609375, -2.688232421875, -2.5909423828125, -2.49365234375, -2.3963623046875, -2.299072265625, -2.2017822265625, -2.1044921875, -2.0072021484375, -1.909912109375, -1.8126220703125, -1.71533203125, -1.6180419921875, -1.520751953125, -1.4234619140625, -1.326171875, -1.2288818359375, -1.131591796875, -1.0343017578125, -0.93701171875, -0.8397216796875, -0.742431640625, -0.6451416015625, -0.5478515625, -0.4505615234375, -0.353271484375, -0.2559814453125, -0.15869140625, -0.0614013671875, 0.035888671875, 0.1331787109375, 0.23046875, 0.3277587890625, 0.425048828125, 0.5223388671875, 0.61962890625, 0.7169189453125, 0.814208984375, 0.9114990234375, 1.0087890625, 1.1060791015625, 1.203369140625, 1.3006591796875, 1.39794921875, 1.4952392578125, 1.592529296875, 1.6898193359375, 1.787109375, 1.8843994140625, 1.981689453125, 2.0789794921875, 2.17626953125, 2.2735595703125, 2.370849609375, 2.4681396484375, 2.5654296875, 2.6627197265625, 2.760009765625, 2.8572998046875, 2.95458984375, 3.0518798828125, 3.149169921875, 3.2464599609375, 3.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 20.0, 20.0, 26.0, 27.0, 22.0, 33.0, 45.0, 57.0, 65.0, 121.0, 167.0, 256.0, 417.0, 720.0, 1442.0, 3083.0, 9955.0, 71493.0, 3935592.0, 147868.0, 14586.0, 4128.0, 1702.0, 910.0, 521.0, 303.0, 173.0, 129.0, 84.0, 54.0, 51.0, 29.0, 42.0, 31.0, 18.0, 18.0, 13.0, 12.0, 9.0, 4.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.31787109375, -10.9482421875, -10.57861328125, -10.208984375, -9.83935546875, -9.4697265625, -9.10009765625, -8.73046875, -8.36083984375, -7.9912109375, -7.62158203125, -7.251953125, -6.88232421875, -6.5126953125, -6.14306640625, -5.7734375, -5.40380859375, -5.0341796875, -4.66455078125, -4.294921875, -3.92529296875, -3.5556640625, -3.18603515625, -2.81640625, -2.44677734375, -2.0771484375, -1.70751953125, -1.337890625, -0.96826171875, -0.5986328125, -0.22900390625, 0.140625, 0.51025390625, 0.8798828125, 1.24951171875, 1.619140625, 1.98876953125, 2.3583984375, 2.72802734375, 3.09765625, 3.46728515625, 3.8369140625, 4.20654296875, 4.576171875, 4.94580078125, 5.3154296875, 5.68505859375, 6.0546875, 6.42431640625, 6.7939453125, 7.16357421875, 7.533203125, 7.90283203125, 8.2724609375, 8.64208984375, 9.01171875, 9.38134765625, 9.7509765625, 10.12060546875, 10.490234375, 10.85986328125, 11.2294921875, 11.59912109375, 11.96875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 13.0, 39.0, 144.0, 2664.0, 975.0, 123.0, 46.0, 22.0, 15.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.320831298828125, -2.21002197265625, -2.099212646484375, -1.9884033203125, -1.877593994140625, -1.76678466796875, -1.655975341796875, -1.545166015625, -1.434356689453125, -1.32354736328125, -1.212738037109375, -1.1019287109375, -0.991119384765625, -0.88031005859375, -0.769500732421875, -0.65869140625, -0.547882080078125, -0.43707275390625, -0.326263427734375, -0.2154541015625, -0.104644775390625, 0.00616455078125, 0.116973876953125, 0.227783203125, 0.338592529296875, 0.44940185546875, 0.560211181640625, 0.6710205078125, 0.781829833984375, 0.89263916015625, 1.003448486328125, 1.1142578125, 1.225067138671875, 1.33587646484375, 1.446685791015625, 1.5574951171875, 1.668304443359375, 1.77911376953125, 1.889923095703125, 2.000732421875, 2.111541748046875, 2.22235107421875, 2.333160400390625, 2.4439697265625, 2.554779052734375, 2.66558837890625, 2.776397705078125, 2.88720703125, 2.998016357421875, 3.10882568359375, 3.219635009765625, 3.3304443359375, 3.441253662109375, 3.55206298828125, 3.662872314453125, 3.773681640625, 3.884490966796875, 3.99530029296875, 4.106109619140625, 4.2169189453125, 4.327728271484375, 4.43853759765625, 4.549346923828125, 4.66015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 21.0, 21.0, 44.0, 81.0, 174.0, 173.0, 161.0, 127.0, 80.0, 52.0, 29.0, 12.0, 9.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.312112808227539, -9.902215957641602, -9.49232006072998, -9.08242416381836, -8.672527313232422, -8.262630462646484, -7.852734565734863, -7.442838191986084, -7.032941818237305, -6.623045444488525, -6.213149070739746, -5.803252696990967, -5.3933563232421875, -4.983459949493408, -4.573563575744629, -4.16366720199585, -3.7537708282470703, -3.343874454498291, -2.9339780807495117, -2.5240817070007324, -2.114185333251953, -1.7042889595031738, -1.2943925857543945, -0.8844962120056152, -0.47459983825683594, -0.06470346450805664, 0.34519290924072266, 0.755089282989502, 1.1649856567382812, 1.5748820304870605, 1.9847784042358398, 2.394674777984619, 2.8045711517333984, 3.2144675254821777, 3.624363899230957, 4.034260272979736, 4.444156646728516, 4.854053020477295, 5.263949394226074, 5.6738457679748535, 6.083742141723633, 6.493638515472412, 6.903534889221191, 7.313431262969971, 7.72332763671875, 8.133224487304688, 8.543120384216309, 8.95301628112793, 9.362913131713867, 9.772809982299805, 10.182705879211426, 10.592601776123047, 11.002498626708984, 11.412395477294922, 11.822291374206543, 12.232187271118164, 12.642084121704102, 13.051980972290039, 13.46187686920166, 13.871772766113281, 14.281669616699219, 14.691566467285156, 15.101462364196777, 15.511358261108398, 15.921255111694336]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 12.0, 13.0, 24.0, 27.0, 15.0, 26.0, 17.0, 29.0, 31.0, 34.0, 32.0, 37.0, 43.0, 36.0, 32.0, 51.0, 30.0, 42.0, 25.0, 37.0, 33.0, 42.0, 23.0, 34.0, 30.0, 20.0, 18.0, 24.0, 21.0, 21.0, 22.0, 22.0, 18.0, 11.0, 6.0, 8.0, 7.0, 7.0, 4.0, 1.0, 3.0, 5.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-5.945357322692871, -5.77437686920166, -5.603396415710449, -5.432415962219238, -5.2614359855651855, -5.090455532073975, -4.919475078582764, -4.748494625091553, -4.577514171600342, -4.406533718109131, -4.23555326461792, -4.064573287963867, -3.893592596054077, -3.7226123809814453, -3.5516319274902344, -3.3806514739990234, -3.2096712589263916, -3.0386908054351807, -2.867710590362549, -2.696730136871338, -2.525749683380127, -2.354769229888916, -2.183789014816284, -2.0128085613250732, -1.8418282270431519, -1.6708478927612305, -1.4998674392700195, -1.3288871049880981, -1.1579067707061768, -0.9869263172149658, -0.8159459829330444, -0.6449655294418335, -0.4739851951599121, -0.30300480127334595, -0.13202443718910217, 0.0389559268951416, 0.20993632078170776, 0.3809167146682739, 0.5518970489501953, 0.7228775024414062, 0.8938578367233276, 1.064838171005249, 1.23581862449646, 1.4067989587783813, 1.5777792930603027, 1.7487597465515137, 1.919740080833435, 2.0907206535339355, 2.2617008686065674, 2.4326813220977783, 2.60366153717041, 2.774641990661621, 2.945622444152832, 3.116602897644043, 3.287583112716675, 3.4585635662078857, 3.6295437812805176, 3.8005242347717285, 3.9715044498443604, 4.142484664916992, 4.313465118408203, 4.484445571899414, 4.655426025390625, 4.826406478881836, 4.997386932373047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 10.0, 2.0, 9.0, 9.0, 22.0, 27.0, 37.0, 45.0, 108.0, 133.0, 238.0, 387.0, 664.0, 1150.0, 2130.0, 4049.0, 8232.0, 17663.0, 41965.0, 106652.0, 255163.0, 325444.0, 168052.0, 65371.0, 26838.0, 11931.0, 5561.0, 2955.0, 1580.0, 823.0, 464.0, 310.0, 176.0, 105.0, 80.0, 49.0, 43.0, 21.0, 23.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.7734375, -6.556640625, -6.33984375, -6.123046875, -5.90625, -5.689453125, -5.47265625, -5.255859375, -5.0390625, -4.822265625, -4.60546875, -4.388671875, -4.171875, -3.955078125, -3.73828125, -3.521484375, -3.3046875, -3.087890625, -2.87109375, -2.654296875, -2.4375, -2.220703125, -2.00390625, -1.787109375, -1.5703125, -1.353515625, -1.13671875, -0.919921875, -0.703125, -0.486328125, -0.26953125, -0.052734375, 0.1640625, 0.380859375, 0.59765625, 0.814453125, 1.03125, 1.248046875, 1.46484375, 1.681640625, 1.8984375, 2.115234375, 2.33203125, 2.548828125, 2.765625, 2.982421875, 3.19921875, 3.416015625, 3.6328125, 3.849609375, 4.06640625, 4.283203125, 4.5, 4.716796875, 4.93359375, 5.150390625, 5.3671875, 5.583984375, 5.80078125, 6.017578125, 6.234375, 6.451171875, 6.66796875, 6.884765625, 7.1015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 7.0, 4.0, 8.0, 15.0, 6.0, 10.0, 12.0, 24.0, 29.0, 23.0, 25.0, 37.0, 44.0, 36.0, 57.0, 43.0, 43.0, 43.0, 46.0, 51.0, 44.0, 51.0, 40.0, 38.0, 42.0, 36.0, 33.0, 27.0, 18.0, 22.0, 15.0, 19.0, 10.0, 12.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203125, -3.097747802734375, -2.99237060546875, -2.886993408203125, -2.7816162109375, -2.676239013671875, -2.57086181640625, -2.465484619140625, -2.360107421875, -2.254730224609375, -2.14935302734375, -2.043975830078125, -1.9385986328125, -1.833221435546875, -1.72784423828125, -1.622467041015625, -1.51708984375, -1.411712646484375, -1.30633544921875, -1.200958251953125, -1.0955810546875, -0.990203857421875, -0.88482666015625, -0.779449462890625, -0.674072265625, -0.568695068359375, -0.46331787109375, -0.357940673828125, -0.2525634765625, -0.147186279296875, -0.04180908203125, 0.063568115234375, 0.1689453125, 0.274322509765625, 0.37969970703125, 0.485076904296875, 0.5904541015625, 0.695831298828125, 0.80120849609375, 0.906585693359375, 1.011962890625, 1.117340087890625, 1.22271728515625, 1.328094482421875, 1.4334716796875, 1.538848876953125, 1.64422607421875, 1.749603271484375, 1.85498046875, 1.960357666015625, 2.06573486328125, 2.171112060546875, 2.2764892578125, 2.381866455078125, 2.48724365234375, 2.592620849609375, 2.697998046875, 2.803375244140625, 2.90875244140625, 3.014129638671875, 3.1195068359375, 3.224884033203125, 3.33026123046875, 3.435638427734375, 3.541015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 17.0, 17.0, 18.0, 30.0, 59.0, 89.0, 134.0, 246.0, 565.0, 1174.0, 3001.0, 8845.0, 36185.0, 227739.0, 620178.0, 118496.0, 21795.0, 5994.0, 2041.0, 915.0, 430.0, 215.0, 121.0, 72.0, 51.0, 35.0, 21.0, 21.0, 12.0, 7.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.328125, -12.950927734375, -12.57373046875, -12.196533203125, -11.8193359375, -11.442138671875, -11.06494140625, -10.687744140625, -10.310546875, -9.933349609375, -9.55615234375, -9.178955078125, -8.8017578125, -8.424560546875, -8.04736328125, -7.670166015625, -7.29296875, -6.915771484375, -6.53857421875, -6.161376953125, -5.7841796875, -5.406982421875, -5.02978515625, -4.652587890625, -4.275390625, -3.898193359375, -3.52099609375, -3.143798828125, -2.7666015625, -2.389404296875, -2.01220703125, -1.635009765625, -1.2578125, -0.880615234375, -0.50341796875, -0.126220703125, 0.2509765625, 0.628173828125, 1.00537109375, 1.382568359375, 1.759765625, 2.136962890625, 2.51416015625, 2.891357421875, 3.2685546875, 3.645751953125, 4.02294921875, 4.400146484375, 4.77734375, 5.154541015625, 5.53173828125, 5.908935546875, 6.2861328125, 6.663330078125, 7.04052734375, 7.417724609375, 7.794921875, 8.172119140625, 8.54931640625, 8.926513671875, 9.3037109375, 9.680908203125, 10.05810546875, 10.435302734375, 10.8125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 16.0, 16.0, 27.0, 30.0, 24.0, 46.0, 57.0, 50.0, 63.0, 50.0, 70.0, 73.0, 62.0, 61.0, 53.0, 43.0, 42.0, 35.0, 33.0, 30.0, 17.0, 26.0, 16.0, 12.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.65625, -21.95166015625, -21.2470703125, -20.54248046875, -19.837890625, -19.13330078125, -18.4287109375, -17.72412109375, -17.01953125, -16.31494140625, -15.6103515625, -14.90576171875, -14.201171875, -13.49658203125, -12.7919921875, -12.08740234375, -11.3828125, -10.67822265625, -9.9736328125, -9.26904296875, -8.564453125, -7.85986328125, -7.1552734375, -6.45068359375, -5.74609375, -5.04150390625, -4.3369140625, -3.63232421875, -2.927734375, -2.22314453125, -1.5185546875, -0.81396484375, -0.109375, 0.59521484375, 1.2998046875, 2.00439453125, 2.708984375, 3.41357421875, 4.1181640625, 4.82275390625, 5.52734375, 6.23193359375, 6.9365234375, 7.64111328125, 8.345703125, 9.05029296875, 9.7548828125, 10.45947265625, 11.1640625, 11.86865234375, 12.5732421875, 13.27783203125, 13.982421875, 14.68701171875, 15.3916015625, 16.09619140625, 16.80078125, 17.50537109375, 18.2099609375, 18.91455078125, 19.619140625, 20.32373046875, 21.0283203125, 21.73291015625, 22.4375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 21.0, 15.0, 20.0, 43.0, 92.0, 262.0, 615.0, 1886.0, 7830.0, 71183.0, 817659.0, 133838.0, 11324.0, 2461.0, 789.0, 268.0, 122.0, 56.0, 24.0, 15.0, 5.0, 11.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.98968505859375, -8.7371826171875, -8.48468017578125, -8.232177734375, -7.97967529296875, -7.7271728515625, -7.47467041015625, -7.22216796875, -6.96966552734375, -6.7171630859375, -6.46466064453125, -6.212158203125, -5.95965576171875, -5.7071533203125, -5.45465087890625, -5.2021484375, -4.94964599609375, -4.6971435546875, -4.44464111328125, -4.192138671875, -3.93963623046875, -3.6871337890625, -3.43463134765625, -3.18212890625, -2.92962646484375, -2.6771240234375, -2.42462158203125, -2.172119140625, -1.91961669921875, -1.6671142578125, -1.41461181640625, -1.162109375, -0.90960693359375, -0.6571044921875, -0.40460205078125, -0.152099609375, 0.10040283203125, 0.3529052734375, 0.60540771484375, 0.85791015625, 1.11041259765625, 1.3629150390625, 1.61541748046875, 1.867919921875, 2.12042236328125, 2.3729248046875, 2.62542724609375, 2.8779296875, 3.13043212890625, 3.3829345703125, 3.63543701171875, 3.887939453125, 4.14044189453125, 4.3929443359375, 4.64544677734375, 4.89794921875, 5.15045166015625, 5.4029541015625, 5.65545654296875, 5.907958984375, 6.16046142578125, 6.4129638671875, 6.66546630859375, 6.91796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 17.0, 21.0, 34.0, 46.0, 47.0, 64.0, 109.0, 98.0, 111.0, 90.0, 78.0, 52.0, 70.0, 32.0, 37.0, 20.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0009016990661621094, -0.0008774474263191223, -0.0008531957864761353, -0.0008289441466331482, -0.0008046925067901611, -0.0007804408669471741, -0.000756189227104187, -0.0007319375872612, -0.0007076859474182129, -0.0006834343075752258, -0.0006591826677322388, -0.0006349310278892517, -0.0006106793880462646, -0.0005864277482032776, -0.0005621761083602905, -0.0005379244685173035, -0.0005136728286743164, -0.0004894211888313293, -0.0004651695489883423, -0.0004409179091453552, -0.00041666626930236816, -0.0003924146294593811, -0.00036816298961639404, -0.000343911349773407, -0.0003196597099304199, -0.00029540807008743286, -0.0002711564302444458, -0.00024690479040145874, -0.00022265315055847168, -0.00019840151071548462, -0.00017414987087249756, -0.0001498982310295105, -0.00012564659118652344, -0.00010139495134353638, -7.714331150054932e-05, -5.2891671657562256e-05, -2.8640031814575195e-05, -4.388391971588135e-06, 1.9863247871398926e-05, 4.4114887714385986e-05, 6.836652755737305e-05, 9.261816740036011e-05, 0.00011686980724334717, 0.00014112144708633423, 0.0001653730869293213, 0.00018962472677230835, 0.0002138763666152954, 0.00023812800645828247, 0.00026237964630126953, 0.0002866312861442566, 0.00031088292598724365, 0.0003351345658302307, 0.0003593862056732178, 0.00038363784551620483, 0.0004078894853591919, 0.00043214112520217896, 0.000456392765045166, 0.0004806444048881531, 0.0005048960447311401, 0.0005291476845741272, 0.0005533993244171143, 0.0005776509642601013, 0.0006019026041030884, 0.0006261542439460754, 0.0006504058837890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 4.0, 8.0, 22.0, 27.0, 34.0, 68.0, 92.0, 177.0, 324.0, 739.0, 1816.0, 6002.0, 28581.0, 270752.0, 650153.0, 73065.0, 11454.0, 3101.0, 1070.0, 479.0, 239.0, 113.0, 66.0, 43.0, 39.0, 18.0, 17.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.83984375, -7.634765625, -7.4296875, -7.224609375, -7.01953125, -6.814453125, -6.609375, -6.404296875, -6.19921875, -5.994140625, -5.7890625, -5.583984375, -5.37890625, -5.173828125, -4.96875, -4.763671875, -4.55859375, -4.353515625, -4.1484375, -3.943359375, -3.73828125, -3.533203125, -3.328125, -3.123046875, -2.91796875, -2.712890625, -2.5078125, -2.302734375, -2.09765625, -1.892578125, -1.6875, -1.482421875, -1.27734375, -1.072265625, -0.8671875, -0.662109375, -0.45703125, -0.251953125, -0.046875, 0.158203125, 0.36328125, 0.568359375, 0.7734375, 0.978515625, 1.18359375, 1.388671875, 1.59375, 1.798828125, 2.00390625, 2.208984375, 2.4140625, 2.619140625, 2.82421875, 3.029296875, 3.234375, 3.439453125, 3.64453125, 3.849609375, 4.0546875, 4.259765625, 4.46484375, 4.669921875, 4.875, 5.080078125, 5.28515625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 11.0, 11.0, 20.0, 22.0, 25.0, 39.0, 64.0, 88.0, 123.0, 119.0, 132.0, 111.0, 75.0, 51.0, 31.0, 24.0, 18.0, 10.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.2314453125, -6.970703125, -6.7099609375, -6.44921875, -6.1884765625, -5.927734375, -5.6669921875, -5.40625, -5.1455078125, -4.884765625, -4.6240234375, -4.36328125, -4.1025390625, -3.841796875, -3.5810546875, -3.3203125, -3.0595703125, -2.798828125, -2.5380859375, -2.27734375, -2.0166015625, -1.755859375, -1.4951171875, -1.234375, -0.9736328125, -0.712890625, -0.4521484375, -0.19140625, 0.0693359375, 0.330078125, 0.5908203125, 0.8515625, 1.1123046875, 1.373046875, 1.6337890625, 1.89453125, 2.1552734375, 2.416015625, 2.6767578125, 2.9375, 3.1982421875, 3.458984375, 3.7197265625, 3.98046875, 4.2412109375, 4.501953125, 4.7626953125, 5.0234375, 5.2841796875, 5.544921875, 5.8056640625, 6.06640625, 6.3271484375, 6.587890625, 6.8486328125, 7.109375, 7.3701171875, 7.630859375, 7.8916015625, 8.15234375, 8.4130859375, 8.673828125, 8.9345703125, 9.1953125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 17.0, 31.0, 83.0, 198.0, 297.0, 206.0, 101.0, 37.0, 22.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-240.6915740966797, -235.83929443359375, -230.9870147705078, -226.13473510742188, -221.28245544433594, -216.43017578125, -211.57789611816406, -206.72561645507812, -201.87335205078125, -197.0210723876953, -192.16879272460938, -187.31651306152344, -182.4642333984375, -177.61195373535156, -172.75967407226562, -167.90740966796875, -163.05511474609375, -158.2028350830078, -153.35055541992188, -148.49827575683594, -143.64599609375, -138.79371643066406, -133.94143676757812, -129.08917236328125, -124.23688507080078, -119.38460540771484, -114.5323257446289, -109.68004608154297, -104.82777404785156, -99.97549438476562, -95.12321472167969, -90.27093505859375, -85.41864013671875, -80.56636047363281, -75.71408081054688, -70.86180114746094, -66.009521484375, -61.15724563598633, -56.304969787597656, -51.45269012451172, -46.60041046142578, -41.748130798339844, -36.895851135253906, -32.043575286865234, -27.191295623779297, -22.33901596069336, -17.486738204956055, -12.63446044921875, -7.7821807861328125, -2.9299020767211914, 1.9223766326904297, 6.774655342102051, 11.626934051513672, 16.47921371459961, 21.331491470336914, 26.18376922607422, 31.036048889160156, 35.888328552246094, 40.74060821533203, 45.5928840637207, 50.44516372680664, 55.29744338989258, 60.14971923828125, 65.00199890136719, 69.85427856445312]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 9.0, 6.0, 9.0, 14.0, 10.0, 21.0, 18.0, 14.0, 20.0, 23.0, 26.0, 34.0, 30.0, 37.0, 26.0, 39.0, 41.0, 49.0, 42.0, 34.0, 37.0, 37.0, 43.0, 33.0, 31.0, 42.0, 27.0, 31.0, 35.0, 19.0, 21.0, 13.0, 21.0, 11.0, 7.0, 12.0, 6.0, 4.0, 7.0, 6.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-64.01964569091797, -61.981971740722656, -59.94430160522461, -57.9066276550293, -55.86895751953125, -53.83128356933594, -51.793609619140625, -49.75593566894531, -47.718265533447266, -45.68059158325195, -43.642921447753906, -41.605247497558594, -39.56757354736328, -37.529903411865234, -35.49222946166992, -33.454559326171875, -31.416885375976562, -29.379213333129883, -27.341541290283203, -25.30386734008789, -23.26619529724121, -21.22852325439453, -19.19084930419922, -17.15317726135254, -15.11550521850586, -13.07783317565918, -11.040160179138184, -9.002487182617188, -6.964815139770508, -4.927143096923828, -2.889470100402832, -0.8517971038818359, 1.185882568359375, 3.223555088043213, 5.261227607727051, 7.298900127410889, 9.336572647094727, 11.374244689941406, 13.411917686462402, 15.449590682983398, 17.487262725830078, 19.524934768676758, 21.562606811523438, 23.60028076171875, 25.63795280456543, 27.67562484741211, 29.713298797607422, 31.7509708404541, 33.78864288330078, 35.826316833496094, 37.86398696899414, 39.90166091918945, 41.9393310546875, 43.97700500488281, 46.014678955078125, 48.05235290527344, 50.090023040771484, 52.1276969909668, 54.165367126464844, 56.203041076660156, 58.24071502685547, 60.278385162353516, 62.31605911254883, 64.35372924804688, 66.39140319824219]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 10.0, 7.0, 7.0, 21.0, 18.0, 36.0, 35.0, 52.0, 77.0, 85.0, 146.0, 229.0, 277.0, 418.0, 590.0, 909.0, 1482.0, 2370.0, 4693.0, 11607.0, 41480.0, 603666.0, 3447923.0, 52018.0, 13571.0, 5262.0, 2728.0, 1544.0, 954.0, 577.0, 401.0, 300.0, 198.0, 160.0, 106.0, 93.0, 52.0, 44.0, 32.0, 24.0, 15.0, 14.0, 16.0, 6.0, 8.0, 6.0, 2.0, 4.0, 0.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.65234375, -6.438232421875, -6.22412109375, -6.010009765625, -5.7958984375, -5.581787109375, -5.36767578125, -5.153564453125, -4.939453125, -4.725341796875, -4.51123046875, -4.297119140625, -4.0830078125, -3.868896484375, -3.65478515625, -3.440673828125, -3.2265625, -3.012451171875, -2.79833984375, -2.584228515625, -2.3701171875, -2.156005859375, -1.94189453125, -1.727783203125, -1.513671875, -1.299560546875, -1.08544921875, -0.871337890625, -0.6572265625, -0.443115234375, -0.22900390625, -0.014892578125, 0.19921875, 0.413330078125, 0.62744140625, 0.841552734375, 1.0556640625, 1.269775390625, 1.48388671875, 1.697998046875, 1.912109375, 2.126220703125, 2.34033203125, 2.554443359375, 2.7685546875, 2.982666015625, 3.19677734375, 3.410888671875, 3.625, 3.839111328125, 4.05322265625, 4.267333984375, 4.4814453125, 4.695556640625, 4.90966796875, 5.123779296875, 5.337890625, 5.552001953125, 5.76611328125, 5.980224609375, 6.1943359375, 6.408447265625, 6.62255859375, 6.836669921875, 7.05078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 2.0, 4.0, 11.0, 12.0, 8.0, 5.0, 7.0, 11.0, 20.0, 30.0, 21.0, 30.0, 34.0, 31.0, 32.0, 38.0, 41.0, 33.0, 53.0, 44.0, 61.0, 45.0, 48.0, 50.0, 35.0, 35.0, 35.0, 36.0, 30.0, 27.0, 23.0, 15.0, 16.0, 17.0, 7.0, 4.0, 15.0, 4.0, 5.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.283203125, -3.183319091796875, -3.08343505859375, -2.983551025390625, -2.8836669921875, -2.783782958984375, -2.68389892578125, -2.584014892578125, -2.484130859375, -2.384246826171875, -2.28436279296875, -2.184478759765625, -2.0845947265625, -1.984710693359375, -1.88482666015625, -1.784942626953125, -1.68505859375, -1.585174560546875, -1.48529052734375, -1.385406494140625, -1.2855224609375, -1.185638427734375, -1.08575439453125, -0.985870361328125, -0.885986328125, -0.786102294921875, -0.68621826171875, -0.586334228515625, -0.4864501953125, -0.386566162109375, -0.28668212890625, -0.186798095703125, -0.0869140625, 0.012969970703125, 0.11285400390625, 0.212738037109375, 0.3126220703125, 0.412506103515625, 0.51239013671875, 0.612274169921875, 0.712158203125, 0.812042236328125, 0.91192626953125, 1.011810302734375, 1.1116943359375, 1.211578369140625, 1.31146240234375, 1.411346435546875, 1.51123046875, 1.611114501953125, 1.71099853515625, 1.810882568359375, 1.9107666015625, 2.010650634765625, 2.11053466796875, 2.210418701171875, 2.310302734375, 2.410186767578125, 2.51007080078125, 2.609954833984375, 2.7098388671875, 2.809722900390625, 2.90960693359375, 3.009490966796875, 3.109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 12.0, 18.0, 15.0, 13.0, 16.0, 22.0, 36.0, 41.0, 61.0, 84.0, 127.0, 218.0, 284.0, 482.0, 807.0, 1361.0, 2512.0, 5563.0, 16459.0, 82563.0, 3531409.0, 490055.0, 42314.0, 10746.0, 4085.0, 1968.0, 1114.0, 597.0, 412.0, 260.0, 178.0, 122.0, 83.0, 55.0, 52.0, 30.0, 21.0, 26.0, 15.0, 13.0, 8.0, 5.0, 2.0, 9.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.58203125, -7.35101318359375, -7.1199951171875, -6.88897705078125, -6.657958984375, -6.42694091796875, -6.1959228515625, -5.96490478515625, -5.73388671875, -5.50286865234375, -5.2718505859375, -5.04083251953125, -4.809814453125, -4.57879638671875, -4.3477783203125, -4.11676025390625, -3.8857421875, -3.65472412109375, -3.4237060546875, -3.19268798828125, -2.961669921875, -2.73065185546875, -2.4996337890625, -2.26861572265625, -2.03759765625, -1.80657958984375, -1.5755615234375, -1.34454345703125, -1.113525390625, -0.88250732421875, -0.6514892578125, -0.42047119140625, -0.189453125, 0.04156494140625, 0.2725830078125, 0.50360107421875, 0.734619140625, 0.96563720703125, 1.1966552734375, 1.42767333984375, 1.65869140625, 1.88970947265625, 2.1207275390625, 2.35174560546875, 2.582763671875, 2.81378173828125, 3.0447998046875, 3.27581787109375, 3.5068359375, 3.73785400390625, 3.9688720703125, 4.19989013671875, 4.430908203125, 4.66192626953125, 4.8929443359375, 5.12396240234375, 5.35498046875, 5.58599853515625, 5.8170166015625, 6.04803466796875, 6.279052734375, 6.51007080078125, 6.7410888671875, 6.97210693359375, 7.203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 17.0, 25.0, 57.0, 135.0, 460.0, 2854.0, 313.0, 95.0, 41.0, 25.0, 9.0, 13.0, 4.0, 7.0, 6.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.453125, -3.36077880859375, -3.2684326171875, -3.17608642578125, -3.083740234375, -2.99139404296875, -2.8990478515625, -2.80670166015625, -2.71435546875, -2.62200927734375, -2.5296630859375, -2.43731689453125, -2.344970703125, -2.25262451171875, -2.1602783203125, -2.06793212890625, -1.9755859375, -1.88323974609375, -1.7908935546875, -1.69854736328125, -1.606201171875, -1.51385498046875, -1.4215087890625, -1.32916259765625, -1.23681640625, -1.14447021484375, -1.0521240234375, -0.95977783203125, -0.867431640625, -0.77508544921875, -0.6827392578125, -0.59039306640625, -0.498046875, -0.40570068359375, -0.3133544921875, -0.22100830078125, -0.128662109375, -0.03631591796875, 0.0560302734375, 0.14837646484375, 0.24072265625, 0.33306884765625, 0.4254150390625, 0.51776123046875, 0.610107421875, 0.70245361328125, 0.7947998046875, 0.88714599609375, 0.9794921875, 1.07183837890625, 1.1641845703125, 1.25653076171875, 1.348876953125, 1.44122314453125, 1.5335693359375, 1.62591552734375, 1.71826171875, 1.81060791015625, 1.9029541015625, 1.99530029296875, 2.087646484375, 2.17999267578125, 2.2723388671875, 2.36468505859375, 2.45703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 7.0, 15.0, 22.0, 28.0, 40.0, 55.0, 71.0, 92.0, 105.0, 94.0, 95.0, 90.0, 82.0, 71.0, 40.0, 25.0, 20.0, 13.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.574042320251465, -4.330786228179932, -4.087530136108398, -3.8442745208740234, -3.6010184288024902, -3.357762336730957, -3.114506483078003, -2.871250629425049, -2.6279945373535156, -2.3847384452819824, -2.1414825916290283, -1.8982266187667847, -1.654970645904541, -1.4117146730422974, -1.1684587001800537, -0.9252027273178101, -0.6819467544555664, -0.43869078159332275, -0.1954348087310791, 0.04782116413116455, 0.2910771369934082, 0.5343331098556519, 0.7775890827178955, 1.0208450555801392, 1.2641010284423828, 1.5073570013046265, 1.7506129741668701, 1.9938689470291138, 2.2371249198913574, 2.4803810119628906, 2.7236368656158447, 2.966892719268799, 3.210148811340332, 3.4534049034118652, 3.6966607570648193, 3.9399166107177734, 4.183172702789307, 4.42642879486084, 4.669684410095215, 4.912940502166748, 5.156196594238281, 5.3994526863098145, 5.642708778381348, 5.885964393615723, 6.129220485687256, 6.372476577758789, 6.615732192993164, 6.858988285064697, 7.1022443771362305, 7.345500469207764, 7.588756561279297, 7.832012176513672, 8.075267791748047, 8.318524360656738, 8.561779975891113, 8.805036544799805, 9.04829216003418, 9.291547775268555, 9.534804344177246, 9.778059959411621, 10.021316528320312, 10.264572143554688, 10.507827758789062, 10.751084327697754, 10.994339942932129]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 8.0, 10.0, 14.0, 14.0, 22.0, 21.0, 31.0, 42.0, 40.0, 57.0, 55.0, 57.0, 67.0, 66.0, 69.0, 51.0, 64.0, 48.0, 33.0, 45.0, 40.0, 36.0, 25.0, 16.0, 15.0, 18.0, 5.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.925815582275391, -4.720465660095215, -4.515115261077881, -4.309764862060547, -4.104414939880371, -3.899064779281616, -3.6937146186828613, -3.4883644580841064, -3.2830142974853516, -3.0776641368865967, -2.872313976287842, -2.666963815689087, -2.461613655090332, -2.256263494491577, -2.0509133338928223, -1.8455631732940674, -1.6402130126953125, -1.4348628520965576, -1.2295126914978027, -1.0241625308990479, -0.818812370300293, -0.6134622097015381, -0.4081120491027832, -0.20276188850402832, 0.0025882720947265625, 0.20793843269348145, 0.41328859329223633, 0.6186387538909912, 0.8239889144897461, 1.029339075088501, 1.2346892356872559, 1.4400393962860107, 1.6453895568847656, 1.8507397174835205, 2.0560898780822754, 2.2614400386810303, 2.466790199279785, 2.67214035987854, 2.877490520477295, 3.08284068107605, 3.2881908416748047, 3.4935410022735596, 3.6988911628723145, 3.9042413234710693, 4.109591484069824, 4.31494140625, 4.520291805267334, 4.725642204284668, 4.930992126464844, 5.1363420486450195, 5.3416924476623535, 5.5470428466796875, 5.752392768859863, 5.957742691040039, 6.163093090057373, 6.368443489074707, 6.573793411254883, 6.779143333435059, 6.984493732452393, 7.189844131469727, 7.395194053649902, 7.600543975830078, 7.805894374847412, 8.011244773864746, 8.216594696044922]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 13.0, 18.0, 24.0, 22.0, 50.0, 84.0, 133.0, 228.0, 392.0, 818.0, 1587.0, 3387.0, 7156.0, 17225.0, 44810.0, 130876.0, 322917.0, 317203.0, 127521.0, 44034.0, 16481.0, 6896.0, 3274.0, 1515.0, 787.0, 400.0, 249.0, 156.0, 99.0, 65.0, 45.0, 30.0, 20.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.8853759765625, -4.704345703125, -4.5233154296875, -4.34228515625, -4.1612548828125, -3.980224609375, -3.7991943359375, -3.6181640625, -3.4371337890625, -3.256103515625, -3.0750732421875, -2.89404296875, -2.7130126953125, -2.531982421875, -2.3509521484375, -2.169921875, -1.9888916015625, -1.807861328125, -1.6268310546875, -1.44580078125, -1.2647705078125, -1.083740234375, -0.9027099609375, -0.7216796875, -0.5406494140625, -0.359619140625, -0.1785888671875, 0.00244140625, 0.1834716796875, 0.364501953125, 0.5455322265625, 0.7265625, 0.9075927734375, 1.088623046875, 1.2696533203125, 1.45068359375, 1.6317138671875, 1.812744140625, 1.9937744140625, 2.1748046875, 2.3558349609375, 2.536865234375, 2.7178955078125, 2.89892578125, 3.0799560546875, 3.260986328125, 3.4420166015625, 3.623046875, 3.8040771484375, 3.985107421875, 4.1661376953125, 4.34716796875, 4.5281982421875, 4.709228515625, 4.8902587890625, 5.0712890625, 5.2523193359375, 5.433349609375, 5.6143798828125, 5.79541015625, 5.9764404296875, 6.157470703125, 6.3385009765625, 6.51953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 10.0, 5.0, 8.0, 8.0, 10.0, 8.0, 7.0, 8.0, 19.0, 17.0, 30.0, 26.0, 29.0, 43.0, 41.0, 41.0, 41.0, 49.0, 43.0, 48.0, 57.0, 48.0, 40.0, 56.0, 42.0, 43.0, 42.0, 25.0, 30.0, 24.0, 22.0, 14.0, 12.0, 10.0, 9.0, 10.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.372039794921875, -3.26556396484375, -3.159088134765625, -3.0526123046875, -2.946136474609375, -2.83966064453125, -2.733184814453125, -2.626708984375, -2.520233154296875, -2.41375732421875, -2.307281494140625, -2.2008056640625, -2.094329833984375, -1.98785400390625, -1.881378173828125, -1.77490234375, -1.668426513671875, -1.56195068359375, -1.455474853515625, -1.3489990234375, -1.242523193359375, -1.13604736328125, -1.029571533203125, -0.923095703125, -0.816619873046875, -0.71014404296875, -0.603668212890625, -0.4971923828125, -0.390716552734375, -0.28424072265625, -0.177764892578125, -0.0712890625, 0.035186767578125, 0.14166259765625, 0.248138427734375, 0.3546142578125, 0.461090087890625, 0.56756591796875, 0.674041748046875, 0.780517578125, 0.886993408203125, 0.99346923828125, 1.099945068359375, 1.2064208984375, 1.312896728515625, 1.41937255859375, 1.525848388671875, 1.63232421875, 1.738800048828125, 1.84527587890625, 1.951751708984375, 2.0582275390625, 2.164703369140625, 2.27117919921875, 2.377655029296875, 2.484130859375, 2.590606689453125, 2.69708251953125, 2.803558349609375, 2.9100341796875, 3.016510009765625, 3.12298583984375, 3.229461669921875, 3.3359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 11.0, 17.0, 17.0, 24.0, 37.0, 67.0, 77.0, 137.0, 211.0, 361.0, 679.0, 1465.0, 3388.0, 10617.0, 44545.0, 258283.0, 575801.0, 118022.0, 23417.0, 6652.0, 2372.0, 1014.0, 487.0, 289.0, 180.0, 97.0, 73.0, 59.0, 44.0, 24.0, 21.0, 9.0, 11.0, 5.0, 10.0, 7.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.6171875, -8.35833740234375, -8.0994873046875, -7.84063720703125, -7.581787109375, -7.32293701171875, -7.0640869140625, -6.80523681640625, -6.54638671875, -6.28753662109375, -6.0286865234375, -5.76983642578125, -5.510986328125, -5.25213623046875, -4.9932861328125, -4.73443603515625, -4.4755859375, -4.21673583984375, -3.9578857421875, -3.69903564453125, -3.440185546875, -3.18133544921875, -2.9224853515625, -2.66363525390625, -2.40478515625, -2.14593505859375, -1.8870849609375, -1.62823486328125, -1.369384765625, -1.11053466796875, -0.8516845703125, -0.59283447265625, -0.333984375, -0.07513427734375, 0.1837158203125, 0.44256591796875, 0.701416015625, 0.96026611328125, 1.2191162109375, 1.47796630859375, 1.73681640625, 1.99566650390625, 2.2545166015625, 2.51336669921875, 2.772216796875, 3.03106689453125, 3.2899169921875, 3.54876708984375, 3.8076171875, 4.06646728515625, 4.3253173828125, 4.58416748046875, 4.843017578125, 5.10186767578125, 5.3607177734375, 5.61956787109375, 5.87841796875, 6.13726806640625, 6.3961181640625, 6.65496826171875, 6.913818359375, 7.17266845703125, 7.4315185546875, 7.69036865234375, 7.94921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 24.0, 14.0, 17.0, 20.0, 33.0, 35.0, 35.0, 40.0, 41.0, 38.0, 53.0, 57.0, 54.0, 46.0, 60.0, 55.0, 53.0, 48.0, 36.0, 38.0, 34.0, 40.0, 22.0, 22.0, 23.0, 6.0, 11.0, 11.0, 9.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.3125, -18.7830810546875, -18.253662109375, -17.7242431640625, -17.19482421875, -16.6654052734375, -16.135986328125, -15.6065673828125, -15.0771484375, -14.5477294921875, -14.018310546875, -13.4888916015625, -12.95947265625, -12.4300537109375, -11.900634765625, -11.3712158203125, -10.841796875, -10.3123779296875, -9.782958984375, -9.2535400390625, -8.72412109375, -8.1947021484375, -7.665283203125, -7.1358642578125, -6.6064453125, -6.0770263671875, -5.547607421875, -5.0181884765625, -4.48876953125, -3.9593505859375, -3.429931640625, -2.9005126953125, -2.37109375, -1.8416748046875, -1.312255859375, -0.7828369140625, -0.25341796875, 0.2760009765625, 0.805419921875, 1.3348388671875, 1.8642578125, 2.3936767578125, 2.923095703125, 3.4525146484375, 3.98193359375, 4.5113525390625, 5.040771484375, 5.5701904296875, 6.099609375, 6.6290283203125, 7.158447265625, 7.6878662109375, 8.21728515625, 8.7467041015625, 9.276123046875, 9.8055419921875, 10.3349609375, 10.8643798828125, 11.393798828125, 11.9232177734375, 12.45263671875, 12.9820556640625, 13.511474609375, 14.0408935546875, 14.5703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 9.0, 10.0, 12.0, 37.0, 45.0, 71.0, 133.0, 291.0, 748.0, 2441.0, 13711.0, 179887.0, 775958.0, 65463.0, 7134.0, 1525.0, 542.0, 234.0, 111.0, 60.0, 42.0, 20.0, 24.0, 16.0, 6.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046875, -6.85809326171875, -6.6693115234375, -6.48052978515625, -6.291748046875, -6.10296630859375, -5.9141845703125, -5.72540283203125, -5.53662109375, -5.34783935546875, -5.1590576171875, -4.97027587890625, -4.781494140625, -4.59271240234375, -4.4039306640625, -4.21514892578125, -4.0263671875, -3.83758544921875, -3.6488037109375, -3.46002197265625, -3.271240234375, -3.08245849609375, -2.8936767578125, -2.70489501953125, -2.51611328125, -2.32733154296875, -2.1385498046875, -1.94976806640625, -1.760986328125, -1.57220458984375, -1.3834228515625, -1.19464111328125, -1.005859375, -0.81707763671875, -0.6282958984375, -0.43951416015625, -0.250732421875, -0.06195068359375, 0.1268310546875, 0.31561279296875, 0.50439453125, 0.69317626953125, 0.8819580078125, 1.07073974609375, 1.259521484375, 1.44830322265625, 1.6370849609375, 1.82586669921875, 2.0146484375, 2.20343017578125, 2.3922119140625, 2.58099365234375, 2.769775390625, 2.95855712890625, 3.1473388671875, 3.33612060546875, 3.52490234375, 3.71368408203125, 3.9024658203125, 4.09124755859375, 4.280029296875, 4.46881103515625, 4.6575927734375, 4.84637451171875, 5.03515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 8.0, 8.0, 11.0, 6.0, 17.0, 17.0, 34.0, 38.0, 40.0, 60.0, 57.0, 67.0, 79.0, 80.0, 77.0, 77.0, 65.0, 51.0, 51.0, 34.0, 21.0, 19.0, 12.0, 20.0, 8.0, 9.0, 10.0, 1.0, 3.0, 9.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005440711975097656, -0.0005255565047264099, -0.0005070418119430542, -0.0004885271191596985, -0.0004700124263763428, -0.00045149773359298706, -0.00043298304080963135, -0.00041446834802627563, -0.0003959536552429199, -0.0003774389624595642, -0.0003589242696762085, -0.0003404095768928528, -0.00032189488410949707, -0.00030338019132614136, -0.00028486549854278564, -0.00026635080575942993, -0.0002478361129760742, -0.0002293214201927185, -0.0002108067274093628, -0.00019229203462600708, -0.00017377734184265137, -0.00015526264905929565, -0.00013674795627593994, -0.00011823326349258423, -9.971857070922852e-05, -8.12038779258728e-05, -6.268918514251709e-05, -4.417449235916138e-05, -2.5659799575805664e-05, -7.145106792449951e-06, 1.1369585990905762e-05, 2.9884278774261475e-05, 4.839897155761719e-05, 6.69136643409729e-05, 8.542835712432861e-05, 0.00010394304990768433, 0.00012245774269104004, 0.00014097243547439575, 0.00015948712825775146, 0.00017800182104110718, 0.0001965165138244629, 0.0002150312066078186, 0.00023354589939117432, 0.00025206059217453003, 0.00027057528495788574, 0.00028908997774124146, 0.00030760467052459717, 0.0003261193633079529, 0.0003446340560913086, 0.0003631487488746643, 0.00038166344165802, 0.00040017813444137573, 0.00041869282722473145, 0.00043720752000808716, 0.00045572221279144287, 0.0004742369055747986, 0.0004927515983581543, 0.00051126629114151, 0.0005297809839248657, 0.0005482956767082214, 0.0005668103694915771, 0.0005853250622749329, 0.0006038397550582886, 0.0006223544478416443, 0.000640869140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 10.0, 11.0, 15.0, 22.0, 40.0, 90.0, 150.0, 361.0, 890.0, 3306.0, 28685.0, 744361.0, 256178.0, 11360.0, 2012.0, 575.0, 243.0, 106.0, 57.0, 26.0, 18.0, 13.0, 9.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.4078369140625, -8.151611328125, -7.8953857421875, -7.63916015625, -7.3829345703125, -7.126708984375, -6.8704833984375, -6.6142578125, -6.3580322265625, -6.101806640625, -5.8455810546875, -5.58935546875, -5.3331298828125, -5.076904296875, -4.8206787109375, -4.564453125, -4.3082275390625, -4.052001953125, -3.7957763671875, -3.53955078125, -3.2833251953125, -3.027099609375, -2.7708740234375, -2.5146484375, -2.2584228515625, -2.002197265625, -1.7459716796875, -1.48974609375, -1.2335205078125, -0.977294921875, -0.7210693359375, -0.46484375, -0.2086181640625, 0.047607421875, 0.3038330078125, 0.56005859375, 0.8162841796875, 1.072509765625, 1.3287353515625, 1.5849609375, 1.8411865234375, 2.097412109375, 2.3536376953125, 2.60986328125, 2.8660888671875, 3.122314453125, 3.3785400390625, 3.634765625, 3.8909912109375, 4.147216796875, 4.4034423828125, 4.65966796875, 4.9158935546875, 5.172119140625, 5.4283447265625, 5.6845703125, 5.9407958984375, 6.197021484375, 6.4532470703125, 6.70947265625, 6.9656982421875, 7.221923828125, 7.4781494140625, 7.734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 15.0, 16.0, 31.0, 32.0, 69.0, 85.0, 83.0, 124.0, 118.0, 109.0, 92.0, 66.0, 50.0, 35.0, 26.0, 19.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.1964111328125, -7.013916015625, -6.8314208984375, -6.64892578125, -6.4664306640625, -6.283935546875, -6.1014404296875, -5.9189453125, -5.7364501953125, -5.553955078125, -5.3714599609375, -5.18896484375, -5.0064697265625, -4.823974609375, -4.6414794921875, -4.458984375, -4.2764892578125, -4.093994140625, -3.9114990234375, -3.72900390625, -3.5465087890625, -3.364013671875, -3.1815185546875, -2.9990234375, -2.8165283203125, -2.634033203125, -2.4515380859375, -2.26904296875, -2.0865478515625, -1.904052734375, -1.7215576171875, -1.5390625, -1.3565673828125, -1.174072265625, -0.9915771484375, -0.80908203125, -0.6265869140625, -0.444091796875, -0.2615966796875, -0.0791015625, 0.1033935546875, 0.285888671875, 0.4683837890625, 0.65087890625, 0.8333740234375, 1.015869140625, 1.1983642578125, 1.380859375, 1.5633544921875, 1.745849609375, 1.9283447265625, 2.11083984375, 2.2933349609375, 2.475830078125, 2.6583251953125, 2.8408203125, 3.0233154296875, 3.205810546875, 3.3883056640625, 3.57080078125, 3.7532958984375, 3.935791015625, 4.1182861328125, 4.30078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 9.0, 15.0, 22.0, 54.0, 69.0, 110.0, 162.0, 156.0, 149.0, 113.0, 60.0, 35.0, 20.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.90678405761719, -68.56118774414062, -66.2155990600586, -63.87000274658203, -61.524410247802734, -59.17881774902344, -56.83322525024414, -54.487632751464844, -52.14203643798828, -49.796443939208984, -47.45085144042969, -45.105255126953125, -42.75966262817383, -40.41407012939453, -38.068477630615234, -35.72288513183594, -33.37729263305664, -31.031700134277344, -28.686105728149414, -26.340513229370117, -23.994918823242188, -21.64932632446289, -19.303733825683594, -16.958139419555664, -14.612546920776367, -12.266953468322754, -9.92136001586914, -7.575767517089844, -5.2301740646362305, -2.884580612182617, -0.5389881134033203, 1.8066062927246094, 4.152198791503906, 6.4977922439575195, 8.843385696411133, 11.18897819519043, 13.534571647644043, 15.880165100097656, 18.225757598876953, 20.571352005004883, 22.91694450378418, 25.262537002563477, 27.608131408691406, 29.953723907470703, 32.29931640625, 34.64491271972656, 36.990501403808594, 39.336097717285156, 41.68169021606445, 44.02728271484375, 46.37287521362305, 48.718467712402344, 51.064064025878906, 53.4096565246582, 55.7552490234375, 58.10084533691406, 60.446434020996094, 62.79202651977539, 65.13761901855469, 67.48321533203125, 69.82880401611328, 72.17440032958984, 74.51998901367188, 76.86558532714844, 79.211181640625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 5.0, 4.0, 15.0, 13.0, 14.0, 18.0, 26.0, 29.0, 47.0, 40.0, 41.0, 60.0, 45.0, 56.0, 59.0, 60.0, 46.0, 47.0, 56.0, 39.0, 50.0, 41.0, 27.0, 30.0, 31.0, 16.0, 17.0, 17.0, 11.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.93276977539062, -75.59931945800781, -73.265869140625, -70.93241882324219, -68.59896850585938, -66.2655258178711, -63.93207550048828, -61.59862518310547, -59.265174865722656, -56.931724548339844, -54.59827423095703, -52.264827728271484, -49.93137741088867, -47.59792709350586, -45.26448059082031, -42.9310302734375, -40.59757995605469, -38.264129638671875, -35.93067932128906, -33.597232818603516, -31.263782501220703, -28.93033218383789, -26.59688377380371, -24.26343536376953, -21.92998504638672, -19.596534729003906, -17.263086318969727, -14.92963695526123, -12.596187591552734, -10.262738227844238, -7.929288864135742, -5.5958404541015625, -3.2623825073242188, -0.9289331436157227, 1.4045162200927734, 3.7379655838012695, 6.071414947509766, 8.404864311218262, 10.738313674926758, 13.071762084960938, 15.40521240234375, 17.738662719726562, 20.072111129760742, 22.405559539794922, 24.739009857177734, 27.072460174560547, 29.405908584594727, 31.739356994628906, 34.07280731201172, 36.40625762939453, 38.739707946777344, 41.07315444946289, 43.4066047668457, 45.740055084228516, 48.07350158691406, 50.406951904296875, 52.74040222167969, 55.0738525390625, 57.40730285644531, 59.74074935913086, 62.07419967651367, 64.40764617919922, 66.74109649658203, 69.07454681396484, 71.40799713134766]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 7.0, 16.0, 27.0, 37.0, 66.0, 81.0, 131.0, 230.0, 334.0, 606.0, 995.0, 2020.0, 4223.0, 10167.0, 32604.0, 223946.0, 3829912.0, 60974.0, 15821.0, 6012.0, 2722.0, 1316.0, 715.0, 417.0, 270.0, 200.0, 115.0, 99.0, 56.0, 32.0, 36.0, 23.0, 14.0, 13.0, 6.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9375, -5.753173828125, -5.56884765625, -5.384521484375, -5.2001953125, -5.015869140625, -4.83154296875, -4.647216796875, -4.462890625, -4.278564453125, -4.09423828125, -3.909912109375, -3.7255859375, -3.541259765625, -3.35693359375, -3.172607421875, -2.98828125, -2.803955078125, -2.61962890625, -2.435302734375, -2.2509765625, -2.066650390625, -1.88232421875, -1.697998046875, -1.513671875, -1.329345703125, -1.14501953125, -0.960693359375, -0.7763671875, -0.592041015625, -0.40771484375, -0.223388671875, -0.0390625, 0.145263671875, 0.32958984375, 0.513916015625, 0.6982421875, 0.882568359375, 1.06689453125, 1.251220703125, 1.435546875, 1.619873046875, 1.80419921875, 1.988525390625, 2.1728515625, 2.357177734375, 2.54150390625, 2.725830078125, 2.91015625, 3.094482421875, 3.27880859375, 3.463134765625, 3.6474609375, 3.831787109375, 4.01611328125, 4.200439453125, 4.384765625, 4.569091796875, 4.75341796875, 4.937744140625, 5.1220703125, 5.306396484375, 5.49072265625, 5.675048828125, 5.859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 5.0, 4.0, 12.0, 9.0, 14.0, 21.0, 11.0, 20.0, 23.0, 27.0, 49.0, 26.0, 32.0, 43.0, 50.0, 51.0, 44.0, 65.0, 45.0, 56.0, 42.0, 58.0, 44.0, 38.0, 31.0, 33.0, 28.0, 17.0, 20.0, 19.0, 11.0, 15.0, 10.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.669921875, -3.560516357421875, -3.45111083984375, -3.341705322265625, -3.2322998046875, -3.122894287109375, -3.01348876953125, -2.904083251953125, -2.794677734375, -2.685272216796875, -2.57586669921875, -2.466461181640625, -2.3570556640625, -2.247650146484375, -2.13824462890625, -2.028839111328125, -1.91943359375, -1.810028076171875, -1.70062255859375, -1.591217041015625, -1.4818115234375, -1.372406005859375, -1.26300048828125, -1.153594970703125, -1.044189453125, -0.934783935546875, -0.82537841796875, -0.715972900390625, -0.6065673828125, -0.497161865234375, -0.38775634765625, -0.278350830078125, -0.1689453125, -0.059539794921875, 0.04986572265625, 0.159271240234375, 0.2686767578125, 0.378082275390625, 0.48748779296875, 0.596893310546875, 0.706298828125, 0.815704345703125, 0.92510986328125, 1.034515380859375, 1.1439208984375, 1.253326416015625, 1.36273193359375, 1.472137451171875, 1.58154296875, 1.690948486328125, 1.80035400390625, 1.909759521484375, 2.0191650390625, 2.128570556640625, 2.23797607421875, 2.347381591796875, 2.456787109375, 2.566192626953125, 2.67559814453125, 2.785003662109375, 2.8944091796875, 3.003814697265625, 3.11322021484375, 3.222625732421875, 3.33203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 6.0, 8.0, 11.0, 12.0, 11.0, 12.0, 9.0, 22.0, 21.0, 30.0, 40.0, 44.0, 78.0, 108.0, 194.0, 325.0, 610.0, 1491.0, 5479.0, 51603.0, 4044142.0, 79762.0, 6912.0, 1632.0, 673.0, 361.0, 211.0, 125.0, 73.0, 65.0, 41.0, 37.0, 23.0, 26.0, 19.0, 9.0, 9.0, 11.0, 5.0, 10.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-13.625, -13.2308349609375, -12.836669921875, -12.4425048828125, -12.04833984375, -11.6541748046875, -11.260009765625, -10.8658447265625, -10.4716796875, -10.0775146484375, -9.683349609375, -9.2891845703125, -8.89501953125, -8.5008544921875, -8.106689453125, -7.7125244140625, -7.318359375, -6.9241943359375, -6.530029296875, -6.1358642578125, -5.74169921875, -5.3475341796875, -4.953369140625, -4.5592041015625, -4.1650390625, -3.7708740234375, -3.376708984375, -2.9825439453125, -2.58837890625, -2.1942138671875, -1.800048828125, -1.4058837890625, -1.01171875, -0.6175537109375, -0.223388671875, 0.1707763671875, 0.56494140625, 0.9591064453125, 1.353271484375, 1.7474365234375, 2.1416015625, 2.5357666015625, 2.929931640625, 3.3240966796875, 3.71826171875, 4.1124267578125, 4.506591796875, 4.9007568359375, 5.294921875, 5.6890869140625, 6.083251953125, 6.4774169921875, 6.87158203125, 7.2657470703125, 7.659912109375, 8.0540771484375, 8.4482421875, 8.8424072265625, 9.236572265625, 9.6307373046875, 10.02490234375, 10.4190673828125, 10.813232421875, 11.2073974609375, 11.6015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 16.0, 28.0, 58.0, 184.0, 3205.0, 403.0, 91.0, 37.0, 19.0, 13.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9111328125, -1.8143768310546875, -1.717620849609375, -1.6208648681640625, -1.52410888671875, -1.4273529052734375, -1.330596923828125, -1.2338409423828125, -1.1370849609375, -1.0403289794921875, -0.943572998046875, -0.8468170166015625, -0.75006103515625, -0.6533050537109375, -0.556549072265625, -0.4597930908203125, -0.363037109375, -0.2662811279296875, -0.169525146484375, -0.0727691650390625, 0.02398681640625, 0.1207427978515625, 0.217498779296875, 0.3142547607421875, 0.4110107421875, 0.5077667236328125, 0.604522705078125, 0.7012786865234375, 0.79803466796875, 0.8947906494140625, 0.991546630859375, 1.0883026123046875, 1.18505859375, 1.2818145751953125, 1.378570556640625, 1.4753265380859375, 1.57208251953125, 1.6688385009765625, 1.765594482421875, 1.8623504638671875, 1.9591064453125, 2.0558624267578125, 2.152618408203125, 2.2493743896484375, 2.34613037109375, 2.4428863525390625, 2.539642333984375, 2.6363983154296875, 2.733154296875, 2.8299102783203125, 2.926666259765625, 3.0234222412109375, 3.12017822265625, 3.2169342041015625, 3.313690185546875, 3.4104461669921875, 3.5072021484375, 3.6039581298828125, 3.700714111328125, 3.7974700927734375, 3.89422607421875, 3.9909820556640625, 4.087738037109375, 4.1844940185546875, 4.28125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 19.0, 44.0, 81.0, 152.0, 178.0, 204.0, 139.0, 87.0, 40.0, 26.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.838037967681885, -5.4201812744140625, -5.00232458114624, -4.584467887878418, -4.166611194610596, -3.7487547397613525, -3.3308980464935303, -2.913041353225708, -2.4951846599578857, -2.0773279666900635, -1.6594712734222412, -1.2416146993637085, -0.8237580060958862, -0.4059014320373535, 0.01195526123046875, 0.429811954498291, 0.8476686477661133, 1.2655253410339355, 1.6833820343017578, 2.10123872756958, 2.5190954208374023, 2.9369518756866455, 3.3548085689544678, 3.77266526222229, 4.190522193908691, 4.608378887176514, 5.026235580444336, 5.444092273712158, 5.8619489669799805, 6.2798051834106445, 6.697662353515625, 7.115518569946289, 7.5333757400512695, 7.951232433319092, 8.369089126586914, 8.786945343017578, 9.204802513122559, 9.622658729553223, 10.040515899658203, 10.458372116088867, 10.876229286193848, 11.294085502624512, 11.711942672729492, 12.129798889160156, 12.547656059265137, 12.9655122756958, 13.383369445800781, 13.801225662231445, 14.21908187866211, 14.636938095092773, 15.054795265197754, 15.472651481628418, 15.890508651733398, 16.308364868164062, 16.726221084594727, 17.144079208374023, 17.561935424804688, 17.97979164123535, 18.397647857666016, 18.815505981445312, 19.233362197875977, 19.65121841430664, 20.069074630737305, 20.4869327545166, 20.904788970947266]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 7.0, 7.0, 11.0, 15.0, 17.0, 16.0, 21.0, 24.0, 26.0, 36.0, 33.0, 37.0, 31.0, 52.0, 41.0, 56.0, 49.0, 48.0, 70.0, 47.0, 45.0, 39.0, 39.0, 31.0, 33.0, 19.0, 20.0, 20.0, 20.0, 19.0, 12.0, 10.0, 9.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.284671306610107, -4.147883415222168, -4.0110955238342285, -3.87430739402771, -3.7375192642211914, -3.600731372833252, -3.4639434814453125, -3.327155590057373, -3.1903674602508545, -3.053579568862915, -2.9167914390563965, -2.780003547668457, -2.6432156562805176, -2.506427526473999, -2.3696396350860596, -2.232851505279541, -2.0960636138916016, -1.9592756032943726, -1.8224875926971436, -1.685699701309204, -1.548911690711975, -1.412123680114746, -1.2753357887268066, -1.1385477781295776, -1.0017597675323486, -0.8649717569351196, -0.7281838059425354, -0.5913958549499512, -0.45460784435272217, -0.31781983375549316, -0.18103188276290894, -0.04424393177032471, 0.0925440788269043, 0.2293320596218109, 0.36612004041671753, 0.5029079914093018, 0.6396960020065308, 0.7764840126037598, 0.913271963596344, 1.0500599145889282, 1.1868479251861572, 1.3236359357833862, 1.4604239463806152, 1.5972118377685547, 1.7339998483657837, 1.8707878589630127, 2.007575750350952, 2.1443638801574707, 2.28115177154541, 2.4179396629333496, 2.554727792739868, 2.6915156841278076, 2.828303813934326, 2.9650917053222656, 3.101879596710205, 3.2386674880981445, 3.375455617904663, 3.5122435092926025, 3.649031639099121, 3.7858195304870605, 3.922607421875, 4.059395790100098, 4.196183681488037, 4.332971572875977, 4.469759464263916]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 7.0, 11.0, 11.0, 24.0, 24.0, 40.0, 61.0, 102.0, 119.0, 176.0, 274.0, 419.0, 695.0, 1224.0, 1999.0, 3743.0, 7313.0, 14705.0, 30954.0, 69330.0, 157568.0, 290093.0, 248831.0, 119707.0, 52248.0, 23829.0, 11642.0, 5871.0, 3015.0, 1718.0, 1052.0, 620.0, 369.0, 224.0, 155.0, 116.0, 70.0, 59.0, 37.0, 25.0, 14.0, 14.0, 12.0, 13.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.65234375, -3.53387451171875, -3.4154052734375, -3.29693603515625, -3.178466796875, -3.05999755859375, -2.9415283203125, -2.82305908203125, -2.70458984375, -2.58612060546875, -2.4676513671875, -2.34918212890625, -2.230712890625, -2.11224365234375, -1.9937744140625, -1.87530517578125, -1.7568359375, -1.63836669921875, -1.5198974609375, -1.40142822265625, -1.282958984375, -1.16448974609375, -1.0460205078125, -0.92755126953125, -0.80908203125, -0.69061279296875, -0.5721435546875, -0.45367431640625, -0.335205078125, -0.21673583984375, -0.0982666015625, 0.02020263671875, 0.138671875, 0.25714111328125, 0.3756103515625, 0.49407958984375, 0.612548828125, 0.73101806640625, 0.8494873046875, 0.96795654296875, 1.08642578125, 1.20489501953125, 1.3233642578125, 1.44183349609375, 1.560302734375, 1.67877197265625, 1.7972412109375, 1.91571044921875, 2.0341796875, 2.15264892578125, 2.2711181640625, 2.38958740234375, 2.508056640625, 2.62652587890625, 2.7449951171875, 2.86346435546875, 2.98193359375, 3.10040283203125, 3.2188720703125, 3.33734130859375, 3.455810546875, 3.57427978515625, 3.6927490234375, 3.81121826171875, 3.9296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 12.0, 9.0, 11.0, 14.0, 19.0, 26.0, 25.0, 28.0, 31.0, 36.0, 29.0, 21.0, 47.0, 48.0, 50.0, 62.0, 54.0, 45.0, 43.0, 41.0, 54.0, 47.0, 38.0, 29.0, 36.0, 21.0, 27.0, 22.0, 21.0, 12.0, 5.0, 9.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.34765625, -4.23382568359375, -4.1199951171875, -4.00616455078125, -3.892333984375, -3.77850341796875, -3.6646728515625, -3.55084228515625, -3.43701171875, -3.32318115234375, -3.2093505859375, -3.09552001953125, -2.981689453125, -2.86785888671875, -2.7540283203125, -2.64019775390625, -2.5263671875, -2.41253662109375, -2.2987060546875, -2.18487548828125, -2.071044921875, -1.95721435546875, -1.8433837890625, -1.72955322265625, -1.61572265625, -1.50189208984375, -1.3880615234375, -1.27423095703125, -1.160400390625, -1.04656982421875, -0.9327392578125, -0.81890869140625, -0.705078125, -0.59124755859375, -0.4774169921875, -0.36358642578125, -0.249755859375, -0.13592529296875, -0.0220947265625, 0.09173583984375, 0.20556640625, 0.31939697265625, 0.4332275390625, 0.54705810546875, 0.660888671875, 0.77471923828125, 0.8885498046875, 1.00238037109375, 1.1162109375, 1.23004150390625, 1.3438720703125, 1.45770263671875, 1.571533203125, 1.68536376953125, 1.7991943359375, 1.91302490234375, 2.02685546875, 2.14068603515625, 2.2545166015625, 2.36834716796875, 2.482177734375, 2.59600830078125, 2.7098388671875, 2.82366943359375, 2.9375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 14.0, 9.0, 18.0, 28.0, 49.0, 69.0, 116.0, 235.0, 467.0, 949.0, 2657.0, 9853.0, 64623.0, 705347.0, 232531.0, 23803.0, 4905.0, 1494.0, 620.0, 309.0, 182.0, 99.0, 56.0, 36.0, 17.0, 15.0, 10.0, 8.0, 5.0, 9.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.458984375, -12.08984375, -11.720703125, -11.3515625, -10.982421875, -10.61328125, -10.244140625, -9.875, -9.505859375, -9.13671875, -8.767578125, -8.3984375, -8.029296875, -7.66015625, -7.291015625, -6.921875, -6.552734375, -6.18359375, -5.814453125, -5.4453125, -5.076171875, -4.70703125, -4.337890625, -3.96875, -3.599609375, -3.23046875, -2.861328125, -2.4921875, -2.123046875, -1.75390625, -1.384765625, -1.015625, -0.646484375, -0.27734375, 0.091796875, 0.4609375, 0.830078125, 1.19921875, 1.568359375, 1.9375, 2.306640625, 2.67578125, 3.044921875, 3.4140625, 3.783203125, 4.15234375, 4.521484375, 4.890625, 5.259765625, 5.62890625, 5.998046875, 6.3671875, 6.736328125, 7.10546875, 7.474609375, 7.84375, 8.212890625, 8.58203125, 8.951171875, 9.3203125, 9.689453125, 10.05859375, 10.427734375, 10.796875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 6.0, 10.0, 9.0, 22.0, 21.0, 21.0, 22.0, 25.0, 34.0, 37.0, 46.0, 46.0, 55.0, 57.0, 61.0, 57.0, 49.0, 57.0, 55.0, 38.0, 43.0, 35.0, 34.0, 30.0, 24.0, 20.0, 23.0, 13.0, 13.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.5, -17.885498046875, -17.27099609375, -16.656494140625, -16.0419921875, -15.427490234375, -14.81298828125, -14.198486328125, -13.583984375, -12.969482421875, -12.35498046875, -11.740478515625, -11.1259765625, -10.511474609375, -9.89697265625, -9.282470703125, -8.66796875, -8.053466796875, -7.43896484375, -6.824462890625, -6.2099609375, -5.595458984375, -4.98095703125, -4.366455078125, -3.751953125, -3.137451171875, -2.52294921875, -1.908447265625, -1.2939453125, -0.679443359375, -0.06494140625, 0.549560546875, 1.1640625, 1.778564453125, 2.39306640625, 3.007568359375, 3.6220703125, 4.236572265625, 4.85107421875, 5.465576171875, 6.080078125, 6.694580078125, 7.30908203125, 7.923583984375, 8.5380859375, 9.152587890625, 9.76708984375, 10.381591796875, 10.99609375, 11.610595703125, 12.22509765625, 12.839599609375, 13.4541015625, 14.068603515625, 14.68310546875, 15.297607421875, 15.912109375, 16.526611328125, 17.14111328125, 17.755615234375, 18.3701171875, 18.984619140625, 19.59912109375, 20.213623046875, 20.828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 7.0, 1.0, 13.0, 14.0, 12.0, 24.0, 41.0, 57.0, 113.0, 221.0, 640.0, 2942.0, 68549.0, 952867.0, 20394.0, 1733.0, 488.0, 179.0, 96.0, 60.0, 37.0, 19.0, 13.0, 10.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.760498046875, -8.48974609375, -8.218994140625, -7.9482421875, -7.677490234375, -7.40673828125, -7.135986328125, -6.865234375, -6.594482421875, -6.32373046875, -6.052978515625, -5.7822265625, -5.511474609375, -5.24072265625, -4.969970703125, -4.69921875, -4.428466796875, -4.15771484375, -3.886962890625, -3.6162109375, -3.345458984375, -3.07470703125, -2.803955078125, -2.533203125, -2.262451171875, -1.99169921875, -1.720947265625, -1.4501953125, -1.179443359375, -0.90869140625, -0.637939453125, -0.3671875, -0.096435546875, 0.17431640625, 0.445068359375, 0.7158203125, 0.986572265625, 1.25732421875, 1.528076171875, 1.798828125, 2.069580078125, 2.34033203125, 2.611083984375, 2.8818359375, 3.152587890625, 3.42333984375, 3.694091796875, 3.96484375, 4.235595703125, 4.50634765625, 4.777099609375, 5.0478515625, 5.318603515625, 5.58935546875, 5.860107421875, 6.130859375, 6.401611328125, 6.67236328125, 6.943115234375, 7.2138671875, 7.484619140625, 7.75537109375, 8.026123046875, 8.296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 10.0, 10.0, 12.0, 21.0, 23.0, 38.0, 33.0, 47.0, 81.0, 95.0, 114.0, 109.0, 98.0, 67.0, 52.0, 44.0, 27.0, 23.0, 25.0, 17.0, 13.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000530242919921875, -0.0005120262503623962, -0.0004938095808029175, -0.0004755929112434387, -0.00045737624168395996, -0.0004391595721244812, -0.00042094290256500244, -0.0004027262330055237, -0.0003845095634460449, -0.00036629289388656616, -0.0003480762243270874, -0.00032985955476760864, -0.0003116428852081299, -0.0002934262156486511, -0.00027520954608917236, -0.0002569928765296936, -0.00023877620697021484, -0.00022055953741073608, -0.00020234286785125732, -0.00018412619829177856, -0.0001659095287322998, -0.00014769285917282104, -0.00012947618961334229, -0.00011125952005386353, -9.304285049438477e-05, -7.4826180934906e-05, -5.6609511375427246e-05, -3.8392841815948486e-05, -2.0176172256469727e-05, -1.959502696990967e-06, 1.6257166862487793e-05, 3.447383642196655e-05, 5.269050598144531e-05, 7.090717554092407e-05, 8.912384510040283e-05, 0.00010734051465988159, 0.00012555718421936035, 0.0001437738537788391, 0.00016199052333831787, 0.00018020719289779663, 0.0001984238624572754, 0.00021664053201675415, 0.0002348572015762329, 0.00025307387113571167, 0.00027129054069519043, 0.0002895072102546692, 0.00030772387981414795, 0.0003259405493736267, 0.00034415721893310547, 0.00036237388849258423, 0.000380590558052063, 0.00039880722761154175, 0.0004170238971710205, 0.00043524056673049927, 0.00045345723628997803, 0.0004716739058494568, 0.0004898905754089355, 0.0005081072449684143, 0.0005263239145278931, 0.0005445405840873718, 0.0005627572536468506, 0.0005809739232063293, 0.0005991905927658081, 0.0006174072623252869, 0.0006356239318847656]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 26.0, 31.0, 38.0, 97.0, 131.0, 281.0, 591.0, 1550.0, 5183.0, 31623.0, 548247.0, 426237.0, 27127.0, 4769.0, 1417.0, 578.0, 252.0, 135.0, 84.0, 55.0, 25.0, 26.0, 11.0, 6.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.34942626953125, -5.1871337890625, -5.02484130859375, -4.862548828125, -4.70025634765625, -4.5379638671875, -4.37567138671875, -4.21337890625, -4.05108642578125, -3.8887939453125, -3.72650146484375, -3.564208984375, -3.40191650390625, -3.2396240234375, -3.07733154296875, -2.9150390625, -2.75274658203125, -2.5904541015625, -2.42816162109375, -2.265869140625, -2.10357666015625, -1.9412841796875, -1.77899169921875, -1.61669921875, -1.45440673828125, -1.2921142578125, -1.12982177734375, -0.967529296875, -0.80523681640625, -0.6429443359375, -0.48065185546875, -0.318359375, -0.15606689453125, 0.0062255859375, 0.16851806640625, 0.330810546875, 0.49310302734375, 0.6553955078125, 0.81768798828125, 0.97998046875, 1.14227294921875, 1.3045654296875, 1.46685791015625, 1.629150390625, 1.79144287109375, 1.9537353515625, 2.11602783203125, 2.2783203125, 2.44061279296875, 2.6029052734375, 2.76519775390625, 2.927490234375, 3.08978271484375, 3.2520751953125, 3.41436767578125, 3.57666015625, 3.73895263671875, 3.9012451171875, 4.06353759765625, 4.225830078125, 4.38812255859375, 4.5504150390625, 4.71270751953125, 4.875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 14.0, 18.0, 22.0, 33.0, 50.0, 75.0, 117.0, 151.0, 137.0, 91.0, 97.0, 51.0, 40.0, 21.0, 16.0, 16.0, 6.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.12213134765625, -5.9473876953125, -5.77264404296875, -5.597900390625, -5.42315673828125, -5.2484130859375, -5.07366943359375, -4.89892578125, -4.72418212890625, -4.5494384765625, -4.37469482421875, -4.199951171875, -4.02520751953125, -3.8504638671875, -3.67572021484375, -3.5009765625, -3.32623291015625, -3.1514892578125, -2.97674560546875, -2.802001953125, -2.62725830078125, -2.4525146484375, -2.27777099609375, -2.10302734375, -1.92828369140625, -1.7535400390625, -1.57879638671875, -1.404052734375, -1.22930908203125, -1.0545654296875, -0.87982177734375, -0.705078125, -0.53033447265625, -0.3555908203125, -0.18084716796875, -0.006103515625, 0.16864013671875, 0.3433837890625, 0.51812744140625, 0.69287109375, 0.86761474609375, 1.0423583984375, 1.21710205078125, 1.391845703125, 1.56658935546875, 1.7413330078125, 1.91607666015625, 2.0908203125, 2.26556396484375, 2.4403076171875, 2.61505126953125, 2.789794921875, 2.96453857421875, 3.1392822265625, 3.31402587890625, 3.48876953125, 3.66351318359375, 3.8382568359375, 4.01300048828125, 4.187744140625, 4.36248779296875, 4.5372314453125, 4.71197509765625, 4.88671875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 19.0, 62.0, 259.0, 418.0, 188.0, 35.0, 14.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-291.00189208984375, -285.3441162109375, -279.6863098144531, -274.0285339355469, -268.3707580566406, -262.7129821777344, -257.05517578125, -251.39739990234375, -245.7396240234375, -240.0818328857422, -234.42405700683594, -228.76626586914062, -223.10848999023438, -217.45069885253906, -211.79290771484375, -206.1351318359375, -200.4773406982422, -194.81954956054688, -189.16177368164062, -183.5039825439453, -177.84620666503906, -172.18841552734375, -166.5306396484375, -160.8728485107422, -155.21505737304688, -149.55726623535156, -143.8994903564453, -138.24169921875, -132.58392333984375, -126.92613220214844, -121.26834869384766, -115.61056518554688, -109.95279693603516, -104.29501342773438, -98.6372299194336, -92.97944641113281, -87.3216552734375, -81.66387939453125, -76.00608825683594, -70.34830474853516, -64.69052124023438, -59.032737731933594, -53.37495422363281, -47.717166900634766, -42.059383392333984, -36.4015998840332, -30.743812561035156, -25.086029052734375, -19.428245544433594, -13.770461082458496, -8.112676620483398, -2.4548912048339844, 3.202892303466797, 8.860675811767578, 14.518463134765625, 20.176246643066406, 25.834030151367188, 31.49181365966797, 37.14959716796875, 42.8073844909668, 48.46516799926758, 54.12295150756836, 59.780738830566406, 65.43852233886719, 71.09630584716797]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 7.0, 12.0, 13.0, 7.0, 8.0, 14.0, 16.0, 23.0, 14.0, 34.0, 34.0, 25.0, 30.0, 44.0, 49.0, 40.0, 39.0, 42.0, 59.0, 42.0, 53.0, 48.0, 33.0, 40.0, 40.0, 29.0, 26.0, 37.0, 19.0, 18.0, 16.0, 17.0, 7.0, 8.0, 15.0, 8.0, 7.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.720909118652344, -59.628684997558594, -57.536460876464844, -55.444236755371094, -53.352012634277344, -51.259788513183594, -49.167564392089844, -47.075340270996094, -44.983116149902344, -42.890892028808594, -40.798667907714844, -38.706443786621094, -36.614219665527344, -34.521995544433594, -32.429771423339844, -30.337547302246094, -28.245323181152344, -26.153099060058594, -24.060874938964844, -21.968650817871094, -19.876426696777344, -17.784202575683594, -15.691978454589844, -13.599754333496094, -11.507530212402344, -9.415306091308594, -7.323081970214844, -5.230857849121094, -3.1386337280273438, -1.0464096069335938, 1.0458145141601562, 3.1380386352539062, 5.2302703857421875, 7.3224945068359375, 9.414718627929688, 11.506942749023438, 13.599166870117188, 15.691390991210938, 17.783615112304688, 19.875839233398438, 21.968063354492188, 24.060287475585938, 26.152511596679688, 28.244735717773438, 30.336959838867188, 32.42918395996094, 34.52140808105469, 36.61363220214844, 38.70585632324219, 40.79808044433594, 42.89030456542969, 44.98252868652344, 47.07475280761719, 49.16697692871094, 51.25920104980469, 53.35142517089844, 55.44364929199219, 57.53587341308594, 59.62809753417969, 61.72032165527344, 63.81254577636719, 65.90476989746094, 67.99699401855469, 70.08921813964844, 72.18144226074219]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 9.0, 14.0, 30.0, 33.0, 44.0, 83.0, 143.0, 264.0, 408.0, 816.0, 1714.0, 4488.0, 13435.0, 62386.0, 3610556.0, 446585.0, 37046.0, 9624.0, 3412.0, 1538.0, 691.0, 387.0, 217.0, 118.0, 78.0, 45.0, 31.0, 20.0, 16.0, 14.0, 3.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.19140625, -6.008544921875, -5.82568359375, -5.642822265625, -5.4599609375, -5.277099609375, -5.09423828125, -4.911376953125, -4.728515625, -4.545654296875, -4.36279296875, -4.179931640625, -3.9970703125, -3.814208984375, -3.63134765625, -3.448486328125, -3.265625, -3.082763671875, -2.89990234375, -2.717041015625, -2.5341796875, -2.351318359375, -2.16845703125, -1.985595703125, -1.802734375, -1.619873046875, -1.43701171875, -1.254150390625, -1.0712890625, -0.888427734375, -0.70556640625, -0.522705078125, -0.33984375, -0.156982421875, 0.02587890625, 0.208740234375, 0.3916015625, 0.574462890625, 0.75732421875, 0.940185546875, 1.123046875, 1.305908203125, 1.48876953125, 1.671630859375, 1.8544921875, 2.037353515625, 2.22021484375, 2.403076171875, 2.5859375, 2.768798828125, 2.95166015625, 3.134521484375, 3.3173828125, 3.500244140625, 3.68310546875, 3.865966796875, 4.048828125, 4.231689453125, 4.41455078125, 4.597412109375, 4.7802734375, 4.963134765625, 5.14599609375, 5.328857421875, 5.51171875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 3.0, 2.0, 6.0, 9.0, 9.0, 8.0, 19.0, 24.0, 21.0, 26.0, 39.0, 45.0, 41.0, 51.0, 52.0, 53.0, 57.0, 63.0, 67.0, 55.0, 58.0, 37.0, 48.0, 37.0, 37.0, 31.0, 17.0, 18.0, 18.0, 11.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.294891357421875, -3.17376708984375, -3.052642822265625, -2.9315185546875, -2.810394287109375, -2.68927001953125, -2.568145751953125, -2.447021484375, -2.325897216796875, -2.20477294921875, -2.083648681640625, -1.9625244140625, -1.841400146484375, -1.72027587890625, -1.599151611328125, -1.47802734375, -1.356903076171875, -1.23577880859375, -1.114654541015625, -0.9935302734375, -0.872406005859375, -0.75128173828125, -0.630157470703125, -0.509033203125, -0.387908935546875, -0.26678466796875, -0.145660400390625, -0.0245361328125, 0.096588134765625, 0.21771240234375, 0.338836669921875, 0.4599609375, 0.581085205078125, 0.70220947265625, 0.823333740234375, 0.9444580078125, 1.065582275390625, 1.18670654296875, 1.307830810546875, 1.428955078125, 1.550079345703125, 1.67120361328125, 1.792327880859375, 1.9134521484375, 2.034576416015625, 2.15570068359375, 2.276824951171875, 2.39794921875, 2.519073486328125, 2.64019775390625, 2.761322021484375, 2.8824462890625, 3.003570556640625, 3.12469482421875, 3.245819091796875, 3.366943359375, 3.488067626953125, 3.60919189453125, 3.730316162109375, 3.8514404296875, 3.972564697265625, 4.09368896484375, 4.214813232421875, 4.3359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 6.0, 6.0, 5.0, 7.0, 17.0, 17.0, 24.0, 25.0, 33.0, 47.0, 72.0, 80.0, 129.0, 161.0, 246.0, 307.0, 433.0, 696.0, 956.0, 1640.0, 3155.0, 7401.0, 25116.0, 180308.0, 3779136.0, 155940.0, 23301.0, 7097.0, 3005.0, 1621.0, 1001.0, 666.0, 469.0, 285.0, 250.0, 175.0, 126.0, 95.0, 65.0, 52.0, 35.0, 16.0, 26.0, 15.0, 5.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.00531005859375, -4.8231201171875, -4.64093017578125, -4.458740234375, -4.27655029296875, -4.0943603515625, -3.91217041015625, -3.72998046875, -3.54779052734375, -3.3656005859375, -3.18341064453125, -3.001220703125, -2.81903076171875, -2.6368408203125, -2.45465087890625, -2.2724609375, -2.09027099609375, -1.9080810546875, -1.72589111328125, -1.543701171875, -1.36151123046875, -1.1793212890625, -0.99713134765625, -0.81494140625, -0.63275146484375, -0.4505615234375, -0.26837158203125, -0.086181640625, 0.09600830078125, 0.2781982421875, 0.46038818359375, 0.642578125, 0.82476806640625, 1.0069580078125, 1.18914794921875, 1.371337890625, 1.55352783203125, 1.7357177734375, 1.91790771484375, 2.10009765625, 2.28228759765625, 2.4644775390625, 2.64666748046875, 2.828857421875, 3.01104736328125, 3.1932373046875, 3.37542724609375, 3.5576171875, 3.73980712890625, 3.9219970703125, 4.10418701171875, 4.286376953125, 4.46856689453125, 4.6507568359375, 4.83294677734375, 5.01513671875, 5.19732666015625, 5.3795166015625, 5.56170654296875, 5.743896484375, 5.92608642578125, 6.1082763671875, 6.29046630859375, 6.47265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 13.0, 22.0, 37.0, 111.0, 419.0, 2888.0, 364.0, 104.0, 38.0, 26.0, 10.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.2471923828125, -4.107666015625, -3.9681396484375, -3.82861328125, -3.6890869140625, -3.549560546875, -3.4100341796875, -3.2705078125, -3.1309814453125, -2.991455078125, -2.8519287109375, -2.71240234375, -2.5728759765625, -2.433349609375, -2.2938232421875, -2.154296875, -2.0147705078125, -1.875244140625, -1.7357177734375, -1.59619140625, -1.4566650390625, -1.317138671875, -1.1776123046875, -1.0380859375, -0.8985595703125, -0.759033203125, -0.6195068359375, -0.47998046875, -0.3404541015625, -0.200927734375, -0.0614013671875, 0.078125, 0.2176513671875, 0.357177734375, 0.4967041015625, 0.63623046875, 0.7757568359375, 0.915283203125, 1.0548095703125, 1.1943359375, 1.3338623046875, 1.473388671875, 1.6129150390625, 1.75244140625, 1.8919677734375, 2.031494140625, 2.1710205078125, 2.310546875, 2.4500732421875, 2.589599609375, 2.7291259765625, 2.86865234375, 3.0081787109375, 3.147705078125, 3.2872314453125, 3.4267578125, 3.5662841796875, 3.705810546875, 3.8453369140625, 3.98486328125, 4.1243896484375, 4.263916015625, 4.4034423828125, 4.54296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 19.0, 23.0, 73.0, 97.0, 141.0, 183.0, 152.0, 108.0, 63.0, 56.0, 30.0, 16.0, 14.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.977409362792969, -11.444223403930664, -10.91103744506836, -10.377851486206055, -9.84466552734375, -9.311479568481445, -8.778292655944824, -8.24510669708252, -7.711920738220215, -7.17873477935791, -6.6455488204956055, -6.112362384796143, -5.579176425933838, -5.045990467071533, -4.51280403137207, -3.9796180725097656, -3.446432113647461, -2.9132461547851562, -2.3800599575042725, -1.8468738794326782, -1.313687801361084, -0.7805018424987793, -0.2473156452178955, 0.2858705520629883, 0.819056510925293, 1.3522425889968872, 1.8854286670684814, 2.4186148643493652, 2.95180082321167, 3.4849867820739746, 4.0181732177734375, 4.551359176635742, 5.084545135498047, 5.617731094360352, 6.150917053222656, 6.684103488922119, 7.217289447784424, 7.7504754066467285, 8.283661842346191, 8.816847801208496, 9.3500337600708, 9.883219718933105, 10.41640567779541, 10.949591636657715, 11.482778549194336, 12.01596450805664, 12.549150466918945, 13.08233642578125, 13.615522384643555, 14.14870834350586, 14.681894302368164, 15.215080261230469, 15.748266220092773, 16.281452178955078, 16.814638137817383, 17.347824096679688, 17.881011962890625, 18.41419792175293, 18.947383880615234, 19.48056983947754, 20.013755798339844, 20.54694175720215, 21.080127716064453, 21.61331558227539, 22.146499633789062]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 1.0, 3.0, 8.0, 3.0, 11.0, 13.0, 10.0, 23.0, 23.0, 33.0, 31.0, 29.0, 41.0, 37.0, 52.0, 37.0, 41.0, 53.0, 50.0, 49.0, 53.0, 36.0, 48.0, 46.0, 52.0, 22.0, 30.0, 25.0, 31.0, 19.0, 17.0, 12.0, 11.0, 14.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.870329856872559, -6.616978645324707, -6.3636274337768555, -6.110276222229004, -5.856925010681152, -5.603573799133301, -5.350222587585449, -5.096871376037598, -4.843520164489746, -4.5901689529418945, -4.336817741394043, -4.083466529846191, -3.83011531829834, -3.5767641067504883, -3.3234126567840576, -3.070061445236206, -2.8167099952697754, -2.563358783721924, -2.3100075721740723, -2.0566563606262207, -1.8033050298690796, -1.549953818321228, -1.296602487564087, -1.0432512760162354, -0.7899000644683838, -0.5365488529205322, -0.2831975817680359, -0.02984631061553955, 0.223504900932312, 0.4768561124801636, 0.7302074432373047, 0.9835586547851562, 1.2369098663330078, 1.4902610778808594, 1.743612289428711, 1.996963620185852, 2.250314712524414, 2.5036659240722656, 2.7570173740386963, 3.010368585586548, 3.2637197971343994, 3.517071008682251, 3.7704222202301025, 4.023773670196533, 4.277124881744385, 4.530476093292236, 4.783827304840088, 5.0371785163879395, 5.290529727935791, 5.543880939483643, 5.797232151031494, 6.050583362579346, 6.303934574127197, 6.557285785675049, 6.810637474060059, 7.06398868560791, 7.317339897155762, 7.570691108703613, 7.824042320251465, 8.077393531799316, 8.330744743347168, 8.58409595489502, 8.837447166442871, 9.090798377990723, 9.344149589538574]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 17.0, 16.0, 25.0, 35.0, 56.0, 79.0, 136.0, 253.0, 383.0, 654.0, 1242.0, 2582.0, 6131.0, 15447.0, 44591.0, 142836.0, 376354.0, 303956.0, 100641.0, 32075.0, 11675.0, 4720.0, 2162.0, 998.0, 556.0, 336.0, 187.0, 117.0, 80.0, 58.0, 33.0, 26.0, 15.0, 21.0, 9.0, 5.0, 11.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.5390625, -5.380126953125, -5.22119140625, -5.062255859375, -4.9033203125, -4.744384765625, -4.58544921875, -4.426513671875, -4.267578125, -4.108642578125, -3.94970703125, -3.790771484375, -3.6318359375, -3.472900390625, -3.31396484375, -3.155029296875, -2.99609375, -2.837158203125, -2.67822265625, -2.519287109375, -2.3603515625, -2.201416015625, -2.04248046875, -1.883544921875, -1.724609375, -1.565673828125, -1.40673828125, -1.247802734375, -1.0888671875, -0.929931640625, -0.77099609375, -0.612060546875, -0.453125, -0.294189453125, -0.13525390625, 0.023681640625, 0.1826171875, 0.341552734375, 0.50048828125, 0.659423828125, 0.818359375, 0.977294921875, 1.13623046875, 1.295166015625, 1.4541015625, 1.613037109375, 1.77197265625, 1.930908203125, 2.08984375, 2.248779296875, 2.40771484375, 2.566650390625, 2.7255859375, 2.884521484375, 3.04345703125, 3.202392578125, 3.361328125, 3.520263671875, 3.67919921875, 3.838134765625, 3.9970703125, 4.156005859375, 4.31494140625, 4.473876953125, 4.6328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 9.0, 8.0, 18.0, 12.0, 30.0, 30.0, 28.0, 32.0, 38.0, 36.0, 63.0, 55.0, 44.0, 54.0, 41.0, 58.0, 55.0, 48.0, 49.0, 42.0, 29.0, 40.0, 37.0, 18.0, 21.0, 10.0, 12.0, 15.0, 10.0, 8.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.111328125, -2.997039794921875, -2.88275146484375, -2.768463134765625, -2.6541748046875, -2.539886474609375, -2.42559814453125, -2.311309814453125, -2.197021484375, -2.082733154296875, -1.96844482421875, -1.854156494140625, -1.7398681640625, -1.625579833984375, -1.51129150390625, -1.397003173828125, -1.28271484375, -1.168426513671875, -1.05413818359375, -0.939849853515625, -0.8255615234375, -0.711273193359375, -0.59698486328125, -0.482696533203125, -0.368408203125, -0.254119873046875, -0.13983154296875, -0.025543212890625, 0.0887451171875, 0.203033447265625, 0.31732177734375, 0.431610107421875, 0.5458984375, 0.660186767578125, 0.77447509765625, 0.888763427734375, 1.0030517578125, 1.117340087890625, 1.23162841796875, 1.345916748046875, 1.460205078125, 1.574493408203125, 1.68878173828125, 1.803070068359375, 1.9173583984375, 2.031646728515625, 2.14593505859375, 2.260223388671875, 2.37451171875, 2.488800048828125, 2.60308837890625, 2.717376708984375, 2.8316650390625, 2.945953369140625, 3.06024169921875, 3.174530029296875, 3.288818359375, 3.403106689453125, 3.51739501953125, 3.631683349609375, 3.7459716796875, 3.860260009765625, 3.97454833984375, 4.088836669921875, 4.203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 21.0, 25.0, 43.0, 50.0, 88.0, 167.0, 347.0, 888.0, 3133.0, 25317.0, 730585.0, 272563.0, 12043.0, 1991.0, 646.0, 272.0, 123.0, 70.0, 42.0, 35.0, 26.0, 18.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.1641845703125, -15.672119140625, -15.1800537109375, -14.68798828125, -14.1959228515625, -13.703857421875, -13.2117919921875, -12.7197265625, -12.2276611328125, -11.735595703125, -11.2435302734375, -10.75146484375, -10.2593994140625, -9.767333984375, -9.2752685546875, -8.783203125, -8.2911376953125, -7.799072265625, -7.3070068359375, -6.81494140625, -6.3228759765625, -5.830810546875, -5.3387451171875, -4.8466796875, -4.3546142578125, -3.862548828125, -3.3704833984375, -2.87841796875, -2.3863525390625, -1.894287109375, -1.4022216796875, -0.91015625, -0.4180908203125, 0.073974609375, 0.5660400390625, 1.05810546875, 1.5501708984375, 2.042236328125, 2.5343017578125, 3.0263671875, 3.5184326171875, 4.010498046875, 4.5025634765625, 4.99462890625, 5.4866943359375, 5.978759765625, 6.4708251953125, 6.962890625, 7.4549560546875, 7.947021484375, 8.4390869140625, 8.93115234375, 9.4232177734375, 9.915283203125, 10.4073486328125, 10.8994140625, 11.3914794921875, 11.883544921875, 12.3756103515625, 12.86767578125, 13.3597412109375, 13.851806640625, 14.3438720703125, 14.8359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 11.0, 8.0, 14.0, 13.0, 17.0, 17.0, 25.0, 25.0, 33.0, 40.0, 35.0, 48.0, 51.0, 49.0, 64.0, 47.0, 56.0, 55.0, 57.0, 51.0, 48.0, 40.0, 26.0, 42.0, 16.0, 17.0, 16.0, 20.0, 11.0, 13.0, 9.0, 5.0, 7.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.9102783203125, -17.398681640625, -16.8870849609375, -16.37548828125, -15.8638916015625, -15.352294921875, -14.8406982421875, -14.3291015625, -13.8175048828125, -13.305908203125, -12.7943115234375, -12.28271484375, -11.7711181640625, -11.259521484375, -10.7479248046875, -10.236328125, -9.7247314453125, -9.213134765625, -8.7015380859375, -8.18994140625, -7.6783447265625, -7.166748046875, -6.6551513671875, -6.1435546875, -5.6319580078125, -5.120361328125, -4.6087646484375, -4.09716796875, -3.5855712890625, -3.073974609375, -2.5623779296875, -2.05078125, -1.5391845703125, -1.027587890625, -0.5159912109375, -0.00439453125, 0.5072021484375, 1.018798828125, 1.5303955078125, 2.0419921875, 2.5535888671875, 3.065185546875, 3.5767822265625, 4.08837890625, 4.5999755859375, 5.111572265625, 5.6231689453125, 6.134765625, 6.6463623046875, 7.157958984375, 7.6695556640625, 8.18115234375, 8.6927490234375, 9.204345703125, 9.7159423828125, 10.2275390625, 10.7391357421875, 11.250732421875, 11.7623291015625, 12.27392578125, 12.7855224609375, 13.297119140625, 13.8087158203125, 14.3203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 5.0, 16.0, 21.0, 30.0, 51.0, 54.0, 93.0, 163.0, 338.0, 716.0, 2377.0, 12778.0, 186004.0, 786365.0, 51611.0, 5515.0, 1312.0, 473.0, 251.0, 145.0, 71.0, 48.0, 35.0, 21.0, 18.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.921875, -5.78814697265625, -5.6544189453125, -5.52069091796875, -5.386962890625, -5.25323486328125, -5.1195068359375, -4.98577880859375, -4.85205078125, -4.71832275390625, -4.5845947265625, -4.45086669921875, -4.317138671875, -4.18341064453125, -4.0496826171875, -3.91595458984375, -3.7822265625, -3.64849853515625, -3.5147705078125, -3.38104248046875, -3.247314453125, -3.11358642578125, -2.9798583984375, -2.84613037109375, -2.71240234375, -2.57867431640625, -2.4449462890625, -2.31121826171875, -2.177490234375, -2.04376220703125, -1.9100341796875, -1.77630615234375, -1.642578125, -1.50885009765625, -1.3751220703125, -1.24139404296875, -1.107666015625, -0.97393798828125, -0.8402099609375, -0.70648193359375, -0.57275390625, -0.43902587890625, -0.3052978515625, -0.17156982421875, -0.037841796875, 0.09588623046875, 0.2296142578125, 0.36334228515625, 0.4970703125, 0.63079833984375, 0.7645263671875, 0.89825439453125, 1.031982421875, 1.16571044921875, 1.2994384765625, 1.43316650390625, 1.56689453125, 1.70062255859375, 1.8343505859375, 1.96807861328125, 2.101806640625, 2.23553466796875, 2.3692626953125, 2.50299072265625, 2.63671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 6.0, 15.0, 19.0, 12.0, 22.0, 21.0, 31.0, 50.0, 53.0, 83.0, 120.0, 157.0, 100.0, 47.0, 42.0, 34.0, 37.0, 30.0, 20.0, 24.0, 12.0, 7.0, 9.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007152557373046875, -0.0006960704922676086, -0.0006768852472305298, -0.0006577000021934509, -0.0006385147571563721, -0.0006193295121192932, -0.0006001442670822144, -0.0005809590220451355, -0.0005617737770080566, -0.0005425885319709778, -0.0005234032869338989, -0.0005042180418968201, -0.0004850327968597412, -0.00046584755182266235, -0.0004466623067855835, -0.00042747706174850464, -0.0004082918167114258, -0.0003891065716743469, -0.00036992132663726807, -0.0003507360816001892, -0.00033155083656311035, -0.0003123655915260315, -0.00029318034648895264, -0.0002739951014518738, -0.0002548098564147949, -0.00023562461137771606, -0.0002164393663406372, -0.00019725412130355835, -0.0001780688762664795, -0.00015888363122940063, -0.00013969838619232178, -0.00012051314115524292, -0.00010132789611816406, -8.21426510810852e-05, -6.295740604400635e-05, -4.377216100692749e-05, -2.4586915969848633e-05, -5.401670932769775e-06, 1.3783574104309082e-05, 3.296881914138794e-05, 5.21540641784668e-05, 7.133930921554565e-05, 9.052455425262451e-05, 0.00010970979928970337, 0.00012889504432678223, 0.00014808028936386108, 0.00016726553440093994, 0.0001864507794380188, 0.00020563602447509766, 0.00022482126951217651, 0.00024400651454925537, 0.00026319175958633423, 0.0002823770046234131, 0.00030156224966049194, 0.0003207474946975708, 0.00033993273973464966, 0.0003591179847717285, 0.0003783032298088074, 0.00039748847484588623, 0.0004166737198829651, 0.00043585896492004395, 0.0004550442099571228, 0.00047422945499420166, 0.0004934147000312805, 0.0005125999450683594]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 9.0, 9.0, 21.0, 16.0, 46.0, 81.0, 132.0, 243.0, 586.0, 1489.0, 4739.0, 25433.0, 446387.0, 533415.0, 28146.0, 5077.0, 1531.0, 600.0, 254.0, 118.0, 68.0, 40.0, 22.0, 18.0, 12.0, 7.0, 6.0, 11.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.38671875, -5.218505859375, -5.05029296875, -4.882080078125, -4.7138671875, -4.545654296875, -4.37744140625, -4.209228515625, -4.041015625, -3.872802734375, -3.70458984375, -3.536376953125, -3.3681640625, -3.199951171875, -3.03173828125, -2.863525390625, -2.6953125, -2.527099609375, -2.35888671875, -2.190673828125, -2.0224609375, -1.854248046875, -1.68603515625, -1.517822265625, -1.349609375, -1.181396484375, -1.01318359375, -0.844970703125, -0.6767578125, -0.508544921875, -0.34033203125, -0.172119140625, -0.00390625, 0.164306640625, 0.33251953125, 0.500732421875, 0.6689453125, 0.837158203125, 1.00537109375, 1.173583984375, 1.341796875, 1.510009765625, 1.67822265625, 1.846435546875, 2.0146484375, 2.182861328125, 2.35107421875, 2.519287109375, 2.6875, 2.855712890625, 3.02392578125, 3.192138671875, 3.3603515625, 3.528564453125, 3.69677734375, 3.864990234375, 4.033203125, 4.201416015625, 4.36962890625, 4.537841796875, 4.7060546875, 4.874267578125, 5.04248046875, 5.210693359375, 5.37890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 1.0, 9.0, 7.0, 7.0, 11.0, 16.0, 16.0, 24.0, 29.0, 60.0, 47.0, 51.0, 76.0, 83.0, 115.0, 111.0, 68.0, 70.0, 35.0, 38.0, 30.0, 20.0, 17.0, 14.0, 10.0, 5.0, 5.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.253173828125, -3.14306640625, -3.032958984375, -2.9228515625, -2.812744140625, -2.70263671875, -2.592529296875, -2.482421875, -2.372314453125, -2.26220703125, -2.152099609375, -2.0419921875, -1.931884765625, -1.82177734375, -1.711669921875, -1.6015625, -1.491455078125, -1.38134765625, -1.271240234375, -1.1611328125, -1.051025390625, -0.94091796875, -0.830810546875, -0.720703125, -0.610595703125, -0.50048828125, -0.390380859375, -0.2802734375, -0.170166015625, -0.06005859375, 0.050048828125, 0.16015625, 0.270263671875, 0.38037109375, 0.490478515625, 0.6005859375, 0.710693359375, 0.82080078125, 0.930908203125, 1.041015625, 1.151123046875, 1.26123046875, 1.371337890625, 1.4814453125, 1.591552734375, 1.70166015625, 1.811767578125, 1.921875, 2.031982421875, 2.14208984375, 2.252197265625, 2.3623046875, 2.472412109375, 2.58251953125, 2.692626953125, 2.802734375, 2.912841796875, 3.02294921875, 3.133056640625, 3.2431640625, 3.353271484375, 3.46337890625, 3.573486328125, 3.68359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 8.0, 10.0, 32.0, 87.0, 283.0, 332.0, 181.0, 44.0, 16.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.99026489257812, -136.7591552734375, -132.52804565429688, -128.29693603515625, -124.0658187866211, -119.83470916748047, -115.60359191894531, -111.37248229980469, -107.14137268066406, -102.91026306152344, -98.67915344238281, -94.44803619384766, -90.21692657470703, -85.9858169555664, -81.75469970703125, -77.52359008789062, -73.29248046875, -69.06137084960938, -64.83026123046875, -60.599143981933594, -56.36803436279297, -52.136924743652344, -47.90581130981445, -43.67469787597656, -39.44358825683594, -35.21247863769531, -30.981365203857422, -26.750253677368164, -22.519142150878906, -18.28803062438965, -14.05691909790039, -9.825807571411133, -5.594696044921875, -1.3635845184326172, 2.8675270080566406, 7.098638534545898, 11.329750061035156, 15.560861587524414, 19.791973114013672, 24.02308464050293, 28.254196166992188, 32.48530578613281, 36.7164192199707, 40.947532653808594, 45.17864227294922, 49.409751892089844, 53.640865325927734, 57.871978759765625, 62.10308837890625, 66.33419799804688, 70.5653076171875, 74.79642486572266, 79.02753448486328, 83.2586441040039, 87.48976135253906, 91.72087097167969, 95.95198059082031, 100.18309020996094, 104.41419982910156, 108.64531707763672, 112.87642669677734, 117.10753631591797, 121.33865356445312, 125.56976318359375, 129.80087280273438]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 5.0, 8.0, 10.0, 19.0, 11.0, 18.0, 19.0, 19.0, 19.0, 31.0, 26.0, 32.0, 47.0, 33.0, 46.0, 39.0, 51.0, 51.0, 43.0, 58.0, 32.0, 39.0, 26.0, 46.0, 32.0, 42.0, 23.0, 22.0, 23.0, 14.0, 19.0, 18.0, 10.0, 7.0, 6.0, 5.0, 5.0, 4.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-56.064056396484375, -54.36747741699219, -52.670902252197266, -50.97432327270508, -49.27774429321289, -47.58116912841797, -45.88459014892578, -44.188011169433594, -42.491432189941406, -40.79485321044922, -39.0982780456543, -37.40169906616211, -35.70512008666992, -34.008544921875, -32.31196594238281, -30.615386962890625, -28.91880989074707, -27.222232818603516, -25.525653839111328, -23.829076766967773, -22.132497787475586, -20.43592071533203, -18.739341735839844, -17.04276466369629, -15.346186637878418, -13.649608612060547, -11.953030586242676, -10.256452560424805, -8.55987548828125, -6.863297462463379, -5.166719436645508, -3.4701414108276367, -1.7735633850097656, -0.07698547840118408, 1.6195924282073975, 3.3161702156066895, 5.0127482414245605, 6.709325790405273, 8.405903816223145, 10.102481842041016, 11.799059867858887, 13.495637893676758, 15.192215919494629, 16.8887939453125, 18.585371017456055, 20.28194808959961, 21.978527069091797, 23.675106048583984, 25.37168312072754, 27.068260192871094, 28.76483917236328, 30.461416244506836, 32.15799331665039, 33.85457229614258, 35.551151275634766, 37.24772644042969, 38.944305419921875, 40.64088439941406, 42.337459564208984, 44.03403854370117, 45.73061752319336, 47.42719268798828, 49.12377166748047, 50.820350646972656, 52.516929626464844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 11.0, 10.0, 19.0, 32.0, 69.0, 141.0, 273.0, 587.0, 1229.0, 2921.0, 8644.0, 40727.0, 1043783.0, 2995361.0, 81271.0, 12385.0, 4010.0, 1460.0, 646.0, 338.0, 169.0, 83.0, 44.0, 22.0, 17.0, 14.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.59375, -8.3848876953125, -8.176025390625, -7.9671630859375, -7.75830078125, -7.5494384765625, -7.340576171875, -7.1317138671875, -6.9228515625, -6.7139892578125, -6.505126953125, -6.2962646484375, -6.08740234375, -5.8785400390625, -5.669677734375, -5.4608154296875, -5.251953125, -5.0430908203125, -4.834228515625, -4.6253662109375, -4.41650390625, -4.2076416015625, -3.998779296875, -3.7899169921875, -3.5810546875, -3.3721923828125, -3.163330078125, -2.9544677734375, -2.74560546875, -2.5367431640625, -2.327880859375, -2.1190185546875, -1.91015625, -1.7012939453125, -1.492431640625, -1.2835693359375, -1.07470703125, -0.8658447265625, -0.656982421875, -0.4481201171875, -0.2392578125, -0.0303955078125, 0.178466796875, 0.3873291015625, 0.59619140625, 0.8050537109375, 1.013916015625, 1.2227783203125, 1.431640625, 1.6405029296875, 1.849365234375, 2.0582275390625, 2.26708984375, 2.4759521484375, 2.684814453125, 2.8936767578125, 3.1025390625, 3.3114013671875, 3.520263671875, 3.7291259765625, 3.93798828125, 4.1468505859375, 4.355712890625, 4.5645751953125, 4.7734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 6.0, 9.0, 12.0, 11.0, 11.0, 22.0, 28.0, 28.0, 18.0, 49.0, 53.0, 57.0, 44.0, 64.0, 59.0, 57.0, 57.0, 67.0, 40.0, 66.0, 29.0, 32.0, 44.0, 20.0, 26.0, 25.0, 14.0, 11.0, 4.0, 4.0, 5.0, 6.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.899139404296875, -2.78851318359375, -2.677886962890625, -2.5672607421875, -2.456634521484375, -2.34600830078125, -2.235382080078125, -2.124755859375, -2.014129638671875, -1.90350341796875, -1.792877197265625, -1.6822509765625, -1.571624755859375, -1.46099853515625, -1.350372314453125, -1.23974609375, -1.129119873046875, -1.01849365234375, -0.907867431640625, -0.7972412109375, -0.686614990234375, -0.57598876953125, -0.465362548828125, -0.354736328125, -0.244110107421875, -0.13348388671875, -0.022857666015625, 0.0877685546875, 0.198394775390625, 0.30902099609375, 0.419647216796875, 0.5302734375, 0.640899658203125, 0.75152587890625, 0.862152099609375, 0.9727783203125, 1.083404541015625, 1.19403076171875, 1.304656982421875, 1.415283203125, 1.525909423828125, 1.63653564453125, 1.747161865234375, 1.8577880859375, 1.968414306640625, 2.07904052734375, 2.189666748046875, 2.30029296875, 2.410919189453125, 2.52154541015625, 2.632171630859375, 2.7427978515625, 2.853424072265625, 2.96405029296875, 3.074676513671875, 3.185302734375, 3.295928955078125, 3.40655517578125, 3.517181396484375, 3.6278076171875, 3.738433837890625, 3.84906005859375, 3.959686279296875, 4.0703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 14.0, 18.0, 43.0, 62.0, 121.0, 311.0, 834.0, 2931.0, 12059.0, 114034.0, 3912780.0, 132727.0, 13267.0, 3300.0, 1028.0, 385.0, 151.0, 59.0, 42.0, 18.0, 16.0, 10.0, 10.0, 4.0, 6.0, 7.0, 0.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.1895751953125, -9.855712890625, -9.5218505859375, -9.18798828125, -8.8541259765625, -8.520263671875, -8.1864013671875, -7.8525390625, -7.5186767578125, -7.184814453125, -6.8509521484375, -6.51708984375, -6.1832275390625, -5.849365234375, -5.5155029296875, -5.181640625, -4.8477783203125, -4.513916015625, -4.1800537109375, -3.84619140625, -3.5123291015625, -3.178466796875, -2.8446044921875, -2.5107421875, -2.1768798828125, -1.843017578125, -1.5091552734375, -1.17529296875, -0.8414306640625, -0.507568359375, -0.1737060546875, 0.16015625, 0.4940185546875, 0.827880859375, 1.1617431640625, 1.49560546875, 1.8294677734375, 2.163330078125, 2.4971923828125, 2.8310546875, 3.1649169921875, 3.498779296875, 3.8326416015625, 4.16650390625, 4.5003662109375, 4.834228515625, 5.1680908203125, 5.501953125, 5.8358154296875, 6.169677734375, 6.5035400390625, 6.83740234375, 7.1712646484375, 7.505126953125, 7.8389892578125, 8.1728515625, 8.5067138671875, 8.840576171875, 9.1744384765625, 9.50830078125, 9.8421630859375, 10.176025390625, 10.5098876953125, 10.84375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 5.0, 8.0, 8.0, 15.0, 27.0, 20.0, 64.0, 93.0, 188.0, 372.0, 935.0, 1139.0, 625.0, 242.0, 131.0, 57.0, 37.0, 22.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98828125, -5.75042724609375, -5.5125732421875, -5.27471923828125, -5.036865234375, -4.79901123046875, -4.5611572265625, -4.32330322265625, -4.08544921875, -3.84759521484375, -3.6097412109375, -3.37188720703125, -3.134033203125, -2.89617919921875, -2.6583251953125, -2.42047119140625, -2.1826171875, -1.94476318359375, -1.7069091796875, -1.46905517578125, -1.231201171875, -0.99334716796875, -0.7554931640625, -0.51763916015625, -0.27978515625, -0.04193115234375, 0.1959228515625, 0.43377685546875, 0.671630859375, 0.90948486328125, 1.1473388671875, 1.38519287109375, 1.623046875, 1.86090087890625, 2.0987548828125, 2.33660888671875, 2.574462890625, 2.81231689453125, 3.0501708984375, 3.28802490234375, 3.52587890625, 3.76373291015625, 4.0015869140625, 4.23944091796875, 4.477294921875, 4.71514892578125, 4.9530029296875, 5.19085693359375, 5.4287109375, 5.66656494140625, 5.9044189453125, 6.14227294921875, 6.380126953125, 6.61798095703125, 6.8558349609375, 7.09368896484375, 7.33154296875, 7.56939697265625, 7.8072509765625, 8.04510498046875, 8.282958984375, 8.52081298828125, 8.7586669921875, 8.99652099609375, 9.234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 12.0, 20.0, 44.0, 114.0, 164.0, 223.0, 181.0, 112.0, 68.0, 18.0, 13.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.09721374511719, -70.97959899902344, -68.86198425292969, -66.7443618774414, -64.62674713134766, -62.509132385253906, -60.391517639160156, -58.27389907836914, -56.156280517578125, -54.038665771484375, -51.92104721069336, -49.80343246459961, -47.685813903808594, -45.568199157714844, -43.450584411621094, -41.33296585083008, -39.21535110473633, -37.09773635864258, -34.98011779785156, -32.86250305175781, -30.744884490966797, -28.627269744873047, -26.509653091430664, -24.39203643798828, -22.2744197845459, -20.156803131103516, -18.039186477661133, -15.921570777893066, -13.803954124450684, -11.6863374710083, -9.568721771240234, -7.451105117797852, -5.333484649658203, -3.2158682346343994, -1.0982518196105957, 1.019364356994629, 3.1369810104370117, 5.2545976638793945, 7.372213363647461, 9.489830017089844, 11.607446670532227, 13.72506332397461, 15.842679977416992, 17.960296630859375, 20.077911376953125, 22.19552993774414, 24.31314468383789, 26.430761337280273, 28.548377990722656, 30.66599464416504, 32.78361129760742, 34.90122604370117, 37.01884460449219, 39.13645935058594, 41.25407409667969, 43.3716926574707, 45.48931121826172, 47.60692596435547, 49.724544525146484, 51.842159271240234, 53.95977783203125, 56.077392578125, 58.19500732421875, 60.312625885009766, 62.430240631103516]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 9.0, 5.0, 15.0, 17.0, 17.0, 13.0, 17.0, 16.0, 27.0, 41.0, 35.0, 30.0, 43.0, 43.0, 48.0, 44.0, 36.0, 32.0, 49.0, 44.0, 38.0, 39.0, 42.0, 47.0, 33.0, 31.0, 39.0, 21.0, 27.0, 19.0, 12.0, 10.0, 13.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-29.870325088500977, -29.03856658935547, -28.206806182861328, -27.375045776367188, -26.54328727722168, -25.711528778076172, -24.87976837158203, -24.04800796508789, -23.216249465942383, -22.384490966796875, -21.552730560302734, -20.720970153808594, -19.889211654663086, -19.057453155517578, -18.225692749023438, -17.393932342529297, -16.56217384338379, -15.730414390563965, -14.89865493774414, -14.066895484924316, -13.235136032104492, -12.403376579284668, -11.571617126464844, -10.73985767364502, -9.908098220825195, -9.076338768005371, -8.244579315185547, -7.412819862365723, -6.581060409545898, -5.749300956726074, -4.91754150390625, -4.085782051086426, -3.2540225982666016, -2.4222631454467773, -1.5905036926269531, -0.7587442398071289, 0.07301521301269531, 0.9047746658325195, 1.7365341186523438, 2.568293571472168, 3.400053024291992, 4.231812477111816, 5.063571929931641, 5.895331382751465, 6.727090835571289, 7.558850288391113, 8.390609741210938, 9.222369194030762, 10.054128646850586, 10.88588809967041, 11.717647552490234, 12.549407005310059, 13.381166458129883, 14.212925910949707, 15.044685363769531, 15.876444816589355, 16.70820426940918, 17.539962768554688, 18.371723175048828, 19.20348358154297, 20.035242080688477, 20.867000579833984, 21.698760986328125, 22.530521392822266, 23.362279891967773]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 9.0, 14.0, 13.0, 20.0, 17.0, 63.0, 54.0, 102.0, 106.0, 182.0, 332.0, 482.0, 820.0, 1345.0, 2442.0, 4574.0, 8901.0, 17916.0, 39022.0, 87098.0, 195251.0, 317756.0, 202176.0, 90606.0, 40510.0, 18806.0, 9192.0, 4620.0, 2467.0, 1377.0, 857.0, 472.0, 307.0, 203.0, 126.0, 96.0, 62.0, 39.0, 21.0, 27.0, 21.0, 14.0, 4.0, 11.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.400390625, -3.29583740234375, -3.1912841796875, -3.08673095703125, -2.982177734375, -2.87762451171875, -2.7730712890625, -2.66851806640625, -2.56396484375, -2.45941162109375, -2.3548583984375, -2.25030517578125, -2.145751953125, -2.04119873046875, -1.9366455078125, -1.83209228515625, -1.7275390625, -1.62298583984375, -1.5184326171875, -1.41387939453125, -1.309326171875, -1.20477294921875, -1.1002197265625, -0.99566650390625, -0.89111328125, -0.78656005859375, -0.6820068359375, -0.57745361328125, -0.472900390625, -0.36834716796875, -0.2637939453125, -0.15924072265625, -0.0546875, 0.04986572265625, 0.1544189453125, 0.25897216796875, 0.363525390625, 0.46807861328125, 0.5726318359375, 0.67718505859375, 0.78173828125, 0.88629150390625, 0.9908447265625, 1.09539794921875, 1.199951171875, 1.30450439453125, 1.4090576171875, 1.51361083984375, 1.6181640625, 1.72271728515625, 1.8272705078125, 1.93182373046875, 2.036376953125, 2.14093017578125, 2.2454833984375, 2.35003662109375, 2.45458984375, 2.55914306640625, 2.6636962890625, 2.76824951171875, 2.872802734375, 2.97735595703125, 3.0819091796875, 3.18646240234375, 3.291015625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 8.0, 17.0, 12.0, 13.0, 12.0, 22.0, 36.0, 31.0, 39.0, 30.0, 43.0, 58.0, 51.0, 43.0, 54.0, 61.0, 48.0, 54.0, 52.0, 31.0, 40.0, 36.0, 34.0, 26.0, 31.0, 15.0, 10.0, 16.0, 14.0, 15.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.1585693359375, -3.065185546875, -2.9718017578125, -2.87841796875, -2.7850341796875, -2.691650390625, -2.5982666015625, -2.5048828125, -2.4114990234375, -2.318115234375, -2.2247314453125, -2.13134765625, -2.0379638671875, -1.944580078125, -1.8511962890625, -1.7578125, -1.6644287109375, -1.571044921875, -1.4776611328125, -1.38427734375, -1.2908935546875, -1.197509765625, -1.1041259765625, -1.0107421875, -0.9173583984375, -0.823974609375, -0.7305908203125, -0.63720703125, -0.5438232421875, -0.450439453125, -0.3570556640625, -0.263671875, -0.1702880859375, -0.076904296875, 0.0164794921875, 0.10986328125, 0.2032470703125, 0.296630859375, 0.3900146484375, 0.4833984375, 0.5767822265625, 0.670166015625, 0.7635498046875, 0.85693359375, 0.9503173828125, 1.043701171875, 1.1370849609375, 1.23046875, 1.3238525390625, 1.417236328125, 1.5106201171875, 1.60400390625, 1.6973876953125, 1.790771484375, 1.8841552734375, 1.9775390625, 2.0709228515625, 2.164306640625, 2.2576904296875, 2.35107421875, 2.4444580078125, 2.537841796875, 2.6312255859375, 2.724609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 10.0, 16.0, 18.0, 47.0, 53.0, 129.0, 173.0, 312.0, 785.0, 2416.0, 14965.0, 670621.0, 345060.0, 10637.0, 1907.0, 725.0, 294.0, 141.0, 94.0, 47.0, 40.0, 16.0, 9.0, 9.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1256103515625, -14.602783203125, -14.0799560546875, -13.55712890625, -13.0343017578125, -12.511474609375, -11.9886474609375, -11.4658203125, -10.9429931640625, -10.420166015625, -9.8973388671875, -9.37451171875, -8.8516845703125, -8.328857421875, -7.8060302734375, -7.283203125, -6.7603759765625, -6.237548828125, -5.7147216796875, -5.19189453125, -4.6690673828125, -4.146240234375, -3.6234130859375, -3.1005859375, -2.5777587890625, -2.054931640625, -1.5321044921875, -1.00927734375, -0.4864501953125, 0.036376953125, 0.5592041015625, 1.08203125, 1.6048583984375, 2.127685546875, 2.6505126953125, 3.17333984375, 3.6961669921875, 4.218994140625, 4.7418212890625, 5.2646484375, 5.7874755859375, 6.310302734375, 6.8331298828125, 7.35595703125, 7.8787841796875, 8.401611328125, 8.9244384765625, 9.447265625, 9.9700927734375, 10.492919921875, 11.0157470703125, 11.53857421875, 12.0614013671875, 12.584228515625, 13.1070556640625, 13.6298828125, 14.1527099609375, 14.675537109375, 15.1983642578125, 15.72119140625, 16.2440185546875, 16.766845703125, 17.2896728515625, 17.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 16.0, 9.0, 18.0, 14.0, 19.0, 27.0, 32.0, 32.0, 47.0, 54.0, 44.0, 74.0, 67.0, 67.0, 66.0, 56.0, 73.0, 46.0, 45.0, 27.0, 28.0, 21.0, 22.0, 21.0, 13.0, 11.0, 6.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.1937255859375, -16.715576171875, -16.2374267578125, -15.75927734375, -15.2811279296875, -14.802978515625, -14.3248291015625, -13.8466796875, -13.3685302734375, -12.890380859375, -12.4122314453125, -11.93408203125, -11.4559326171875, -10.977783203125, -10.4996337890625, -10.021484375, -9.5433349609375, -9.065185546875, -8.5870361328125, -8.10888671875, -7.6307373046875, -7.152587890625, -6.6744384765625, -6.1962890625, -5.7181396484375, -5.239990234375, -4.7618408203125, -4.28369140625, -3.8055419921875, -3.327392578125, -2.8492431640625, -2.37109375, -1.8929443359375, -1.414794921875, -0.9366455078125, -0.45849609375, 0.0196533203125, 0.497802734375, 0.9759521484375, 1.4541015625, 1.9322509765625, 2.410400390625, 2.8885498046875, 3.36669921875, 3.8448486328125, 4.322998046875, 4.8011474609375, 5.279296875, 5.7574462890625, 6.235595703125, 6.7137451171875, 7.19189453125, 7.6700439453125, 8.148193359375, 8.6263427734375, 9.1044921875, 9.5826416015625, 10.060791015625, 10.5389404296875, 11.01708984375, 11.4952392578125, 11.973388671875, 12.4515380859375, 12.9296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 0.0, 4.0, 6.0, 10.0, 11.0, 20.0, 20.0, 52.0, 116.0, 422.0, 10522.0, 1034660.0, 2275.0, 241.0, 80.0, 50.0, 19.0, 15.0, 8.0, 3.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.40625, -32.534912109375, -31.66357421875, -30.792236328125, -29.9208984375, -29.049560546875, -28.17822265625, -27.306884765625, -26.435546875, -25.564208984375, -24.69287109375, -23.821533203125, -22.9501953125, -22.078857421875, -21.20751953125, -20.336181640625, -19.46484375, -18.593505859375, -17.72216796875, -16.850830078125, -15.9794921875, -15.108154296875, -14.23681640625, -13.365478515625, -12.494140625, -11.622802734375, -10.75146484375, -9.880126953125, -9.0087890625, -8.137451171875, -7.26611328125, -6.394775390625, -5.5234375, -4.652099609375, -3.78076171875, -2.909423828125, -2.0380859375, -1.166748046875, -0.29541015625, 0.575927734375, 1.447265625, 2.318603515625, 3.18994140625, 4.061279296875, 4.9326171875, 5.803955078125, 6.67529296875, 7.546630859375, 8.41796875, 9.289306640625, 10.16064453125, 11.031982421875, 11.9033203125, 12.774658203125, 13.64599609375, 14.517333984375, 15.388671875, 16.260009765625, 17.13134765625, 18.002685546875, 18.8740234375, 19.745361328125, 20.61669921875, 21.488037109375, 22.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 5.0, 16.0, 17.0, 17.0, 19.0, 31.0, 57.0, 98.0, 198.0, 225.0, 98.0, 65.0, 31.0, 35.0, 24.0, 15.0, 6.0, 11.0, 7.0, 3.0, 2.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009441375732421875, -0.0009063631296157837, -0.0008685886859893799, -0.0008308142423629761, -0.0007930397987365723, -0.0007552653551101685, -0.0007174909114837646, -0.0006797164678573608, -0.000641942024230957, -0.0006041675806045532, -0.0005663931369781494, -0.0005286186933517456, -0.0004908442497253418, -0.000453069806098938, -0.0004152953624725342, -0.00037752091884613037, -0.00033974647521972656, -0.00030197203159332275, -0.00026419758796691895, -0.00022642314434051514, -0.00018864870071411133, -0.00015087425708770752, -0.00011309981346130371, -7.53253698348999e-05, -3.7550926208496094e-05, 2.2351741790771484e-07, 3.7997961044311523e-05, 7.577240467071533e-05, 0.00011354684829711914, 0.00015132129192352295, 0.00018909573554992676, 0.00022687017917633057, 0.0002646446228027344, 0.0003024190664291382, 0.000340193510055542, 0.0003779679536819458, 0.0004157423973083496, 0.0004535168409347534, 0.0004912912845611572, 0.000529065728187561, 0.0005668401718139648, 0.0006046146154403687, 0.0006423890590667725, 0.0006801635026931763, 0.0007179379463195801, 0.0007557123899459839, 0.0007934868335723877, 0.0008312612771987915, 0.0008690357208251953, 0.0009068101644515991, 0.0009445846080780029, 0.0009823590517044067, 0.0010201334953308105, 0.0010579079389572144, 0.0010956823825836182, 0.001133456826210022, 0.0011712312698364258, 0.0012090057134628296, 0.0012467801570892334, 0.0012845546007156372, 0.001322329044342041, 0.0013601034879684448, 0.0013978779315948486, 0.0014356523752212524, 0.0014734268188476562]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 7.0, 9.0, 14.0, 16.0, 24.0, 35.0, 43.0, 80.0, 171.0, 318.0, 773.0, 1927.0, 6716.0, 434678.0, 593383.0, 6833.0, 1945.0, 737.0, 374.0, 168.0, 88.0, 56.0, 40.0, 21.0, 12.0, 21.0, 9.0, 9.0, 7.0, 6.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.0, -23.314453125, -22.62890625, -21.943359375, -21.2578125, -20.572265625, -19.88671875, -19.201171875, -18.515625, -17.830078125, -17.14453125, -16.458984375, -15.7734375, -15.087890625, -14.40234375, -13.716796875, -13.03125, -12.345703125, -11.66015625, -10.974609375, -10.2890625, -9.603515625, -8.91796875, -8.232421875, -7.546875, -6.861328125, -6.17578125, -5.490234375, -4.8046875, -4.119140625, -3.43359375, -2.748046875, -2.0625, -1.376953125, -0.69140625, -0.005859375, 0.6796875, 1.365234375, 2.05078125, 2.736328125, 3.421875, 4.107421875, 4.79296875, 5.478515625, 6.1640625, 6.849609375, 7.53515625, 8.220703125, 8.90625, 9.591796875, 10.27734375, 10.962890625, 11.6484375, 12.333984375, 13.01953125, 13.705078125, 14.390625, 15.076171875, 15.76171875, 16.447265625, 17.1328125, 17.818359375, 18.50390625, 19.189453125, 19.875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 7.0, 10.0, 19.0, 34.0, 61.0, 154.0, 323.0, 216.0, 82.0, 26.0, 12.0, 12.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.78173828125, -10.3916015625, -10.00146484375, -9.611328125, -9.22119140625, -8.8310546875, -8.44091796875, -8.05078125, -7.66064453125, -7.2705078125, -6.88037109375, -6.490234375, -6.10009765625, -5.7099609375, -5.31982421875, -4.9296875, -4.53955078125, -4.1494140625, -3.75927734375, -3.369140625, -2.97900390625, -2.5888671875, -2.19873046875, -1.80859375, -1.41845703125, -1.0283203125, -0.63818359375, -0.248046875, 0.14208984375, 0.5322265625, 0.92236328125, 1.3125, 1.70263671875, 2.0927734375, 2.48291015625, 2.873046875, 3.26318359375, 3.6533203125, 4.04345703125, 4.43359375, 4.82373046875, 5.2138671875, 5.60400390625, 5.994140625, 6.38427734375, 6.7744140625, 7.16455078125, 7.5546875, 7.94482421875, 8.3349609375, 8.72509765625, 9.115234375, 9.50537109375, 9.8955078125, 10.28564453125, 10.67578125, 11.06591796875, 11.4560546875, 11.84619140625, 12.236328125, 12.62646484375, 13.0166015625, 13.40673828125, 13.796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 25.0, 93.0, 341.0, 371.0, 112.0, 35.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-250.1065673828125, -244.0308380126953, -237.95510864257812, -231.87937927246094, -225.80364990234375, -219.72792053222656, -213.65219116210938, -207.5764617919922, -201.500732421875, -195.4250030517578, -189.34927368164062, -183.27354431152344, -177.19781494140625, -171.12208557128906, -165.04635620117188, -158.9706268310547, -152.8948974609375, -146.8191680908203, -140.74343872070312, -134.66770935058594, -128.59197998046875, -122.51625061035156, -116.44052124023438, -110.36479187011719, -104.2890625, -98.21333312988281, -92.13760375976562, -86.06187438964844, -79.98614501953125, -73.91041564941406, -67.83468627929688, -61.75895690917969, -55.6832275390625, -49.60749816894531, -43.531768798828125, -37.45603942871094, -31.38031005859375, -25.304580688476562, -19.228851318359375, -13.153121948242188, -7.077392578125, -1.0016632080078125, 5.074066162109375, 11.149795532226562, 17.22552490234375, 23.301254272460938, 29.376983642578125, 35.45271301269531, 41.5284423828125, 47.60417175292969, 53.679901123046875, 59.75563049316406, 65.83135986328125, 71.90708923339844, 77.98281860351562, 84.05854797363281, 90.13427734375, 96.21000671386719, 102.28573608398438, 108.36146545410156, 114.43719482421875, 120.51292419433594, 126.58865356445312, 132.6643829345703, 138.7401123046875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 12.0, 10.0, 12.0, 17.0, 25.0, 30.0, 30.0, 31.0, 56.0, 51.0, 65.0, 77.0, 79.0, 60.0, 73.0, 68.0, 66.0, 39.0, 38.0, 35.0, 33.0, 14.0, 15.0, 19.0, 13.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.08047485351562, -83.86880493164062, -81.65713500976562, -79.4454574584961, -77.2337875366211, -75.0221176147461, -72.8104476928711, -70.5987777709961, -68.38710021972656, -66.17543029785156, -63.9637565612793, -61.7520866394043, -59.54041290283203, -57.32874298095703, -55.11707305908203, -52.90540313720703, -50.69373321533203, -48.48206329345703, -46.270389556884766, -44.058719635009766, -41.8470458984375, -39.6353759765625, -37.4237060546875, -35.2120361328125, -33.000362396240234, -30.7886905670166, -28.57701873779297, -26.36534881591797, -24.153676986694336, -21.942005157470703, -19.730335235595703, -17.51866340637207, -15.306999206542969, -13.095327377319336, -10.88365650177002, -8.671985626220703, -6.46031379699707, -4.2486419677734375, -2.036971092224121, 0.1746997833251953, 2.386371612548828, 4.598042964935303, 6.809714317321777, 9.021385192871094, 11.233057022094727, 13.44472885131836, 15.656399726867676, 17.868070602416992, 20.079742431640625, 22.291414260864258, 24.50308609008789, 26.71475601196289, 28.926427841186523, 31.138099670410156, 33.349769592285156, 35.561439514160156, 37.77311325073242, 39.98478317260742, 42.19645690917969, 44.40812683105469, 46.61979675292969, 48.83147048950195, 51.04314041137695, 53.25481414794922, 55.46648406982422]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 16.0, 21.0, 29.0, 37.0, 78.0, 127.0, 236.0, 814.0, 199158.0, 3991465.0, 1627.0, 301.0, 147.0, 77.0, 58.0, 22.0, 17.0, 12.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -42.510009765625, -41.33251953125, -40.155029296875, -38.9775390625, -37.800048828125, -36.62255859375, -35.445068359375, -34.267578125, -33.090087890625, -31.91259765625, -30.735107421875, -29.5576171875, -28.380126953125, -27.20263671875, -26.025146484375, -24.84765625, -23.670166015625, -22.49267578125, -21.315185546875, -20.1376953125, -18.960205078125, -17.78271484375, -16.605224609375, -15.427734375, -14.250244140625, -13.07275390625, -11.895263671875, -10.7177734375, -9.540283203125, -8.36279296875, -7.185302734375, -6.0078125, -4.830322265625, -3.65283203125, -2.475341796875, -1.2978515625, -0.120361328125, 1.05712890625, 2.234619140625, 3.412109375, 4.589599609375, 5.76708984375, 6.944580078125, 8.1220703125, 9.299560546875, 10.47705078125, 11.654541015625, 12.83203125, 14.009521484375, 15.18701171875, 16.364501953125, 17.5419921875, 18.719482421875, 19.89697265625, 21.074462890625, 22.251953125, 23.429443359375, 24.60693359375, 25.784423828125, 26.9619140625, 28.139404296875, 29.31689453125, 30.494384765625, 31.671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 13.0, 23.0, 33.0, 37.0, 44.0, 57.0, 68.0, 74.0, 57.0, 95.0, 76.0, 87.0, 58.0, 76.0, 47.0, 34.0, 28.0, 26.0, 18.0, 10.0, 7.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.981292724609375, -5.82977294921875, -5.678253173828125, -5.5267333984375, -5.375213623046875, -5.22369384765625, -5.072174072265625, -4.920654296875, -4.769134521484375, -4.61761474609375, -4.466094970703125, -4.3145751953125, -4.163055419921875, -4.01153564453125, -3.860015869140625, -3.70849609375, -3.556976318359375, -3.40545654296875, -3.253936767578125, -3.1024169921875, -2.950897216796875, -2.79937744140625, -2.647857666015625, -2.496337890625, -2.344818115234375, -2.19329833984375, -2.041778564453125, -1.8902587890625, -1.738739013671875, -1.58721923828125, -1.435699462890625, -1.2841796875, -1.132659912109375, -0.98114013671875, -0.829620361328125, -0.6781005859375, -0.526580810546875, -0.37506103515625, -0.223541259765625, -0.072021484375, 0.079498291015625, 0.23101806640625, 0.382537841796875, 0.5340576171875, 0.685577392578125, 0.83709716796875, 0.988616943359375, 1.14013671875, 1.291656494140625, 1.44317626953125, 1.594696044921875, 1.7462158203125, 1.897735595703125, 2.04925537109375, 2.200775146484375, 2.352294921875, 2.503814697265625, 2.65533447265625, 2.806854248046875, 2.9583740234375, 3.109893798828125, 3.26141357421875, 3.412933349609375, 3.564453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 2.0, 6.0, 12.0, 9.0, 19.0, 20.0, 31.0, 26.0, 52.0, 61.0, 54.0, 95.0, 140.0, 245.0, 541.0, 1308.0, 3794.0, 12864.0, 67372.0, 2681492.0, 1363881.0, 47074.0, 10107.0, 2970.0, 997.0, 426.0, 234.0, 132.0, 81.0, 57.0, 39.0, 33.0, 32.0, 21.0, 17.0, 12.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.29986572265625, -6.0567626953125, -5.81365966796875, -5.570556640625, -5.32745361328125, -5.0843505859375, -4.84124755859375, -4.59814453125, -4.35504150390625, -4.1119384765625, -3.86883544921875, -3.625732421875, -3.38262939453125, -3.1395263671875, -2.89642333984375, -2.6533203125, -2.41021728515625, -2.1671142578125, -1.92401123046875, -1.680908203125, -1.43780517578125, -1.1947021484375, -0.95159912109375, -0.70849609375, -0.46539306640625, -0.2222900390625, 0.02081298828125, 0.263916015625, 0.50701904296875, 0.7501220703125, 0.99322509765625, 1.236328125, 1.47943115234375, 1.7225341796875, 1.96563720703125, 2.208740234375, 2.45184326171875, 2.6949462890625, 2.93804931640625, 3.18115234375, 3.42425537109375, 3.6673583984375, 3.91046142578125, 4.153564453125, 4.39666748046875, 4.6397705078125, 4.88287353515625, 5.1259765625, 5.36907958984375, 5.6121826171875, 5.85528564453125, 6.098388671875, 6.34149169921875, 6.5845947265625, 6.82769775390625, 7.07080078125, 7.31390380859375, 7.5570068359375, 7.80010986328125, 8.043212890625, 8.28631591796875, 8.5294189453125, 8.77252197265625, 9.015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 6.0, 3.0, 6.0, 11.0, 6.0, 15.0, 7.0, 23.0, 38.0, 65.0, 114.0, 210.0, 374.0, 690.0, 887.0, 689.0, 412.0, 190.0, 132.0, 62.0, 36.0, 17.0, 14.0, 12.0, 10.0, 10.0, 8.0, 6.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-7.3125, -7.13629150390625, -6.9600830078125, -6.78387451171875, -6.607666015625, -6.43145751953125, -6.2552490234375, -6.07904052734375, -5.90283203125, -5.72662353515625, -5.5504150390625, -5.37420654296875, -5.197998046875, -5.02178955078125, -4.8455810546875, -4.66937255859375, -4.4931640625, -4.31695556640625, -4.1407470703125, -3.96453857421875, -3.788330078125, -3.61212158203125, -3.4359130859375, -3.25970458984375, -3.08349609375, -2.90728759765625, -2.7310791015625, -2.55487060546875, -2.378662109375, -2.20245361328125, -2.0262451171875, -1.85003662109375, -1.673828125, -1.49761962890625, -1.3214111328125, -1.14520263671875, -0.968994140625, -0.79278564453125, -0.6165771484375, -0.44036865234375, -0.26416015625, -0.08795166015625, 0.0882568359375, 0.26446533203125, 0.440673828125, 0.61688232421875, 0.7930908203125, 0.96929931640625, 1.1455078125, 1.32171630859375, 1.4979248046875, 1.67413330078125, 1.850341796875, 2.02655029296875, 2.2027587890625, 2.37896728515625, 2.55517578125, 2.73138427734375, 2.9075927734375, 3.08380126953125, 3.260009765625, 3.43621826171875, 3.6124267578125, 3.78863525390625, 3.96484375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 11.0, 24.0, 42.0, 122.0, 236.0, 272.0, 184.0, 69.0, 23.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-140.1982421875, -137.35736083984375, -134.51649475097656, -131.6756134033203, -128.83474731445312, -125.9938735961914, -123.15299987792969, -120.31211853027344, -117.47125244140625, -114.63037872314453, -111.78950500488281, -108.9486312866211, -106.10775756835938, -103.26688385009766, -100.42601013183594, -97.58512878417969, -94.74425506591797, -91.90338134765625, -89.06250762939453, -86.22163391113281, -83.3807601928711, -80.53988647460938, -77.69900512695312, -74.85813903808594, -72.01725769042969, -69.17638397216797, -66.33551025390625, -63.49463653564453, -60.65376281738281, -57.812889099121094, -54.97201156616211, -52.13113784790039, -49.290260314941406, -46.44938659667969, -43.60851287841797, -40.76763916015625, -37.92676544189453, -35.08589172363281, -32.24501419067383, -29.40414047241211, -26.56326675415039, -23.722393035888672, -20.881519317626953, -18.0406436920166, -15.199769973754883, -12.358896255493164, -9.518020629882812, -6.677146911621094, -3.836273193359375, -0.995398998260498, 1.845475196838379, 4.686349868774414, 7.527223587036133, 10.368097305297852, 13.208972930908203, 16.049846649169922, 18.89072036743164, 21.73159408569336, 24.572467803955078, 27.41334342956543, 30.25421714782715, 33.0950927734375, 35.93596649169922, 38.77684020996094, 41.617713928222656]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 13.0, 17.0, 22.0, 25.0, 28.0, 48.0, 22.0, 43.0, 41.0, 44.0, 59.0, 52.0, 50.0, 53.0, 66.0, 60.0, 38.0, 37.0, 39.0, 36.0, 27.0, 27.0, 20.0, 19.0, 16.0, 17.0, 5.0, 7.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-27.459341049194336, -26.670984268188477, -25.88262939453125, -25.09427261352539, -24.30591583251953, -23.517560958862305, -22.729204177856445, -21.94084930419922, -21.15249252319336, -20.3641357421875, -19.575780868530273, -18.787424087524414, -17.999069213867188, -17.210712432861328, -16.42235565185547, -15.633999824523926, -14.845643997192383, -14.05728816986084, -13.268932342529297, -12.480575561523438, -11.692219734191895, -10.903863906860352, -10.115507125854492, -9.32715129852295, -8.538795471191406, -7.750439643859863, -6.962083339691162, -6.173727035522461, -5.385371208190918, -4.597015380859375, -3.808659076690674, -3.0203027725219727, -2.2319488525390625, -1.4435927867889404, -0.6552367210388184, 0.1331193447113037, 0.9214754104614258, 1.7098314762115479, 2.49818754196167, 3.286543846130371, 4.074899673461914, 4.863255500793457, 5.651611804962158, 6.439968109130859, 7.228323936462402, 8.016679763793945, 8.805036544799805, 9.593392372131348, 10.38174819946289, 11.170104026794434, 11.958459854125977, 12.746816635131836, 13.535172462463379, 14.323528289794922, 15.111885070800781, 15.900240898132324, 16.688596725463867, 17.476953506469727, 18.265308380126953, 19.053665161132812, 19.842021942138672, 20.6303768157959, 21.418733596801758, 22.207088470458984, 22.995445251464844]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 10.0, 23.0, 29.0, 63.0, 135.0, 256.0, 823.0, 4263.0, 47029.0, 770152.0, 210846.0, 12387.0, 1756.0, 410.0, 172.0, 69.0, 38.0, 25.0, 17.0, 13.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8125, -15.3701171875, -14.927734375, -14.4853515625, -14.04296875, -13.6005859375, -13.158203125, -12.7158203125, -12.2734375, -11.8310546875, -11.388671875, -10.9462890625, -10.50390625, -10.0615234375, -9.619140625, -9.1767578125, -8.734375, -8.2919921875, -7.849609375, -7.4072265625, -6.96484375, -6.5224609375, -6.080078125, -5.6376953125, -5.1953125, -4.7529296875, -4.310546875, -3.8681640625, -3.42578125, -2.9833984375, -2.541015625, -2.0986328125, -1.65625, -1.2138671875, -0.771484375, -0.3291015625, 0.11328125, 0.5556640625, 0.998046875, 1.4404296875, 1.8828125, 2.3251953125, 2.767578125, 3.2099609375, 3.65234375, 4.0947265625, 4.537109375, 4.9794921875, 5.421875, 5.8642578125, 6.306640625, 6.7490234375, 7.19140625, 7.6337890625, 8.076171875, 8.5185546875, 8.9609375, 9.4033203125, 9.845703125, 10.2880859375, 10.73046875, 11.1728515625, 11.615234375, 12.0576171875, 12.5]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 3.0, 9.0, 11.0, 11.0, 18.0, 19.0, 24.0, 38.0, 29.0, 38.0, 61.0, 54.0, 71.0, 69.0, 47.0, 68.0, 58.0, 70.0, 49.0, 58.0, 40.0, 33.0, 30.0, 20.0, 13.0, 13.0, 7.0, 12.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.10321044921875, -3.9837646484375, -3.86431884765625, -3.744873046875, -3.62542724609375, -3.5059814453125, -3.38653564453125, -3.26708984375, -3.14764404296875, -3.0281982421875, -2.90875244140625, -2.789306640625, -2.66986083984375, -2.5504150390625, -2.43096923828125, -2.3115234375, -2.19207763671875, -2.0726318359375, -1.95318603515625, -1.833740234375, -1.71429443359375, -1.5948486328125, -1.47540283203125, -1.35595703125, -1.23651123046875, -1.1170654296875, -0.99761962890625, -0.878173828125, -0.75872802734375, -0.6392822265625, -0.51983642578125, -0.400390625, -0.28094482421875, -0.1614990234375, -0.04205322265625, 0.077392578125, 0.19683837890625, 0.3162841796875, 0.43572998046875, 0.55517578125, 0.67462158203125, 0.7940673828125, 0.91351318359375, 1.032958984375, 1.15240478515625, 1.2718505859375, 1.39129638671875, 1.5107421875, 1.63018798828125, 1.7496337890625, 1.86907958984375, 1.988525390625, 2.10797119140625, 2.2274169921875, 2.34686279296875, 2.46630859375, 2.58575439453125, 2.7052001953125, 2.82464599609375, 2.944091796875, 3.06353759765625, 3.1829833984375, 3.30242919921875, 3.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 12.0, 5.0, 15.0, 9.0, 10.0, 24.0, 20.0, 29.0, 56.0, 68.0, 82.0, 133.0, 226.0, 349.0, 663.0, 1497.0, 3643.0, 10918.0, 44998.0, 287100.0, 591734.0, 80256.0, 17373.0, 5201.0, 1964.0, 919.0, 410.0, 266.0, 160.0, 94.0, 72.0, 53.0, 49.0, 30.0, 25.0, 14.0, 18.0, 10.0, 11.0, 5.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6171875, -8.349365234375, -8.08154296875, -7.813720703125, -7.5458984375, -7.278076171875, -7.01025390625, -6.742431640625, -6.474609375, -6.206787109375, -5.93896484375, -5.671142578125, -5.4033203125, -5.135498046875, -4.86767578125, -4.599853515625, -4.33203125, -4.064208984375, -3.79638671875, -3.528564453125, -3.2607421875, -2.992919921875, -2.72509765625, -2.457275390625, -2.189453125, -1.921630859375, -1.65380859375, -1.385986328125, -1.1181640625, -0.850341796875, -0.58251953125, -0.314697265625, -0.046875, 0.220947265625, 0.48876953125, 0.756591796875, 1.0244140625, 1.292236328125, 1.56005859375, 1.827880859375, 2.095703125, 2.363525390625, 2.63134765625, 2.899169921875, 3.1669921875, 3.434814453125, 3.70263671875, 3.970458984375, 4.23828125, 4.506103515625, 4.77392578125, 5.041748046875, 5.3095703125, 5.577392578125, 5.84521484375, 6.113037109375, 6.380859375, 6.648681640625, 6.91650390625, 7.184326171875, 7.4521484375, 7.719970703125, 7.98779296875, 8.255615234375, 8.5234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 9.0, 9.0, 10.0, 12.0, 13.0, 34.0, 24.0, 23.0, 28.0, 39.0, 32.0, 43.0, 51.0, 49.0, 67.0, 70.0, 43.0, 56.0, 56.0, 42.0, 54.0, 33.0, 27.0, 30.0, 24.0, 21.0, 21.0, 7.0, 9.0, 19.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.8046875, -14.3795166015625, -13.954345703125, -13.5291748046875, -13.10400390625, -12.6788330078125, -12.253662109375, -11.8284912109375, -11.4033203125, -10.9781494140625, -10.552978515625, -10.1278076171875, -9.70263671875, -9.2774658203125, -8.852294921875, -8.4271240234375, -8.001953125, -7.5767822265625, -7.151611328125, -6.7264404296875, -6.30126953125, -5.8760986328125, -5.450927734375, -5.0257568359375, -4.6005859375, -4.1754150390625, -3.750244140625, -3.3250732421875, -2.89990234375, -2.4747314453125, -2.049560546875, -1.6243896484375, -1.19921875, -0.7740478515625, -0.348876953125, 0.0762939453125, 0.50146484375, 0.9266357421875, 1.351806640625, 1.7769775390625, 2.2021484375, 2.6273193359375, 3.052490234375, 3.4776611328125, 3.90283203125, 4.3280029296875, 4.753173828125, 5.1783447265625, 5.603515625, 6.0286865234375, 6.453857421875, 6.8790283203125, 7.30419921875, 7.7293701171875, 8.154541015625, 8.5797119140625, 9.0048828125, 9.4300537109375, 9.855224609375, 10.2803955078125, 10.70556640625, 11.1307373046875, 11.555908203125, 11.9810791015625, 12.40625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 21.0, 41.0, 91.0, 320.0, 2409.0, 694280.0, 348760.0, 2150.0, 319.0, 74.0, 29.0, 23.0, 12.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.514404296875, -18.76318359375, -18.011962890625, -17.2607421875, -16.509521484375, -15.75830078125, -15.007080078125, -14.255859375, -13.504638671875, -12.75341796875, -12.002197265625, -11.2509765625, -10.499755859375, -9.74853515625, -8.997314453125, -8.24609375, -7.494873046875, -6.74365234375, -5.992431640625, -5.2412109375, -4.489990234375, -3.73876953125, -2.987548828125, -2.236328125, -1.485107421875, -0.73388671875, 0.017333984375, 0.7685546875, 1.519775390625, 2.27099609375, 3.022216796875, 3.7734375, 4.524658203125, 5.27587890625, 6.027099609375, 6.7783203125, 7.529541015625, 8.28076171875, 9.031982421875, 9.783203125, 10.534423828125, 11.28564453125, 12.036865234375, 12.7880859375, 13.539306640625, 14.29052734375, 15.041748046875, 15.79296875, 16.544189453125, 17.29541015625, 18.046630859375, 18.7978515625, 19.549072265625, 20.30029296875, 21.051513671875, 21.802734375, 22.553955078125, 23.30517578125, 24.056396484375, 24.8076171875, 25.558837890625, 26.31005859375, 27.061279296875, 27.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 10.0, 11.0, 16.0, 23.0, 25.0, 38.0, 46.0, 54.0, 106.0, 158.0, 173.0, 94.0, 66.0, 44.0, 27.0, 21.0, 19.0, 14.0, 6.0, 9.0, 8.0, 9.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007009506225585938, -0.0006676614284515381, -0.0006343722343444824, -0.0006010830402374268, -0.0005677938461303711, -0.0005345046520233154, -0.0005012154579162598, -0.0004679262638092041, -0.00043463706970214844, -0.0004013478755950928, -0.0003680586814880371, -0.00033476948738098145, -0.0003014802932739258, -0.0002681910991668701, -0.00023490190505981445, -0.0002016127109527588, -0.00016832351684570312, -0.00013503432273864746, -0.0001017451286315918, -6.845593452453613e-05, -3.516674041748047e-05, -1.8775463104248047e-06, 3.141164779663086e-05, 6.470084190368652e-05, 9.799003601074219e-05, 0.00013127923011779785, 0.00016456842422485352, 0.00019785761833190918, 0.00023114681243896484, 0.0002644360065460205, 0.00029772520065307617, 0.00033101439476013184, 0.0003643035888671875, 0.00039759278297424316, 0.00043088197708129883, 0.0004641711711883545, 0.0004974603652954102, 0.0005307495594024658, 0.0005640387535095215, 0.0005973279476165771, 0.0006306171417236328, 0.0006639063358306885, 0.0006971955299377441, 0.0007304847240447998, 0.0007637739181518555, 0.0007970631122589111, 0.0008303523063659668, 0.0008636415004730225, 0.0008969306945800781, 0.0009302198886871338, 0.0009635090827941895, 0.0009967982769012451, 0.0010300874710083008, 0.0010633766651153564, 0.0010966658592224121, 0.0011299550533294678, 0.0011632442474365234, 0.001196533441543579, 0.0012298226356506348, 0.0012631118297576904, 0.001296401023864746, 0.0013296902179718018, 0.0013629794120788574, 0.001396268606185913, 0.0014295578002929688]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 9.0, 23.0, 28.0, 54.0, 96.0, 187.0, 374.0, 933.0, 2909.0, 13124.0, 144780.0, 836124.0, 40701.0, 6308.0, 1669.0, 574.0, 268.0, 148.0, 90.0, 47.0, 31.0, 21.0, 14.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.8824462890625, -9.624267578125, -9.3660888671875, -9.10791015625, -8.8497314453125, -8.591552734375, -8.3333740234375, -8.0751953125, -7.8170166015625, -7.558837890625, -7.3006591796875, -7.04248046875, -6.7843017578125, -6.526123046875, -6.2679443359375, -6.009765625, -5.7515869140625, -5.493408203125, -5.2352294921875, -4.97705078125, -4.7188720703125, -4.460693359375, -4.2025146484375, -3.9443359375, -3.6861572265625, -3.427978515625, -3.1697998046875, -2.91162109375, -2.6534423828125, -2.395263671875, -2.1370849609375, -1.87890625, -1.6207275390625, -1.362548828125, -1.1043701171875, -0.84619140625, -0.5880126953125, -0.329833984375, -0.0716552734375, 0.1865234375, 0.4447021484375, 0.702880859375, 0.9610595703125, 1.21923828125, 1.4774169921875, 1.735595703125, 1.9937744140625, 2.251953125, 2.5101318359375, 2.768310546875, 3.0264892578125, 3.28466796875, 3.5428466796875, 3.801025390625, 4.0592041015625, 4.3173828125, 4.5755615234375, 4.833740234375, 5.0919189453125, 5.35009765625, 5.6082763671875, 5.866455078125, 6.1246337890625, 6.3828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 8.0, 3.0, 10.0, 11.0, 12.0, 18.0, 19.0, 20.0, 48.0, 56.0, 108.0, 135.0, 158.0, 118.0, 76.0, 49.0, 37.0, 17.0, 18.0, 14.0, 16.0, 9.0, 8.0, 5.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.1243896484375, -5.959716796875, -5.7950439453125, -5.63037109375, -5.4656982421875, -5.301025390625, -5.1363525390625, -4.9716796875, -4.8070068359375, -4.642333984375, -4.4776611328125, -4.31298828125, -4.1483154296875, -3.983642578125, -3.8189697265625, -3.654296875, -3.4896240234375, -3.324951171875, -3.1602783203125, -2.99560546875, -2.8309326171875, -2.666259765625, -2.5015869140625, -2.3369140625, -2.1722412109375, -2.007568359375, -1.8428955078125, -1.67822265625, -1.5135498046875, -1.348876953125, -1.1842041015625, -1.01953125, -0.8548583984375, -0.690185546875, -0.5255126953125, -0.36083984375, -0.1961669921875, -0.031494140625, 0.1331787109375, 0.2978515625, 0.4625244140625, 0.627197265625, 0.7918701171875, 0.95654296875, 1.1212158203125, 1.285888671875, 1.4505615234375, 1.615234375, 1.7799072265625, 1.944580078125, 2.1092529296875, 2.27392578125, 2.4385986328125, 2.603271484375, 2.7679443359375, 2.9326171875, 3.0972900390625, 3.261962890625, 3.4266357421875, 3.59130859375, 3.7559814453125, 3.920654296875, 4.0853271484375, 4.25]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 11.0, 24.0, 177.0, 511.0, 201.0, 43.0, 14.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.90744018554688, -208.07186889648438, -201.23629760742188, -194.40072631835938, -187.56517028808594, -180.72959899902344, -173.89402770996094, -167.05845642089844, -160.22288513183594, -153.38731384277344, -146.55174255371094, -139.7161865234375, -132.880615234375, -126.0450439453125, -119.20947265625, -112.3739013671875, -105.53833770751953, -98.70276641845703, -91.86720275878906, -85.03163146972656, -78.19606018066406, -71.36048889160156, -64.5249252319336, -57.689353942871094, -50.85378646850586, -44.018218994140625, -37.182647705078125, -30.34708023071289, -23.511510848999023, -16.675941467285156, -9.840373992919922, -3.004802703857422, 3.8307647705078125, 10.66633415222168, 17.501903533935547, 24.33747100830078, 31.17304039001465, 38.008609771728516, 44.84417724609375, 51.67974853515625, 58.515316009521484, 65.35088348388672, 72.18645477294922, 79.02201843261719, 85.85758972167969, 92.69316101074219, 99.52873229980469, 106.36430358886719, 113.19986724853516, 120.03543853759766, 126.87100219726562, 133.70657348632812, 140.54214477539062, 147.37771606445312, 154.21328735351562, 161.04885864257812, 167.88441467285156, 174.71998596191406, 181.55555725097656, 188.39111328125, 195.2266845703125, 202.062255859375, 208.8978271484375, 215.7333984375, 222.5689697265625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 5.0, 0.0, 5.0, 3.0, 4.0, 12.0, 10.0, 14.0, 23.0, 9.0, 16.0, 14.0, 32.0, 31.0, 26.0, 39.0, 43.0, 49.0, 48.0, 64.0, 59.0, 71.0, 66.0, 51.0, 44.0, 38.0, 32.0, 35.0, 34.0, 26.0, 15.0, 13.0, 20.0, 14.0, 3.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.06634521484375, -45.186431884765625, -43.306522369384766, -41.42660903930664, -39.54669952392578, -37.666786193847656, -35.78687286376953, -33.906959533691406, -32.02705001831055, -30.147138595581055, -28.267227172851562, -26.387313842773438, -24.507402420043945, -22.627490997314453, -20.747577667236328, -18.867666244506836, -16.987754821777344, -15.107843399047852, -13.227931022644043, -11.348018646240234, -9.468107223510742, -7.58819580078125, -5.708283424377441, -3.828371047973633, -1.9484596252441406, -0.06854772567749023, 1.8113641738891602, 3.6912760734558105, 5.571187973022461, 7.451099395751953, 9.331011772155762, 11.21092414855957, 13.090835571289062, 14.970746994018555, 16.850658416748047, 18.730571746826172, 20.610483169555664, 22.490394592285156, 24.37030792236328, 26.250219345092773, 28.130130767822266, 30.010042190551758, 31.88995361328125, 33.769866943359375, 35.6497802734375, 37.52968978881836, 39.409603118896484, 41.289512634277344, 43.16942596435547, 45.049339294433594, 46.92924880981445, 48.80916213989258, 50.68907165527344, 52.56898498535156, 54.44889831542969, 56.32881164550781, 58.20872116088867, 60.0886344909668, 61.968544006347656, 63.84845733642578, 65.7283706665039, 67.6082763671875, 69.48818969726562, 71.36810302734375, 73.24801635742188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 4.0, 7.0, 9.0, 16.0, 30.0, 51.0, 64.0, 125.0, 253.0, 587.0, 1756.0, 8332.0, 115132.0, 3865147.0, 187832.0, 10876.0, 2454.0, 895.0, 354.0, 143.0, 83.0, 34.0, 22.0, 10.0, 10.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.1290283203125, -12.797119140625, -12.4652099609375, -12.13330078125, -11.8013916015625, -11.469482421875, -11.1375732421875, -10.8056640625, -10.4737548828125, -10.141845703125, -9.8099365234375, -9.47802734375, -9.1461181640625, -8.814208984375, -8.4822998046875, -8.150390625, -7.8184814453125, -7.486572265625, -7.1546630859375, -6.82275390625, -6.4908447265625, -6.158935546875, -5.8270263671875, -5.4951171875, -5.1632080078125, -4.831298828125, -4.4993896484375, -4.16748046875, -3.8355712890625, -3.503662109375, -3.1717529296875, -2.83984375, -2.5079345703125, -2.176025390625, -1.8441162109375, -1.51220703125, -1.1802978515625, -0.848388671875, -0.5164794921875, -0.1845703125, 0.1473388671875, 0.479248046875, 0.8111572265625, 1.14306640625, 1.4749755859375, 1.806884765625, 2.1387939453125, 2.470703125, 2.8026123046875, 3.134521484375, 3.4664306640625, 3.79833984375, 4.1302490234375, 4.462158203125, 4.7940673828125, 5.1259765625, 5.4578857421875, 5.789794921875, 6.1217041015625, 6.45361328125, 6.7855224609375, 7.117431640625, 7.4493408203125, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 13.0, 26.0, 30.0, 23.0, 40.0, 49.0, 61.0, 73.0, 68.0, 58.0, 47.0, 70.0, 70.0, 72.0, 50.0, 41.0, 36.0, 34.0, 24.0, 19.0, 10.0, 6.0, 14.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.73046875, -4.615570068359375, -4.50067138671875, -4.385772705078125, -4.2708740234375, -4.155975341796875, -4.04107666015625, -3.926177978515625, -3.811279296875, -3.696380615234375, -3.58148193359375, -3.466583251953125, -3.3516845703125, -3.236785888671875, -3.12188720703125, -3.006988525390625, -2.89208984375, -2.777191162109375, -2.66229248046875, -2.547393798828125, -2.4324951171875, -2.317596435546875, -2.20269775390625, -2.087799072265625, -1.972900390625, -1.858001708984375, -1.74310302734375, -1.628204345703125, -1.5133056640625, -1.398406982421875, -1.28350830078125, -1.168609619140625, -1.0537109375, -0.938812255859375, -0.82391357421875, -0.709014892578125, -0.5941162109375, -0.479217529296875, -0.36431884765625, -0.249420166015625, -0.134521484375, -0.019622802734375, 0.09527587890625, 0.210174560546875, 0.3250732421875, 0.439971923828125, 0.55487060546875, 0.669769287109375, 0.78466796875, 0.899566650390625, 1.01446533203125, 1.129364013671875, 1.2442626953125, 1.359161376953125, 1.47406005859375, 1.588958740234375, 1.703857421875, 1.818756103515625, 1.93365478515625, 2.048553466796875, 2.1634521484375, 2.278350830078125, 2.39324951171875, 2.508148193359375, 2.623046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 12.0, 13.0, 15.0, 23.0, 28.0, 65.0, 79.0, 104.0, 188.0, 318.0, 663.0, 1926.0, 7609.0, 49660.0, 1856533.0, 2207771.0, 56935.0, 8638.0, 2084.0, 753.0, 316.0, 171.0, 116.0, 69.0, 53.0, 38.0, 20.0, 14.0, 16.0, 10.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.1363525390625, -7.835205078125, -7.5340576171875, -7.23291015625, -6.9317626953125, -6.630615234375, -6.3294677734375, -6.0283203125, -5.7271728515625, -5.426025390625, -5.1248779296875, -4.82373046875, -4.5225830078125, -4.221435546875, -3.9202880859375, -3.619140625, -3.3179931640625, -3.016845703125, -2.7156982421875, -2.41455078125, -2.1134033203125, -1.812255859375, -1.5111083984375, -1.2099609375, -0.9088134765625, -0.607666015625, -0.3065185546875, -0.00537109375, 0.2957763671875, 0.596923828125, 0.8980712890625, 1.19921875, 1.5003662109375, 1.801513671875, 2.1026611328125, 2.40380859375, 2.7049560546875, 3.006103515625, 3.3072509765625, 3.6083984375, 3.9095458984375, 4.210693359375, 4.5118408203125, 4.81298828125, 5.1141357421875, 5.415283203125, 5.7164306640625, 6.017578125, 6.3187255859375, 6.619873046875, 6.9210205078125, 7.22216796875, 7.5233154296875, 7.824462890625, 8.1256103515625, 8.4267578125, 8.7279052734375, 9.029052734375, 9.3302001953125, 9.63134765625, 9.9324951171875, 10.233642578125, 10.5347900390625, 10.8359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 11.0, 9.0, 9.0, 18.0, 35.0, 55.0, 79.0, 157.0, 360.0, 765.0, 1035.0, 744.0, 364.0, 162.0, 98.0, 64.0, 34.0, 19.0, 12.0, 13.0, 10.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.90802001953125, -9.6285400390625, -9.34906005859375, -9.069580078125, -8.79010009765625, -8.5106201171875, -8.23114013671875, -7.95166015625, -7.67218017578125, -7.3927001953125, -7.11322021484375, -6.833740234375, -6.55426025390625, -6.2747802734375, -5.99530029296875, -5.7158203125, -5.43634033203125, -5.1568603515625, -4.87738037109375, -4.597900390625, -4.31842041015625, -4.0389404296875, -3.75946044921875, -3.47998046875, -3.20050048828125, -2.9210205078125, -2.64154052734375, -2.362060546875, -2.08258056640625, -1.8031005859375, -1.52362060546875, -1.244140625, -0.96466064453125, -0.6851806640625, -0.40570068359375, -0.126220703125, 0.15325927734375, 0.4327392578125, 0.71221923828125, 0.99169921875, 1.27117919921875, 1.5506591796875, 1.83013916015625, 2.109619140625, 2.38909912109375, 2.6685791015625, 2.94805908203125, 3.2275390625, 3.50701904296875, 3.7864990234375, 4.06597900390625, 4.345458984375, 4.62493896484375, 4.9044189453125, 5.18389892578125, 5.46337890625, 5.74285888671875, 6.0223388671875, 6.30181884765625, 6.581298828125, 6.86077880859375, 7.1402587890625, 7.41973876953125, 7.69921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 8.0, 23.0, 40.0, 87.0, 164.0, 222.0, 230.0, 115.0, 57.0, 19.0, 7.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.66506576538086, -52.85368347167969, -50.042301177978516, -47.230918884277344, -44.41954040527344, -41.608158111572266, -38.796775817871094, -35.98539733886719, -33.17401123046875, -30.362628936767578, -27.55124855041504, -24.739866256713867, -21.928485870361328, -19.117103576660156, -16.305721282958984, -13.494340896606445, -10.682960510253906, -7.871579170227051, -5.060197353363037, -2.2488155364990234, 0.562565803527832, 3.3739471435546875, 6.185329437255859, 8.996709823608398, 11.80809211730957, 14.619473457336426, 17.43085479736328, 20.242237091064453, 23.053619384765625, 25.864999771118164, 28.676382064819336, 31.487762451171875, 34.29914855957031, 37.110530853271484, 39.921913146972656, 42.73329162597656, 45.544673919677734, 48.356056213378906, 51.16743850708008, 53.97882080078125, 56.790199279785156, 59.60158157348633, 62.4129638671875, 65.2243423461914, 68.03572845458984, 70.84710693359375, 73.65849304199219, 76.4698715209961, 79.28125, 82.0926284790039, 84.90401458740234, 87.71539306640625, 90.52677917480469, 93.3381576538086, 96.1495361328125, 98.96092224121094, 101.77230834960938, 104.58368682861328, 107.39507293701172, 110.20645141601562, 113.01783752441406, 115.82921600341797, 118.64059448242188, 121.45198059082031, 124.26335906982422]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 8.0, 10.0, 5.0, 22.0, 15.0, 19.0, 27.0, 32.0, 27.0, 40.0, 32.0, 40.0, 52.0, 56.0, 60.0, 60.0, 52.0, 62.0, 52.0, 52.0, 51.0, 29.0, 35.0, 28.0, 26.0, 17.0, 16.0, 14.0, 16.0, 11.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-39.43090057373047, -38.29712677001953, -37.163352966308594, -36.02958297729492, -34.895809173583984, -33.76203536987305, -32.628265380859375, -31.494491577148438, -30.3607177734375, -29.226943969726562, -28.093172073364258, -26.959400177001953, -25.825626373291016, -24.691852569580078, -23.558080673217773, -22.42430877685547, -21.29053497314453, -20.156761169433594, -19.02298927307129, -17.889217376708984, -16.755443572998047, -15.621670722961426, -14.487897872924805, -13.354125022888184, -12.220352172851562, -11.086579322814941, -9.95280647277832, -8.8190336227417, -7.685260772705078, -6.551487922668457, -5.417715072631836, -4.283942222595215, -3.1501731872558594, -2.0164003372192383, -0.8826274871826172, 0.2511453628540039, 1.384918212890625, 2.518691062927246, 3.652463912963867, 4.786236763000488, 5.920009613037109, 7.0537824630737305, 8.187555313110352, 9.321328163146973, 10.455101013183594, 11.588873863220215, 12.722646713256836, 13.856419563293457, 14.990192413330078, 16.123966217041016, 17.25773811340332, 18.391510009765625, 19.525283813476562, 20.6590576171875, 21.792829513549805, 22.92660140991211, 24.060375213623047, 25.194149017333984, 26.32792091369629, 27.461692810058594, 28.59546661376953, 29.72924041748047, 30.863012313842773, 31.996784210205078, 33.130558013916016]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 5.0, 8.0, 7.0, 5.0, 9.0, 9.0, 12.0, 19.0, 29.0, 44.0, 107.0, 226.0, 697.0, 3159.0, 25790.0, 391726.0, 580001.0, 41089.0, 4239.0, 835.0, 257.0, 118.0, 48.0, 29.0, 28.0, 17.0, 17.0, 10.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8125, -11.3919677734375, -10.971435546875, -10.5509033203125, -10.13037109375, -9.7098388671875, -9.289306640625, -8.8687744140625, -8.4482421875, -8.0277099609375, -7.607177734375, -7.1866455078125, -6.76611328125, -6.3455810546875, -5.925048828125, -5.5045166015625, -5.083984375, -4.6634521484375, -4.242919921875, -3.8223876953125, -3.40185546875, -2.9813232421875, -2.560791015625, -2.1402587890625, -1.7197265625, -1.2991943359375, -0.878662109375, -0.4581298828125, -0.03759765625, 0.3829345703125, 0.803466796875, 1.2239990234375, 1.64453125, 2.0650634765625, 2.485595703125, 2.9061279296875, 3.32666015625, 3.7471923828125, 4.167724609375, 4.5882568359375, 5.0087890625, 5.4293212890625, 5.849853515625, 6.2703857421875, 6.69091796875, 7.1114501953125, 7.531982421875, 7.9525146484375, 8.373046875, 8.7935791015625, 9.214111328125, 9.6346435546875, 10.05517578125, 10.4757080078125, 10.896240234375, 11.3167724609375, 11.7373046875, 12.1578369140625, 12.578369140625, 12.9989013671875, 13.41943359375, 13.8399658203125, 14.260498046875, 14.6810302734375, 15.1015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 18.0, 18.0, 27.0, 22.0, 45.0, 48.0, 47.0, 65.0, 64.0, 76.0, 68.0, 77.0, 81.0, 51.0, 57.0, 38.0, 41.0, 37.0, 24.0, 18.0, 15.0, 13.0, 9.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.418792724609375, -4.29071044921875, -4.162628173828125, -4.0345458984375, -3.906463623046875, -3.77838134765625, -3.650299072265625, -3.522216796875, -3.394134521484375, -3.26605224609375, -3.137969970703125, -3.0098876953125, -2.881805419921875, -2.75372314453125, -2.625640869140625, -2.49755859375, -2.369476318359375, -2.24139404296875, -2.113311767578125, -1.9852294921875, -1.857147216796875, -1.72906494140625, -1.600982666015625, -1.472900390625, -1.344818115234375, -1.21673583984375, -1.088653564453125, -0.9605712890625, -0.832489013671875, -0.70440673828125, -0.576324462890625, -0.4482421875, -0.320159912109375, -0.19207763671875, -0.063995361328125, 0.0640869140625, 0.192169189453125, 0.32025146484375, 0.448333740234375, 0.576416015625, 0.704498291015625, 0.83258056640625, 0.960662841796875, 1.0887451171875, 1.216827392578125, 1.34490966796875, 1.472991943359375, 1.60107421875, 1.729156494140625, 1.85723876953125, 1.985321044921875, 2.1134033203125, 2.241485595703125, 2.36956787109375, 2.497650146484375, 2.625732421875, 2.753814697265625, 2.88189697265625, 3.009979248046875, 3.1380615234375, 3.266143798828125, 3.39422607421875, 3.522308349609375, 3.650390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 11.0, 11.0, 15.0, 30.0, 29.0, 70.0, 85.0, 159.0, 300.0, 633.0, 1529.0, 4576.0, 33670.0, 819600.0, 172510.0, 10939.0, 2414.0, 941.0, 428.0, 226.0, 137.0, 85.0, 55.0, 31.0, 23.0, 13.0, 11.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.703125, -19.13623046875, -18.5693359375, -18.00244140625, -17.435546875, -16.86865234375, -16.3017578125, -15.73486328125, -15.16796875, -14.60107421875, -14.0341796875, -13.46728515625, -12.900390625, -12.33349609375, -11.7666015625, -11.19970703125, -10.6328125, -10.06591796875, -9.4990234375, -8.93212890625, -8.365234375, -7.79833984375, -7.2314453125, -6.66455078125, -6.09765625, -5.53076171875, -4.9638671875, -4.39697265625, -3.830078125, -3.26318359375, -2.6962890625, -2.12939453125, -1.5625, -0.99560546875, -0.4287109375, 0.13818359375, 0.705078125, 1.27197265625, 1.8388671875, 2.40576171875, 2.97265625, 3.53955078125, 4.1064453125, 4.67333984375, 5.240234375, 5.80712890625, 6.3740234375, 6.94091796875, 7.5078125, 8.07470703125, 8.6416015625, 9.20849609375, 9.775390625, 10.34228515625, 10.9091796875, 11.47607421875, 12.04296875, 12.60986328125, 13.1767578125, 13.74365234375, 14.310546875, 14.87744140625, 15.4443359375, 16.01123046875, 16.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 12.0, 16.0, 14.0, 21.0, 27.0, 24.0, 38.0, 31.0, 46.0, 61.0, 54.0, 60.0, 85.0, 70.0, 71.0, 63.0, 46.0, 56.0, 57.0, 26.0, 27.0, 19.0, 21.0, 11.0, 12.0, 8.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.46875, -19.896484375, -19.32421875, -18.751953125, -18.1796875, -17.607421875, -17.03515625, -16.462890625, -15.890625, -15.318359375, -14.74609375, -14.173828125, -13.6015625, -13.029296875, -12.45703125, -11.884765625, -11.3125, -10.740234375, -10.16796875, -9.595703125, -9.0234375, -8.451171875, -7.87890625, -7.306640625, -6.734375, -6.162109375, -5.58984375, -5.017578125, -4.4453125, -3.873046875, -3.30078125, -2.728515625, -2.15625, -1.583984375, -1.01171875, -0.439453125, 0.1328125, 0.705078125, 1.27734375, 1.849609375, 2.421875, 2.994140625, 3.56640625, 4.138671875, 4.7109375, 5.283203125, 5.85546875, 6.427734375, 7.0, 7.572265625, 8.14453125, 8.716796875, 9.2890625, 9.861328125, 10.43359375, 11.005859375, 11.578125, 12.150390625, 12.72265625, 13.294921875, 13.8671875, 14.439453125, 15.01171875, 15.583984375, 16.15625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 20.0, 17.0, 38.0, 72.0, 115.0, 241.0, 454.0, 1113.0, 3278.0, 13189.0, 114296.0, 847084.0, 55863.0, 8639.0, 2395.0, 849.0, 419.0, 173.0, 120.0, 55.0, 25.0, 27.0, 18.0, 12.0, 4.0, 9.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.3587646484375, -7.108154296875, -6.8575439453125, -6.60693359375, -6.3563232421875, -6.105712890625, -5.8551025390625, -5.6044921875, -5.3538818359375, -5.103271484375, -4.8526611328125, -4.60205078125, -4.3514404296875, -4.100830078125, -3.8502197265625, -3.599609375, -3.3489990234375, -3.098388671875, -2.8477783203125, -2.59716796875, -2.3465576171875, -2.095947265625, -1.8453369140625, -1.5947265625, -1.3441162109375, -1.093505859375, -0.8428955078125, -0.59228515625, -0.3416748046875, -0.091064453125, 0.1595458984375, 0.41015625, 0.6607666015625, 0.911376953125, 1.1619873046875, 1.41259765625, 1.6632080078125, 1.913818359375, 2.1644287109375, 2.4150390625, 2.6656494140625, 2.916259765625, 3.1668701171875, 3.41748046875, 3.6680908203125, 3.918701171875, 4.1693115234375, 4.419921875, 4.6705322265625, 4.921142578125, 5.1717529296875, 5.42236328125, 5.6729736328125, 5.923583984375, 6.1741943359375, 6.4248046875, 6.6754150390625, 6.926025390625, 7.1766357421875, 7.42724609375, 7.6778564453125, 7.928466796875, 8.1790771484375, 8.4296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 6.0, 8.0, 6.0, 7.0, 10.0, 10.0, 16.0, 25.0, 23.0, 43.0, 39.0, 69.0, 86.0, 133.0, 147.0, 100.0, 53.0, 52.0, 33.0, 27.0, 30.0, 15.0, 18.0, 9.0, 9.0, 7.0, 9.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013027191162109375, -0.0012646615505218506, -0.0012266039848327637, -0.0011885464191436768, -0.0011504888534545898, -0.001112431287765503, -0.001074373722076416, -0.001036316156387329, -0.0009982585906982422, -0.0009602010250091553, -0.0009221434593200684, -0.0008840858936309814, -0.0008460283279418945, -0.0008079707622528076, -0.0007699131965637207, -0.0007318556308746338, -0.0006937980651855469, -0.00065574049949646, -0.000617682933807373, -0.0005796253681182861, -0.0005415678024291992, -0.0005035102367401123, -0.0004654526710510254, -0.0004273951053619385, -0.00038933753967285156, -0.00035127997398376465, -0.00031322240829467773, -0.0002751648426055908, -0.0002371072769165039, -0.000199049711227417, -0.00016099214553833008, -0.00012293457984924316, -8.487701416015625e-05, -4.6819448471069336e-05, -8.761882781982422e-06, 2.9295682907104492e-05, 6.73532485961914e-05, 0.00010541081428527832, 0.00014346837997436523, 0.00018152594566345215, 0.00021958351135253906, 0.000257641077041626, 0.0002956986427307129, 0.0003337562084197998, 0.0003718137741088867, 0.00040987133979797363, 0.00044792890548706055, 0.00048598647117614746, 0.0005240440368652344, 0.0005621016025543213, 0.0006001591682434082, 0.0006382167339324951, 0.000676274299621582, 0.0007143318653106689, 0.0007523894309997559, 0.0007904469966888428, 0.0008285045623779297, 0.0008665621280670166, 0.0009046196937561035, 0.0009426772594451904, 0.0009807348251342773, 0.0010187923908233643, 0.0010568499565124512, 0.001094907522201538, 0.001132965087890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 6.0, 7.0, 12.0, 20.0, 33.0, 42.0, 44.0, 110.0, 144.0, 255.0, 457.0, 883.0, 2102.0, 5488.0, 18199.0, 88245.0, 776388.0, 122656.0, 22355.0, 6494.0, 2361.0, 1013.0, 506.0, 249.0, 172.0, 96.0, 66.0, 40.0, 23.0, 26.0, 17.0, 10.0, 14.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83984375, -6.6298828125, -6.419921875, -6.2099609375, -6.0, -5.7900390625, -5.580078125, -5.3701171875, -5.16015625, -4.9501953125, -4.740234375, -4.5302734375, -4.3203125, -4.1103515625, -3.900390625, -3.6904296875, -3.48046875, -3.2705078125, -3.060546875, -2.8505859375, -2.640625, -2.4306640625, -2.220703125, -2.0107421875, -1.80078125, -1.5908203125, -1.380859375, -1.1708984375, -0.9609375, -0.7509765625, -0.541015625, -0.3310546875, -0.12109375, 0.0888671875, 0.298828125, 0.5087890625, 0.71875, 0.9287109375, 1.138671875, 1.3486328125, 1.55859375, 1.7685546875, 1.978515625, 2.1884765625, 2.3984375, 2.6083984375, 2.818359375, 3.0283203125, 3.23828125, 3.4482421875, 3.658203125, 3.8681640625, 4.078125, 4.2880859375, 4.498046875, 4.7080078125, 4.91796875, 5.1279296875, 5.337890625, 5.5478515625, 5.7578125, 5.9677734375, 6.177734375, 6.3876953125, 6.59765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 9.0, 5.0, 2.0, 3.0, 8.0, 7.0, 10.0, 13.0, 11.0, 13.0, 15.0, 22.0, 27.0, 25.0, 30.0, 47.0, 36.0, 62.0, 113.0, 99.0, 77.0, 62.0, 49.0, 42.0, 36.0, 22.0, 23.0, 18.0, 17.0, 17.0, 14.0, 10.0, 7.0, 4.0, 9.0, 4.0, 1.0, 2.0, 8.0, 3.0, 2.0, 9.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.2421875, -4.115386962890625, -3.98858642578125, -3.861785888671875, -3.7349853515625, -3.608184814453125, -3.48138427734375, -3.354583740234375, -3.227783203125, -3.100982666015625, -2.97418212890625, -2.847381591796875, -2.7205810546875, -2.593780517578125, -2.46697998046875, -2.340179443359375, -2.21337890625, -2.086578369140625, -1.95977783203125, -1.832977294921875, -1.7061767578125, -1.579376220703125, -1.45257568359375, -1.325775146484375, -1.198974609375, -1.072174072265625, -0.94537353515625, -0.818572998046875, -0.6917724609375, -0.564971923828125, -0.43817138671875, -0.311370849609375, -0.1845703125, -0.057769775390625, 0.06903076171875, 0.195831298828125, 0.3226318359375, 0.449432373046875, 0.57623291015625, 0.703033447265625, 0.829833984375, 0.956634521484375, 1.08343505859375, 1.210235595703125, 1.3370361328125, 1.463836669921875, 1.59063720703125, 1.717437744140625, 1.84423828125, 1.971038818359375, 2.09783935546875, 2.224639892578125, 2.3514404296875, 2.478240966796875, 2.60504150390625, 2.731842041015625, 2.858642578125, 2.985443115234375, 3.11224365234375, 3.239044189453125, 3.3658447265625, 3.492645263671875, 3.61944580078125, 3.746246337890625, 3.873046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 15.0, 25.0, 64.0, 125.0, 248.0, 214.0, 132.0, 71.0, 35.0, 24.0, 6.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.33662414550781, -96.98323059082031, -93.62983703613281, -90.27644348144531, -86.92304992675781, -83.56965637207031, -80.21625518798828, -76.86286163330078, -73.50946807861328, -70.15607452392578, -66.80268096923828, -63.449283599853516, -60.095890045166016, -56.742496490478516, -53.38909912109375, -50.03570556640625, -46.68231201171875, -43.32891845703125, -39.97552490234375, -36.622127532958984, -33.268733978271484, -29.915340423583984, -26.56194496154785, -23.20854949951172, -19.85515594482422, -16.50176239013672, -13.148366928100586, -9.79497241973877, -6.441577911376953, -3.088184356689453, 0.2652111053466797, 3.6186065673828125, 6.9720001220703125, 10.325394630432129, 13.678789138793945, 17.032184600830078, 20.385578155517578, 23.738971710205078, 27.09236717224121, 30.445762634277344, 33.799156188964844, 37.152549743652344, 40.505943298339844, 43.85934066772461, 47.21273422241211, 50.56612777709961, 53.919525146484375, 57.272918701171875, 60.626312255859375, 63.979705810546875, 67.33309936523438, 70.68649291992188, 74.03988647460938, 77.39328002929688, 80.7466812133789, 84.1000747680664, 87.4534683227539, 90.8068618774414, 94.1602554321289, 97.5136489868164, 100.86705017089844, 104.22044372558594, 107.57383728027344, 110.92723083496094, 114.28062438964844]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 16.0, 15.0, 21.0, 19.0, 26.0, 21.0, 27.0, 29.0, 28.0, 45.0, 46.0, 51.0, 56.0, 69.0, 77.0, 66.0, 47.0, 45.0, 37.0, 44.0, 19.0, 22.0, 31.0, 16.0, 18.0, 12.0, 13.0, 14.0, 11.0, 2.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.255550384521484, -51.40003967285156, -49.544532775878906, -47.689022064208984, -45.83351135253906, -43.978004455566406, -42.122493743896484, -40.26698303222656, -38.411476135253906, -36.555965423583984, -34.70045852661133, -32.844947814941406, -30.989437103271484, -29.133928298950195, -27.278419494628906, -25.422908782958984, -23.567398071289062, -21.711889266967773, -19.85637855529785, -18.000869750976562, -16.14535903930664, -14.289850234985352, -12.434341430664062, -10.578831672668457, -8.723321914672852, -6.867812156677246, -5.012302875518799, -3.1567935943603516, -1.301283836364746, 0.5542259216308594, 2.4097347259521484, 4.265244483947754, 6.120750427246094, 7.976260185241699, 9.831769943237305, 11.687278747558594, 13.5427885055542, 15.398298263549805, 17.253807067871094, 19.109317779541016, 20.964826583862305, 22.820335388183594, 24.675846099853516, 26.531354904174805, 28.386863708496094, 30.242374420166016, 32.09788513183594, 33.953392028808594, 35.808902740478516, 37.66441345214844, 39.519920349121094, 41.375431060791016, 43.23094177246094, 45.086448669433594, 46.941959381103516, 48.79747009277344, 50.652976989746094, 52.508487701416016, 54.36399459838867, 56.219505310058594, 58.075016021728516, 59.93052673339844, 61.786033630371094, 63.641544342041016, 65.49705505371094]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 6.0, 7.0, 7.0, 10.0, 23.0, 31.0, 40.0, 81.0, 135.0, 284.0, 852.0, 3424.0, 27844.0, 2436267.0, 1697260.0, 22860.0, 3471.0, 990.0, 404.0, 151.0, 64.0, 23.0, 18.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-16.796875, -16.439208984375, -16.08154296875, -15.723876953125, -15.3662109375, -15.008544921875, -14.65087890625, -14.293212890625, -13.935546875, -13.577880859375, -13.22021484375, -12.862548828125, -12.5048828125, -12.147216796875, -11.78955078125, -11.431884765625, -11.07421875, -10.716552734375, -10.35888671875, -10.001220703125, -9.6435546875, -9.285888671875, -8.92822265625, -8.570556640625, -8.212890625, -7.855224609375, -7.49755859375, -7.139892578125, -6.7822265625, -6.424560546875, -6.06689453125, -5.709228515625, -5.3515625, -4.993896484375, -4.63623046875, -4.278564453125, -3.9208984375, -3.563232421875, -3.20556640625, -2.847900390625, -2.490234375, -2.132568359375, -1.77490234375, -1.417236328125, -1.0595703125, -0.701904296875, -0.34423828125, 0.013427734375, 0.37109375, 0.728759765625, 1.08642578125, 1.444091796875, 1.8017578125, 2.159423828125, 2.51708984375, 2.874755859375, 3.232421875, 3.590087890625, 3.94775390625, 4.305419921875, 4.6630859375, 5.020751953125, 5.37841796875, 5.736083984375, 6.09375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 4.0, 10.0, 11.0, 25.0, 22.0, 24.0, 43.0, 43.0, 63.0, 61.0, 67.0, 77.0, 81.0, 67.0, 64.0, 80.0, 48.0, 44.0, 49.0, 33.0, 17.0, 16.0, 14.0, 10.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.16796875, -5.036712646484375, -4.90545654296875, -4.774200439453125, -4.6429443359375, -4.511688232421875, -4.38043212890625, -4.249176025390625, -4.117919921875, -3.986663818359375, -3.85540771484375, -3.724151611328125, -3.5928955078125, -3.461639404296875, -3.33038330078125, -3.199127197265625, -3.06787109375, -2.936614990234375, -2.80535888671875, -2.674102783203125, -2.5428466796875, -2.411590576171875, -2.28033447265625, -2.149078369140625, -2.017822265625, -1.886566162109375, -1.75531005859375, -1.624053955078125, -1.4927978515625, -1.361541748046875, -1.23028564453125, -1.099029541015625, -0.9677734375, -0.836517333984375, -0.70526123046875, -0.574005126953125, -0.4427490234375, -0.311492919921875, -0.18023681640625, -0.048980712890625, 0.082275390625, 0.213531494140625, 0.34478759765625, 0.476043701171875, 0.6072998046875, 0.738555908203125, 0.86981201171875, 1.001068115234375, 1.13232421875, 1.263580322265625, 1.39483642578125, 1.526092529296875, 1.6573486328125, 1.788604736328125, 1.91986083984375, 2.051116943359375, 2.182373046875, 2.313629150390625, 2.44488525390625, 2.576141357421875, 2.7073974609375, 2.838653564453125, 2.96990966796875, 3.101165771484375, 3.232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 6.0, 18.0, 20.0, 21.0, 35.0, 62.0, 104.0, 178.0, 333.0, 660.0, 1304.0, 3083.0, 8855.0, 37153.0, 409046.0, 3487577.0, 207065.0, 26211.0, 7031.0, 2637.0, 1231.0, 680.0, 369.0, 202.0, 144.0, 76.0, 49.0, 33.0, 28.0, 15.0, 17.0, 9.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.65625, -8.41168212890625, -8.1671142578125, -7.92254638671875, -7.677978515625, -7.43341064453125, -7.1888427734375, -6.94427490234375, -6.69970703125, -6.45513916015625, -6.2105712890625, -5.96600341796875, -5.721435546875, -5.47686767578125, -5.2322998046875, -4.98773193359375, -4.7431640625, -4.49859619140625, -4.2540283203125, -4.00946044921875, -3.764892578125, -3.52032470703125, -3.2757568359375, -3.03118896484375, -2.78662109375, -2.54205322265625, -2.2974853515625, -2.05291748046875, -1.808349609375, -1.56378173828125, -1.3192138671875, -1.07464599609375, -0.830078125, -0.58551025390625, -0.3409423828125, -0.09637451171875, 0.148193359375, 0.39276123046875, 0.6373291015625, 0.88189697265625, 1.12646484375, 1.37103271484375, 1.6156005859375, 1.86016845703125, 2.104736328125, 2.34930419921875, 2.5938720703125, 2.83843994140625, 3.0830078125, 3.32757568359375, 3.5721435546875, 3.81671142578125, 4.061279296875, 4.30584716796875, 4.5504150390625, 4.79498291015625, 5.03955078125, 5.28411865234375, 5.5286865234375, 5.77325439453125, 6.017822265625, 6.26239013671875, 6.5069580078125, 6.75152587890625, 6.99609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 7.0, 6.0, 8.0, 10.0, 21.0, 33.0, 49.0, 99.0, 192.0, 446.0, 946.0, 1087.0, 644.0, 236.0, 121.0, 76.0, 29.0, 20.0, 18.0, 6.0, 3.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.3115234375, -5.998046875, -5.6845703125, -5.37109375, -5.0576171875, -4.744140625, -4.4306640625, -4.1171875, -3.8037109375, -3.490234375, -3.1767578125, -2.86328125, -2.5498046875, -2.236328125, -1.9228515625, -1.609375, -1.2958984375, -0.982421875, -0.6689453125, -0.35546875, -0.0419921875, 0.271484375, 0.5849609375, 0.8984375, 1.2119140625, 1.525390625, 1.8388671875, 2.15234375, 2.4658203125, 2.779296875, 3.0927734375, 3.40625, 3.7197265625, 4.033203125, 4.3466796875, 4.66015625, 4.9736328125, 5.287109375, 5.6005859375, 5.9140625, 6.2275390625, 6.541015625, 6.8544921875, 7.16796875, 7.4814453125, 7.794921875, 8.1083984375, 8.421875, 8.7353515625, 9.048828125, 9.3623046875, 9.67578125, 9.9892578125, 10.302734375, 10.6162109375, 10.9296875, 11.2431640625, 11.556640625, 11.8701171875, 12.18359375, 12.4970703125, 12.810546875, 13.1240234375, 13.4375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 14.0, 18.0, 50.0, 91.0, 202.0, 248.0, 182.0, 95.0, 38.0, 24.0, 13.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.48509216308594, -60.520179748535156, -57.55527114868164, -54.59035873413086, -51.625450134277344, -48.66053771972656, -45.69562530517578, -42.730716705322266, -39.76580810546875, -36.80089569091797, -33.83598709106445, -30.871074676513672, -27.906166076660156, -24.941253662109375, -21.976343154907227, -19.011432647705078, -16.046520233154297, -13.081609725952148, -10.11669921875, -7.151787757873535, -4.186877250671387, -1.2219667434692383, 1.7429447174072266, 4.707855224609375, 7.672765731811523, 10.637676239013672, 13.60258674621582, 16.56749725341797, 19.53240966796875, 22.497318267822266, 25.462230682373047, 28.427141189575195, 31.392051696777344, 34.356964111328125, 37.32187271118164, 40.28678512573242, 43.25169372558594, 46.21660614013672, 49.1815185546875, 52.146427154541016, 55.11133575439453, 58.07624816894531, 61.04115676879883, 64.00606536865234, 66.97097778320312, 69.9358901977539, 72.90080261230469, 75.86570739746094, 78.83062744140625, 81.79553985595703, 84.76045227050781, 87.72535705566406, 90.69026947021484, 93.65518188476562, 96.6200942993164, 99.58500671386719, 102.54991149902344, 105.51482391357422, 108.479736328125, 111.44464111328125, 114.40955352783203, 117.37446594238281, 120.3393783569336, 123.30429077148438, 126.26919555664062]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 0.0, 12.0, 15.0, 12.0, 26.0, 37.0, 29.0, 41.0, 43.0, 68.0, 73.0, 65.0, 64.0, 54.0, 71.0, 81.0, 57.0, 46.0, 42.0, 41.0, 33.0, 22.0, 17.0, 13.0, 8.0, 8.0, 5.0, 10.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.485008239746094, -26.17704963684082, -24.869091033935547, -23.561134338378906, -22.253175735473633, -20.94521713256836, -19.63726043701172, -18.329301834106445, -17.021343231201172, -15.713384628295898, -14.405426979064941, -13.097469329833984, -11.789510726928711, -10.481552124023438, -9.17359447479248, -7.865636825561523, -6.55767822265625, -5.249720096588135, -3.9417619705200195, -2.6338038444519043, -1.325845718383789, -0.017887592315673828, 1.2900705337524414, 2.5980281829833984, 3.905986785888672, 5.213944911956787, 6.521903038024902, 7.829861164093018, 9.137819290161133, 10.445777893066406, 11.753735542297363, 13.06169319152832, 14.369651794433594, 15.677610397338867, 16.98556900024414, 18.29352569580078, 19.601484298706055, 20.909442901611328, 22.21739959716797, 23.525358200073242, 24.833316802978516, 26.14127540588379, 27.449234008789062, 28.757190704345703, 30.065149307250977, 31.37310791015625, 32.68106460571289, 33.98902130126953, 35.29698181152344, 36.60493850708008, 37.912899017333984, 39.220855712890625, 40.52881622314453, 41.83677291870117, 43.14472961425781, 44.45269012451172, 45.76064682006836, 47.068603515625, 48.376564025878906, 49.68452072143555, 50.99247741699219, 52.300437927246094, 53.608394622802734, 54.916351318359375, 56.22431182861328]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 7.0, 14.0, 7.0, 13.0, 16.0, 26.0, 43.0, 60.0, 91.0, 162.0, 291.0, 500.0, 1023.0, 2387.0, 7130.0, 25585.0, 123673.0, 537114.0, 278730.0, 51898.0, 12535.0, 3972.0, 1569.0, 751.0, 352.0, 201.0, 131.0, 84.0, 54.0, 37.0, 35.0, 11.0, 8.0, 10.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.0234375, -8.77093505859375, -8.5184326171875, -8.26593017578125, -8.013427734375, -7.76092529296875, -7.5084228515625, -7.25592041015625, -7.00341796875, -6.75091552734375, -6.4984130859375, -6.24591064453125, -5.993408203125, -5.74090576171875, -5.4884033203125, -5.23590087890625, -4.9833984375, -4.73089599609375, -4.4783935546875, -4.22589111328125, -3.973388671875, -3.72088623046875, -3.4683837890625, -3.21588134765625, -2.96337890625, -2.71087646484375, -2.4583740234375, -2.20587158203125, -1.953369140625, -1.70086669921875, -1.4483642578125, -1.19586181640625, -0.943359375, -0.69085693359375, -0.4383544921875, -0.18585205078125, 0.066650390625, 0.31915283203125, 0.5716552734375, 0.82415771484375, 1.07666015625, 1.32916259765625, 1.5816650390625, 1.83416748046875, 2.086669921875, 2.33917236328125, 2.5916748046875, 2.84417724609375, 3.0966796875, 3.34918212890625, 3.6016845703125, 3.85418701171875, 4.106689453125, 4.35919189453125, 4.6116943359375, 4.86419677734375, 5.11669921875, 5.36920166015625, 5.6217041015625, 5.87420654296875, 6.126708984375, 6.37921142578125, 6.6317138671875, 6.88421630859375, 7.13671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 12.0, 13.0, 10.0, 20.0, 18.0, 29.0, 22.0, 20.0, 48.0, 44.0, 54.0, 56.0, 50.0, 56.0, 63.0, 54.0, 65.0, 60.0, 53.0, 38.0, 32.0, 29.0, 31.0, 23.0, 27.0, 11.0, 13.0, 10.0, 8.0, 7.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.876678466796875, -2.76898193359375, -2.661285400390625, -2.5535888671875, -2.445892333984375, -2.33819580078125, -2.230499267578125, -2.122802734375, -2.015106201171875, -1.90740966796875, -1.799713134765625, -1.6920166015625, -1.584320068359375, -1.47662353515625, -1.368927001953125, -1.26123046875, -1.153533935546875, -1.04583740234375, -0.938140869140625, -0.8304443359375, -0.722747802734375, -0.61505126953125, -0.507354736328125, -0.399658203125, -0.291961669921875, -0.18426513671875, -0.076568603515625, 0.0311279296875, 0.138824462890625, 0.24652099609375, 0.354217529296875, 0.4619140625, 0.569610595703125, 0.67730712890625, 0.785003662109375, 0.8927001953125, 1.000396728515625, 1.10809326171875, 1.215789794921875, 1.323486328125, 1.431182861328125, 1.53887939453125, 1.646575927734375, 1.7542724609375, 1.861968994140625, 1.96966552734375, 2.077362060546875, 2.18505859375, 2.292755126953125, 2.40045166015625, 2.508148193359375, 2.6158447265625, 2.723541259765625, 2.83123779296875, 2.938934326171875, 3.046630859375, 3.154327392578125, 3.26202392578125, 3.369720458984375, 3.4774169921875, 3.585113525390625, 3.69281005859375, 3.800506591796875, 3.908203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 13.0, 19.0, 26.0, 43.0, 79.0, 98.0, 146.0, 310.0, 548.0, 1250.0, 3198.0, 13485.0, 152667.0, 821291.0, 44401.0, 6945.0, 2156.0, 885.0, 377.0, 209.0, 116.0, 79.0, 54.0, 37.0, 28.0, 14.0, 10.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.9140625, -14.3868408203125, -13.859619140625, -13.3323974609375, -12.80517578125, -12.2779541015625, -11.750732421875, -11.2235107421875, -10.6962890625, -10.1690673828125, -9.641845703125, -9.1146240234375, -8.58740234375, -8.0601806640625, -7.532958984375, -7.0057373046875, -6.478515625, -5.9512939453125, -5.424072265625, -4.8968505859375, -4.36962890625, -3.8424072265625, -3.315185546875, -2.7879638671875, -2.2607421875, -1.7335205078125, -1.206298828125, -0.6790771484375, -0.15185546875, 0.3753662109375, 0.902587890625, 1.4298095703125, 1.95703125, 2.4842529296875, 3.011474609375, 3.5386962890625, 4.06591796875, 4.5931396484375, 5.120361328125, 5.6475830078125, 6.1748046875, 6.7020263671875, 7.229248046875, 7.7564697265625, 8.28369140625, 8.8109130859375, 9.338134765625, 9.8653564453125, 10.392578125, 10.9197998046875, 11.447021484375, 11.9742431640625, 12.50146484375, 13.0286865234375, 13.555908203125, 14.0831298828125, 14.6103515625, 15.1375732421875, 15.664794921875, 16.1920166015625, 16.71923828125, 17.2464599609375, 17.773681640625, 18.3009033203125, 18.828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 16.0, 29.0, 36.0, 41.0, 38.0, 58.0, 65.0, 93.0, 90.0, 69.0, 73.0, 85.0, 54.0, 53.0, 37.0, 36.0, 15.0, 22.0, 21.0, 15.0, 4.0, 1.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.791748046875, -20.17724609375, -19.562744140625, -18.9482421875, -18.333740234375, -17.71923828125, -17.104736328125, -16.490234375, -15.875732421875, -15.26123046875, -14.646728515625, -14.0322265625, -13.417724609375, -12.80322265625, -12.188720703125, -11.57421875, -10.959716796875, -10.34521484375, -9.730712890625, -9.1162109375, -8.501708984375, -7.88720703125, -7.272705078125, -6.658203125, -6.043701171875, -5.42919921875, -4.814697265625, -4.2001953125, -3.585693359375, -2.97119140625, -2.356689453125, -1.7421875, -1.127685546875, -0.51318359375, 0.101318359375, 0.7158203125, 1.330322265625, 1.94482421875, 2.559326171875, 3.173828125, 3.788330078125, 4.40283203125, 5.017333984375, 5.6318359375, 6.246337890625, 6.86083984375, 7.475341796875, 8.08984375, 8.704345703125, 9.31884765625, 9.933349609375, 10.5478515625, 11.162353515625, 11.77685546875, 12.391357421875, 13.005859375, 13.620361328125, 14.23486328125, 14.849365234375, 15.4638671875, 16.078369140625, 16.69287109375, 17.307373046875, 17.921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 4.0, 6.0, 13.0, 16.0, 18.0, 32.0, 32.0, 59.0, 94.0, 120.0, 217.0, 379.0, 774.0, 1902.0, 5705.0, 20679.0, 115909.0, 792219.0, 85356.0, 16937.0, 4818.0, 1610.0, 727.0, 350.0, 189.0, 90.0, 84.0, 49.0, 44.0, 29.0, 17.0, 19.0, 8.0, 11.0, 10.0, 9.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8515625, -5.676513671875, -5.50146484375, -5.326416015625, -5.1513671875, -4.976318359375, -4.80126953125, -4.626220703125, -4.451171875, -4.276123046875, -4.10107421875, -3.926025390625, -3.7509765625, -3.575927734375, -3.40087890625, -3.225830078125, -3.05078125, -2.875732421875, -2.70068359375, -2.525634765625, -2.3505859375, -2.175537109375, -2.00048828125, -1.825439453125, -1.650390625, -1.475341796875, -1.30029296875, -1.125244140625, -0.9501953125, -0.775146484375, -0.60009765625, -0.425048828125, -0.25, -0.074951171875, 0.10009765625, 0.275146484375, 0.4501953125, 0.625244140625, 0.80029296875, 0.975341796875, 1.150390625, 1.325439453125, 1.50048828125, 1.675537109375, 1.8505859375, 2.025634765625, 2.20068359375, 2.375732421875, 2.55078125, 2.725830078125, 2.90087890625, 3.075927734375, 3.2509765625, 3.426025390625, 3.60107421875, 3.776123046875, 3.951171875, 4.126220703125, 4.30126953125, 4.476318359375, 4.6513671875, 4.826416015625, 5.00146484375, 5.176513671875, 5.3515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 7.0, 7.0, 9.0, 10.0, 8.0, 6.0, 28.0, 20.0, 32.0, 42.0, 78.0, 157.0, 245.0, 130.0, 61.0, 47.0, 32.0, 20.0, 18.0, 5.0, 11.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016689300537109375, -0.0016138255596160889, -0.0015587210655212402, -0.0015036165714263916, -0.001448512077331543, -0.0013934075832366943, -0.0013383030891418457, -0.001283198595046997, -0.0012280941009521484, -0.0011729896068572998, -0.0011178851127624512, -0.0010627806186676025, -0.001007676124572754, -0.0009525716304779053, -0.0008974671363830566, -0.000842362642288208, -0.0007872581481933594, -0.0007321536540985107, -0.0006770491600036621, -0.0006219446659088135, -0.0005668401718139648, -0.0005117356777191162, -0.0004566311836242676, -0.00040152668952941895, -0.0003464221954345703, -0.0002913177013397217, -0.00023621320724487305, -0.00018110871315002441, -0.00012600421905517578, -7.089972496032715e-05, -1.5795230865478516e-05, 3.930926322937012e-05, 9.441375732421875e-05, 0.00014951825141906738, 0.00020462274551391602, 0.00025972723960876465, 0.0003148317337036133, 0.0003699362277984619, 0.00042504072189331055, 0.0004801452159881592, 0.0005352497100830078, 0.0005903542041778564, 0.0006454586982727051, 0.0007005631923675537, 0.0007556676864624023, 0.000810772180557251, 0.0008658766746520996, 0.0009209811687469482, 0.0009760856628417969, 0.0010311901569366455, 0.0010862946510314941, 0.0011413991451263428, 0.0011965036392211914, 0.00125160813331604, 0.0013067126274108887, 0.0013618171215057373, 0.001416921615600586, 0.0014720261096954346, 0.0015271306037902832, 0.0015822350978851318, 0.0016373395919799805, 0.001692444086074829, 0.0017475485801696777, 0.0018026530742645264, 0.001857757568359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 16.0, 19.0, 29.0, 59.0, 68.0, 142.0, 199.0, 365.0, 756.0, 1972.0, 6691.0, 28306.0, 196033.0, 735931.0, 59823.0, 12542.0, 3285.0, 1116.0, 518.0, 258.0, 150.0, 88.0, 63.0, 39.0, 21.0, 21.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.90087890625, -5.7119140625, -5.52294921875, -5.333984375, -5.14501953125, -4.9560546875, -4.76708984375, -4.578125, -4.38916015625, -4.2001953125, -4.01123046875, -3.822265625, -3.63330078125, -3.4443359375, -3.25537109375, -3.06640625, -2.87744140625, -2.6884765625, -2.49951171875, -2.310546875, -2.12158203125, -1.9326171875, -1.74365234375, -1.5546875, -1.36572265625, -1.1767578125, -0.98779296875, -0.798828125, -0.60986328125, -0.4208984375, -0.23193359375, -0.04296875, 0.14599609375, 0.3349609375, 0.52392578125, 0.712890625, 0.90185546875, 1.0908203125, 1.27978515625, 1.46875, 1.65771484375, 1.8466796875, 2.03564453125, 2.224609375, 2.41357421875, 2.6025390625, 2.79150390625, 2.98046875, 3.16943359375, 3.3583984375, 3.54736328125, 3.736328125, 3.92529296875, 4.1142578125, 4.30322265625, 4.4921875, 4.68115234375, 4.8701171875, 5.05908203125, 5.248046875, 5.43701171875, 5.6259765625, 5.81494140625, 6.00390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 13.0, 16.0, 11.0, 12.0, 31.0, 27.0, 44.0, 51.0, 66.0, 126.0, 138.0, 114.0, 93.0, 62.0, 44.0, 23.0, 24.0, 12.0, 17.0, 10.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.380615234375, -4.24169921875, -4.102783203125, -3.9638671875, -3.824951171875, -3.68603515625, -3.547119140625, -3.408203125, -3.269287109375, -3.13037109375, -2.991455078125, -2.8525390625, -2.713623046875, -2.57470703125, -2.435791015625, -2.296875, -2.157958984375, -2.01904296875, -1.880126953125, -1.7412109375, -1.602294921875, -1.46337890625, -1.324462890625, -1.185546875, -1.046630859375, -0.90771484375, -0.768798828125, -0.6298828125, -0.490966796875, -0.35205078125, -0.213134765625, -0.07421875, 0.064697265625, 0.20361328125, 0.342529296875, 0.4814453125, 0.620361328125, 0.75927734375, 0.898193359375, 1.037109375, 1.176025390625, 1.31494140625, 1.453857421875, 1.5927734375, 1.731689453125, 1.87060546875, 2.009521484375, 2.1484375, 2.287353515625, 2.42626953125, 2.565185546875, 2.7041015625, 2.843017578125, 2.98193359375, 3.120849609375, 3.259765625, 3.398681640625, 3.53759765625, 3.676513671875, 3.8154296875, 3.954345703125, 4.09326171875, 4.232177734375, 4.37109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 5.0, 6.0, 14.0, 21.0, 53.0, 75.0, 153.0, 240.0, 189.0, 92.0, 63.0, 27.0, 14.0, 11.0, 8.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-85.1076889038086, -82.6568603515625, -80.20602416992188, -77.75519561767578, -75.30436706542969, -72.85353088378906, -70.40270233154297, -67.95187377929688, -65.50103759765625, -63.05020523071289, -60.59937286376953, -58.14854431152344, -55.69771194458008, -53.24687957763672, -50.796051025390625, -48.345218658447266, -45.894386291503906, -43.44355392456055, -40.99272155761719, -38.541893005371094, -36.091060638427734, -33.640228271484375, -31.18939781188965, -28.738567352294922, -26.287734985351562, -23.836902618408203, -21.386072158813477, -18.93524169921875, -16.48440933227539, -14.033577919006348, -11.582746505737305, -9.131916046142578, -6.6810760498046875, -4.2302446365356445, -1.7794132232666016, 0.6714181900024414, 3.1222496032714844, 5.573081016540527, 8.02391242980957, 10.474742889404297, 12.925575256347656, 15.3764066696167, 17.827238082885742, 20.27806854248047, 22.728900909423828, 25.179733276367188, 27.630563735961914, 30.08139419555664, 32.5322265625, 34.98305892944336, 37.43389129638672, 39.88471984863281, 42.33555221557617, 44.78638458251953, 47.237213134765625, 49.688045501708984, 52.138877868652344, 54.5897102355957, 57.04054260253906, 59.491371154785156, 61.942203521728516, 64.39303588867188, 66.84386444091797, 69.29469299316406, 71.74552917480469]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 6.0, 6.0, 10.0, 5.0, 11.0, 11.0, 15.0, 14.0, 19.0, 23.0, 28.0, 28.0, 30.0, 42.0, 39.0, 49.0, 67.0, 65.0, 75.0, 62.0, 55.0, 42.0, 25.0, 42.0, 44.0, 33.0, 25.0, 16.0, 37.0, 10.0, 16.0, 5.0, 16.0, 5.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-61.93077087402344, -60.2968864440918, -58.663002014160156, -57.029117584228516, -55.395233154296875, -53.761348724365234, -52.127464294433594, -50.49357986450195, -48.85969543457031, -47.22581100463867, -45.59192657470703, -43.95804214477539, -42.32415771484375, -40.69027328491211, -39.05638885498047, -37.42250442504883, -35.78861999511719, -34.15473556518555, -32.520851135253906, -30.886966705322266, -29.253082275390625, -27.619197845458984, -25.985313415527344, -24.351428985595703, -22.717544555664062, -21.083660125732422, -19.44977569580078, -17.81589126586914, -16.1820068359375, -14.54812240600586, -12.914237976074219, -11.280353546142578, -9.646469116210938, -8.012584686279297, -6.378700256347656, -4.744815826416016, -3.110931396484375, -1.4770469665527344, 0.15683746337890625, 1.7907218933105469, 3.4246063232421875, 5.058490753173828, 6.692375183105469, 8.32625961303711, 9.96014404296875, 11.59402847290039, 13.227912902832031, 14.861797332763672, 16.495681762695312, 18.129566192626953, 19.763450622558594, 21.397335052490234, 23.031219482421875, 24.665103912353516, 26.298988342285156, 27.932872772216797, 29.566757202148438, 31.200641632080078, 32.83452606201172, 34.46841049194336, 36.102294921875, 37.73617935180664, 39.37006378173828, 41.00394821166992, 42.63783264160156]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 7.0, 12.0, 14.0, 33.0, 68.0, 150.0, 360.0, 1368.0, 7222.0, 223484.0, 3920355.0, 35792.0, 3850.0, 1040.0, 312.0, 103.0, 47.0, 26.0, 16.0, 3.0, 3.0, 6.0], "bins": [-24.296875, -23.83233642578125, -23.3677978515625, -22.90325927734375, -22.438720703125, -21.97418212890625, -21.5096435546875, -21.04510498046875, -20.58056640625, -20.11602783203125, -19.6514892578125, -19.18695068359375, -18.722412109375, -18.25787353515625, -17.7933349609375, -17.32879638671875, -16.8642578125, -16.39971923828125, -15.9351806640625, -15.47064208984375, -15.006103515625, -14.54156494140625, -14.0770263671875, -13.61248779296875, -13.14794921875, -12.68341064453125, -12.2188720703125, -11.75433349609375, -11.289794921875, -10.82525634765625, -10.3607177734375, -9.89617919921875, -9.431640625, -8.96710205078125, -8.5025634765625, -8.03802490234375, -7.573486328125, -7.10894775390625, -6.6444091796875, -6.17987060546875, -5.71533203125, -5.25079345703125, -4.7862548828125, -4.32171630859375, -3.857177734375, -3.39263916015625, -2.9281005859375, -2.46356201171875, -1.9990234375, -1.53448486328125, -1.0699462890625, -0.60540771484375, -0.140869140625, 0.32366943359375, 0.7882080078125, 1.25274658203125, 1.71728515625, 2.18182373046875, 2.6463623046875, 3.11090087890625, 3.575439453125, 4.03997802734375, 4.5045166015625, 4.96905517578125, 5.43359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 11.0, 14.0, 15.0, 30.0, 37.0, 52.0, 66.0, 77.0, 79.0, 100.0, 86.0, 81.0, 81.0, 72.0, 59.0, 45.0, 40.0, 15.0, 13.0, 11.0, 9.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.55078125, -7.38330078125, -7.2158203125, -7.04833984375, -6.880859375, -6.71337890625, -6.5458984375, -6.37841796875, -6.2109375, -6.04345703125, -5.8759765625, -5.70849609375, -5.541015625, -5.37353515625, -5.2060546875, -5.03857421875, -4.87109375, -4.70361328125, -4.5361328125, -4.36865234375, -4.201171875, -4.03369140625, -3.8662109375, -3.69873046875, -3.53125, -3.36376953125, -3.1962890625, -3.02880859375, -2.861328125, -2.69384765625, -2.5263671875, -2.35888671875, -2.19140625, -2.02392578125, -1.8564453125, -1.68896484375, -1.521484375, -1.35400390625, -1.1865234375, -1.01904296875, -0.8515625, -0.68408203125, -0.5166015625, -0.34912109375, -0.181640625, -0.01416015625, 0.1533203125, 0.32080078125, 0.48828125, 0.65576171875, 0.8232421875, 0.99072265625, 1.158203125, 1.32568359375, 1.4931640625, 1.66064453125, 1.828125, 1.99560546875, 2.1630859375, 2.33056640625, 2.498046875, 2.66552734375, 2.8330078125, 3.00048828125, 3.16796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 13.0, 20.0, 29.0, 38.0, 100.0, 164.0, 322.0, 694.0, 2006.0, 8843.0, 230732.0, 3915381.0, 30461.0, 3533.0, 1088.0, 432.0, 215.0, 82.0, 55.0, 27.0, 9.0, 10.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.095458984375, -17.53466796875, -16.973876953125, -16.4130859375, -15.852294921875, -15.29150390625, -14.730712890625, -14.169921875, -13.609130859375, -13.04833984375, -12.487548828125, -11.9267578125, -11.365966796875, -10.80517578125, -10.244384765625, -9.68359375, -9.122802734375, -8.56201171875, -8.001220703125, -7.4404296875, -6.879638671875, -6.31884765625, -5.758056640625, -5.197265625, -4.636474609375, -4.07568359375, -3.514892578125, -2.9541015625, -2.393310546875, -1.83251953125, -1.271728515625, -0.7109375, -0.150146484375, 0.41064453125, 0.971435546875, 1.5322265625, 2.093017578125, 2.65380859375, 3.214599609375, 3.775390625, 4.336181640625, 4.89697265625, 5.457763671875, 6.0185546875, 6.579345703125, 7.14013671875, 7.700927734375, 8.26171875, 8.822509765625, 9.38330078125, 9.944091796875, 10.5048828125, 11.065673828125, 11.62646484375, 12.187255859375, 12.748046875, 13.308837890625, 13.86962890625, 14.430419921875, 14.9912109375, 15.552001953125, 16.11279296875, 16.673583984375, 17.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 11.0, 14.0, 19.0, 29.0, 49.0, 87.0, 180.0, 408.0, 953.0, 1154.0, 653.0, 260.0, 107.0, 55.0, 35.0, 17.0, 11.0, 10.0, 9.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-14.4765625, -14.1563720703125, -13.836181640625, -13.5159912109375, -13.19580078125, -12.8756103515625, -12.555419921875, -12.2352294921875, -11.9150390625, -11.5948486328125, -11.274658203125, -10.9544677734375, -10.63427734375, -10.3140869140625, -9.993896484375, -9.6737060546875, -9.353515625, -9.0333251953125, -8.713134765625, -8.3929443359375, -8.07275390625, -7.7525634765625, -7.432373046875, -7.1121826171875, -6.7919921875, -6.4718017578125, -6.151611328125, -5.8314208984375, -5.51123046875, -5.1910400390625, -4.870849609375, -4.5506591796875, -4.23046875, -3.9102783203125, -3.590087890625, -3.2698974609375, -2.94970703125, -2.6295166015625, -2.309326171875, -1.9891357421875, -1.6689453125, -1.3487548828125, -1.028564453125, -0.7083740234375, -0.38818359375, -0.0679931640625, 0.252197265625, 0.5723876953125, 0.892578125, 1.2127685546875, 1.532958984375, 1.8531494140625, 2.17333984375, 2.4935302734375, 2.813720703125, 3.1339111328125, 3.4541015625, 3.7742919921875, 4.094482421875, 4.4146728515625, 4.73486328125, 5.0550537109375, 5.375244140625, 5.6954345703125, 6.015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 5.0, 6.0, 24.0, 52.0, 142.0, 279.0, 287.0, 130.0, 43.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.53944396972656, -184.6129150390625, -180.68638610839844, -176.7598419189453, -172.83331298828125, -168.9067840576172, -164.98025512695312, -161.05372619628906, -157.127197265625, -153.20066833496094, -149.27413940429688, -145.34759521484375, -141.4210662841797, -137.49453735351562, -133.56800842285156, -129.6414794921875, -125.71493530273438, -121.78840637207031, -117.86186981201172, -113.93534088134766, -110.00880432128906, -106.082275390625, -102.15574645996094, -98.22921752929688, -94.30268096923828, -90.37615203857422, -86.44961547851562, -82.52308654785156, -78.5965576171875, -74.6700210571289, -70.74349212646484, -66.81695556640625, -62.89042663574219, -58.96389389038086, -55.03736114501953, -51.11083221435547, -47.18429946899414, -43.25776672363281, -39.33123779296875, -35.40470504760742, -31.478172302246094, -27.551639556884766, -23.62510871887207, -19.698577880859375, -15.772045135498047, -11.845512390136719, -7.918981552124023, -3.992450714111328, -0.06591796875, 3.8606138229370117, 7.787145614624023, 11.713677406311035, 15.640209197998047, 19.566741943359375, 23.49327278137207, 27.419803619384766, 31.346336364746094, 35.27286911010742, 39.19940185546875, 43.12593078613281, 47.05246353149414, 50.97899627685547, 54.90552520751953, 58.83205795288086, 62.75859069824219]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 4.0, 8.0, 17.0, 17.0, 48.0, 44.0, 44.0, 73.0, 108.0, 88.0, 97.0, 96.0, 98.0, 79.0, 53.0, 39.0, 30.0, 23.0, 15.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.262285232543945, -27.4180908203125, -25.573894500732422, -23.729698181152344, -21.8855037689209, -20.041309356689453, -18.197113037109375, -16.352916717529297, -14.508722305297852, -12.66452693939209, -10.820331573486328, -8.976136207580566, -7.131940841674805, -5.287745475769043, -3.4435501098632812, -1.5993547439575195, 0.2448406219482422, 2.089035987854004, 3.9332313537597656, 5.777426719665527, 7.621622085571289, 9.46581745147705, 11.310012817382812, 13.154208183288574, 14.998403549194336, 16.84259796142578, 18.68679428100586, 20.530990600585938, 22.375185012817383, 24.219379425048828, 26.063575744628906, 27.907772064208984, 29.751968383789062, 31.59616470336914, 33.44036102294922, 35.28455352783203, 37.12874984741211, 38.97294616699219, 40.817138671875, 42.66133499145508, 44.505531311035156, 46.349727630615234, 48.19392395019531, 50.038116455078125, 51.8823127746582, 53.72650909423828, 55.570701599121094, 57.41489791870117, 59.25909423828125, 61.10329055786133, 62.947486877441406, 64.79167938232422, 66.63587951660156, 68.48007202148438, 70.32426452636719, 72.16846466064453, 74.01265716552734, 75.85684967041016, 77.7010498046875, 79.54524230957031, 81.38943481445312, 83.23363494873047, 85.07782745361328, 86.92202758789062, 88.76622009277344]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 11.0, 13.0, 19.0, 26.0, 30.0, 49.0, 71.0, 118.0, 207.0, 331.0, 772.0, 1797.0, 4813.0, 15916.0, 63845.0, 315496.0, 486210.0, 119692.0, 26452.0, 7669.0, 2636.0, 1108.0, 498.0, 287.0, 151.0, 93.0, 64.0, 44.0, 33.0, 33.0, 13.0, 13.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.23046875, -6.03076171875, -5.8310546875, -5.63134765625, -5.431640625, -5.23193359375, -5.0322265625, -4.83251953125, -4.6328125, -4.43310546875, -4.2333984375, -4.03369140625, -3.833984375, -3.63427734375, -3.4345703125, -3.23486328125, -3.03515625, -2.83544921875, -2.6357421875, -2.43603515625, -2.236328125, -2.03662109375, -1.8369140625, -1.63720703125, -1.4375, -1.23779296875, -1.0380859375, -0.83837890625, -0.638671875, -0.43896484375, -0.2392578125, -0.03955078125, 0.16015625, 0.35986328125, 0.5595703125, 0.75927734375, 0.958984375, 1.15869140625, 1.3583984375, 1.55810546875, 1.7578125, 1.95751953125, 2.1572265625, 2.35693359375, 2.556640625, 2.75634765625, 2.9560546875, 3.15576171875, 3.35546875, 3.55517578125, 3.7548828125, 3.95458984375, 4.154296875, 4.35400390625, 4.5537109375, 4.75341796875, 4.953125, 5.15283203125, 5.3525390625, 5.55224609375, 5.751953125, 5.95166015625, 6.1513671875, 6.35107421875, 6.55078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 17.0, 18.0, 31.0, 44.0, 61.0, 51.0, 85.0, 78.0, 88.0, 88.0, 79.0, 74.0, 61.0, 58.0, 38.0, 28.0, 27.0, 18.0, 13.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6949462890625, -4.538330078125, -4.3817138671875, -4.22509765625, -4.0684814453125, -3.911865234375, -3.7552490234375, -3.5986328125, -3.4420166015625, -3.285400390625, -3.1287841796875, -2.97216796875, -2.8155517578125, -2.658935546875, -2.5023193359375, -2.345703125, -2.1890869140625, -2.032470703125, -1.8758544921875, -1.71923828125, -1.5626220703125, -1.406005859375, -1.2493896484375, -1.0927734375, -0.9361572265625, -0.779541015625, -0.6229248046875, -0.46630859375, -0.3096923828125, -0.153076171875, 0.0035400390625, 0.16015625, 0.3167724609375, 0.473388671875, 0.6300048828125, 0.78662109375, 0.9432373046875, 1.099853515625, 1.2564697265625, 1.4130859375, 1.5697021484375, 1.726318359375, 1.8829345703125, 2.03955078125, 2.1961669921875, 2.352783203125, 2.5093994140625, 2.666015625, 2.8226318359375, 2.979248046875, 3.1358642578125, 3.29248046875, 3.4490966796875, 3.605712890625, 3.7623291015625, 3.9189453125, 4.0755615234375, 4.232177734375, 4.3887939453125, 4.54541015625, 4.7020263671875, 4.858642578125, 5.0152587890625, 5.171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 9.0, 16.0, 33.0, 48.0, 68.0, 141.0, 330.0, 914.0, 3236.0, 17225.0, 172693.0, 763627.0, 77335.0, 9699.0, 2043.0, 599.0, 225.0, 123.0, 70.0, 34.0, 28.0, 12.0, 12.0, 1.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.534423828125, -9.20947265625, -8.884521484375, -8.5595703125, -8.234619140625, -7.90966796875, -7.584716796875, -7.259765625, -6.934814453125, -6.60986328125, -6.284912109375, -5.9599609375, -5.635009765625, -5.31005859375, -4.985107421875, -4.66015625, -4.335205078125, -4.01025390625, -3.685302734375, -3.3603515625, -3.035400390625, -2.71044921875, -2.385498046875, -2.060546875, -1.735595703125, -1.41064453125, -1.085693359375, -0.7607421875, -0.435791015625, -0.11083984375, 0.214111328125, 0.5390625, 0.864013671875, 1.18896484375, 1.513916015625, 1.8388671875, 2.163818359375, 2.48876953125, 2.813720703125, 3.138671875, 3.463623046875, 3.78857421875, 4.113525390625, 4.4384765625, 4.763427734375, 5.08837890625, 5.413330078125, 5.73828125, 6.063232421875, 6.38818359375, 6.713134765625, 7.0380859375, 7.363037109375, 7.68798828125, 8.012939453125, 8.337890625, 8.662841796875, 8.98779296875, 9.312744140625, 9.6376953125, 9.962646484375, 10.28759765625, 10.612548828125, 10.9375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 14.0, 15.0, 15.0, 28.0, 38.0, 34.0, 30.0, 33.0, 29.0, 49.0, 52.0, 54.0, 59.0, 70.0, 48.0, 42.0, 45.0, 38.0, 45.0, 29.0, 36.0, 28.0, 24.0, 20.0, 22.0, 13.0, 11.0, 10.0, 13.0, 7.0, 7.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.390625, -11.0426025390625, -10.694580078125, -10.3465576171875, -9.99853515625, -9.6505126953125, -9.302490234375, -8.9544677734375, -8.6064453125, -8.2584228515625, -7.910400390625, -7.5623779296875, -7.21435546875, -6.8663330078125, -6.518310546875, -6.1702880859375, -5.822265625, -5.4742431640625, -5.126220703125, -4.7781982421875, -4.43017578125, -4.0821533203125, -3.734130859375, -3.3861083984375, -3.0380859375, -2.6900634765625, -2.342041015625, -1.9940185546875, -1.64599609375, -1.2979736328125, -0.949951171875, -0.6019287109375, -0.25390625, 0.0941162109375, 0.442138671875, 0.7901611328125, 1.13818359375, 1.4862060546875, 1.834228515625, 2.1822509765625, 2.5302734375, 2.8782958984375, 3.226318359375, 3.5743408203125, 3.92236328125, 4.2703857421875, 4.618408203125, 4.9664306640625, 5.314453125, 5.6624755859375, 6.010498046875, 6.3585205078125, 6.70654296875, 7.0545654296875, 7.402587890625, 7.7506103515625, 8.0986328125, 8.4466552734375, 8.794677734375, 9.1427001953125, 9.49072265625, 9.8387451171875, 10.186767578125, 10.5347900390625, 10.8828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 12.0, 7.0, 18.0, 24.0, 56.0, 97.0, 207.0, 422.0, 990.0, 2683.0, 8531.0, 36822.0, 274568.0, 641400.0, 64196.0, 12446.0, 3683.0, 1281.0, 575.0, 255.0, 137.0, 66.0, 34.0, 22.0, 10.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.2586669921875, -3.154052734375, -3.0494384765625, -2.94482421875, -2.8402099609375, -2.735595703125, -2.6309814453125, -2.5263671875, -2.4217529296875, -2.317138671875, -2.2125244140625, -2.10791015625, -2.0032958984375, -1.898681640625, -1.7940673828125, -1.689453125, -1.5848388671875, -1.480224609375, -1.3756103515625, -1.27099609375, -1.1663818359375, -1.061767578125, -0.9571533203125, -0.8525390625, -0.7479248046875, -0.643310546875, -0.5386962890625, -0.43408203125, -0.3294677734375, -0.224853515625, -0.1202392578125, -0.015625, 0.0889892578125, 0.193603515625, 0.2982177734375, 0.40283203125, 0.5074462890625, 0.612060546875, 0.7166748046875, 0.8212890625, 0.9259033203125, 1.030517578125, 1.1351318359375, 1.23974609375, 1.3443603515625, 1.448974609375, 1.5535888671875, 1.658203125, 1.7628173828125, 1.867431640625, 1.9720458984375, 2.07666015625, 2.1812744140625, 2.285888671875, 2.3905029296875, 2.4951171875, 2.5997314453125, 2.704345703125, 2.8089599609375, 2.91357421875, 3.0181884765625, 3.122802734375, 3.2274169921875, 3.33203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 19.0, 11.0, 27.0, 42.0, 78.0, 114.0, 139.0, 152.0, 127.0, 79.0, 65.0, 43.0, 28.0, 16.0, 9.0, 14.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0009713172912597656, -0.000942133367061615, -0.0009129494428634644, -0.0008837655186653137, -0.0008545815944671631, -0.0008253976702690125, -0.0007962137460708618, -0.0007670298218727112, -0.0007378458976745605, -0.0007086619734764099, -0.0006794780492782593, -0.0006502941250801086, -0.000621110200881958, -0.0005919262766838074, -0.0005627423524856567, -0.0005335584282875061, -0.0005043745040893555, -0.00047519057989120483, -0.0004460066556930542, -0.00041682273149490356, -0.00038763880729675293, -0.0003584548830986023, -0.00032927095890045166, -0.000300087034702301, -0.0002709031105041504, -0.00024171918630599976, -0.00021253526210784912, -0.00018335133790969849, -0.00015416741371154785, -0.00012498348951339722, -9.579956531524658e-05, -6.661564111709595e-05, -3.743171691894531e-05, -8.247792720794678e-06, 2.0936131477355957e-05, 5.012005567550659e-05, 7.930397987365723e-05, 0.00010848790407180786, 0.0001376718282699585, 0.00016685575246810913, 0.00019603967666625977, 0.0002252236008644104, 0.00025440752506256104, 0.00028359144926071167, 0.0003127753734588623, 0.00034195929765701294, 0.0003711432218551636, 0.0004003271460533142, 0.00042951107025146484, 0.0004586949944496155, 0.0004878789186477661, 0.0005170628428459167, 0.0005462467670440674, 0.000575430691242218, 0.0006046146154403687, 0.0006337985396385193, 0.0006629824638366699, 0.0006921663880348206, 0.0007213503122329712, 0.0007505342364311218, 0.0007797181606292725, 0.0008089020848274231, 0.0008380860090255737, 0.0008672699332237244, 0.000896453857421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 13.0, 19.0, 28.0, 39.0, 60.0, 124.0, 270.0, 664.0, 1878.0, 5734.0, 20534.0, 105494.0, 689648.0, 180987.0, 30974.0, 7993.0, 2533.0, 850.0, 346.0, 162.0, 68.0, 55.0, 27.0, 16.0, 6.0, 10.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.44287109375, -2.3349609375, -2.22705078125, -2.119140625, -2.01123046875, -1.9033203125, -1.79541015625, -1.6875, -1.57958984375, -1.4716796875, -1.36376953125, -1.255859375, -1.14794921875, -1.0400390625, -0.93212890625, -0.82421875, -0.71630859375, -0.6083984375, -0.50048828125, -0.392578125, -0.28466796875, -0.1767578125, -0.06884765625, 0.0390625, 0.14697265625, 0.2548828125, 0.36279296875, 0.470703125, 0.57861328125, 0.6865234375, 0.79443359375, 0.90234375, 1.01025390625, 1.1181640625, 1.22607421875, 1.333984375, 1.44189453125, 1.5498046875, 1.65771484375, 1.765625, 1.87353515625, 1.9814453125, 2.08935546875, 2.197265625, 2.30517578125, 2.4130859375, 2.52099609375, 2.62890625, 2.73681640625, 2.8447265625, 2.95263671875, 3.060546875, 3.16845703125, 3.2763671875, 3.38427734375, 3.4921875, 3.60009765625, 3.7080078125, 3.81591796875, 3.923828125, 4.03173828125, 4.1396484375, 4.24755859375, 4.35546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 9.0, 9.0, 7.0, 18.0, 21.0, 27.0, 38.0, 44.0, 56.0, 97.0, 88.0, 106.0, 96.0, 78.0, 66.0, 58.0, 37.0, 25.0, 23.0, 17.0, 10.0, 9.0, 9.0, 7.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75, -2.668365478515625, -2.58673095703125, -2.505096435546875, -2.4234619140625, -2.341827392578125, -2.26019287109375, -2.178558349609375, -2.096923828125, -2.015289306640625, -1.93365478515625, -1.852020263671875, -1.7703857421875, -1.688751220703125, -1.60711669921875, -1.525482177734375, -1.44384765625, -1.362213134765625, -1.28057861328125, -1.198944091796875, -1.1173095703125, -1.035675048828125, -0.95404052734375, -0.872406005859375, -0.790771484375, -0.709136962890625, -0.62750244140625, -0.545867919921875, -0.4642333984375, -0.382598876953125, -0.30096435546875, -0.219329833984375, -0.1376953125, -0.056060791015625, 0.02557373046875, 0.107208251953125, 0.1888427734375, 0.270477294921875, 0.35211181640625, 0.433746337890625, 0.515380859375, 0.597015380859375, 0.67864990234375, 0.760284423828125, 0.8419189453125, 0.923553466796875, 1.00518798828125, 1.086822509765625, 1.16845703125, 1.250091552734375, 1.33172607421875, 1.413360595703125, 1.4949951171875, 1.576629638671875, 1.65826416015625, 1.739898681640625, 1.821533203125, 1.903167724609375, 1.98480224609375, 2.066436767578125, 2.1480712890625, 2.229705810546875, 2.31134033203125, 2.392974853515625, 2.474609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 8.0, 17.0, 81.0, 209.0, 412.0, 164.0, 60.0, 24.0, 14.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-107.77953338623047, -104.3449478149414, -100.91035461425781, -97.47576904296875, -94.04118347167969, -90.6065902709961, -87.17200469970703, -83.73741149902344, -80.30282592773438, -76.86824035644531, -73.43364715576172, -69.99906158447266, -66.56446838378906, -63.1298828125, -59.69529724121094, -56.26070785522461, -52.82611846923828, -49.39152908325195, -45.956939697265625, -42.52235412597656, -39.087764739990234, -35.653175354003906, -32.218589782714844, -28.784000396728516, -25.349411010742188, -21.91482162475586, -18.480234146118164, -15.045645713806152, -11.61105728149414, -8.176467895507812, -4.741880416870117, -1.3072929382324219, 2.1273040771484375, 5.561892509460449, 8.996480941772461, 12.431069374084473, 15.865657806396484, 19.300247192382812, 22.734834671020508, 26.169422149658203, 29.60401153564453, 33.03860092163086, 36.47319030761719, 39.90777587890625, 43.34236526489258, 46.776954650878906, 50.21154022216797, 53.6461296081543, 57.080718994140625, 60.51530838012695, 63.94989776611328, 67.38448333740234, 70.81907653808594, 74.253662109375, 77.68824768066406, 81.12283325195312, 84.55742645263672, 87.99201202392578, 91.42660522460938, 94.86119079589844, 98.2957763671875, 101.7303695678711, 105.16495513916016, 108.59954833984375, 112.03413391113281]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 12.0, 10.0, 11.0, 16.0, 10.0, 17.0, 27.0, 25.0, 37.0, 40.0, 41.0, 45.0, 63.0, 84.0, 92.0, 76.0, 52.0, 42.0, 49.0, 32.0, 23.0, 23.0, 22.0, 30.0, 24.0, 15.0, 10.0, 16.0, 10.0, 13.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.996734619140625, -39.50214385986328, -38.00755310058594, -36.512962341308594, -35.01837158203125, -33.52377700805664, -32.0291862487793, -30.534595489501953, -29.04000473022461, -27.545413970947266, -26.050823211669922, -24.556230545043945, -23.0616397857666, -21.567049026489258, -20.07245635986328, -18.577865600585938, -17.083274841308594, -15.58868408203125, -14.09409236907959, -12.59950065612793, -11.104909896850586, -9.610319137573242, -8.115727424621582, -6.621135711669922, -5.126544952392578, -3.631953716278076, -2.137362480163574, -0.6427712440490723, 0.8518199920654297, 2.3464112281799316, 3.8410024642944336, 5.335594177246094, 6.830181121826172, 8.324771881103516, 9.819363594055176, 11.313955307006836, 12.80854606628418, 14.303136825561523, 15.797728538513184, 17.292320251464844, 18.786911010742188, 20.28150177001953, 21.776092529296875, 23.27068519592285, 24.765275955200195, 26.25986671447754, 27.754459381103516, 29.24905014038086, 30.743640899658203, 32.23823165893555, 33.73282241821289, 35.227413177490234, 36.722007751464844, 38.21659851074219, 39.71118927001953, 41.205780029296875, 42.70037078857422, 44.19496154785156, 45.689552307128906, 47.18414306640625, 48.678733825683594, 50.1733283996582, 51.66791915893555, 53.16250991821289, 54.657100677490234]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 4.0, 8.0, 11.0, 14.0, 44.0, 93.0, 248.0, 742.0, 3134.0, 33449.0, 3973090.0, 174925.0, 6303.0, 1517.0, 470.0, 145.0, 45.0, 12.0, 5.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.3939208984375, -16.944091796875, -16.4942626953125, -16.04443359375, -15.5946044921875, -15.144775390625, -14.6949462890625, -14.2451171875, -13.7952880859375, -13.345458984375, -12.8956298828125, -12.44580078125, -11.9959716796875, -11.546142578125, -11.0963134765625, -10.646484375, -10.1966552734375, -9.746826171875, -9.2969970703125, -8.84716796875, -8.3973388671875, -7.947509765625, -7.4976806640625, -7.0478515625, -6.5980224609375, -6.148193359375, -5.6983642578125, -5.24853515625, -4.7987060546875, -4.348876953125, -3.8990478515625, -3.44921875, -2.9993896484375, -2.549560546875, -2.0997314453125, -1.64990234375, -1.2000732421875, -0.750244140625, -0.3004150390625, 0.1494140625, 0.5992431640625, 1.049072265625, 1.4989013671875, 1.94873046875, 2.3985595703125, 2.848388671875, 3.2982177734375, 3.748046875, 4.1978759765625, 4.647705078125, 5.0975341796875, 5.54736328125, 5.9971923828125, 6.447021484375, 6.8968505859375, 7.3466796875, 7.7965087890625, 8.246337890625, 8.6961669921875, 9.14599609375, 9.5958251953125, 10.045654296875, 10.4954833984375, 10.9453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 10.0, 11.0, 24.0, 37.0, 51.0, 49.0, 83.0, 80.0, 83.0, 95.0, 100.0, 107.0, 79.0, 60.0, 60.0, 30.0, 18.0, 12.0, 7.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.351776123046875, -8.16448974609375, -7.977203369140625, -7.7899169921875, -7.602630615234375, -7.41534423828125, -7.228057861328125, -7.040771484375, -6.853485107421875, -6.66619873046875, -6.478912353515625, -6.2916259765625, -6.104339599609375, -5.91705322265625, -5.729766845703125, -5.54248046875, -5.355194091796875, -5.16790771484375, -4.980621337890625, -4.7933349609375, -4.606048583984375, -4.41876220703125, -4.231475830078125, -4.044189453125, -3.856903076171875, -3.66961669921875, -3.482330322265625, -3.2950439453125, -3.107757568359375, -2.92047119140625, -2.733184814453125, -2.5458984375, -2.358612060546875, -2.17132568359375, -1.984039306640625, -1.7967529296875, -1.609466552734375, -1.42218017578125, -1.234893798828125, -1.047607421875, -0.860321044921875, -0.67303466796875, -0.485748291015625, -0.2984619140625, -0.111175537109375, 0.07611083984375, 0.263397216796875, 0.45068359375, 0.637969970703125, 0.82525634765625, 1.012542724609375, 1.1998291015625, 1.387115478515625, 1.57440185546875, 1.761688232421875, 1.948974609375, 2.136260986328125, 2.32354736328125, 2.510833740234375, 2.6981201171875, 2.885406494140625, 3.07269287109375, 3.259979248046875, 3.447265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 14.0, 14.0, 18.0, 45.0, 65.0, 75.0, 171.0, 446.0, 1931.0, 20443.0, 3781665.0, 380512.0, 7264.0, 981.0, 301.0, 124.0, 76.0, 45.0, 26.0, 18.0, 11.0, 11.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.6517333984375, -18.115966796875, -17.5802001953125, -17.04443359375, -16.5086669921875, -15.972900390625, -15.4371337890625, -14.9013671875, -14.3656005859375, -13.829833984375, -13.2940673828125, -12.75830078125, -12.2225341796875, -11.686767578125, -11.1510009765625, -10.615234375, -10.0794677734375, -9.543701171875, -9.0079345703125, -8.47216796875, -7.9364013671875, -7.400634765625, -6.8648681640625, -6.3291015625, -5.7933349609375, -5.257568359375, -4.7218017578125, -4.18603515625, -3.6502685546875, -3.114501953125, -2.5787353515625, -2.04296875, -1.5072021484375, -0.971435546875, -0.4356689453125, 0.10009765625, 0.6358642578125, 1.171630859375, 1.7073974609375, 2.2431640625, 2.7789306640625, 3.314697265625, 3.8504638671875, 4.38623046875, 4.9219970703125, 5.457763671875, 5.9935302734375, 6.529296875, 7.0650634765625, 7.600830078125, 8.1365966796875, 8.67236328125, 9.2081298828125, 9.743896484375, 10.2796630859375, 10.8154296875, 11.3511962890625, 11.886962890625, 12.4227294921875, 12.95849609375, 13.4942626953125, 14.030029296875, 14.5657958984375, 15.1015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 14.0, 16.0, 32.0, 49.0, 89.0, 181.0, 346.0, 768.0, 1055.0, 769.0, 342.0, 158.0, 84.0, 58.0, 33.0, 23.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.28125, -11.02203369140625, -10.7628173828125, -10.50360107421875, -10.244384765625, -9.98516845703125, -9.7259521484375, -9.46673583984375, -9.20751953125, -8.94830322265625, -8.6890869140625, -8.42987060546875, -8.170654296875, -7.91143798828125, -7.6522216796875, -7.39300537109375, -7.1337890625, -6.87457275390625, -6.6153564453125, -6.35614013671875, -6.096923828125, -5.83770751953125, -5.5784912109375, -5.31927490234375, -5.06005859375, -4.80084228515625, -4.5416259765625, -4.28240966796875, -4.023193359375, -3.76397705078125, -3.5047607421875, -3.24554443359375, -2.986328125, -2.72711181640625, -2.4678955078125, -2.20867919921875, -1.949462890625, -1.69024658203125, -1.4310302734375, -1.17181396484375, -0.91259765625, -0.65338134765625, -0.3941650390625, -0.13494873046875, 0.124267578125, 0.38348388671875, 0.6427001953125, 0.90191650390625, 1.1611328125, 1.42034912109375, 1.6795654296875, 1.93878173828125, 2.197998046875, 2.45721435546875, 2.7164306640625, 2.97564697265625, 3.23486328125, 3.49407958984375, 3.7532958984375, 4.01251220703125, 4.271728515625, 4.53094482421875, 4.7901611328125, 5.04937744140625, 5.30859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 17.0, 35.0, 59.0, 101.0, 135.0, 172.0, 183.0, 126.0, 72.0, 34.0, 25.0, 16.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.9763069152832, -62.090187072753906, -60.204063415527344, -58.31794357299805, -56.43182373046875, -54.54570007324219, -52.65958023071289, -50.773460388183594, -48.88733673095703, -47.001216888427734, -45.11509323120117, -43.228973388671875, -41.34285354614258, -39.45673370361328, -37.57061004638672, -35.68449020385742, -33.798370361328125, -31.912248611450195, -30.0261287689209, -28.14000701904297, -26.253887176513672, -24.367765426635742, -22.481643676757812, -20.595523834228516, -18.709402084350586, -16.823280334472656, -14.93716049194336, -13.05103874206543, -11.164917945861816, -9.278797149658203, -7.392675399780273, -5.50655460357666, -3.6204376220703125, -1.7343165874481201, 0.15180444717407227, 2.0379257202148438, 3.924046516418457, 5.81016731262207, 7.6962890625, 9.582409858703613, 11.468530654907227, 13.35465145111084, 15.240772247314453, 17.126893997192383, 19.013015747070312, 20.89913558959961, 22.78525733947754, 24.67137908935547, 26.557498931884766, 28.443620681762695, 30.329740524291992, 32.21586227416992, 34.10198211669922, 35.98810577392578, 37.87422561645508, 39.760345458984375, 41.64646911621094, 43.532588958740234, 45.4187126159668, 47.304832458496094, 49.19095230102539, 51.07707214355469, 52.96319580078125, 54.84931564331055, 56.735435485839844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 8.0, 6.0, 13.0, 14.0, 17.0, 14.0, 16.0, 22.0, 26.0, 32.0, 39.0, 37.0, 31.0, 37.0, 44.0, 31.0, 34.0, 30.0, 48.0, 41.0, 39.0, 37.0, 49.0, 37.0, 37.0, 33.0, 36.0, 30.0, 14.0, 24.0, 19.0, 17.0, 16.0, 9.0, 10.0, 8.0, 12.0, 6.0, 9.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.838489532470703, -21.08622932434082, -20.333969116210938, -19.581708908081055, -18.829448699951172, -18.07718849182129, -17.324928283691406, -16.572669982910156, -15.820408821105957, -15.068148612976074, -14.315888404846191, -13.563629150390625, -12.811368942260742, -12.05910873413086, -11.306848526000977, -10.554588317871094, -9.802328109741211, -9.050067901611328, -8.297807693481445, -7.545547962188721, -6.793287754058838, -6.041027545928955, -5.2887678146362305, -4.536507606506348, -3.784247398376465, -3.031987190246582, -2.2797272205352783, -1.5274672508239746, -0.7752070426940918, -0.022946834564208984, 0.7293128967285156, 1.4815731048583984, 2.2338333129882812, 2.986093521118164, 3.7383534908294678, 4.4906134605407715, 5.242873668670654, 5.995133876800537, 6.747393608093262, 7.4996538162231445, 8.251914024353027, 9.00417423248291, 9.756434440612793, 10.50869369506836, 11.260953903198242, 12.013214111328125, 12.765474319458008, 13.51773452758789, 14.269994735717773, 15.022254943847656, 15.774515151977539, 16.526775360107422, 17.279035568237305, 18.031295776367188, 18.783554077148438, 19.535816192626953, 20.288074493408203, 21.040334701538086, 21.79259490966797, 22.54485511779785, 23.297115325927734, 24.049375534057617, 24.8016357421875, 25.55389404296875, 26.306156158447266]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 2.0, 8.0, 17.0, 33.0, 48.0, 74.0, 149.0, 266.0, 628.0, 1544.0, 4680.0, 20301.0, 125945.0, 676924.0, 182321.0, 26197.0, 6209.0, 1763.0, 701.0, 331.0, 157.0, 86.0, 54.0, 26.0, 19.0, 13.0, 15.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.1015625, -9.78173828125, -9.4619140625, -9.14208984375, -8.822265625, -8.50244140625, -8.1826171875, -7.86279296875, -7.54296875, -7.22314453125, -6.9033203125, -6.58349609375, -6.263671875, -5.94384765625, -5.6240234375, -5.30419921875, -4.984375, -4.66455078125, -4.3447265625, -4.02490234375, -3.705078125, -3.38525390625, -3.0654296875, -2.74560546875, -2.42578125, -2.10595703125, -1.7861328125, -1.46630859375, -1.146484375, -0.82666015625, -0.5068359375, -0.18701171875, 0.1328125, 0.45263671875, 0.7724609375, 1.09228515625, 1.412109375, 1.73193359375, 2.0517578125, 2.37158203125, 2.69140625, 3.01123046875, 3.3310546875, 3.65087890625, 3.970703125, 4.29052734375, 4.6103515625, 4.93017578125, 5.25, 5.56982421875, 5.8896484375, 6.20947265625, 6.529296875, 6.84912109375, 7.1689453125, 7.48876953125, 7.80859375, 8.12841796875, 8.4482421875, 8.76806640625, 9.087890625, 9.40771484375, 9.7275390625, 10.04736328125, 10.3671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 14.0, 11.0, 18.0, 32.0, 33.0, 46.0, 47.0, 72.0, 80.0, 79.0, 78.0, 84.0, 86.0, 68.0, 67.0, 51.0, 50.0, 37.0, 14.0, 9.0, 12.0, 9.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0], "bins": [-7.85546875, -7.6873779296875, -7.519287109375, -7.3511962890625, -7.18310546875, -7.0150146484375, -6.846923828125, -6.6788330078125, -6.5107421875, -6.3426513671875, -6.174560546875, -6.0064697265625, -5.83837890625, -5.6702880859375, -5.502197265625, -5.3341064453125, -5.166015625, -4.9979248046875, -4.829833984375, -4.6617431640625, -4.49365234375, -4.3255615234375, -4.157470703125, -3.9893798828125, -3.8212890625, -3.6531982421875, -3.485107421875, -3.3170166015625, -3.14892578125, -2.9808349609375, -2.812744140625, -2.6446533203125, -2.4765625, -2.3084716796875, -2.140380859375, -1.9722900390625, -1.80419921875, -1.6361083984375, -1.468017578125, -1.2999267578125, -1.1318359375, -0.9637451171875, -0.795654296875, -0.6275634765625, -0.45947265625, -0.2913818359375, -0.123291015625, 0.0447998046875, 0.212890625, 0.3809814453125, 0.549072265625, 0.7171630859375, 0.88525390625, 1.0533447265625, 1.221435546875, 1.3895263671875, 1.5576171875, 1.7257080078125, 1.893798828125, 2.0618896484375, 2.22998046875, 2.3980712890625, 2.566162109375, 2.7342529296875, 2.90234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 3.0, 6.0, 8.0, 13.0, 13.0, 32.0, 37.0, 67.0, 105.0, 156.0, 285.0, 446.0, 872.0, 2182.0, 5722.0, 21613.0, 133080.0, 753310.0, 103656.0, 18134.0, 5094.0, 1796.0, 823.0, 407.0, 254.0, 145.0, 91.0, 56.0, 46.0, 27.0, 25.0, 10.0, 13.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.11309814453125, -9.8277587890625, -9.54241943359375, -9.257080078125, -8.97174072265625, -8.6864013671875, -8.40106201171875, -8.11572265625, -7.83038330078125, -7.5450439453125, -7.25970458984375, -6.974365234375, -6.68902587890625, -6.4036865234375, -6.11834716796875, -5.8330078125, -5.54766845703125, -5.2623291015625, -4.97698974609375, -4.691650390625, -4.40631103515625, -4.1209716796875, -3.83563232421875, -3.55029296875, -3.26495361328125, -2.9796142578125, -2.69427490234375, -2.408935546875, -2.12359619140625, -1.8382568359375, -1.55291748046875, -1.267578125, -0.98223876953125, -0.6968994140625, -0.41156005859375, -0.126220703125, 0.15911865234375, 0.4444580078125, 0.72979736328125, 1.01513671875, 1.30047607421875, 1.5858154296875, 1.87115478515625, 2.156494140625, 2.44183349609375, 2.7271728515625, 3.01251220703125, 3.2978515625, 3.58319091796875, 3.8685302734375, 4.15386962890625, 4.439208984375, 4.72454833984375, 5.0098876953125, 5.29522705078125, 5.58056640625, 5.86590576171875, 6.1512451171875, 6.43658447265625, 6.721923828125, 7.00726318359375, 7.2926025390625, 7.57794189453125, 7.86328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 6.0, 8.0, 17.0, 13.0, 26.0, 23.0, 27.0, 26.0, 38.0, 47.0, 59.0, 46.0, 54.0, 53.0, 61.0, 57.0, 56.0, 50.0, 56.0, 29.0, 34.0, 30.0, 32.0, 26.0, 19.0, 17.0, 20.0, 7.0, 12.0, 4.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.3203125, -12.9134521484375, -12.506591796875, -12.0997314453125, -11.69287109375, -11.2860107421875, -10.879150390625, -10.4722900390625, -10.0654296875, -9.6585693359375, -9.251708984375, -8.8448486328125, -8.43798828125, -8.0311279296875, -7.624267578125, -7.2174072265625, -6.810546875, -6.4036865234375, -5.996826171875, -5.5899658203125, -5.18310546875, -4.7762451171875, -4.369384765625, -3.9625244140625, -3.5556640625, -3.1488037109375, -2.741943359375, -2.3350830078125, -1.92822265625, -1.5213623046875, -1.114501953125, -0.7076416015625, -0.30078125, 0.1060791015625, 0.512939453125, 0.9197998046875, 1.32666015625, 1.7335205078125, 2.140380859375, 2.5472412109375, 2.9541015625, 3.3609619140625, 3.767822265625, 4.1746826171875, 4.58154296875, 4.9884033203125, 5.395263671875, 5.8021240234375, 6.208984375, 6.6158447265625, 7.022705078125, 7.4295654296875, 7.83642578125, 8.2432861328125, 8.650146484375, 9.0570068359375, 9.4638671875, 9.8707275390625, 10.277587890625, 10.6844482421875, 11.09130859375, 11.4981689453125, 11.905029296875, 12.3118896484375, 12.71875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 22.0, 19.0, 37.0, 46.0, 54.0, 85.0, 129.0, 169.0, 274.0, 403.0, 620.0, 940.0, 1504.0, 2581.0, 4431.0, 8701.0, 19601.0, 50909.0, 212055.0, 618381.0, 76221.0, 26287.0, 11399.0, 5614.0, 3159.0, 1719.0, 1079.0, 678.0, 436.0, 264.0, 220.0, 131.0, 119.0, 64.0, 56.0, 43.0, 16.0, 19.0, 13.0, 12.0, 8.0, 4.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-3.759765625, -3.652862548828125, -3.54595947265625, -3.439056396484375, -3.3321533203125, -3.225250244140625, -3.11834716796875, -3.011444091796875, -2.904541015625, -2.797637939453125, -2.69073486328125, -2.583831787109375, -2.4769287109375, -2.370025634765625, -2.26312255859375, -2.156219482421875, -2.04931640625, -1.942413330078125, -1.83551025390625, -1.728607177734375, -1.6217041015625, -1.514801025390625, -1.40789794921875, -1.300994873046875, -1.194091796875, -1.087188720703125, -0.98028564453125, -0.873382568359375, -0.7664794921875, -0.659576416015625, -0.55267333984375, -0.445770263671875, -0.3388671875, -0.231964111328125, -0.12506103515625, -0.018157958984375, 0.0887451171875, 0.195648193359375, 0.30255126953125, 0.409454345703125, 0.516357421875, 0.623260498046875, 0.73016357421875, 0.837066650390625, 0.9439697265625, 1.050872802734375, 1.15777587890625, 1.264678955078125, 1.37158203125, 1.478485107421875, 1.58538818359375, 1.692291259765625, 1.7991943359375, 1.906097412109375, 2.01300048828125, 2.119903564453125, 2.226806640625, 2.333709716796875, 2.44061279296875, 2.547515869140625, 2.6544189453125, 2.761322021484375, 2.86822509765625, 2.975128173828125, 3.08203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 3.0, 14.0, 24.0, 20.0, 26.0, 57.0, 63.0, 99.0, 180.0, 175.0, 92.0, 74.0, 53.0, 25.0, 17.0, 11.0, 7.0, 4.0, 8.0, 4.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001674652099609375, -0.0016317814588546753, -0.0015889108180999756, -0.0015460401773452759, -0.0015031695365905762, -0.0014602988958358765, -0.0014174282550811768, -0.001374557614326477, -0.0013316869735717773, -0.0012888163328170776, -0.001245945692062378, -0.0012030750513076782, -0.0011602044105529785, -0.0011173337697982788, -0.001074463129043579, -0.0010315924882888794, -0.0009887218475341797, -0.00094585120677948, -0.0009029805660247803, -0.0008601099252700806, -0.0008172392845153809, -0.0007743686437606812, -0.0007314980030059814, -0.0006886273622512817, -0.000645756721496582, -0.0006028860807418823, -0.0005600154399871826, -0.0005171447992324829, -0.0004742741584777832, -0.0004314035177230835, -0.0003885328769683838, -0.0003456622362136841, -0.0003027915954589844, -0.00025992095470428467, -0.00021705031394958496, -0.00017417967319488525, -0.00013130903244018555, -8.843839168548584e-05, -4.556775093078613e-05, -2.6971101760864258e-06, 4.017353057861328e-05, 8.304417133331299e-05, 0.0001259148120880127, 0.0001687854528427124, 0.0002116560935974121, 0.0002545267343521118, 0.0002973973751068115, 0.00034026801586151123, 0.00038313865661621094, 0.00042600929737091064, 0.00046887993812561035, 0.0005117505788803101, 0.0005546212196350098, 0.0005974918603897095, 0.0006403625011444092, 0.0006832331418991089, 0.0007261037826538086, 0.0007689744234085083, 0.000811845064163208, 0.0008547157049179077, 0.0008975863456726074, 0.0009404569864273071, 0.0009833276271820068, 0.0010261982679367065, 0.0010690689086914062]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 10.0, 9.0, 14.0, 23.0, 31.0, 51.0, 83.0, 177.0, 351.0, 831.0, 2639.0, 10889.0, 83740.0, 871936.0, 64711.0, 9298.0, 2308.0, 762.0, 298.0, 143.0, 82.0, 70.0, 30.0, 19.0, 12.0, 16.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.93359375, -7.67303466796875, -7.4124755859375, -7.15191650390625, -6.891357421875, -6.63079833984375, -6.3702392578125, -6.10968017578125, -5.84912109375, -5.58856201171875, -5.3280029296875, -5.06744384765625, -4.806884765625, -4.54632568359375, -4.2857666015625, -4.02520751953125, -3.7646484375, -3.50408935546875, -3.2435302734375, -2.98297119140625, -2.722412109375, -2.46185302734375, -2.2012939453125, -1.94073486328125, -1.68017578125, -1.41961669921875, -1.1590576171875, -0.89849853515625, -0.637939453125, -0.37738037109375, -0.1168212890625, 0.14373779296875, 0.404296875, 0.66485595703125, 0.9254150390625, 1.18597412109375, 1.446533203125, 1.70709228515625, 1.9676513671875, 2.22821044921875, 2.48876953125, 2.74932861328125, 3.0098876953125, 3.27044677734375, 3.531005859375, 3.79156494140625, 4.0521240234375, 4.31268310546875, 4.5732421875, 4.83380126953125, 5.0943603515625, 5.35491943359375, 5.615478515625, 5.87603759765625, 6.1365966796875, 6.39715576171875, 6.65771484375, 6.91827392578125, 7.1788330078125, 7.43939208984375, 7.699951171875, 7.96051025390625, 8.2210693359375, 8.48162841796875, 8.7421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 4.0, 9.0, 8.0, 11.0, 15.0, 18.0, 19.0, 23.0, 49.0, 45.0, 75.0, 82.0, 121.0, 105.0, 82.0, 81.0, 45.0, 45.0, 30.0, 21.0, 26.0, 16.0, 9.0, 14.0, 10.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.931640625, -3.8310546875, -3.73046875, -3.6298828125, -3.529296875, -3.4287109375, -3.328125, -3.2275390625, -3.126953125, -3.0263671875, -2.92578125, -2.8251953125, -2.724609375, -2.6240234375, -2.5234375, -2.4228515625, -2.322265625, -2.2216796875, -2.12109375, -2.0205078125, -1.919921875, -1.8193359375, -1.71875, -1.6181640625, -1.517578125, -1.4169921875, -1.31640625, -1.2158203125, -1.115234375, -1.0146484375, -0.9140625, -0.8134765625, -0.712890625, -0.6123046875, -0.51171875, -0.4111328125, -0.310546875, -0.2099609375, -0.109375, -0.0087890625, 0.091796875, 0.1923828125, 0.29296875, 0.3935546875, 0.494140625, 0.5947265625, 0.6953125, 0.7958984375, 0.896484375, 0.9970703125, 1.09765625, 1.1982421875, 1.298828125, 1.3994140625, 1.5, 1.6005859375, 1.701171875, 1.8017578125, 1.90234375, 2.0029296875, 2.103515625, 2.2041015625, 2.3046875, 2.4052734375, 2.505859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 11.0, 20.0, 60.0, 147.0, 328.0, 157.0, 118.0, 51.0, 39.0, 22.0, 15.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.82377624511719, -97.62581634521484, -94.42784881591797, -91.22988891601562, -88.03192138671875, -84.8339614868164, -81.63600158691406, -78.43803405761719, -75.24006652832031, -72.04210662841797, -68.8441390991211, -65.64617919921875, -62.448211669921875, -59.25025177001953, -56.05228805541992, -52.85432434082031, -49.65636444091797, -46.45840072631836, -43.26043701171875, -40.062477111816406, -36.86450958251953, -33.66654968261719, -30.468585968017578, -27.27062225341797, -24.07265853881836, -20.87469482421875, -17.67673110961914, -14.478769302368164, -11.280805587768555, -8.082841873168945, -4.884880065917969, -1.6869163513183594, 1.51104736328125, 4.709010601043701, 7.906973838806152, 11.104936599731445, 14.302900314331055, 17.500864028930664, 20.69882583618164, 23.89678955078125, 27.09475326538086, 30.29271697998047, 33.49068069458008, 36.68864440917969, 39.88660430908203, 43.084571838378906, 46.28253173828125, 49.48049545288086, 52.67845916748047, 55.87642288208008, 59.07438659667969, 62.27234649658203, 65.4703140258789, 68.66827392578125, 71.86624145507812, 75.06420135498047, 78.26216125488281, 81.46012115478516, 84.65808868408203, 87.85604858398438, 91.05401611328125, 94.2519760131836, 97.44993591308594, 100.64790344238281, 103.84587097167969]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 9.0, 4.0, 4.0, 7.0, 5.0, 14.0, 18.0, 16.0, 18.0, 23.0, 27.0, 32.0, 30.0, 32.0, 21.0, 50.0, 53.0, 91.0, 107.0, 86.0, 52.0, 29.0, 34.0, 26.0, 23.0, 24.0, 28.0, 29.0, 23.0, 12.0, 13.0, 9.0, 9.0, 7.0, 14.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.551727294921875, -43.94677734375, -42.34182357788086, -40.736873626708984, -39.13192367553711, -37.52696990966797, -35.922019958496094, -34.31707000732422, -32.712120056152344, -31.107168197631836, -29.50221824645996, -27.897266387939453, -26.292316436767578, -24.68736457824707, -23.082412719726562, -21.477462768554688, -19.872509002685547, -18.26755714416504, -16.662607192993164, -15.057655334472656, -13.452704429626465, -11.847753524780273, -10.242801666259766, -8.637850761413574, -7.032899856567383, -5.427948951721191, -3.822997570037842, -2.218046188354492, -0.6130952835083008, 0.9918556213378906, 2.5968074798583984, 4.20175838470459, 5.806709289550781, 7.411660194396973, 9.016611099243164, 10.621562957763672, 12.226513862609863, 13.831464767456055, 15.436416625976562, 17.041366577148438, 18.646318435668945, 20.251270294189453, 21.856220245361328, 23.461172103881836, 25.066123962402344, 26.67107391357422, 28.276025772094727, 29.880977630615234, 31.48592758178711, 33.090877532958984, 34.695831298828125, 36.30078125, 37.905731201171875, 39.51068115234375, 41.11563491821289, 42.720584869384766, 44.325538635253906, 45.93048858642578, 47.53544235229492, 49.1403923034668, 50.74534225463867, 52.35029602050781, 53.95524597167969, 55.56019592285156, 57.16514587402344]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 12.0, 23.0, 35.0, 43.0, 67.0, 114.0, 218.0, 413.0, 1190.0, 5520.0, 150746.0, 4000428.0, 30549.0, 3369.0, 850.0, 345.0, 142.0, 90.0, 37.0, 25.0, 18.0, 12.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.578125, -25.9786376953125, -25.379150390625, -24.7796630859375, -24.18017578125, -23.5806884765625, -22.981201171875, -22.3817138671875, -21.7822265625, -21.1827392578125, -20.583251953125, -19.9837646484375, -19.38427734375, -18.7847900390625, -18.185302734375, -17.5858154296875, -16.986328125, -16.3868408203125, -15.787353515625, -15.1878662109375, -14.58837890625, -13.9888916015625, -13.389404296875, -12.7899169921875, -12.1904296875, -11.5909423828125, -10.991455078125, -10.3919677734375, -9.79248046875, -9.1929931640625, -8.593505859375, -7.9940185546875, -7.39453125, -6.7950439453125, -6.195556640625, -5.5960693359375, -4.99658203125, -4.3970947265625, -3.797607421875, -3.1981201171875, -2.5986328125, -1.9991455078125, -1.399658203125, -0.8001708984375, -0.20068359375, 0.3988037109375, 0.998291015625, 1.5977783203125, 2.197265625, 2.7967529296875, 3.396240234375, 3.9957275390625, 4.59521484375, 5.1947021484375, 5.794189453125, 6.3936767578125, 6.9931640625, 7.5926513671875, 8.192138671875, 8.7916259765625, 9.39111328125, 9.9906005859375, 10.590087890625, 11.1895751953125, 11.7890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 10.0, 9.0, 14.0, 13.0, 23.0, 21.0, 24.0, 34.0, 35.0, 46.0, 58.0, 56.0, 55.0, 65.0, 45.0, 55.0, 56.0, 44.0, 59.0, 44.0, 37.0, 36.0, 32.0, 31.0, 24.0, 11.0, 13.0, 9.0, 8.0, 5.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.236328125, -3.118865966796875, -3.00140380859375, -2.883941650390625, -2.7664794921875, -2.649017333984375, -2.53155517578125, -2.414093017578125, -2.296630859375, -2.179168701171875, -2.06170654296875, -1.944244384765625, -1.8267822265625, -1.709320068359375, -1.59185791015625, -1.474395751953125, -1.35693359375, -1.239471435546875, -1.12200927734375, -1.004547119140625, -0.8870849609375, -0.769622802734375, -0.65216064453125, -0.534698486328125, -0.417236328125, -0.299774169921875, -0.18231201171875, -0.064849853515625, 0.0526123046875, 0.170074462890625, 0.28753662109375, 0.404998779296875, 0.5224609375, 0.639923095703125, 0.75738525390625, 0.874847412109375, 0.9923095703125, 1.109771728515625, 1.22723388671875, 1.344696044921875, 1.462158203125, 1.579620361328125, 1.69708251953125, 1.814544677734375, 1.9320068359375, 2.049468994140625, 2.16693115234375, 2.284393310546875, 2.40185546875, 2.519317626953125, 2.63677978515625, 2.754241943359375, 2.8717041015625, 2.989166259765625, 3.10662841796875, 3.224090576171875, 3.341552734375, 3.459014892578125, 3.57647705078125, 3.693939208984375, 3.8114013671875, 3.928863525390625, 4.04632568359375, 4.163787841796875, 4.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 21.0, 23.0, 38.0, 79.0, 142.0, 259.0, 563.0, 1675.0, 11358.0, 2611832.0, 1555981.0, 9779.0, 1463.0, 533.0, 236.0, 111.0, 69.0, 37.0, 24.0, 12.0, 11.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.1875, -15.51220703125, -14.8369140625, -14.16162109375, -13.486328125, -12.81103515625, -12.1357421875, -11.46044921875, -10.78515625, -10.10986328125, -9.4345703125, -8.75927734375, -8.083984375, -7.40869140625, -6.7333984375, -6.05810546875, -5.3828125, -4.70751953125, -4.0322265625, -3.35693359375, -2.681640625, -2.00634765625, -1.3310546875, -0.65576171875, 0.01953125, 0.69482421875, 1.3701171875, 2.04541015625, 2.720703125, 3.39599609375, 4.0712890625, 4.74658203125, 5.421875, 6.09716796875, 6.7724609375, 7.44775390625, 8.123046875, 8.79833984375, 9.4736328125, 10.14892578125, 10.82421875, 11.49951171875, 12.1748046875, 12.85009765625, 13.525390625, 14.20068359375, 14.8759765625, 15.55126953125, 16.2265625, 16.90185546875, 17.5771484375, 18.25244140625, 18.927734375, 19.60302734375, 20.2783203125, 20.95361328125, 21.62890625, 22.30419921875, 22.9794921875, 23.65478515625, 24.330078125, 25.00537109375, 25.6806640625, 26.35595703125, 27.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 11.0, 13.0, 17.0, 19.0, 33.0, 39.0, 74.0, 141.0, 279.0, 521.0, 884.0, 867.0, 535.0, 303.0, 128.0, 77.0, 34.0, 27.0, 20.0, 10.0, 12.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.820068359375, -9.52294921875, -9.225830078125, -8.9287109375, -8.631591796875, -8.33447265625, -8.037353515625, -7.740234375, -7.443115234375, -7.14599609375, -6.848876953125, -6.5517578125, -6.254638671875, -5.95751953125, -5.660400390625, -5.36328125, -5.066162109375, -4.76904296875, -4.471923828125, -4.1748046875, -3.877685546875, -3.58056640625, -3.283447265625, -2.986328125, -2.689208984375, -2.39208984375, -2.094970703125, -1.7978515625, -1.500732421875, -1.20361328125, -0.906494140625, -0.609375, -0.312255859375, -0.01513671875, 0.281982421875, 0.5791015625, 0.876220703125, 1.17333984375, 1.470458984375, 1.767578125, 2.064697265625, 2.36181640625, 2.658935546875, 2.9560546875, 3.253173828125, 3.55029296875, 3.847412109375, 4.14453125, 4.441650390625, 4.73876953125, 5.035888671875, 5.3330078125, 5.630126953125, 5.92724609375, 6.224365234375, 6.521484375, 6.818603515625, 7.11572265625, 7.412841796875, 7.7099609375, 8.007080078125, 8.30419921875, 8.601318359375, 8.8984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 17.0, 31.0, 51.0, 77.0, 136.0, 160.0, 191.0, 131.0, 71.0, 32.0, 25.0, 11.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.07937622070312, -96.48065948486328, -93.88194274902344, -91.2832260131836, -88.68450927734375, -86.0857925415039, -83.48707580566406, -80.88835906982422, -78.28964233398438, -75.69092559814453, -73.09220886230469, -70.49349212646484, -67.894775390625, -65.29605865478516, -62.69734191894531, -60.09862518310547, -57.499908447265625, -54.90119171142578, -52.30247497558594, -49.703758239746094, -47.10504150390625, -44.506324768066406, -41.90760803222656, -39.30889129638672, -36.710174560546875, -34.11145782470703, -31.512741088867188, -28.914024353027344, -26.3153076171875, -23.716590881347656, -21.117874145507812, -18.51915740966797, -15.920440673828125, -13.321723937988281, -10.723007202148438, -8.124290466308594, -5.52557373046875, -2.9268569946289062, -0.3281402587890625, 2.2705764770507812, 4.869293212890625, 7.468009948730469, 10.066726684570312, 12.665443420410156, 15.26416015625, 17.862876892089844, 20.461593627929688, 23.06031036376953, 25.659027099609375, 28.25774383544922, 30.856460571289062, 33.455177307128906, 36.05389404296875, 38.652610778808594, 41.25132751464844, 43.85004425048828, 46.448760986328125, 49.04747772216797, 51.64619445800781, 54.244911193847656, 56.8436279296875, 59.442344665527344, 62.04106140136719, 64.63977813720703, 67.23849487304688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 12.0, 10.0, 24.0, 10.0, 24.0, 31.0, 30.0, 32.0, 29.0, 42.0, 39.0, 39.0, 51.0, 55.0, 41.0, 44.0, 52.0, 44.0, 42.0, 50.0, 32.0, 35.0, 37.0, 45.0, 26.0, 19.0, 17.0, 19.0, 9.0, 10.0, 9.0, 8.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.138973236083984, -29.904857635498047, -28.67074203491211, -27.43662452697754, -26.2025089263916, -24.968393325805664, -23.734275817871094, -22.500160217285156, -21.26604461669922, -20.03192901611328, -18.797813415527344, -17.563695907592773, -16.329580307006836, -15.095464706420898, -13.861348152160645, -12.62723159790039, -11.393115997314453, -10.159000396728516, -8.924883842468262, -7.690767765045166, -6.45665168762207, -5.222535610198975, -3.988419532775879, -2.754302978515625, -1.5201873779296875, -0.2860713005065918, 0.9480447769165039, 2.1821608543395996, 3.4162769317626953, 4.650393009185791, 5.884509086608887, 7.118625640869141, 8.352745056152344, 9.586860656738281, 10.820977210998535, 12.055093765258789, 13.289209365844727, 14.523324966430664, 15.757441520690918, 16.991558074951172, 18.22567367553711, 19.459789276123047, 20.693904876708984, 21.928022384643555, 23.162137985229492, 24.39625358581543, 25.63037109375, 26.864486694335938, 28.098602294921875, 29.332717895507812, 30.56683349609375, 31.80095100402832, 33.035064697265625, 34.26918411254883, 35.503299713134766, 36.7374153137207, 37.97153091430664, 39.20564651489258, 40.439762115478516, 41.67387771606445, 42.907997131347656, 44.142112731933594, 45.37622833251953, 46.61034393310547, 47.844459533691406]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 8.0, 23.0, 29.0, 54.0, 127.0, 228.0, 690.0, 2766.0, 16681.0, 182825.0, 758936.0, 74856.0, 8842.0, 1667.0, 455.0, 177.0, 76.0, 41.0, 26.0, 12.0, 14.0, 7.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.6676025390625, -8.296142578125, -7.9246826171875, -7.55322265625, -7.1817626953125, -6.810302734375, -6.4388427734375, -6.0673828125, -5.6959228515625, -5.324462890625, -4.9530029296875, -4.58154296875, -4.2100830078125, -3.838623046875, -3.4671630859375, -3.095703125, -2.7242431640625, -2.352783203125, -1.9813232421875, -1.60986328125, -1.2384033203125, -0.866943359375, -0.4954833984375, -0.1240234375, 0.2474365234375, 0.618896484375, 0.9903564453125, 1.36181640625, 1.7332763671875, 2.104736328125, 2.4761962890625, 2.84765625, 3.2191162109375, 3.590576171875, 3.9620361328125, 4.33349609375, 4.7049560546875, 5.076416015625, 5.4478759765625, 5.8193359375, 6.1907958984375, 6.562255859375, 6.9337158203125, 7.30517578125, 7.6766357421875, 8.048095703125, 8.4195556640625, 8.791015625, 9.1624755859375, 9.533935546875, 9.9053955078125, 10.27685546875, 10.6483154296875, 11.019775390625, 11.3912353515625, 11.7626953125, 12.1341552734375, 12.505615234375, 12.8770751953125, 13.24853515625, 13.6199951171875, 13.991455078125, 14.3629150390625, 14.734375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 7.0, 14.0, 10.0, 20.0, 27.0, 43.0, 55.0, 58.0, 73.0, 84.0, 76.0, 78.0, 80.0, 72.0, 58.0, 50.0, 49.0, 49.0, 38.0, 22.0, 11.0, 10.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.875, -6.691162109375, -6.50732421875, -6.323486328125, -6.1396484375, -5.955810546875, -5.77197265625, -5.588134765625, -5.404296875, -5.220458984375, -5.03662109375, -4.852783203125, -4.6689453125, -4.485107421875, -4.30126953125, -4.117431640625, -3.93359375, -3.749755859375, -3.56591796875, -3.382080078125, -3.1982421875, -3.014404296875, -2.83056640625, -2.646728515625, -2.462890625, -2.279052734375, -2.09521484375, -1.911376953125, -1.7275390625, -1.543701171875, -1.35986328125, -1.176025390625, -0.9921875, -0.808349609375, -0.62451171875, -0.440673828125, -0.2568359375, -0.072998046875, 0.11083984375, 0.294677734375, 0.478515625, 0.662353515625, 0.84619140625, 1.030029296875, 1.2138671875, 1.397705078125, 1.58154296875, 1.765380859375, 1.94921875, 2.133056640625, 2.31689453125, 2.500732421875, 2.6845703125, 2.868408203125, 3.05224609375, 3.236083984375, 3.419921875, 3.603759765625, 3.78759765625, 3.971435546875, 4.1552734375, 4.339111328125, 4.52294921875, 4.706787109375, 4.890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 10.0, 18.0, 22.0, 29.0, 42.0, 66.0, 94.0, 188.0, 334.0, 707.0, 1735.0, 6870.0, 79908.0, 908782.0, 41976.0, 5030.0, 1390.0, 582.0, 290.0, 163.0, 104.0, 60.0, 44.0, 34.0, 18.0, 9.0, 15.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2734375, -14.802001953125, -14.33056640625, -13.859130859375, -13.3876953125, -12.916259765625, -12.44482421875, -11.973388671875, -11.501953125, -11.030517578125, -10.55908203125, -10.087646484375, -9.6162109375, -9.144775390625, -8.67333984375, -8.201904296875, -7.73046875, -7.259033203125, -6.78759765625, -6.316162109375, -5.8447265625, -5.373291015625, -4.90185546875, -4.430419921875, -3.958984375, -3.487548828125, -3.01611328125, -2.544677734375, -2.0732421875, -1.601806640625, -1.13037109375, -0.658935546875, -0.1875, 0.283935546875, 0.75537109375, 1.226806640625, 1.6982421875, 2.169677734375, 2.64111328125, 3.112548828125, 3.583984375, 4.055419921875, 4.52685546875, 4.998291015625, 5.4697265625, 5.941162109375, 6.41259765625, 6.884033203125, 7.35546875, 7.826904296875, 8.29833984375, 8.769775390625, 9.2412109375, 9.712646484375, 10.18408203125, 10.655517578125, 11.126953125, 11.598388671875, 12.06982421875, 12.541259765625, 13.0126953125, 13.484130859375, 13.95556640625, 14.427001953125, 14.8984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 7.0, 15.0, 19.0, 28.0, 29.0, 49.0, 52.0, 86.0, 78.0, 82.0, 91.0, 91.0, 83.0, 56.0, 51.0, 43.0, 39.0, 17.0, 21.0, 12.0, 10.0, 5.0, 8.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.87548828125, -18.1572265625, -17.43896484375, -16.720703125, -16.00244140625, -15.2841796875, -14.56591796875, -13.84765625, -13.12939453125, -12.4111328125, -11.69287109375, -10.974609375, -10.25634765625, -9.5380859375, -8.81982421875, -8.1015625, -7.38330078125, -6.6650390625, -5.94677734375, -5.228515625, -4.51025390625, -3.7919921875, -3.07373046875, -2.35546875, -1.63720703125, -0.9189453125, -0.20068359375, 0.517578125, 1.23583984375, 1.9541015625, 2.67236328125, 3.390625, 4.10888671875, 4.8271484375, 5.54541015625, 6.263671875, 6.98193359375, 7.7001953125, 8.41845703125, 9.13671875, 9.85498046875, 10.5732421875, 11.29150390625, 12.009765625, 12.72802734375, 13.4462890625, 14.16455078125, 14.8828125, 15.60107421875, 16.3193359375, 17.03759765625, 17.755859375, 18.47412109375, 19.1923828125, 19.91064453125, 20.62890625, 21.34716796875, 22.0654296875, 22.78369140625, 23.501953125, 24.22021484375, 24.9384765625, 25.65673828125, 26.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 6.0, 3.0, 8.0, 10.0, 15.0, 22.0, 18.0, 21.0, 45.0, 51.0, 87.0, 140.0, 241.0, 381.0, 792.0, 1836.0, 4942.0, 16634.0, 94434.0, 828256.0, 77989.0, 14630.0, 4490.0, 1716.0, 766.0, 402.0, 201.0, 116.0, 79.0, 58.0, 35.0, 35.0, 26.0, 15.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8671875, -3.75811767578125, -3.6490478515625, -3.53997802734375, -3.430908203125, -3.32183837890625, -3.2127685546875, -3.10369873046875, -2.99462890625, -2.88555908203125, -2.7764892578125, -2.66741943359375, -2.558349609375, -2.44927978515625, -2.3402099609375, -2.23114013671875, -2.1220703125, -2.01300048828125, -1.9039306640625, -1.79486083984375, -1.685791015625, -1.57672119140625, -1.4676513671875, -1.35858154296875, -1.24951171875, -1.14044189453125, -1.0313720703125, -0.92230224609375, -0.813232421875, -0.70416259765625, -0.5950927734375, -0.48602294921875, -0.376953125, -0.26788330078125, -0.1588134765625, -0.04974365234375, 0.059326171875, 0.16839599609375, 0.2774658203125, 0.38653564453125, 0.49560546875, 0.60467529296875, 0.7137451171875, 0.82281494140625, 0.931884765625, 1.04095458984375, 1.1500244140625, 1.25909423828125, 1.3681640625, 1.47723388671875, 1.5863037109375, 1.69537353515625, 1.804443359375, 1.91351318359375, 2.0225830078125, 2.13165283203125, 2.24072265625, 2.34979248046875, 2.4588623046875, 2.56793212890625, 2.677001953125, 2.78607177734375, 2.8951416015625, 3.00421142578125, 3.11328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 9.0, 2.0, 16.0, 16.0, 27.0, 29.0, 90.0, 174.0, 269.0, 165.0, 87.0, 41.0, 17.0, 15.0, 4.0, 12.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009775161743164062, -0.0009319484233856201, -0.000886380672454834, -0.0008408129215240479, -0.0007952451705932617, -0.0007496774196624756, -0.0007041096687316895, -0.0006585419178009033, -0.0006129741668701172, -0.0005674064159393311, -0.0005218386650085449, -0.0004762709140777588, -0.00043070316314697266, -0.0003851354122161865, -0.0003395676612854004, -0.00029399991035461426, -0.0002484321594238281, -0.000202864408493042, -0.00015729665756225586, -0.00011172890663146973, -6.61611557006836e-05, -2.059340476989746e-05, 2.4974346160888672e-05, 7.05420970916748e-05, 0.00011610984802246094, 0.00016167759895324707, 0.0002072453498840332, 0.00025281310081481934, 0.00029838085174560547, 0.0003439486026763916, 0.00038951635360717773, 0.00043508410453796387, 0.00048065185546875, 0.0005262196063995361, 0.0005717873573303223, 0.0006173551082611084, 0.0006629228591918945, 0.0007084906101226807, 0.0007540583610534668, 0.0007996261119842529, 0.0008451938629150391, 0.0008907616138458252, 0.0009363293647766113, 0.0009818971157073975, 0.0010274648666381836, 0.0010730326175689697, 0.0011186003684997559, 0.001164168119430542, 0.0012097358703613281, 0.0012553036212921143, 0.0013008713722229004, 0.0013464391231536865, 0.0013920068740844727, 0.0014375746250152588, 0.001483142375946045, 0.001528710126876831, 0.0015742778778076172, 0.0016198456287384033, 0.0016654133796691895, 0.0017109811305999756, 0.0017565488815307617, 0.0018021166324615479, 0.001847684383392334, 0.0018932521343231201, 0.0019388198852539062]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 10.0, 6.0, 10.0, 16.0, 12.0, 22.0, 35.0, 49.0, 88.0, 145.0, 250.0, 437.0, 774.0, 1587.0, 3715.0, 10285.0, 36753.0, 226655.0, 682974.0, 60569.0, 15007.0, 4989.0, 2033.0, 902.0, 482.0, 304.0, 152.0, 87.0, 61.0, 43.0, 25.0, 18.0, 17.0, 8.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.09375, -2.007080078125, -1.92041015625, -1.833740234375, -1.7470703125, -1.660400390625, -1.57373046875, -1.487060546875, -1.400390625, -1.313720703125, -1.22705078125, -1.140380859375, -1.0537109375, -0.967041015625, -0.88037109375, -0.793701171875, -0.70703125, -0.620361328125, -0.53369140625, -0.447021484375, -0.3603515625, -0.273681640625, -0.18701171875, -0.100341796875, -0.013671875, 0.072998046875, 0.15966796875, 0.246337890625, 0.3330078125, 0.419677734375, 0.50634765625, 0.593017578125, 0.6796875, 0.766357421875, 0.85302734375, 0.939697265625, 1.0263671875, 1.113037109375, 1.19970703125, 1.286376953125, 1.373046875, 1.459716796875, 1.54638671875, 1.633056640625, 1.7197265625, 1.806396484375, 1.89306640625, 1.979736328125, 2.06640625, 2.153076171875, 2.23974609375, 2.326416015625, 2.4130859375, 2.499755859375, 2.58642578125, 2.673095703125, 2.759765625, 2.846435546875, 2.93310546875, 3.019775390625, 3.1064453125, 3.193115234375, 3.27978515625, 3.366455078125, 3.453125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 3.0, 5.0, 3.0, 9.0, 7.0, 10.0, 18.0, 15.0, 19.0, 25.0, 21.0, 41.0, 35.0, 52.0, 66.0, 90.0, 64.0, 72.0, 75.0, 54.0, 50.0, 59.0, 30.0, 33.0, 15.0, 20.0, 16.0, 18.0, 6.0, 13.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7412109375, -1.6834716796875, -1.625732421875, -1.5679931640625, -1.51025390625, -1.4525146484375, -1.394775390625, -1.3370361328125, -1.279296875, -1.2215576171875, -1.163818359375, -1.1060791015625, -1.04833984375, -0.9906005859375, -0.932861328125, -0.8751220703125, -0.8173828125, -0.7596435546875, -0.701904296875, -0.6441650390625, -0.58642578125, -0.5286865234375, -0.470947265625, -0.4132080078125, -0.35546875, -0.2977294921875, -0.239990234375, -0.1822509765625, -0.12451171875, -0.0667724609375, -0.009033203125, 0.0487060546875, 0.1064453125, 0.1641845703125, 0.221923828125, 0.2796630859375, 0.33740234375, 0.3951416015625, 0.452880859375, 0.5106201171875, 0.568359375, 0.6260986328125, 0.683837890625, 0.7415771484375, 0.79931640625, 0.8570556640625, 0.914794921875, 0.9725341796875, 1.0302734375, 1.0880126953125, 1.145751953125, 1.2034912109375, 1.26123046875, 1.3189697265625, 1.376708984375, 1.4344482421875, 1.4921875, 1.5499267578125, 1.607666015625, 1.6654052734375, 1.72314453125, 1.7808837890625, 1.838623046875, 1.8963623046875, 1.9541015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 36.0, 152.0, 588.0, 175.0, 31.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.16714477539062, -176.7618865966797, -170.3566131591797, -163.95135498046875, -157.5460968017578, -151.1408233642578, -144.73556518554688, -138.33029174804688, -131.92503356933594, -125.51976776123047, -119.11450958251953, -112.70924377441406, -106.3039779663086, -99.89871215820312, -93.49345397949219, -87.08818817138672, -80.68292999267578, -74.27766418457031, -67.87240600585938, -61.467140197753906, -55.06187438964844, -48.656612396240234, -42.25135040283203, -35.84608459472656, -29.44082260131836, -23.035558700561523, -16.630294799804688, -10.225032806396484, -3.8197689056396484, 2.5854949951171875, 8.99075698852539, 15.39602279663086, 21.801284790039062, 28.2065486907959, 34.611812591552734, 41.01707458496094, 47.422340393066406, 53.82760238647461, 60.23286437988281, 66.63813018798828, 73.04339599609375, 79.44866180419922, 85.85391998291016, 92.25918579101562, 98.6644515991211, 105.06971740722656, 111.4749755859375, 117.88024139404297, 124.2854995727539, 130.69076538085938, 137.0960235595703, 143.50128173828125, 149.90655517578125, 156.3118133544922, 162.71707153320312, 169.12234497070312, 175.52760314941406, 181.932861328125, 188.338134765625, 194.74339294433594, 201.14865112304688, 207.55392456054688, 213.9591827392578, 220.36444091796875, 226.76971435546875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 8.0, 11.0, 7.0, 9.0, 21.0, 18.0, 18.0, 23.0, 34.0, 32.0, 20.0, 49.0, 52.0, 57.0, 144.0, 134.0, 54.0, 55.0, 35.0, 40.0, 24.0, 25.0, 24.0, 21.0, 13.0, 13.0, 15.0, 13.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-86.34188842773438, -84.12348175048828, -81.90506744384766, -79.68666076660156, -77.46825408935547, -75.24983978271484, -73.03143310546875, -70.81302642822266, -68.59461212158203, -66.37620544433594, -64.15779113769531, -61.93938446044922, -59.72097396850586, -57.5025634765625, -55.284156799316406, -53.06574630737305, -50.84733963012695, -48.628929138183594, -46.4105224609375, -44.19211196899414, -41.97370147705078, -39.75529479980469, -37.53688430786133, -35.31847381591797, -33.100067138671875, -30.88165855407715, -28.66324806213379, -26.444839477539062, -24.226428985595703, -22.008020401000977, -19.78961181640625, -17.57120132446289, -15.352787017822266, -13.134377479553223, -10.91596794128418, -8.697559356689453, -6.47914981842041, -4.260740280151367, -2.0423316955566406, 0.17607784271240234, 2.3944873809814453, 4.612896919250488, 6.831305980682373, 9.049715042114258, 11.2681245803833, 13.486534118652344, 15.70494270324707, 17.923351287841797, 20.141761779785156, 22.360170364379883, 24.578580856323242, 26.79698944091797, 29.015399932861328, 31.233808517456055, 33.45221710205078, 35.67062759399414, 37.8890380859375, 40.10744857788086, 42.32585525512695, 44.54426574707031, 46.76267623901367, 48.98108673095703, 51.199493408203125, 53.417903900146484, 55.63631057739258]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 21.0, 15.0, 20.0, 24.0, 55.0, 77.0, 143.0, 336.0, 820.0, 2774.0, 12388.0, 182744.0, 3555789.0, 412636.0, 20113.0, 4276.0, 1251.0, 434.0, 179.0, 73.0, 45.0, 24.0, 9.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.8125, -20.3458251953125, -19.879150390625, -19.4124755859375, -18.94580078125, -18.4791259765625, -18.012451171875, -17.5457763671875, -17.0791015625, -16.6124267578125, -16.145751953125, -15.6790771484375, -15.21240234375, -14.7457275390625, -14.279052734375, -13.8123779296875, -13.345703125, -12.8790283203125, -12.412353515625, -11.9456787109375, -11.47900390625, -11.0123291015625, -10.545654296875, -10.0789794921875, -9.6123046875, -9.1456298828125, -8.678955078125, -8.2122802734375, -7.74560546875, -7.2789306640625, -6.812255859375, -6.3455810546875, -5.87890625, -5.4122314453125, -4.945556640625, -4.4788818359375, -4.01220703125, -3.5455322265625, -3.078857421875, -2.6121826171875, -2.1455078125, -1.6788330078125, -1.212158203125, -0.7454833984375, -0.27880859375, 0.1878662109375, 0.654541015625, 1.1212158203125, 1.587890625, 2.0545654296875, 2.521240234375, 2.9879150390625, 3.45458984375, 3.9212646484375, 4.387939453125, 4.8546142578125, 5.3212890625, 5.7879638671875, 6.254638671875, 6.7213134765625, 7.18798828125, 7.6546630859375, 8.121337890625, 8.5880126953125, 9.0546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 10.0, 7.0, 10.0, 10.0, 13.0, 26.0, 30.0, 23.0, 47.0, 30.0, 49.0, 54.0, 56.0, 61.0, 58.0, 69.0, 49.0, 58.0, 51.0, 55.0, 45.0, 50.0, 30.0, 27.0, 19.0, 19.0, 14.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-5.89453125, -5.75970458984375, -5.6248779296875, -5.49005126953125, -5.355224609375, -5.22039794921875, -5.0855712890625, -4.95074462890625, -4.81591796875, -4.68109130859375, -4.5462646484375, -4.41143798828125, -4.276611328125, -4.14178466796875, -4.0069580078125, -3.87213134765625, -3.7373046875, -3.60247802734375, -3.4676513671875, -3.33282470703125, -3.197998046875, -3.06317138671875, -2.9283447265625, -2.79351806640625, -2.65869140625, -2.52386474609375, -2.3890380859375, -2.25421142578125, -2.119384765625, -1.98455810546875, -1.8497314453125, -1.71490478515625, -1.580078125, -1.44525146484375, -1.3104248046875, -1.17559814453125, -1.040771484375, -0.90594482421875, -0.7711181640625, -0.63629150390625, -0.50146484375, -0.36663818359375, -0.2318115234375, -0.09698486328125, 0.037841796875, 0.17266845703125, 0.3074951171875, 0.44232177734375, 0.5771484375, 0.71197509765625, 0.8468017578125, 0.98162841796875, 1.116455078125, 1.25128173828125, 1.3861083984375, 1.52093505859375, 1.65576171875, 1.79058837890625, 1.9254150390625, 2.06024169921875, 2.195068359375, 2.32989501953125, 2.4647216796875, 2.59954833984375, 2.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 13.0, 25.0, 23.0, 57.0, 112.0, 270.0, 982.0, 6457.0, 4123920.0, 59474.0, 2125.0, 507.0, 186.0, 57.0, 39.0, 14.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.3125, -62.51318359375, -60.7138671875, -58.91455078125, -57.115234375, -55.31591796875, -53.5166015625, -51.71728515625, -49.91796875, -48.11865234375, -46.3193359375, -44.52001953125, -42.720703125, -40.92138671875, -39.1220703125, -37.32275390625, -35.5234375, -33.72412109375, -31.9248046875, -30.12548828125, -28.326171875, -26.52685546875, -24.7275390625, -22.92822265625, -21.12890625, -19.32958984375, -17.5302734375, -15.73095703125, -13.931640625, -12.13232421875, -10.3330078125, -8.53369140625, -6.734375, -4.93505859375, -3.1357421875, -1.33642578125, 0.462890625, 2.26220703125, 4.0615234375, 5.86083984375, 7.66015625, 9.45947265625, 11.2587890625, 13.05810546875, 14.857421875, 16.65673828125, 18.4560546875, 20.25537109375, 22.0546875, 23.85400390625, 25.6533203125, 27.45263671875, 29.251953125, 31.05126953125, 32.8505859375, 34.64990234375, 36.44921875, 38.24853515625, 40.0478515625, 41.84716796875, 43.646484375, 45.44580078125, 47.2451171875, 49.04443359375, 50.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 9.0, 16.0, 29.0, 72.0, 195.0, 457.0, 1305.0, 1213.0, 475.0, 162.0, 78.0, 33.0, 17.0, 10.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.0, -43.0638427734375, -42.127685546875, -41.1915283203125, -40.25537109375, -39.3192138671875, -38.383056640625, -37.4468994140625, -36.5107421875, -35.5745849609375, -34.638427734375, -33.7022705078125, -32.76611328125, -31.8299560546875, -30.893798828125, -29.9576416015625, -29.021484375, -28.0853271484375, -27.149169921875, -26.2130126953125, -25.27685546875, -24.3406982421875, -23.404541015625, -22.4683837890625, -21.5322265625, -20.5960693359375, -19.659912109375, -18.7237548828125, -17.78759765625, -16.8514404296875, -15.915283203125, -14.9791259765625, -14.04296875, -13.1068115234375, -12.170654296875, -11.2344970703125, -10.29833984375, -9.3621826171875, -8.426025390625, -7.4898681640625, -6.5537109375, -5.6175537109375, -4.681396484375, -3.7452392578125, -2.80908203125, -1.8729248046875, -0.936767578125, -0.0006103515625, 0.935546875, 1.8717041015625, 2.807861328125, 3.7440185546875, 4.68017578125, 5.6163330078125, 6.552490234375, 7.4886474609375, 8.4248046875, 9.3609619140625, 10.297119140625, 11.2332763671875, 12.16943359375, 13.1055908203125, 14.041748046875, 14.9779052734375, 15.9140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 12.0, 30.0, 59.0, 125.0, 211.0, 225.0, 151.0, 73.0, 34.0, 16.0, 12.0, 10.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.0352325439453, -140.95846557617188, -134.88169860839844, -128.804931640625, -122.72816467285156, -116.65139770507812, -110.57463073730469, -104.49786376953125, -98.42109680175781, -92.34432983398438, -86.26756286621094, -80.1907958984375, -74.11402893066406, -68.03726196289062, -61.96049499511719, -55.88372802734375, -49.80696105957031, -43.730194091796875, -37.65342712402344, -31.57666015625, -25.499893188476562, -19.423126220703125, -13.346359252929688, -7.26959228515625, -1.1928253173828125, 4.883941650390625, 10.960708618164062, 17.0374755859375, 23.114242553710938, 29.191009521484375, 35.26777648925781, 41.34454345703125, 47.42132568359375, 53.49809265136719, 59.574859619140625, 65.65162658691406, 71.7283935546875, 77.80516052246094, 83.88192749023438, 89.95869445800781, 96.03546142578125, 102.11222839355469, 108.18899536132812, 114.26576232910156, 120.342529296875, 126.41929626464844, 132.49606323242188, 138.5728302001953, 144.64959716796875, 150.7263641357422, 156.80313110351562, 162.87989807128906, 168.9566650390625, 175.03343200683594, 181.11019897460938, 187.1869659423828, 193.26373291015625, 199.3404998779297, 205.41726684570312, 211.49403381347656, 217.57080078125, 223.64756774902344, 229.72433471679688, 235.8011016845703, 241.87786865234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 10.0, 10.0, 8.0, 10.0, 18.0, 16.0, 28.0, 35.0, 59.0, 53.0, 71.0, 73.0, 89.0, 113.0, 80.0, 76.0, 53.0, 41.0, 30.0, 27.0, 22.0, 22.0, 22.0, 9.0, 3.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.29942321777344, -93.79444885253906, -90.28946685791016, -86.78449249267578, -83.27951049804688, -79.7745361328125, -76.26956176757812, -72.76457977294922, -69.25959777832031, -65.75462341308594, -62.24964141845703, -58.744667053222656, -55.23968505859375, -51.734710693359375, -48.229732513427734, -44.724754333496094, -41.21977996826172, -37.71480178833008, -34.20982360839844, -30.70484733581543, -27.19986915588379, -23.69489097595215, -20.18991470336914, -16.6849365234375, -13.17995834350586, -9.674980163574219, -6.1700029373168945, -2.6650257110595703, 0.8399524688720703, 4.344930648803711, 7.849906921386719, 11.35488510131836, 14.859855651855469, 18.36483383178711, 21.86981201171875, 25.374788284301758, 28.8797664642334, 32.384742736816406, 35.88972091674805, 39.39469909667969, 42.89967727661133, 46.40465545654297, 49.90963363647461, 53.41461181640625, 56.919586181640625, 60.42456817626953, 63.929542541503906, 67.43452453613281, 70.93949890136719, 74.44447326660156, 77.94945526123047, 81.45442962646484, 84.95941162109375, 88.46438598632812, 91.9693603515625, 95.4743423461914, 98.97932434082031, 102.48429870605469, 105.9892807006836, 109.49425506591797, 112.99923706054688, 116.50421142578125, 120.00918579101562, 123.51416778564453, 127.0191421508789]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 19.0, 11.0, 25.0, 53.0, 45.0, 84.0, 151.0, 257.0, 408.0, 876.0, 1985.0, 5252.0, 19716.0, 128497.0, 764974.0, 101054.0, 16832.0, 4767.0, 1785.0, 753.0, 408.0, 230.0, 121.0, 81.0, 50.0, 47.0, 22.0, 13.0, 15.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.8197021484375, -8.530029296875, -8.2403564453125, -7.95068359375, -7.6610107421875, -7.371337890625, -7.0816650390625, -6.7919921875, -6.5023193359375, -6.212646484375, -5.9229736328125, -5.63330078125, -5.3436279296875, -5.053955078125, -4.7642822265625, -4.474609375, -4.1849365234375, -3.895263671875, -3.6055908203125, -3.31591796875, -3.0262451171875, -2.736572265625, -2.4468994140625, -2.1572265625, -1.8675537109375, -1.577880859375, -1.2882080078125, -0.99853515625, -0.7088623046875, -0.419189453125, -0.1295166015625, 0.16015625, 0.4498291015625, 0.739501953125, 1.0291748046875, 1.31884765625, 1.6085205078125, 1.898193359375, 2.1878662109375, 2.4775390625, 2.7672119140625, 3.056884765625, 3.3465576171875, 3.63623046875, 3.9259033203125, 4.215576171875, 4.5052490234375, 4.794921875, 5.0845947265625, 5.374267578125, 5.6639404296875, 5.95361328125, 6.2432861328125, 6.532958984375, 6.8226318359375, 7.1123046875, 7.4019775390625, 7.691650390625, 7.9813232421875, 8.27099609375, 8.5606689453125, 8.850341796875, 9.1400146484375, 9.4296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 9.0, 11.0, 16.0, 23.0, 12.0, 21.0, 42.0, 59.0, 74.0, 80.0, 77.0, 94.0, 87.0, 86.0, 74.0, 61.0, 57.0, 38.0, 33.0, 13.0, 13.0, 11.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0546875, -8.8013916015625, -8.548095703125, -8.2947998046875, -8.04150390625, -7.7882080078125, -7.534912109375, -7.2816162109375, -7.0283203125, -6.7750244140625, -6.521728515625, -6.2684326171875, -6.01513671875, -5.7618408203125, -5.508544921875, -5.2552490234375, -5.001953125, -4.7486572265625, -4.495361328125, -4.2420654296875, -3.98876953125, -3.7354736328125, -3.482177734375, -3.2288818359375, -2.9755859375, -2.7222900390625, -2.468994140625, -2.2156982421875, -1.96240234375, -1.7091064453125, -1.455810546875, -1.2025146484375, -0.94921875, -0.6959228515625, -0.442626953125, -0.1893310546875, 0.06396484375, 0.3172607421875, 0.570556640625, 0.8238525390625, 1.0771484375, 1.3304443359375, 1.583740234375, 1.8370361328125, 2.09033203125, 2.3436279296875, 2.596923828125, 2.8502197265625, 3.103515625, 3.3568115234375, 3.610107421875, 3.8634033203125, 4.11669921875, 4.3699951171875, 4.623291015625, 4.8765869140625, 5.1298828125, 5.3831787109375, 5.636474609375, 5.8897705078125, 6.14306640625, 6.3963623046875, 6.649658203125, 6.9029541015625, 7.15625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 7.0, 6.0, 13.0, 10.0, 10.0, 24.0, 18.0, 34.0, 39.0, 67.0, 91.0, 120.0, 206.0, 380.0, 724.0, 1863.0, 6650.0, 54050.0, 915498.0, 58082.0, 6965.0, 1833.0, 751.0, 387.0, 227.0, 152.0, 92.0, 54.0, 49.0, 30.0, 35.0, 18.0, 8.0, 17.0, 12.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.1015625, -9.781005859375, -9.46044921875, -9.139892578125, -8.8193359375, -8.498779296875, -8.17822265625, -7.857666015625, -7.537109375, -7.216552734375, -6.89599609375, -6.575439453125, -6.2548828125, -5.934326171875, -5.61376953125, -5.293212890625, -4.97265625, -4.652099609375, -4.33154296875, -4.010986328125, -3.6904296875, -3.369873046875, -3.04931640625, -2.728759765625, -2.408203125, -2.087646484375, -1.76708984375, -1.446533203125, -1.1259765625, -0.805419921875, -0.48486328125, -0.164306640625, 0.15625, 0.476806640625, 0.79736328125, 1.117919921875, 1.4384765625, 1.759033203125, 2.07958984375, 2.400146484375, 2.720703125, 3.041259765625, 3.36181640625, 3.682373046875, 4.0029296875, 4.323486328125, 4.64404296875, 4.964599609375, 5.28515625, 5.605712890625, 5.92626953125, 6.246826171875, 6.5673828125, 6.887939453125, 7.20849609375, 7.529052734375, 7.849609375, 8.170166015625, 8.49072265625, 8.811279296875, 9.1318359375, 9.452392578125, 9.77294921875, 10.093505859375, 10.4140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 6.0, 10.0, 7.0, 15.0, 11.0, 25.0, 27.0, 29.0, 35.0, 34.0, 44.0, 49.0, 65.0, 72.0, 90.0, 76.0, 63.0, 49.0, 49.0, 47.0, 35.0, 32.0, 22.0, 21.0, 20.0, 14.0, 14.0, 4.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.576904296875, -16.93505859375, -16.293212890625, -15.6513671875, -15.009521484375, -14.36767578125, -13.725830078125, -13.083984375, -12.442138671875, -11.80029296875, -11.158447265625, -10.5166015625, -9.874755859375, -9.23291015625, -8.591064453125, -7.94921875, -7.307373046875, -6.66552734375, -6.023681640625, -5.3818359375, -4.739990234375, -4.09814453125, -3.456298828125, -2.814453125, -2.172607421875, -1.53076171875, -0.888916015625, -0.2470703125, 0.394775390625, 1.03662109375, 1.678466796875, 2.3203125, 2.962158203125, 3.60400390625, 4.245849609375, 4.8876953125, 5.529541015625, 6.17138671875, 6.813232421875, 7.455078125, 8.096923828125, 8.73876953125, 9.380615234375, 10.0224609375, 10.664306640625, 11.30615234375, 11.947998046875, 12.58984375, 13.231689453125, 13.87353515625, 14.515380859375, 15.1572265625, 15.799072265625, 16.44091796875, 17.082763671875, 17.724609375, 18.366455078125, 19.00830078125, 19.650146484375, 20.2919921875, 20.933837890625, 21.57568359375, 22.217529296875, 22.859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 11.0, 14.0, 20.0, 34.0, 60.0, 95.0, 203.0, 448.0, 1210.0, 5101.0, 55131.0, 957649.0, 23786.0, 3183.0, 835.0, 328.0, 155.0, 108.0, 57.0, 39.0, 19.0, 23.0, 9.0, 10.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.884765625, -2.7864990234375, -2.688232421875, -2.5899658203125, -2.49169921875, -2.3934326171875, -2.295166015625, -2.1968994140625, -2.0986328125, -2.0003662109375, -1.902099609375, -1.8038330078125, -1.70556640625, -1.6072998046875, -1.509033203125, -1.4107666015625, -1.3125, -1.2142333984375, -1.115966796875, -1.0177001953125, -0.91943359375, -0.8211669921875, -0.722900390625, -0.6246337890625, -0.5263671875, -0.4281005859375, -0.329833984375, -0.2315673828125, -0.13330078125, -0.0350341796875, 0.063232421875, 0.1614990234375, 0.259765625, 0.3580322265625, 0.456298828125, 0.5545654296875, 0.65283203125, 0.7510986328125, 0.849365234375, 0.9476318359375, 1.0458984375, 1.1441650390625, 1.242431640625, 1.3406982421875, 1.43896484375, 1.5372314453125, 1.635498046875, 1.7337646484375, 1.83203125, 1.9302978515625, 2.028564453125, 2.1268310546875, 2.22509765625, 2.3233642578125, 2.421630859375, 2.5198974609375, 2.6181640625, 2.7164306640625, 2.814697265625, 2.9129638671875, 3.01123046875, 3.1094970703125, 3.207763671875, 3.3060302734375, 3.404296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 7.0, 12.0, 10.0, 18.0, 23.0, 50.0, 57.0, 148.0, 229.0, 192.0, 92.0, 40.0, 35.0, 21.0, 10.0, 8.0, 9.0, 4.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007281303405761719, -0.0007044821977615356, -0.0006808340549468994, -0.0006571859121322632, -0.000633537769317627, -0.0006098896265029907, -0.0005862414836883545, -0.0005625933408737183, -0.000538945198059082, -0.0005152970552444458, -0.0004916489124298096, -0.00046800076961517334, -0.0004443526268005371, -0.0004207044839859009, -0.00039705634117126465, -0.0003734081983566284, -0.0003497600555419922, -0.00032611191272735596, -0.0003024637699127197, -0.0002788156270980835, -0.00025516748428344727, -0.00023151934146881104, -0.0002078711986541748, -0.00018422305583953857, -0.00016057491302490234, -0.0001369267702102661, -0.00011327862739562988, -8.963048458099365e-05, -6.598234176635742e-05, -4.233419895172119e-05, -1.868605613708496e-05, 4.9620866775512695e-06, 2.86102294921875e-05, 5.225837230682373e-05, 7.590651512145996e-05, 9.955465793609619e-05, 0.00012320280075073242, 0.00014685094356536865, 0.00017049908638000488, 0.0001941472291946411, 0.00021779537200927734, 0.00024144351482391357, 0.0002650916576385498, 0.00028873980045318604, 0.00031238794326782227, 0.0003360360860824585, 0.0003596842288970947, 0.00038333237171173096, 0.0004069805145263672, 0.0004306286573410034, 0.00045427680015563965, 0.0004779249429702759, 0.0005015730857849121, 0.0005252212285995483, 0.0005488693714141846, 0.0005725175142288208, 0.000596165657043457, 0.0006198137998580933, 0.0006434619426727295, 0.0006671100854873657, 0.000690758228302002, 0.0007144063711166382, 0.0007380545139312744, 0.0007617026567459106, 0.0007853507995605469]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 20.0, 29.0, 45.0, 72.0, 154.0, 295.0, 630.0, 1556.0, 5149.0, 24820.0, 828984.0, 165490.0, 15387.0, 3644.0, 1190.0, 492.0, 232.0, 134.0, 69.0, 50.0, 28.0, 17.0, 16.0, 14.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.31317138671875, -2.2357177734375, -2.15826416015625, -2.080810546875, -2.00335693359375, -1.9259033203125, -1.84844970703125, -1.77099609375, -1.69354248046875, -1.6160888671875, -1.53863525390625, -1.461181640625, -1.38372802734375, -1.3062744140625, -1.22882080078125, -1.1513671875, -1.07391357421875, -0.9964599609375, -0.91900634765625, -0.841552734375, -0.76409912109375, -0.6866455078125, -0.60919189453125, -0.53173828125, -0.45428466796875, -0.3768310546875, -0.29937744140625, -0.221923828125, -0.14447021484375, -0.0670166015625, 0.01043701171875, 0.087890625, 0.16534423828125, 0.2427978515625, 0.32025146484375, 0.397705078125, 0.47515869140625, 0.5526123046875, 0.63006591796875, 0.70751953125, 0.78497314453125, 0.8624267578125, 0.93988037109375, 1.017333984375, 1.09478759765625, 1.1722412109375, 1.24969482421875, 1.3271484375, 1.40460205078125, 1.4820556640625, 1.55950927734375, 1.636962890625, 1.71441650390625, 1.7918701171875, 1.86932373046875, 1.94677734375, 2.02423095703125, 2.1016845703125, 2.17913818359375, 2.256591796875, 2.33404541015625, 2.4114990234375, 2.48895263671875, 2.56640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 3.0, 6.0, 12.0, 11.0, 11.0, 15.0, 20.0, 22.0, 29.0, 44.0, 58.0, 99.0, 131.0, 108.0, 118.0, 73.0, 63.0, 31.0, 24.0, 21.0, 16.0, 19.0, 8.0, 12.0, 5.0, 8.0, 8.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6259765625, -1.5701141357421875, -1.514251708984375, -1.4583892822265625, -1.40252685546875, -1.3466644287109375, -1.290802001953125, -1.2349395751953125, -1.1790771484375, -1.1232147216796875, -1.067352294921875, -1.0114898681640625, -0.95562744140625, -0.8997650146484375, -0.843902587890625, -0.7880401611328125, -0.732177734375, -0.6763153076171875, -0.620452880859375, -0.5645904541015625, -0.50872802734375, -0.4528656005859375, -0.397003173828125, -0.3411407470703125, -0.2852783203125, -0.2294158935546875, -0.173553466796875, -0.1176910400390625, -0.06182861328125, -0.0059661865234375, 0.049896240234375, 0.1057586669921875, 0.16162109375, 0.2174835205078125, 0.273345947265625, 0.3292083740234375, 0.38507080078125, 0.4409332275390625, 0.496795654296875, 0.5526580810546875, 0.6085205078125, 0.6643829345703125, 0.720245361328125, 0.7761077880859375, 0.83197021484375, 0.8878326416015625, 0.943695068359375, 0.9995574951171875, 1.055419921875, 1.1112823486328125, 1.167144775390625, 1.2230072021484375, 1.27886962890625, 1.3347320556640625, 1.390594482421875, 1.4464569091796875, 1.5023193359375, 1.5581817626953125, 1.614044189453125, 1.6699066162109375, 1.72576904296875, 1.7816314697265625, 1.837493896484375, 1.8933563232421875, 1.94921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 14.0, 29.0, 76.0, 190.0, 498.0, 99.0, 40.0, 24.0, 9.0, 3.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.94486999511719, -46.84848403930664, -43.752098083496094, -40.65570831298828, -37.559322357177734, -34.46293640136719, -31.36655044555664, -28.27016258239746, -25.173776626586914, -22.077390670776367, -18.981002807617188, -15.88461685180664, -12.788229942321777, -9.691843032836914, -6.595457077026367, -3.4990692138671875, -0.4026832580566406, 2.6937034130096436, 5.790090084075928, 8.886476516723633, 11.982863426208496, 15.07925033569336, 18.175636291503906, 21.272024154663086, 24.368410110473633, 27.46479606628418, 30.56118392944336, 33.657569885253906, 36.75395584106445, 39.850341796875, 42.94673156738281, 46.04311752319336, 49.139503479003906, 52.23588943481445, 55.332275390625, 58.42866516113281, 61.52505111694336, 64.6214370727539, 67.71781921386719, 70.814208984375, 73.91059875488281, 77.00698852539062, 80.1033706665039, 83.19976043701172, 86.296142578125, 89.39253234863281, 92.48892211914062, 95.5853042602539, 98.68168640136719, 101.778076171875, 104.87445831298828, 107.9708480834961, 111.06723022460938, 114.16361999511719, 117.260009765625, 120.35639190673828, 123.4527816772461, 126.5491714477539, 129.6455535888672, 132.741943359375, 135.8383331298828, 138.93472290039062, 142.03109741210938, 145.1274871826172, 148.223876953125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 15.0, 22.0, 27.0, 43.0, 49.0, 91.0, 390.0, 134.0, 56.0, 40.0, 36.0, 36.0, 18.0, 6.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.80511474609375, -129.36587524414062, -125.9266357421875, -122.48739624023438, -119.04815673828125, -115.60891723632812, -112.169677734375, -108.73043823242188, -105.29119873046875, -101.85195922851562, -98.4127197265625, -94.97348022460938, -91.53424072265625, -88.09500122070312, -84.65576171875, -81.21652221679688, -77.77729034423828, -74.33805084228516, -70.89881134033203, -67.4595718383789, -64.02033233642578, -60.581092834472656, -57.1418571472168, -53.70261764526367, -50.26337814331055, -46.82413864135742, -43.3848991394043, -39.94566345214844, -36.50642395019531, -33.06718444824219, -29.627944946289062, -26.188705444335938, -22.749465942382812, -19.310226440429688, -15.870987892150879, -12.43174934387207, -8.992509841918945, -5.55327033996582, -2.114032745361328, 1.3252067565917969, 4.764446258544922, 8.203685760498047, 11.642924308776855, 15.082162857055664, 18.52140235900879, 21.960641860961914, 25.399879455566406, 28.83911895751953, 32.278358459472656, 35.71759796142578, 39.156837463378906, 42.59607696533203, 46.035316467285156, 49.47455596923828, 52.91379165649414, 56.353031158447266, 59.79227066040039, 63.231510162353516, 66.67074584960938, 70.1099853515625, 73.54922485351562, 76.98846435546875, 80.42770385742188, 83.866943359375, 87.30618286132812]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 11.0, 12.0, 17.0, 35.0, 32.0, 59.0, 54.0, 123.0, 294.0, 67.0, 74.0, 55.0, 30.0, 30.0, 28.0, 16.0, 9.0, 12.0, 8.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.375, -7.1539306640625, -6.932861328125, -6.7117919921875, -6.49072265625, -6.2696533203125, -6.048583984375, -5.8275146484375, -5.6064453125, -5.3853759765625, -5.164306640625, -4.9432373046875, -4.72216796875, -4.5010986328125, -4.280029296875, -4.0589599609375, -3.837890625, -3.6168212890625, -3.395751953125, -3.1746826171875, -2.95361328125, -2.7325439453125, -2.511474609375, -2.2904052734375, -2.0693359375, -1.8482666015625, -1.627197265625, -1.4061279296875, -1.18505859375, -0.9639892578125, -0.742919921875, -0.5218505859375, -0.30078125, -0.0797119140625, 0.141357421875, 0.3624267578125, 0.58349609375, 0.8045654296875, 1.025634765625, 1.2467041015625, 1.4677734375, 1.6888427734375, 1.909912109375, 2.1309814453125, 2.35205078125, 2.5731201171875, 2.794189453125, 3.0152587890625, 3.236328125, 3.4573974609375, 3.678466796875, 3.8995361328125, 4.12060546875, 4.3416748046875, 4.562744140625, 4.7838134765625, 5.0048828125, 5.2259521484375, 5.447021484375, 5.6680908203125, 5.88916015625, 6.1102294921875, 6.331298828125, 6.5523681640625, 6.7734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 11.0, 5.0, 1.0, 6.0, 15.0, 16.0, 28.0, 32.0, 96.0, 139.0, 316.0, 1561.0, 22387.0, 8358579.0, 4280.0, 658.0, 214.0, 71.0, 58.0, 44.0, 17.0, 10.0, 14.0, 8.0, 10.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-73.26998138427734, -70.76465606689453, -68.25933837890625, -65.75401306152344, -63.248695373535156, -60.74337387084961, -58.23805236816406, -55.73272705078125, -53.22740936279297, -50.72208786010742, -48.216766357421875, -45.71144485473633, -43.20612335205078, -40.700801849365234, -38.19548034667969, -35.690155029296875, -33.18483352661133, -30.67951202392578, -28.174190521240234, -25.668869018554688, -23.16354751586914, -20.658226013183594, -18.152902603149414, -15.647581100463867, -13.14225959777832, -10.636938095092773, -8.131616592407227, -5.626294136047363, -3.1209726333618164, -0.6156511306762695, 1.8896713256835938, 4.394992828369141, 6.9003143310546875, 9.405635833740234, 11.910957336425781, 14.416279792785645, 16.921600341796875, 19.426921844482422, 21.9322452545166, 24.43756675720215, 26.942888259887695, 29.448209762573242, 31.95353126525879, 34.45885467529297, 36.964176177978516, 39.46949768066406, 41.97481918334961, 44.480140686035156, 46.9854621887207, 49.49078369140625, 51.9961051940918, 54.501426696777344, 57.00674819946289, 59.51206970214844, 62.01739501953125, 64.52271270751953, 67.02803802490234, 69.53336334228516, 72.03868103027344, 74.54400634765625, 77.04932403564453, 79.55464935302734, 82.05996704101562, 84.56529235839844, 87.07061004638672]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 2.0, 5.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.47355651855469, -63.188907623291016, -60.904258728027344, -58.61960983276367, -56.3349609375, -54.05030822753906, -51.76565933227539, -49.48101043701172, -47.19636154174805, -44.911712646484375, -42.6270637512207, -40.34241485595703, -38.057762145996094, -35.77311706542969, -33.48846435546875, -31.203815460205078, -28.919166564941406, -26.634517669677734, -24.349868774414062, -22.065217971801758, -19.780569076538086, -17.495920181274414, -15.211270332336426, -12.926620483398438, -10.641971588134766, -8.357322692871094, -6.0726728439331055, -3.7880234718322754, -1.5033740997314453, 0.7812747955322266, 3.065924644470215, 5.350574493408203, 7.635231018066406, 9.919879913330078, 12.204529762268066, 14.489179611206055, 16.773828506469727, 19.0584774017334, 21.343128204345703, 23.627777099609375, 25.912425994873047, 28.19707489013672, 30.48172378540039, 32.76637268066406, 35.051025390625, 37.335670471191406, 39.620323181152344, 41.904972076416016, 44.18962097167969, 46.47426986694336, 48.75891876220703, 51.0435676574707, 53.328216552734375, 55.61286926269531, 57.897518157958984, 60.182167053222656, 62.46681594848633, 64.75146484375, 67.03611755371094, 69.32076263427734, 71.60541534423828, 73.89006042480469, 76.17471313476562, 78.45936584472656, 80.74401092529297]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 13.0, 7.0, 6.0, 15.0, 26.0, 29.0, 41.0, 54.0, 81.0, 96.0, 123.0, 111.0, 104.0, 82.0, 65.0, 45.0, 29.0, 24.0, 22.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.069976806640625, -2.97198486328125, -2.873992919921875, -2.7760009765625, -2.678009033203125, -2.58001708984375, -2.482025146484375, -2.384033203125, -2.286041259765625, -2.18804931640625, -2.090057373046875, -1.9920654296875, -1.894073486328125, -1.79608154296875, -1.698089599609375, -1.60009765625, -1.502105712890625, -1.40411376953125, -1.306121826171875, -1.2081298828125, -1.110137939453125, -1.01214599609375, -0.914154052734375, -0.816162109375, -0.718170166015625, -0.62017822265625, -0.522186279296875, -0.4241943359375, -0.326202392578125, -0.22821044921875, -0.130218505859375, -0.0322265625, 0.065765380859375, 0.16375732421875, 0.261749267578125, 0.3597412109375, 0.457733154296875, 0.55572509765625, 0.653717041015625, 0.751708984375, 0.849700927734375, 0.94769287109375, 1.045684814453125, 1.1436767578125, 1.241668701171875, 1.33966064453125, 1.437652587890625, 1.53564453125, 1.633636474609375, 1.73162841796875, 1.829620361328125, 1.9276123046875, 2.025604248046875, 2.12359619140625, 2.221588134765625, 2.319580078125, 2.417572021484375, 2.51556396484375, 2.613555908203125, 2.7115478515625, 2.809539794921875, 2.90753173828125, 3.005523681640625, 3.103515625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 1.0, 3.0, 11.0, 10.0, 16.0, 14.0, 20.0, 43.0, 104.0, 160.0, 342.0, 757.0, 2190.0, 7876.0, 43583.0, 252545.0, 180232.0, 27736.0, 5566.0, 1754.0, 670.0, 301.0, 150.0, 69.0, 53.0, 22.0, 9.0, 7.0, 8.0, 4.0, 1.0, 2.0], "bins": [-80.875, -79.18603515625, -77.4970703125, -75.80810546875, -74.119140625, -72.43017578125, -70.7412109375, -69.05224609375, -67.36328125, -65.67431640625, -63.9853515625, -62.29638671875, -60.607421875, -58.91845703125, -57.2294921875, -55.54052734375, -53.8515625, -52.16259765625, -50.4736328125, -48.78466796875, -47.095703125, -45.40673828125, -43.7177734375, -42.02880859375, -40.33984375, -38.65087890625, -36.9619140625, -35.27294921875, -33.583984375, -31.89501953125, -30.2060546875, -28.51708984375, -26.828125, -25.13916015625, -23.4501953125, -21.76123046875, -20.072265625, -18.38330078125, -16.6943359375, -15.00537109375, -13.31640625, -11.62744140625, -9.9384765625, -8.24951171875, -6.560546875, -4.87158203125, -3.1826171875, -1.49365234375, 0.1953125, 1.88427734375, 3.5732421875, 5.26220703125, 6.951171875, 8.64013671875, 10.3291015625, 12.01806640625, 13.70703125, 15.39599609375, 17.0849609375, 18.77392578125, 20.462890625, 22.15185546875, 23.8408203125, 25.52978515625, 27.21875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 7.0, 4.0, 8.0, 21.0, 22.0, 26.0, 33.0, 48.0, 53.0, 97.0, 87.0, 91.0, 114.0, 80.0, 72.0, 65.0, 39.0, 38.0, 27.0, 19.0, 17.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0], "bins": [-10.8671875, -10.62615966796875, -10.3851318359375, -10.14410400390625, -9.903076171875, -9.66204833984375, -9.4210205078125, -9.17999267578125, -8.93896484375, -8.69793701171875, -8.4569091796875, -8.21588134765625, -7.974853515625, -7.73382568359375, -7.4927978515625, -7.25177001953125, -7.0107421875, -6.76971435546875, -6.5286865234375, -6.28765869140625, -6.046630859375, -5.80560302734375, -5.5645751953125, -5.32354736328125, -5.08251953125, -4.84149169921875, -4.6004638671875, -4.35943603515625, -4.118408203125, -3.87738037109375, -3.6363525390625, -3.39532470703125, -3.154296875, -2.91326904296875, -2.6722412109375, -2.43121337890625, -2.190185546875, -1.94915771484375, -1.7081298828125, -1.46710205078125, -1.22607421875, -0.98504638671875, -0.7440185546875, -0.50299072265625, -0.261962890625, -0.02093505859375, 0.2200927734375, 0.46112060546875, 0.7021484375, 0.94317626953125, 1.1842041015625, 1.42523193359375, 1.666259765625, 1.90728759765625, 2.1483154296875, 2.38934326171875, 2.63037109375, 2.87139892578125, 3.1124267578125, 3.35345458984375, 3.594482421875, 3.83551025390625, 4.0765380859375, 4.31756591796875, 4.55859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 18.0, 28.0, 38.0, 68.0, 75.0, 72.0, 66.0, 30.0, 19.0, 14.0, 3.0, 7.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.89596176147461, -31.626115798950195, -30.356271743774414, -29.08642578125, -27.81658172607422, -26.546735763549805, -25.27688980102539, -24.00704574584961, -22.737199783325195, -21.46735382080078, -20.197509765625, -18.927663803100586, -17.657817840576172, -16.38797378540039, -15.118127822875977, -13.848282814025879, -12.578437805175781, -11.308592796325684, -10.038747787475586, -8.768901824951172, -7.499056816101074, -6.229211807250977, -4.959366321563721, -3.689520835876465, -2.419675827026367, -1.1498305797576904, 0.12001466751098633, 1.389859914779663, 2.65970516204834, 3.9295501708984375, 5.199395656585693, 6.469241142272949, 7.7390899658203125, 9.00893497467041, 10.278779983520508, 11.548625946044922, 12.81847095489502, 14.088315963745117, 15.358161926269531, 16.628005981445312, 17.897851943969727, 19.16769790649414, 20.437541961669922, 21.707387924194336, 22.97723388671875, 24.24707794189453, 25.516923904418945, 26.78676986694336, 28.05661392211914, 29.326459884643555, 30.596303939819336, 31.86614990234375, 33.13599395751953, 34.40583801269531, 35.67568588256836, 36.94552993774414, 38.21537780761719, 39.48522186279297, 40.755069732666016, 42.0249137878418, 43.29475784301758, 44.564605712890625, 45.834449768066406, 47.10429382324219, 48.37413787841797]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 20.0, 22.0, 32.0, 58.0, 67.0, 76.0, 51.0, 36.0, 27.0, 17.0, 14.0, 10.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.92654800415039, -33.86155700683594, -32.79656982421875, -31.73158073425293, -30.66659164428711, -29.60160255432129, -28.53661346435547, -27.47162437438965, -26.406635284423828, -25.341646194458008, -24.276657104492188, -23.211668014526367, -22.146678924560547, -21.081689834594727, -20.016700744628906, -18.951711654663086, -17.886722564697266, -16.821733474731445, -15.756744384765625, -14.691755294799805, -13.626766204833984, -12.561777114868164, -11.496788024902344, -10.431798934936523, -9.366809844970703, -8.301820755004883, -7.2368316650390625, -6.171842575073242, -5.106853485107422, -4.041864395141602, -2.9768753051757812, -1.911886215209961, -0.846893310546875, 0.2180957794189453, 1.2830848693847656, 2.348073959350586, 3.4130630493164062, 4.478052139282227, 5.543041229248047, 6.608030319213867, 7.6730194091796875, 8.738008499145508, 9.802997589111328, 10.867986679077148, 11.932975769042969, 12.997964859008789, 14.06295394897461, 15.12794303894043, 16.19293212890625, 17.25792121887207, 18.32291030883789, 19.38789939880371, 20.45288848876953, 21.51787757873535, 22.582866668701172, 23.647855758666992, 24.712844848632812, 25.777833938598633, 26.842823028564453, 27.907812118530273, 28.972801208496094, 30.037790298461914, 31.102779388427734, 32.16777038574219, 33.232757568359375]}, "eval/loss": 5.443604946136475, "eval/wer": 1.5227687425624752, "eval/runtime": 664.731, "eval/samples_per_second": 3.975, "eval/steps_per_second": 0.498} \ No newline at end of file