diff --git "a/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" "b/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" --- "a/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" +++ "b/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0607, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 5.0, "train/global_step": 2230, "_runtime": 27450, "_timestamp": 1648082204, "_step": 2235, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 68.0, 378.0, 461.0, 73.0, 23.0, 5.0], "bins": [-18.02739143371582, -17.72731590270996, -17.4272403717041, -17.127166748046875, -16.827091217041016, -16.527015686035156, -16.226940155029297, -15.926865577697754, -15.626791000366211, -15.326715469360352, -15.026640892028809, -14.72656536102295, -14.426490783691406, -14.126415252685547, -13.826340675354004, -13.526265144348145, -13.226189613342285, -12.926114082336426, -12.626039505004883, -12.325963973999023, -12.02588939666748, -11.725813865661621, -11.425739288330078, -11.125663757324219, -10.82558822631836, -10.5255126953125, -10.225438117980957, -9.925362586975098, -9.625288009643555, -9.325212478637695, -9.025137901306152, -8.725062370300293, -8.42498779296875, -8.12491226196289, -7.824837684631348, -7.5247626304626465, -7.224687576293945, -6.924612045288086, -6.624536991119385, -6.324461936950684, -6.024386882781982, -5.724311828613281, -5.42423677444458, -5.124161720275879, -4.8240861892700195, -4.524011611938477, -4.223936080932617, -3.923861026763916, -3.623785972595215, -3.3237109184265137, -3.0236358642578125, -2.7235605716705322, -2.423485517501831, -2.12341046333313, -1.8233352899551392, -1.5232601165771484, -1.2231850624084473, -0.9231099486351013, -0.6230348348617554, -0.3229597210884094, -0.022884607315063477, 0.2771904468536377, 0.5772656202316284, 0.8773407936096191, 1.1774158477783203]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 11.0, 14.0, 14.0, 20.0, 26.0, 20.0, 29.0, 30.0, 47.0, 41.0, 36.0, 27.0, 36.0, 39.0, 42.0, 64.0, 43.0, 57.0, 43.0, 37.0, 54.0, 40.0, 31.0, 31.0, 27.0, 24.0, 22.0, 22.0, 21.0, 7.0, 10.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5585064888000488, -1.5144308805465698, -1.4703552722930908, -1.4262796640396118, -1.3822040557861328, -1.3381283283233643, -1.2940528392791748, -1.2499771118164062, -1.2059015035629272, -1.1618258953094482, -1.1177502870559692, -1.0736746788024902, -1.0295990705490112, -0.9855234026908875, -0.9414477944374084, -0.8973721265792847, -0.8532965779304504, -0.8092209696769714, -0.7651453614234924, -0.7210696935653687, -0.6769940853118896, -0.6329184770584106, -0.5888428688049316, -0.5447672605514526, -0.5006916522979736, -0.45661604404449463, -0.41254040598869324, -0.36846479773521423, -0.32438915967941284, -0.28031355142593384, -0.23623794317245483, -0.19216230511665344, -0.14808666706085205, -0.10401104390621185, -0.05993542820215225, -0.01585981249809265, 0.028215810656547546, 0.07229143381118774, 0.11636704206466675, 0.16044268012046814, 0.20451828837394714, 0.24859391152858734, 0.29266953468322754, 0.33674514293670654, 0.38082075119018555, 0.42489638924598694, 0.46897199749946594, 0.5130476355552673, 0.5571232438087463, 0.6011988520622253, 0.6452744603157043, 0.6893501281738281, 0.7334257364273071, 0.7775013446807861, 0.8215769529342651, 0.8656525611877441, 0.9097281694412231, 0.9538037776947021, 0.9978793859481812, 1.0419549942016602, 1.0860306024551392, 1.1301062107086182, 1.1741819381713867, 1.2182575464248657, 1.2623331546783447]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 15.0, 18.0, 25.0, 39.0, 64.0, 77.0, 122.0, 168.0, 265.0, 409.0, 597.0, 977.0, 1516.0, 2377.0, 3912.0, 7508.0, 26892.0, 350221.0, 3272449.0, 467680.0, 39875.0, 8556.0, 4066.0, 2386.0, 1466.0, 911.0, 571.0, 376.0, 238.0, 168.0, 115.0, 81.0, 39.0, 27.0, 22.0, 20.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.497314453125, -4.35009765625, -4.202880859375, -4.0556640625, -3.908447265625, -3.76123046875, -3.614013671875, -3.466796875, -3.319580078125, -3.17236328125, -3.025146484375, -2.8779296875, -2.730712890625, -2.58349609375, -2.436279296875, -2.2890625, -2.141845703125, -1.99462890625, -1.847412109375, -1.7001953125, -1.552978515625, -1.40576171875, -1.258544921875, -1.111328125, -0.964111328125, -0.81689453125, -0.669677734375, -0.5224609375, -0.375244140625, -0.22802734375, -0.080810546875, 0.06640625, 0.213623046875, 0.36083984375, 0.508056640625, 0.6552734375, 0.802490234375, 0.94970703125, 1.096923828125, 1.244140625, 1.391357421875, 1.53857421875, 1.685791015625, 1.8330078125, 1.980224609375, 2.12744140625, 2.274658203125, 2.421875, 2.569091796875, 2.71630859375, 2.863525390625, 3.0107421875, 3.157958984375, 3.30517578125, 3.452392578125, 3.599609375, 3.746826171875, 3.89404296875, 4.041259765625, 4.1884765625, 4.335693359375, 4.48291015625, 4.630126953125, 4.77734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 15.0, 17.0, 23.0, 21.0, 27.0, 31.0, 29.0, 33.0, 34.0, 27.0, 40.0, 35.0, 35.0, 55.0, 54.0, 52.0, 42.0, 45.0, 38.0, 34.0, 50.0, 24.0, 26.0, 26.0, 29.0, 12.0, 17.0, 22.0, 13.0, 6.0, 10.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0], "bins": [-2.458984375, -2.390777587890625, -2.32257080078125, -2.254364013671875, -2.1861572265625, -2.117950439453125, -2.04974365234375, -1.981536865234375, -1.913330078125, -1.845123291015625, -1.77691650390625, -1.708709716796875, -1.6405029296875, -1.572296142578125, -1.50408935546875, -1.435882568359375, -1.36767578125, -1.299468994140625, -1.23126220703125, -1.163055419921875, -1.0948486328125, -1.026641845703125, -0.95843505859375, -0.890228271484375, -0.822021484375, -0.753814697265625, -0.68560791015625, -0.617401123046875, -0.5491943359375, -0.480987548828125, -0.41278076171875, -0.344573974609375, -0.2763671875, -0.208160400390625, -0.13995361328125, -0.071746826171875, -0.0035400390625, 0.064666748046875, 0.13287353515625, 0.201080322265625, 0.269287109375, 0.337493896484375, 0.40570068359375, 0.473907470703125, 0.5421142578125, 0.610321044921875, 0.67852783203125, 0.746734619140625, 0.81494140625, 0.883148193359375, 0.95135498046875, 1.019561767578125, 1.0877685546875, 1.155975341796875, 1.22418212890625, 1.292388916015625, 1.360595703125, 1.428802490234375, 1.49700927734375, 1.565216064453125, 1.6334228515625, 1.701629638671875, 1.76983642578125, 1.838043212890625, 1.90625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 10.0, 21.0, 21.0, 29.0, 86.0, 312.0, 6910.0, 4183939.0, 2593.0, 203.0, 59.0, 28.0, 21.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.5, -50.001953125, -48.50390625, -47.005859375, -45.5078125, -44.009765625, -42.51171875, -41.013671875, -39.515625, -38.017578125, -36.51953125, -35.021484375, -33.5234375, -32.025390625, -30.52734375, -29.029296875, -27.53125, -26.033203125, -24.53515625, -23.037109375, -21.5390625, -20.041015625, -18.54296875, -17.044921875, -15.546875, -14.048828125, -12.55078125, -11.052734375, -9.5546875, -8.056640625, -6.55859375, -5.060546875, -3.5625, -2.064453125, -0.56640625, 0.931640625, 2.4296875, 3.927734375, 5.42578125, 6.923828125, 8.421875, 9.919921875, 11.41796875, 12.916015625, 14.4140625, 15.912109375, 17.41015625, 18.908203125, 20.40625, 21.904296875, 23.40234375, 24.900390625, 26.3984375, 27.896484375, 29.39453125, 30.892578125, 32.390625, 33.888671875, 35.38671875, 36.884765625, 38.3828125, 39.880859375, 41.37890625, 42.876953125, 44.375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 20.0, 16.0, 29.0, 66.0, 144.0, 864.0, 2344.0, 370.0, 80.0, 45.0, 16.0, 23.0, 14.0, 7.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.607421875, -2.533538818359375, -2.45965576171875, -2.385772705078125, -2.3118896484375, -2.238006591796875, -2.16412353515625, -2.090240478515625, -2.016357421875, -1.942474365234375, -1.86859130859375, -1.794708251953125, -1.7208251953125, -1.646942138671875, -1.57305908203125, -1.499176025390625, -1.42529296875, -1.351409912109375, -1.27752685546875, -1.203643798828125, -1.1297607421875, -1.055877685546875, -0.98199462890625, -0.908111572265625, -0.834228515625, -0.760345458984375, -0.68646240234375, -0.612579345703125, -0.5386962890625, -0.464813232421875, -0.39093017578125, -0.317047119140625, -0.2431640625, -0.169281005859375, -0.09539794921875, -0.021514892578125, 0.0523681640625, 0.126251220703125, 0.20013427734375, 0.274017333984375, 0.347900390625, 0.421783447265625, 0.49566650390625, 0.569549560546875, 0.6434326171875, 0.717315673828125, 0.79119873046875, 0.865081787109375, 0.93896484375, 1.012847900390625, 1.08673095703125, 1.160614013671875, 1.2344970703125, 1.308380126953125, 1.38226318359375, 1.456146240234375, 1.530029296875, 1.603912353515625, 1.67779541015625, 1.751678466796875, 1.8255615234375, 1.899444580078125, 1.97332763671875, 2.047210693359375, 2.12109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 20.0, 23.0, 24.0, 29.0, 54.0, 62.0, 87.0, 85.0, 102.0, 96.0, 86.0, 60.0, 49.0, 35.0, 28.0, 20.0, 25.0, 10.0, 12.0, 6.0, 5.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.95149827003479, -2.8608500957489014, -2.7702019214630127, -2.679553985595703, -2.5889058113098145, -2.498257637023926, -2.407609462738037, -2.3169612884521484, -2.2263131141662598, -2.135664939880371, -2.0450167655944824, -1.9543687105178833, -1.8637206554412842, -1.7730724811553955, -1.6824243068695068, -1.5917761325836182, -1.5011281967163086, -1.41048002243042, -1.3198319673538208, -1.2291837930679321, -1.138535737991333, -1.0478875637054443, -0.9572393894195557, -0.8665912747383118, -0.7759431600570679, -0.685295045375824, -0.5946469306945801, -0.5039987564086914, -0.4133506417274475, -0.3227025270462036, -0.23205435276031494, -0.14140623807907104, -0.05075812339782715, 0.03989000618457794, 0.13053813576698303, 0.22118628025054932, 0.3118343949317932, 0.4024825096130371, 0.4931306838989258, 0.5837787985801697, 0.6744269132614136, 0.7650750279426575, 0.8557231426239014, 0.94637131690979, 1.0370194911956787, 1.1276675462722778, 1.2183157205581665, 1.3089637756347656, 1.3996119499206543, 1.490260124206543, 1.580908179283142, 1.6715563535690308, 1.7622044086456299, 1.8528525829315186, 1.9435007572174072, 2.034148931503296, 2.1247968673706055, 2.215445041656494, 2.306093215942383, 2.3967413902282715, 2.487389326095581, 2.5780375003814697, 2.6686856746673584, 2.759333848953247, 2.8499820232391357]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 1.0, 5.0, 9.0, 6.0, 12.0, 13.0, 15.0, 19.0, 20.0, 22.0, 32.0, 32.0, 28.0, 35.0, 31.0, 33.0, 36.0, 44.0, 40.0, 29.0, 58.0, 43.0, 46.0, 36.0, 34.0, 40.0, 33.0, 30.0, 26.0, 21.0, 26.0, 20.0, 18.0, 20.0, 18.0, 9.0, 15.0, 8.0, 10.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.039533853530884, -1.9769076108932495, -1.9142814874649048, -1.8516552448272705, -1.7890291213989258, -1.7264028787612915, -1.6637766361236572, -1.6011505126953125, -1.5385242700576782, -1.475898027420044, -1.4132719039916992, -1.350645661354065, -1.2880194187164307, -1.225393295288086, -1.1627670526504517, -1.1001408100128174, -1.0375146865844727, -0.9748885035514832, -0.9122623205184937, -0.8496360778808594, -0.7870098948478699, -0.7243837118148804, -0.6617574691772461, -0.5991312861442566, -0.5365051031112671, -0.4738789200782776, -0.4112527072429657, -0.3486264944076538, -0.2860003113746643, -0.2233741283416748, -0.16074791550636292, -0.09812170267105103, -0.03549528121948242, 0.027130916714668274, 0.08975711464881897, 0.15238331258296967, 0.21500951051712036, 0.27763569355010986, 0.34026190638542175, 0.40288811922073364, 0.46551430225372314, 0.5281404852867126, 0.5907666683197021, 0.6533929109573364, 0.7160190939903259, 0.7786452770233154, 0.8412715196609497, 0.9038977026939392, 0.9665238857269287, 1.029150128364563, 1.0917762517929077, 1.154402494430542, 1.2170286178588867, 1.279654860496521, 1.3422811031341553, 1.4049072265625, 1.4675334692001343, 1.5301597118377686, 1.5927858352661133, 1.6554120779037476, 1.7180383205413818, 1.7806644439697266, 1.8432906866073608, 1.9059169292449951, 1.9685430526733398]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 13.0, 12.0, 19.0, 36.0, 41.0, 56.0, 86.0, 116.0, 169.0, 263.0, 363.0, 556.0, 840.0, 1318.0, 2252.0, 3521.0, 6272.0, 11190.0, 21637.0, 44246.0, 99651.0, 244308.0, 335984.0, 148025.0, 63239.0, 29368.0, 14888.0, 8000.0, 4501.0, 2753.0, 1727.0, 1051.0, 682.0, 442.0, 298.0, 176.0, 135.0, 94.0, 63.0, 46.0, 39.0, 23.0, 16.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.708984375, -0.6876449584960938, -0.6663055419921875, -0.6449661254882812, -0.623626708984375, -0.6022872924804688, -0.5809478759765625, -0.5596084594726562, -0.53826904296875, -0.5169296264648438, -0.4955902099609375, -0.47425079345703125, -0.452911376953125, -0.43157196044921875, -0.4102325439453125, -0.38889312744140625, -0.3675537109375, -0.34621429443359375, -0.3248748779296875, -0.30353546142578125, -0.282196044921875, -0.26085662841796875, -0.2395172119140625, -0.21817779541015625, -0.19683837890625, -0.17549896240234375, -0.1541595458984375, -0.13282012939453125, -0.111480712890625, -0.09014129638671875, -0.0688018798828125, -0.04746246337890625, -0.026123046875, -0.00478363037109375, 0.0165557861328125, 0.03789520263671875, 0.059234619140625, 0.08057403564453125, 0.1019134521484375, 0.12325286865234375, 0.14459228515625, 0.16593170166015625, 0.1872711181640625, 0.20861053466796875, 0.229949951171875, 0.25128936767578125, 0.2726287841796875, 0.29396820068359375, 0.3153076171875, 0.33664703369140625, 0.3579864501953125, 0.37932586669921875, 0.400665283203125, 0.42200469970703125, 0.4433441162109375, 0.46468353271484375, 0.48602294921875, 0.5073623657226562, 0.5287017822265625, 0.5500411987304688, 0.571380615234375, 0.5927200317382812, 0.6140594482421875, 0.6353988647460938, 0.65673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 4.0, 6.0, 7.0, 22.0, 9.0, 18.0, 14.0, 19.0, 39.0, 32.0, 31.0, 30.0, 41.0, 42.0, 52.0, 53.0, 45.0, 48.0, 65.0, 56.0, 41.0, 54.0, 32.0, 40.0, 24.0, 37.0, 10.0, 19.0, 18.0, 17.0, 16.0, 18.0, 12.0, 5.0, 9.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8525390625, -1.7936248779296875, -1.734710693359375, -1.6757965087890625, -1.61688232421875, -1.5579681396484375, -1.499053955078125, -1.4401397705078125, -1.3812255859375, -1.3223114013671875, -1.263397216796875, -1.2044830322265625, -1.14556884765625, -1.0866546630859375, -1.027740478515625, -0.9688262939453125, -0.909912109375, -0.8509979248046875, -0.792083740234375, -0.7331695556640625, -0.67425537109375, -0.6153411865234375, -0.556427001953125, -0.4975128173828125, -0.4385986328125, -0.3796844482421875, -0.320770263671875, -0.2618560791015625, -0.20294189453125, -0.1440277099609375, -0.085113525390625, -0.0261993408203125, 0.03271484375, 0.0916290283203125, 0.150543212890625, 0.2094573974609375, 0.26837158203125, 0.3272857666015625, 0.386199951171875, 0.4451141357421875, 0.5040283203125, 0.5629425048828125, 0.621856689453125, 0.6807708740234375, 0.73968505859375, 0.7985992431640625, 0.857513427734375, 0.9164276123046875, 0.975341796875, 1.0342559814453125, 1.093170166015625, 1.1520843505859375, 1.21099853515625, 1.2699127197265625, 1.328826904296875, 1.3877410888671875, 1.4466552734375, 1.5055694580078125, 1.564483642578125, 1.6233978271484375, 1.68231201171875, 1.7412261962890625, 1.800140380859375, 1.8590545654296875, 1.91796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 8.0, 14.0, 16.0, 34.0, 42.0, 48.0, 80.0, 104.0, 115.0, 207.0, 283.0, 366.0, 585.0, 890.0, 1314.0, 2122.0, 3317.0, 5547.0, 10256.0, 21772.0, 56196.0, 187567.0, 465487.0, 187973.0, 56884.0, 21818.0, 10281.0, 5666.0, 3281.0, 2050.0, 1350.0, 884.0, 591.0, 455.0, 271.0, 169.0, 132.0, 92.0, 66.0, 57.0, 36.0, 26.0, 27.0, 22.0, 8.0, 7.0, 8.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70849609375, -0.6852645874023438, -0.6620330810546875, -0.6388015747070312, -0.615570068359375, -0.5923385620117188, -0.5691070556640625, -0.5458755493164062, -0.52264404296875, -0.49941253662109375, -0.4761810302734375, -0.45294952392578125, -0.429718017578125, -0.40648651123046875, -0.3832550048828125, -0.36002349853515625, -0.3367919921875, -0.31356048583984375, -0.2903289794921875, -0.26709747314453125, -0.243865966796875, -0.22063446044921875, -0.1974029541015625, -0.17417144775390625, -0.15093994140625, -0.12770843505859375, -0.1044769287109375, -0.08124542236328125, -0.058013916015625, -0.03478240966796875, -0.0115509033203125, 0.01168060302734375, 0.034912109375, 0.05814361572265625, 0.0813751220703125, 0.10460662841796875, 0.127838134765625, 0.15106964111328125, 0.1743011474609375, 0.19753265380859375, 0.22076416015625, 0.24399566650390625, 0.2672271728515625, 0.29045867919921875, 0.313690185546875, 0.33692169189453125, 0.3601531982421875, 0.38338470458984375, 0.4066162109375, 0.42984771728515625, 0.4530792236328125, 0.47631072998046875, 0.499542236328125, 0.5227737426757812, 0.5460052490234375, 0.5692367553710938, 0.59246826171875, 0.6156997680664062, 0.6389312744140625, 0.6621627807617188, 0.685394287109375, 0.7086257934570312, 0.7318572998046875, 0.7550888061523438, 0.7783203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 6.0, 12.0, 12.0, 20.0, 16.0, 7.0, 22.0, 28.0, 39.0, 35.0, 30.0, 56.0, 34.0, 43.0, 49.0, 45.0, 39.0, 41.0, 43.0, 51.0, 32.0, 50.0, 40.0, 23.0, 25.0, 24.0, 27.0, 18.0, 9.0, 19.0, 11.0, 14.0, 12.0, 12.0, 4.0, 5.0, 7.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.44921875, -3.3392333984375, -3.229248046875, -3.1192626953125, -3.00927734375, -2.8992919921875, -2.789306640625, -2.6793212890625, -2.5693359375, -2.4593505859375, -2.349365234375, -2.2393798828125, -2.12939453125, -2.0194091796875, -1.909423828125, -1.7994384765625, -1.689453125, -1.5794677734375, -1.469482421875, -1.3594970703125, -1.24951171875, -1.1395263671875, -1.029541015625, -0.9195556640625, -0.8095703125, -0.6995849609375, -0.589599609375, -0.4796142578125, -0.36962890625, -0.2596435546875, -0.149658203125, -0.0396728515625, 0.0703125, 0.1802978515625, 0.290283203125, 0.4002685546875, 0.51025390625, 0.6202392578125, 0.730224609375, 0.8402099609375, 0.9501953125, 1.0601806640625, 1.170166015625, 1.2801513671875, 1.39013671875, 1.5001220703125, 1.610107421875, 1.7200927734375, 1.830078125, 1.9400634765625, 2.050048828125, 2.1600341796875, 2.27001953125, 2.3800048828125, 2.489990234375, 2.5999755859375, 2.7099609375, 2.8199462890625, 2.929931640625, 3.0399169921875, 3.14990234375, 3.2598876953125, 3.369873046875, 3.4798583984375, 3.58984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 18.0, 23.0, 37.0, 57.0, 74.0, 125.0, 217.0, 385.0, 715.0, 1460.0, 3476.0, 10271.0, 44002.0, 572482.0, 365937.0, 34546.0, 8662.0, 3029.0, 1363.0, 666.0, 366.0, 205.0, 133.0, 82.0, 61.0, 39.0, 29.0, 21.0, 17.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.326446533203125, -0.31475830078125, -0.303070068359375, -0.2913818359375, -0.279693603515625, -0.26800537109375, -0.256317138671875, -0.24462890625, -0.232940673828125, -0.22125244140625, -0.209564208984375, -0.1978759765625, -0.186187744140625, -0.17449951171875, -0.162811279296875, -0.151123046875, -0.139434814453125, -0.12774658203125, -0.116058349609375, -0.1043701171875, -0.092681884765625, -0.08099365234375, -0.069305419921875, -0.0576171875, -0.045928955078125, -0.03424072265625, -0.022552490234375, -0.0108642578125, 0.000823974609375, 0.01251220703125, 0.024200439453125, 0.035888671875, 0.047576904296875, 0.05926513671875, 0.070953369140625, 0.0826416015625, 0.094329833984375, 0.10601806640625, 0.117706298828125, 0.12939453125, 0.141082763671875, 0.15277099609375, 0.164459228515625, 0.1761474609375, 0.187835693359375, 0.19952392578125, 0.211212158203125, 0.222900390625, 0.234588623046875, 0.24627685546875, 0.257965087890625, 0.2696533203125, 0.281341552734375, 0.29302978515625, 0.304718017578125, 0.31640625, 0.328094482421875, 0.33978271484375, 0.351470947265625, 0.3631591796875, 0.374847412109375, 0.38653564453125, 0.398223876953125, 0.409912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 10.0, 17.0, 14.0, 41.0, 69.0, 100.0, 209.0, 223.0, 124.0, 60.0, 39.0, 24.0, 12.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002739429473876953, -0.0002659037709236145, -0.0002578645944595337, -0.0002498254179954529, -0.00024178624153137207, -0.00023374706506729126, -0.00022570788860321045, -0.00021766871213912964, -0.00020962953567504883, -0.00020159035921096802, -0.0001935511827468872, -0.0001855120062828064, -0.00017747282981872559, -0.00016943365335464478, -0.00016139447689056396, -0.00015335530042648315, -0.00014531612396240234, -0.00013727694749832153, -0.00012923777103424072, -0.00012119859457015991, -0.0001131594181060791, -0.00010512024164199829, -9.708106517791748e-05, -8.904188871383667e-05, -8.100271224975586e-05, -7.296353578567505e-05, -6.492435932159424e-05, -5.688518285751343e-05, -4.884600639343262e-05, -4.080682992935181e-05, -3.2767653465270996e-05, -2.4728477001190186e-05, -1.6689300537109375e-05, -8.650124073028564e-06, -6.109476089477539e-07, 7.428228855133057e-06, 1.5467405319213867e-05, 2.3506581783294678e-05, 3.154575824737549e-05, 3.95849347114563e-05, 4.762411117553711e-05, 5.566328763961792e-05, 6.370246410369873e-05, 7.174164056777954e-05, 7.978081703186035e-05, 8.781999349594116e-05, 9.585916996002197e-05, 0.00010389834642410278, 0.0001119375228881836, 0.0001199766993522644, 0.00012801587581634521, 0.00013605505228042603, 0.00014409422874450684, 0.00015213340520858765, 0.00016017258167266846, 0.00016821175813674927, 0.00017625093460083008, 0.0001842901110649109, 0.0001923292875289917, 0.0002003684639930725, 0.00020840764045715332, 0.00021644681692123413, 0.00022448599338531494, 0.00023252516984939575, 0.00024056434631347656]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 6.0, 12.0, 27.0, 44.0, 101.0, 160.0, 367.0, 973.0, 2628.0, 9675.0, 47184.0, 656701.0, 291334.0, 29329.0, 6594.0, 2026.0, 759.0, 324.0, 131.0, 66.0, 35.0, 11.0, 12.0, 12.0, 10.0, 3.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67333984375, -0.6534576416015625, -0.633575439453125, -0.6136932373046875, -0.59381103515625, -0.5739288330078125, -0.554046630859375, -0.5341644287109375, -0.5142822265625, -0.4944000244140625, -0.474517822265625, -0.4546356201171875, -0.43475341796875, -0.4148712158203125, -0.394989013671875, -0.3751068115234375, -0.355224609375, -0.3353424072265625, -0.315460205078125, -0.2955780029296875, -0.27569580078125, -0.2558135986328125, -0.235931396484375, -0.2160491943359375, -0.1961669921875, -0.1762847900390625, -0.156402587890625, -0.1365203857421875, -0.11663818359375, -0.0967559814453125, -0.076873779296875, -0.0569915771484375, -0.037109375, -0.0172271728515625, 0.002655029296875, 0.0225372314453125, 0.04241943359375, 0.0623016357421875, 0.082183837890625, 0.1020660400390625, 0.1219482421875, 0.1418304443359375, 0.161712646484375, 0.1815948486328125, 0.20147705078125, 0.2213592529296875, 0.241241455078125, 0.2611236572265625, 0.281005859375, 0.3008880615234375, 0.320770263671875, 0.3406524658203125, 0.36053466796875, 0.3804168701171875, 0.400299072265625, 0.4201812744140625, 0.4400634765625, 0.4599456787109375, 0.479827880859375, 0.4997100830078125, 0.51959228515625, 0.5394744873046875, 0.559356689453125, 0.5792388916015625, 0.59912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 7.0, 5.0, 2.0, 4.0, 13.0, 18.0, 20.0, 29.0, 28.0, 34.0, 47.0, 67.0, 99.0, 104.0, 140.0, 93.0, 73.0, 52.0, 45.0, 26.0, 28.0, 10.0, 13.0, 8.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.137939453125, -0.13399505615234375, -0.1300506591796875, -0.12610626220703125, -0.122161865234375, -0.11821746826171875, -0.1142730712890625, -0.11032867431640625, -0.10638427734375, -0.10243988037109375, -0.0984954833984375, -0.09455108642578125, -0.090606689453125, -0.08666229248046875, -0.0827178955078125, -0.07877349853515625, -0.0748291015625, -0.07088470458984375, -0.0669403076171875, -0.06299591064453125, -0.059051513671875, -0.05510711669921875, -0.0511627197265625, -0.04721832275390625, -0.04327392578125, -0.03932952880859375, -0.0353851318359375, -0.03144073486328125, -0.027496337890625, -0.02355194091796875, -0.0196075439453125, -0.01566314697265625, -0.01171875, -0.00777435302734375, -0.0038299560546875, 0.00011444091796875, 0.004058837890625, 0.00800323486328125, 0.0119476318359375, 0.01589202880859375, 0.01983642578125, 0.02378082275390625, 0.0277252197265625, 0.03166961669921875, 0.035614013671875, 0.03955841064453125, 0.0435028076171875, 0.04744720458984375, 0.0513916015625, 0.05533599853515625, 0.0592803955078125, 0.06322479248046875, 0.067169189453125, 0.07111358642578125, 0.0750579833984375, 0.07900238037109375, 0.08294677734375, 0.08689117431640625, 0.0908355712890625, 0.09477996826171875, 0.098724365234375, 0.10266876220703125, 0.1066131591796875, 0.11055755615234375, 0.114501953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 11.0, 11.0, 9.0, 12.0, 26.0, 34.0, 40.0, 72.0, 86.0, 120.0, 145.0, 113.0, 87.0, 56.0, 42.0, 36.0, 20.0, 17.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.930957317352295, -2.8432822227478027, -2.7556071281433105, -2.6679320335388184, -2.580256938934326, -2.492581844329834, -2.404906749725342, -2.3172316551208496, -2.2295565605163574, -2.1418814659118652, -2.054206371307373, -1.9665312767028809, -1.8788561820983887, -1.7911810874938965, -1.7035058736801147, -1.6158307790756226, -1.5281555652618408, -1.4404804706573486, -1.3528053760528564, -1.2651302814483643, -1.177455186843872, -1.0897800922393799, -1.0021048784255981, -0.914429783821106, -0.8267546892166138, -0.7390795946121216, -0.6514045000076294, -0.5637293457984924, -0.47605425119400024, -0.38837915658950806, -0.3007040023803711, -0.2130289077758789, -0.12535405158996582, -0.03767894208431244, 0.04999616742134094, 0.13767129182815552, 0.2253463864326477, 0.3130214810371399, 0.40069663524627686, 0.48837172985076904, 0.5760468244552612, 0.6637219190597534, 0.7513970136642456, 0.8390721678733826, 0.9267472624778748, 1.0144224166870117, 1.102097511291504, 1.189772605895996, 1.2774477005004883, 1.3651227951049805, 1.4527978897094727, 1.5404729843139648, 1.628148078918457, 1.7158231735229492, 1.803498387336731, 1.8911734819412231, 1.9788485765457153, 2.066523790359497, 2.1541988849639893, 2.2418739795684814, 2.3295490741729736, 2.417224168777466, 2.504899263381958, 2.59257435798645, 2.6802494525909424]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 0.0, 1.0, 10.0, 3.0, 7.0, 14.0, 15.0, 20.0, 16.0, 24.0, 33.0, 26.0, 43.0, 31.0, 44.0, 41.0, 38.0, 47.0, 45.0, 64.0, 50.0, 49.0, 47.0, 42.0, 40.0, 38.0, 23.0, 31.0, 19.0, 18.0, 27.0, 22.0, 23.0, 13.0, 8.0, 5.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7804385423660278, -1.7255982160568237, -1.67075777053833, -1.615917444229126, -1.5610769987106323, -1.5062366724014282, -1.4513962268829346, -1.3965559005737305, -1.3417155742645264, -1.2868752479553223, -1.2320348024368286, -1.1771944761276245, -1.1223540306091309, -1.0675137042999268, -1.0126733779907227, -0.957832932472229, -0.9029924869537354, -0.8481521010398865, -0.7933117151260376, -0.7384713888168335, -0.6836309432983398, -0.6287906169891357, -0.5739502310752869, -0.519109845161438, -0.4642694592475891, -0.40942907333374023, -0.35458868741989136, -0.29974833130836487, -0.244907945394516, -0.19006755948066711, -0.13522720336914062, -0.08038681745529175, -0.02554631233215332, 0.02929406613111496, 0.08413444459438324, 0.13897481560707092, 0.1938152015209198, 0.24865558743476868, 0.30349594354629517, 0.35833632946014404, 0.4131767153739929, 0.4680171012878418, 0.5228574872016907, 0.5776978731155396, 0.6325381994247437, 0.6873786449432373, 0.7422189712524414, 0.7970593571662903, 0.8518997430801392, 0.906740128993988, 0.9615805149078369, 1.016420841217041, 1.0712612867355347, 1.1261016130447388, 1.1809420585632324, 1.2357823848724365, 1.2906227111816406, 1.3454630374908447, 1.4003034830093384, 1.4551438093185425, 1.5099842548370361, 1.5648245811462402, 1.6196649074554443, 1.674505352973938, 1.7293457984924316]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 20.0, 28.0, 56.0, 58.0, 104.0, 147.0, 251.0, 434.0, 601.0, 1047.0, 1671.0, 2732.0, 4621.0, 7970.0, 15159.0, 34077.0, 167967.0, 690710.0, 69267.0, 24022.0, 11784.0, 6347.0, 3722.0, 2156.0, 1356.0, 808.0, 493.0, 323.0, 174.0, 141.0, 101.0, 47.0, 30.0, 22.0, 12.0, 14.0, 10.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.21875, -2.152099609375, -2.08544921875, -2.018798828125, -1.9521484375, -1.885498046875, -1.81884765625, -1.752197265625, -1.685546875, -1.618896484375, -1.55224609375, -1.485595703125, -1.4189453125, -1.352294921875, -1.28564453125, -1.218994140625, -1.15234375, -1.085693359375, -1.01904296875, -0.952392578125, -0.8857421875, -0.819091796875, -0.75244140625, -0.685791015625, -0.619140625, -0.552490234375, -0.48583984375, -0.419189453125, -0.3525390625, -0.285888671875, -0.21923828125, -0.152587890625, -0.0859375, -0.019287109375, 0.04736328125, 0.114013671875, 0.1806640625, 0.247314453125, 0.31396484375, 0.380615234375, 0.447265625, 0.513916015625, 0.58056640625, 0.647216796875, 0.7138671875, 0.780517578125, 0.84716796875, 0.913818359375, 0.98046875, 1.047119140625, 1.11376953125, 1.180419921875, 1.2470703125, 1.313720703125, 1.38037109375, 1.447021484375, 1.513671875, 1.580322265625, 1.64697265625, 1.713623046875, 1.7802734375, 1.846923828125, 1.91357421875, 1.980224609375, 2.046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 5.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 15.0, 23.0, 23.0, 24.0, 17.0, 33.0, 40.0, 25.0, 27.0, 31.0, 54.0, 42.0, 51.0, 41.0, 51.0, 45.0, 37.0, 39.0, 40.0, 28.0, 26.0, 25.0, 24.0, 21.0, 22.0, 13.0, 28.0, 18.0, 16.0, 15.0, 6.0, 11.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.05859375, -2.9703369140625, -2.882080078125, -2.7938232421875, -2.70556640625, -2.6173095703125, -2.529052734375, -2.4407958984375, -2.3525390625, -2.2642822265625, -2.176025390625, -2.0877685546875, -1.99951171875, -1.9112548828125, -1.822998046875, -1.7347412109375, -1.646484375, -1.5582275390625, -1.469970703125, -1.3817138671875, -1.29345703125, -1.2052001953125, -1.116943359375, -1.0286865234375, -0.9404296875, -0.8521728515625, -0.763916015625, -0.6756591796875, -0.58740234375, -0.4991455078125, -0.410888671875, -0.3226318359375, -0.234375, -0.1461181640625, -0.057861328125, 0.0303955078125, 0.11865234375, 0.2069091796875, 0.295166015625, 0.3834228515625, 0.4716796875, 0.5599365234375, 0.648193359375, 0.7364501953125, 0.82470703125, 0.9129638671875, 1.001220703125, 1.0894775390625, 1.177734375, 1.2659912109375, 1.354248046875, 1.4425048828125, 1.53076171875, 1.6190185546875, 1.707275390625, 1.7955322265625, 1.8837890625, 1.9720458984375, 2.060302734375, 2.1485595703125, 2.23681640625, 2.3250732421875, 2.413330078125, 2.5015869140625, 2.58984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 20.0, 16.0, 17.0, 25.0, 38.0, 56.0, 72.0, 100.0, 123.0, 210.0, 323.0, 536.0, 907.0, 1728.0, 3448.0, 7046.0, 16164.0, 47933.0, 506600.0, 390783.0, 43192.0, 15279.0, 6607.0, 3126.0, 1684.0, 955.0, 544.0, 324.0, 219.0, 114.0, 88.0, 68.0, 49.0, 41.0, 23.0, 19.0, 13.0, 11.0, 11.0, 7.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.1470947265625, -2.075439453125, -2.0037841796875, -1.93212890625, -1.8604736328125, -1.788818359375, -1.7171630859375, -1.6455078125, -1.5738525390625, -1.502197265625, -1.4305419921875, -1.35888671875, -1.2872314453125, -1.215576171875, -1.1439208984375, -1.072265625, -1.0006103515625, -0.928955078125, -0.8572998046875, -0.78564453125, -0.7139892578125, -0.642333984375, -0.5706787109375, -0.4990234375, -0.4273681640625, -0.355712890625, -0.2840576171875, -0.21240234375, -0.1407470703125, -0.069091796875, 0.0025634765625, 0.07421875, 0.1458740234375, 0.217529296875, 0.2891845703125, 0.36083984375, 0.4324951171875, 0.504150390625, 0.5758056640625, 0.6474609375, 0.7191162109375, 0.790771484375, 0.8624267578125, 0.93408203125, 1.0057373046875, 1.077392578125, 1.1490478515625, 1.220703125, 1.2923583984375, 1.364013671875, 1.4356689453125, 1.50732421875, 1.5789794921875, 1.650634765625, 1.7222900390625, 1.7939453125, 1.8656005859375, 1.937255859375, 2.0089111328125, 2.08056640625, 2.1522216796875, 2.223876953125, 2.2955322265625, 2.3671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 4.0, 5.0, 7.0, 12.0, 8.0, 13.0, 19.0, 9.0, 20.0, 15.0, 25.0, 37.0, 32.0, 30.0, 30.0, 45.0, 51.0, 35.0, 43.0, 42.0, 41.0, 53.0, 30.0, 36.0, 45.0, 33.0, 32.0, 25.0, 33.0, 22.0, 28.0, 25.0, 24.0, 16.0, 9.0, 7.0, 11.0, 15.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.03497314453125, -2.9410400390625, -2.84710693359375, -2.753173828125, -2.65924072265625, -2.5653076171875, -2.47137451171875, -2.37744140625, -2.28350830078125, -2.1895751953125, -2.09564208984375, -2.001708984375, -1.90777587890625, -1.8138427734375, -1.71990966796875, -1.6259765625, -1.53204345703125, -1.4381103515625, -1.34417724609375, -1.250244140625, -1.15631103515625, -1.0623779296875, -0.96844482421875, -0.87451171875, -0.78057861328125, -0.6866455078125, -0.59271240234375, -0.498779296875, -0.40484619140625, -0.3109130859375, -0.21697998046875, -0.123046875, -0.02911376953125, 0.0648193359375, 0.15875244140625, 0.252685546875, 0.34661865234375, 0.4405517578125, 0.53448486328125, 0.62841796875, 0.72235107421875, 0.8162841796875, 0.91021728515625, 1.004150390625, 1.09808349609375, 1.1920166015625, 1.28594970703125, 1.3798828125, 1.47381591796875, 1.5677490234375, 1.66168212890625, 1.755615234375, 1.84954833984375, 1.9434814453125, 2.03741455078125, 2.13134765625, 2.22528076171875, 2.3192138671875, 2.41314697265625, 2.507080078125, 2.60101318359375, 2.6949462890625, 2.78887939453125, 2.8828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 15.0, 18.0, 14.0, 24.0, 38.0, 58.0, 59.0, 97.0, 151.0, 253.0, 451.0, 800.0, 1596.0, 2942.0, 6542.0, 21353.0, 933773.0, 60981.0, 10562.0, 4107.0, 2112.0, 1085.0, 590.0, 333.0, 187.0, 114.0, 76.0, 54.0, 50.0, 36.0, 23.0, 15.0, 7.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.130859375, -2.065765380859375, -2.00067138671875, -1.935577392578125, -1.8704833984375, -1.805389404296875, -1.74029541015625, -1.675201416015625, -1.610107421875, -1.545013427734375, -1.47991943359375, -1.414825439453125, -1.3497314453125, -1.284637451171875, -1.21954345703125, -1.154449462890625, -1.08935546875, -1.024261474609375, -0.95916748046875, -0.894073486328125, -0.8289794921875, -0.763885498046875, -0.69879150390625, -0.633697509765625, -0.568603515625, -0.503509521484375, -0.43841552734375, -0.373321533203125, -0.3082275390625, -0.243133544921875, -0.17803955078125, -0.112945556640625, -0.0478515625, 0.017242431640625, 0.08233642578125, 0.147430419921875, 0.2125244140625, 0.277618408203125, 0.34271240234375, 0.407806396484375, 0.472900390625, 0.537994384765625, 0.60308837890625, 0.668182373046875, 0.7332763671875, 0.798370361328125, 0.86346435546875, 0.928558349609375, 0.99365234375, 1.058746337890625, 1.12384033203125, 1.188934326171875, 1.2540283203125, 1.319122314453125, 1.38421630859375, 1.449310302734375, 1.514404296875, 1.579498291015625, 1.64459228515625, 1.709686279296875, 1.7747802734375, 1.839874267578125, 1.90496826171875, 1.970062255859375, 2.03515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 3.0, 2.0, 8.0, 12.0, 46.0, 333.0, 500.0, 33.0, 16.0, 11.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331878662109375, -0.00031444430351257324, -0.0002970099449157715, -0.0002795755863189697, -0.00026214122772216797, -0.0002447068691253662, -0.00022727251052856445, -0.0002098381519317627, -0.00019240379333496094, -0.00017496943473815918, -0.00015753507614135742, -0.00014010071754455566, -0.0001226663589477539, -0.00010523200035095215, -8.779764175415039e-05, -7.036328315734863e-05, -5.2928924560546875e-05, -3.549456596374512e-05, -1.806020736694336e-05, -6.258487701416016e-07, 1.6808509826660156e-05, 3.4242868423461914e-05, 5.167722702026367e-05, 6.911158561706543e-05, 8.654594421386719e-05, 0.00010398030281066895, 0.0001214146614074707, 0.00013884902000427246, 0.00015628337860107422, 0.00017371773719787598, 0.00019115209579467773, 0.0002085864543914795, 0.00022602081298828125, 0.000243455171585083, 0.00026088953018188477, 0.0002783238887786865, 0.0002957582473754883, 0.00031319260597229004, 0.0003306269645690918, 0.00034806132316589355, 0.0003654956817626953, 0.00038293004035949707, 0.00040036439895629883, 0.0004177987575531006, 0.00043523311614990234, 0.0004526674747467041, 0.00047010183334350586, 0.0004875361919403076, 0.0005049705505371094, 0.0005224049091339111, 0.0005398392677307129, 0.0005572736263275146, 0.0005747079849243164, 0.0005921423435211182, 0.0006095767021179199, 0.0006270110607147217, 0.0006444454193115234, 0.0006618797779083252, 0.000679314136505127, 0.0006967484951019287, 0.0007141828536987305, 0.0007316172122955322, 0.000749051570892334, 0.0007664859294891357, 0.0007839202880859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 13.0, 12.0, 21.0, 28.0, 47.0, 70.0, 81.0, 141.0, 182.0, 267.0, 414.0, 679.0, 1077.0, 1869.0, 3831.0, 10748.0, 126518.0, 876760.0, 15522.0, 4696.0, 2179.0, 1199.0, 746.0, 488.0, 293.0, 199.0, 145.0, 103.0, 62.0, 55.0, 34.0, 25.0, 20.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.79364013671875, -1.7298583984375, -1.66607666015625, -1.602294921875, -1.53851318359375, -1.4747314453125, -1.41094970703125, -1.34716796875, -1.28338623046875, -1.2196044921875, -1.15582275390625, -1.092041015625, -1.02825927734375, -0.9644775390625, -0.90069580078125, -0.8369140625, -0.77313232421875, -0.7093505859375, -0.64556884765625, -0.581787109375, -0.51800537109375, -0.4542236328125, -0.39044189453125, -0.32666015625, -0.26287841796875, -0.1990966796875, -0.13531494140625, -0.071533203125, -0.00775146484375, 0.0560302734375, 0.11981201171875, 0.18359375, 0.24737548828125, 0.3111572265625, 0.37493896484375, 0.438720703125, 0.50250244140625, 0.5662841796875, 0.63006591796875, 0.69384765625, 0.75762939453125, 0.8214111328125, 0.88519287109375, 0.948974609375, 1.01275634765625, 1.0765380859375, 1.14031982421875, 1.2041015625, 1.26788330078125, 1.3316650390625, 1.39544677734375, 1.459228515625, 1.52301025390625, 1.5867919921875, 1.65057373046875, 1.71435546875, 1.77813720703125, 1.8419189453125, 1.90570068359375, 1.969482421875, 2.03326416015625, 2.0970458984375, 2.16082763671875, 2.224609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 24.0, 41.0, 286.0, 473.0, 72.0, 25.0, 16.0, 7.0, 8.0, 6.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.941131591796875, -0.90765380859375, -0.874176025390625, -0.8406982421875, -0.807220458984375, -0.77374267578125, -0.740264892578125, -0.706787109375, -0.673309326171875, -0.63983154296875, -0.606353759765625, -0.5728759765625, -0.539398193359375, -0.50592041015625, -0.472442626953125, -0.43896484375, -0.405487060546875, -0.37200927734375, -0.338531494140625, -0.3050537109375, -0.271575927734375, -0.23809814453125, -0.204620361328125, -0.171142578125, -0.137664794921875, -0.10418701171875, -0.070709228515625, -0.0372314453125, -0.003753662109375, 0.02972412109375, 0.063201904296875, 0.0966796875, 0.130157470703125, 0.16363525390625, 0.197113037109375, 0.2305908203125, 0.264068603515625, 0.29754638671875, 0.331024169921875, 0.364501953125, 0.397979736328125, 0.43145751953125, 0.464935302734375, 0.4984130859375, 0.531890869140625, 0.56536865234375, 0.598846435546875, 0.63232421875, 0.665802001953125, 0.69927978515625, 0.732757568359375, 0.7662353515625, 0.799713134765625, 0.83319091796875, 0.866668701171875, 0.900146484375, 0.933624267578125, 0.96710205078125, 1.000579833984375, 1.0340576171875, 1.067535400390625, 1.10101318359375, 1.134490966796875, 1.16796875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 31.0, 811.0, 173.0, 7.0], "bins": [-150.4115753173828, -147.9746856689453, -145.5377960205078, -143.1009063720703, -140.6640167236328, -138.2271270751953, -135.7902374267578, -133.3533477783203, -130.9164581298828, -128.4795684814453, -126.04267883300781, -123.60578918457031, -121.16889953613281, -118.73200988769531, -116.29512023925781, -113.85823059082031, -111.42134094238281, -108.98445129394531, -106.54756164550781, -104.11067199707031, -101.67378234863281, -99.23689270019531, -96.80000305175781, -94.36311340332031, -91.92621612548828, -89.48932647705078, -87.05243682861328, -84.61554718017578, -82.17865753173828, -79.74176788330078, -77.30487823486328, -74.86798858642578, -72.43109130859375, -69.99420166015625, -67.55731201171875, -65.12042236328125, -62.68353271484375, -60.24664306640625, -57.80975341796875, -55.37286376953125, -52.93597412109375, -50.49908447265625, -48.06219482421875, -45.62530517578125, -43.18841552734375, -40.75152587890625, -38.31463623046875, -35.87774658203125, -33.440853118896484, -31.003963470458984, -28.567073822021484, -26.130184173583984, -23.693294525146484, -21.256404876708984, -18.81951332092285, -16.38262367248535, -13.945734977722168, -11.508845329284668, -9.071954727172852, -6.635065078735352, -4.198175430297852, -1.7612857818603516, 0.6756048202514648, 3.112494468688965, 5.549384117126465]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 0.0, 8.0, 7.0, 12.0, 16.0, 15.0, 20.0, 23.0, 21.0, 25.0, 31.0, 30.0, 33.0, 21.0, 29.0, 40.0, 35.0, 39.0, 46.0, 34.0, 39.0, 51.0, 37.0, 33.0, 34.0, 35.0, 29.0, 39.0, 34.0, 22.0, 25.0, 18.0, 21.0, 15.0, 19.0, 9.0, 18.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3116960525512695, -5.159384727478027, -5.007073402404785, -4.854762554168701, -4.702451229095459, -4.550139904022217, -4.397828578948975, -4.245517253875732, -4.093206405639648, -3.9408950805664062, -3.788583993911743, -3.636272668838501, -3.483961582183838, -3.3316502571105957, -3.1793389320373535, -3.0270276069641113, -2.874716281890869, -2.722404956817627, -2.570093870162964, -2.4177825450897217, -2.2654714584350586, -2.1131601333618164, -1.9608488082885742, -1.8085376024246216, -1.656226396560669, -1.5039151906967163, -1.3516039848327637, -1.1992926597595215, -1.0469814538955688, -0.8946702480316162, -0.7423589825630188, -0.5900477170944214, -0.43773651123046875, -0.2854252755641937, -0.1331140398979187, 0.019197195768356323, 0.17150843143463135, 0.323819637298584, 0.4761309027671814, 0.6284421682357788, 0.7807533740997314, 0.9330645799636841, 1.0853757858276367, 1.237687110900879, 1.3899983167648315, 1.5423095226287842, 1.6946208477020264, 1.846932053565979, 1.9992432594299316, 2.151554584503174, 2.303865671157837, 2.456176996231079, 2.608488082885742, 2.7607994079589844, 2.9131107330322266, 3.0654220581054688, 3.217733144760132, 3.370044469833374, 3.522355556488037, 3.6746668815612793, 3.8269782066345215, 3.9792892932891846, 4.131600379943848, 4.28391170501709, 4.436223030090332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 3.0, 14.0, 31.0, 27.0, 37.0, 66.0, 118.0, 232.0, 558.0, 2089.0, 10890.0, 3698554.0, 472496.0, 6517.0, 1563.0, 561.0, 205.0, 119.0, 65.0, 32.0, 29.0, 23.0, 9.0, 15.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.02490234375, -12.5888671875, -12.15283203125, -11.716796875, -11.28076171875, -10.8447265625, -10.40869140625, -9.97265625, -9.53662109375, -9.1005859375, -8.66455078125, -8.228515625, -7.79248046875, -7.3564453125, -6.92041015625, -6.484375, -6.04833984375, -5.6123046875, -5.17626953125, -4.740234375, -4.30419921875, -3.8681640625, -3.43212890625, -2.99609375, -2.56005859375, -2.1240234375, -1.68798828125, -1.251953125, -0.81591796875, -0.3798828125, 0.05615234375, 0.4921875, 0.92822265625, 1.3642578125, 1.80029296875, 2.236328125, 2.67236328125, 3.1083984375, 3.54443359375, 3.98046875, 4.41650390625, 4.8525390625, 5.28857421875, 5.724609375, 6.16064453125, 6.5966796875, 7.03271484375, 7.46875, 7.90478515625, 8.3408203125, 8.77685546875, 9.212890625, 9.64892578125, 10.0849609375, 10.52099609375, 10.95703125, 11.39306640625, 11.8291015625, 12.26513671875, 12.701171875, 13.13720703125, 13.5732421875, 14.00927734375, 14.4453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 14.0, 18.0, 13.0, 25.0, 44.0, 47.0, 44.0, 69.0, 57.0, 58.0, 66.0, 83.0, 83.0, 55.0, 66.0, 45.0, 38.0, 37.0, 46.0, 16.0, 16.0, 19.0, 14.0, 8.0, 3.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.57354736328125, -2.4888916015625, -2.40423583984375, -2.319580078125, -2.23492431640625, -2.1502685546875, -2.06561279296875, -1.98095703125, -1.89630126953125, -1.8116455078125, -1.72698974609375, -1.642333984375, -1.55767822265625, -1.4730224609375, -1.38836669921875, -1.3037109375, -1.21905517578125, -1.1343994140625, -1.04974365234375, -0.965087890625, -0.88043212890625, -0.7957763671875, -0.71112060546875, -0.62646484375, -0.54180908203125, -0.4571533203125, -0.37249755859375, -0.287841796875, -0.20318603515625, -0.1185302734375, -0.03387451171875, 0.05078125, 0.13543701171875, 0.2200927734375, 0.30474853515625, 0.389404296875, 0.47406005859375, 0.5587158203125, 0.64337158203125, 0.72802734375, 0.81268310546875, 0.8973388671875, 0.98199462890625, 1.066650390625, 1.15130615234375, 1.2359619140625, 1.32061767578125, 1.4052734375, 1.48992919921875, 1.5745849609375, 1.65924072265625, 1.743896484375, 1.82855224609375, 1.9132080078125, 1.99786376953125, 2.08251953125, 2.16717529296875, 2.2518310546875, 2.33648681640625, 2.421142578125, 2.50579833984375, 2.5904541015625, 2.67510986328125, 2.759765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 11.0, 19.0, 28.0, 52.0, 115.0, 481.0, 7503.0, 4175189.0, 10101.0, 490.0, 128.0, 46.0, 32.0, 18.0, 13.0, 10.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.7724609375, -18.966796875, -18.1611328125, -17.35546875, -16.5498046875, -15.744140625, -14.9384765625, -14.1328125, -13.3271484375, -12.521484375, -11.7158203125, -10.91015625, -10.1044921875, -9.298828125, -8.4931640625, -7.6875, -6.8818359375, -6.076171875, -5.2705078125, -4.46484375, -3.6591796875, -2.853515625, -2.0478515625, -1.2421875, -0.4365234375, 0.369140625, 1.1748046875, 1.98046875, 2.7861328125, 3.591796875, 4.3974609375, 5.203125, 6.0087890625, 6.814453125, 7.6201171875, 8.42578125, 9.2314453125, 10.037109375, 10.8427734375, 11.6484375, 12.4541015625, 13.259765625, 14.0654296875, 14.87109375, 15.6767578125, 16.482421875, 17.2880859375, 18.09375, 18.8994140625, 19.705078125, 20.5107421875, 21.31640625, 22.1220703125, 22.927734375, 23.7333984375, 24.5390625, 25.3447265625, 26.150390625, 26.9560546875, 27.76171875, 28.5673828125, 29.373046875, 30.1787109375, 30.984375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 11.0, 15.0, 32.0, 46.0, 82.0, 292.0, 1887.0, 1341.0, 195.0, 61.0, 28.0, 19.0, 19.0, 5.0, 9.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8271484375, -1.7616729736328125, -1.696197509765625, -1.6307220458984375, -1.56524658203125, -1.4997711181640625, -1.434295654296875, -1.3688201904296875, -1.3033447265625, -1.2378692626953125, -1.172393798828125, -1.1069183349609375, -1.04144287109375, -0.9759674072265625, -0.910491943359375, -0.8450164794921875, -0.779541015625, -0.7140655517578125, -0.648590087890625, -0.5831146240234375, -0.51763916015625, -0.4521636962890625, -0.386688232421875, -0.3212127685546875, -0.2557373046875, -0.1902618408203125, -0.124786376953125, -0.0593109130859375, 0.00616455078125, 0.0716400146484375, 0.137115478515625, 0.2025909423828125, 0.26806640625, 0.3335418701171875, 0.399017333984375, 0.4644927978515625, 0.52996826171875, 0.5954437255859375, 0.660919189453125, 0.7263946533203125, 0.7918701171875, 0.8573455810546875, 0.922821044921875, 0.9882965087890625, 1.05377197265625, 1.1192474365234375, 1.184722900390625, 1.2501983642578125, 1.315673828125, 1.3811492919921875, 1.446624755859375, 1.5121002197265625, 1.57757568359375, 1.6430511474609375, 1.708526611328125, 1.7740020751953125, 1.8394775390625, 1.9049530029296875, 1.970428466796875, 2.0359039306640625, 2.10137939453125, 2.1668548583984375, 2.232330322265625, 2.2978057861328125, 2.36328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 3.0, 14.0, 19.0, 17.0, 15.0, 34.0, 49.0, 62.0, 73.0, 86.0, 102.0, 92.0, 96.0, 89.0, 53.0, 34.0, 30.0, 29.0, 20.0, 17.0, 13.0, 6.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7544424533843994, -2.671036958694458, -2.5876314640045166, -2.504225969314575, -2.420820713043213, -2.3374152183532715, -2.25400972366333, -2.1706042289733887, -2.0871987342834473, -2.003793239593506, -1.9203877449035645, -1.8369823694229126, -1.7535768747329712, -1.6701713800430298, -1.586766004562378, -1.5033605098724365, -1.4199550151824951, -1.3365495204925537, -1.2531440258026123, -1.1697386503219604, -1.086333155632019, -1.0029276609420776, -0.919522225856781, -0.8361167907714844, -0.752711296081543, -0.6693058013916016, -0.5859003663063049, -0.5024949312210083, -0.4190894365310669, -0.3356839716434479, -0.25227850675582886, -0.16887307167053223, -0.08546781539916992, -0.0020623505115509033, 0.08134311437606812, 0.16474857926368713, 0.24815404415130615, 0.33155950903892517, 0.4149649739265442, 0.4983704090118408, 0.5817759037017822, 0.6651813983917236, 0.7485868334770203, 0.8319922685623169, 0.9153977632522583, 0.9988032579421997, 1.0822086334228516, 1.165614128112793, 1.2490196228027344, 1.3324251174926758, 1.4158306121826172, 1.499235987663269, 1.5826414823532104, 1.6660469770431519, 1.7494523525238037, 1.8328578472137451, 1.9162633419036865, 1.999668836593628, 2.0830743312835693, 2.1664798259735107, 2.249885082244873, 2.3332905769348145, 2.416696071624756, 2.5001015663146973, 2.5835070610046387]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 7.0, 10.0, 11.0, 21.0, 19.0, 16.0, 27.0, 24.0, 32.0, 32.0, 36.0, 32.0, 42.0, 40.0, 56.0, 36.0, 52.0, 44.0, 47.0, 49.0, 35.0, 27.0, 35.0, 32.0, 36.0, 25.0, 29.0, 15.0, 23.0, 13.0, 21.0, 10.0, 6.0, 6.0, 10.0, 5.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1681621074676514, -2.1113107204437256, -2.054459571838379, -1.9976081848144531, -1.9407567977905273, -1.8839055299758911, -1.8270541429519653, -1.770202875137329, -1.7133514881134033, -1.656500220298767, -1.5996488332748413, -1.542797565460205, -1.4859461784362793, -1.429094910621643, -1.3722435235977173, -1.315392255783081, -1.2585408687591553, -1.201689600944519, -1.1448382139205933, -1.087986946105957, -1.0311355590820312, -0.974284291267395, -0.9174329042434692, -0.860581636428833, -0.8037303686141968, -0.7468790411949158, -0.6900277137756348, -0.6331763863563538, -0.5763250589370728, -0.5194737911224365, -0.46262243390083313, -0.4057711064815521, -0.34891974925994873, -0.2920684218406677, -0.23521709442138672, -0.1783657819032669, -0.1215144544839859, -0.06466314196586609, -0.007811814546585083, 0.04903951287269592, 0.10589084029197693, 0.16274216771125793, 0.21959349513053894, 0.27644479274749756, 0.33329612016677856, 0.39014744758605957, 0.4469987750053406, 0.5038501024246216, 0.5607014298439026, 0.6175527572631836, 0.6744040846824646, 0.7312554121017456, 0.7881067395210266, 0.8449580669403076, 0.9018093347549438, 0.9586607217788696, 1.0155119895935059, 1.072363257408142, 1.1292146444320679, 1.186065912246704, 1.2429172992706299, 1.2997685670852661, 1.356619954109192, 1.4134712219238281, 1.470322608947754]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 8.0, 10.0, 19.0, 28.0, 39.0, 61.0, 153.0, 363.0, 977.0, 2735.0, 9230.0, 40653.0, 384261.0, 541903.0, 51936.0, 11016.0, 3297.0, 1079.0, 405.0, 177.0, 69.0, 37.0, 19.0, 19.0, 10.0, 10.0, 5.0, 8.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3151092529296875, -1.269866943359375, -1.2246246337890625, -1.17938232421875, -1.1341400146484375, -1.088897705078125, -1.0436553955078125, -0.9984130859375, -0.9531707763671875, -0.907928466796875, -0.8626861572265625, -0.81744384765625, -0.7722015380859375, -0.726959228515625, -0.6817169189453125, -0.636474609375, -0.5912322998046875, -0.545989990234375, -0.5007476806640625, -0.45550537109375, -0.4102630615234375, -0.365020751953125, -0.3197784423828125, -0.2745361328125, -0.2292938232421875, -0.184051513671875, -0.1388092041015625, -0.09356689453125, -0.0483245849609375, -0.003082275390625, 0.0421600341796875, 0.08740234375, 0.1326446533203125, 0.177886962890625, 0.2231292724609375, 0.26837158203125, 0.3136138916015625, 0.358856201171875, 0.4040985107421875, 0.4493408203125, 0.4945831298828125, 0.539825439453125, 0.5850677490234375, 0.63031005859375, 0.6755523681640625, 0.720794677734375, 0.7660369873046875, 0.811279296875, 0.8565216064453125, 0.901763916015625, 0.9470062255859375, 0.99224853515625, 1.0374908447265625, 1.082733154296875, 1.1279754638671875, 1.1732177734375, 1.2184600830078125, 1.263702392578125, 1.3089447021484375, 1.35418701171875, 1.3994293212890625, 1.444671630859375, 1.4899139404296875, 1.53515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 17.0, 14.0, 19.0, 50.0, 29.0, 62.0, 71.0, 92.0, 97.0, 106.0, 102.0, 73.0, 81.0, 61.0, 36.0, 30.0, 26.0, 11.0, 15.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.5949554443359375, -1.513153076171875, -1.4313507080078125, -1.34954833984375, -1.2677459716796875, -1.185943603515625, -1.1041412353515625, -1.0223388671875, -0.9405364990234375, -0.858734130859375, -0.7769317626953125, -0.69512939453125, -0.6133270263671875, -0.531524658203125, -0.4497222900390625, -0.367919921875, -0.2861175537109375, -0.204315185546875, -0.1225128173828125, -0.04071044921875, 0.0410919189453125, 0.122894287109375, 0.2046966552734375, 0.2864990234375, 0.3683013916015625, 0.450103759765625, 0.5319061279296875, 0.61370849609375, 0.6955108642578125, 0.777313232421875, 0.8591156005859375, 0.94091796875, 1.0227203369140625, 1.104522705078125, 1.1863250732421875, 1.26812744140625, 1.3499298095703125, 1.431732177734375, 1.5135345458984375, 1.5953369140625, 1.6771392822265625, 1.758941650390625, 1.8407440185546875, 1.92254638671875, 2.0043487548828125, 2.086151123046875, 2.1679534912109375, 2.249755859375, 2.3315582275390625, 2.413360595703125, 2.4951629638671875, 2.57696533203125, 2.6587677001953125, 2.740570068359375, 2.8223724365234375, 2.9041748046875, 2.9859771728515625, 3.067779541015625, 3.1495819091796875, 3.23138427734375, 3.3131866455078125, 3.394989013671875, 3.4767913818359375, 3.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 10.0, 21.0, 25.0, 32.0, 43.0, 74.0, 105.0, 176.0, 224.0, 399.0, 642.0, 1000.0, 1943.0, 3658.0, 7585.0, 17788.0, 50204.0, 198266.0, 542977.0, 152395.0, 41458.0, 15293.0, 6662.0, 3343.0, 1669.0, 951.0, 568.0, 336.0, 236.0, 145.0, 95.0, 67.0, 41.0, 29.0, 17.0, 13.0, 19.0, 6.0, 5.0, 1.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.6484375, -0.6284332275390625, -0.608428955078125, -0.5884246826171875, -0.56842041015625, -0.5484161376953125, -0.528411865234375, -0.5084075927734375, -0.4884033203125, -0.4683990478515625, -0.448394775390625, -0.4283905029296875, -0.40838623046875, -0.3883819580078125, -0.368377685546875, -0.3483734130859375, -0.328369140625, -0.3083648681640625, -0.288360595703125, -0.2683563232421875, -0.24835205078125, -0.2283477783203125, -0.208343505859375, -0.1883392333984375, -0.1683349609375, -0.1483306884765625, -0.128326416015625, -0.1083221435546875, -0.08831787109375, -0.0683135986328125, -0.048309326171875, -0.0283050537109375, -0.00830078125, 0.0117034912109375, 0.031707763671875, 0.0517120361328125, 0.07171630859375, 0.0917205810546875, 0.111724853515625, 0.1317291259765625, 0.1517333984375, 0.1717376708984375, 0.191741943359375, 0.2117462158203125, 0.23175048828125, 0.2517547607421875, 0.271759033203125, 0.2917633056640625, 0.311767578125, 0.3317718505859375, 0.351776123046875, 0.3717803955078125, 0.39178466796875, 0.4117889404296875, 0.431793212890625, 0.4517974853515625, 0.4718017578125, 0.4918060302734375, 0.511810302734375, 0.5318145751953125, 0.55181884765625, 0.5718231201171875, 0.591827392578125, 0.6118316650390625, 0.6318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 20.0, 10.0, 12.0, 11.0, 15.0, 19.0, 20.0, 21.0, 27.0, 35.0, 45.0, 36.0, 44.0, 46.0, 55.0, 48.0, 56.0, 45.0, 42.0, 58.0, 47.0, 45.0, 32.0, 26.0, 27.0, 21.0, 28.0, 22.0, 12.0, 9.0, 8.0, 8.0, 12.0, 5.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4453125, -2.367218017578125, -2.28912353515625, -2.211029052734375, -2.1329345703125, -2.054840087890625, -1.97674560546875, -1.898651123046875, -1.820556640625, -1.742462158203125, -1.66436767578125, -1.586273193359375, -1.5081787109375, -1.430084228515625, -1.35198974609375, -1.273895263671875, -1.19580078125, -1.117706298828125, -1.03961181640625, -0.961517333984375, -0.8834228515625, -0.805328369140625, -0.72723388671875, -0.649139404296875, -0.571044921875, -0.492950439453125, -0.41485595703125, -0.336761474609375, -0.2586669921875, -0.180572509765625, -0.10247802734375, -0.024383544921875, 0.0537109375, 0.131805419921875, 0.20989990234375, 0.287994384765625, 0.3660888671875, 0.444183349609375, 0.52227783203125, 0.600372314453125, 0.678466796875, 0.756561279296875, 0.83465576171875, 0.912750244140625, 0.9908447265625, 1.068939208984375, 1.14703369140625, 1.225128173828125, 1.30322265625, 1.381317138671875, 1.45941162109375, 1.537506103515625, 1.6156005859375, 1.693695068359375, 1.77178955078125, 1.849884033203125, 1.927978515625, 2.006072998046875, 2.08416748046875, 2.162261962890625, 2.2403564453125, 2.318450927734375, 2.39654541015625, 2.474639892578125, 2.552734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 13.0, 23.0, 18.0, 38.0, 53.0, 121.0, 167.0, 276.0, 484.0, 1047.0, 2168.0, 4957.0, 13092.0, 46912.0, 423910.0, 480812.0, 50976.0, 13783.0, 5216.0, 2168.0, 1028.0, 544.0, 298.0, 157.0, 105.0, 58.0, 39.0, 27.0, 13.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1552448272705078, -0.14850234985351562, -0.14175987243652344, -0.13501739501953125, -0.12827491760253906, -0.12153244018554688, -0.11478996276855469, -0.1080474853515625, -0.10130500793457031, -0.09456253051757812, -0.08782005310058594, -0.08107757568359375, -0.07433509826660156, -0.06759262084960938, -0.06085014343261719, -0.054107666015625, -0.04736518859863281, -0.040622711181640625, -0.03388023376464844, -0.02713775634765625, -0.020395278930664062, -0.013652801513671875, -0.0069103240966796875, -0.0001678466796875, 0.0065746307373046875, 0.013317108154296875, 0.020059585571289062, 0.02680206298828125, 0.03354454040527344, 0.040287017822265625, 0.04702949523925781, 0.05377197265625, 0.06051445007324219, 0.06725692749023438, 0.07399940490722656, 0.08074188232421875, 0.08748435974121094, 0.09422683715820312, 0.10096931457519531, 0.1077117919921875, 0.11445426940917969, 0.12119674682617188, 0.12793922424316406, 0.13468170166015625, 0.14142417907714844, 0.14816665649414062, 0.1549091339111328, 0.161651611328125, 0.1683940887451172, 0.17513656616210938, 0.18187904357910156, 0.18862152099609375, 0.19536399841308594, 0.20210647583007812, 0.2088489532470703, 0.2155914306640625, 0.2223339080810547, 0.22907638549804688, 0.23581886291503906, 0.24256134033203125, 0.24930381774902344, 0.2560462951660156, 0.2627887725830078, 0.26953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 5.0, 5.0, 6.0, 15.0, 19.0, 13.0, 16.0, 35.0, 54.0, 66.0, 115.0, 160.0, 156.0, 116.0, 64.0, 37.0, 39.0, 22.0, 11.0, 7.0, 7.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00017189979553222656, -0.0001672450453042984, -0.00016259029507637024, -0.00015793554484844208, -0.00015328079462051392, -0.00014862604439258575, -0.0001439712941646576, -0.00013931654393672943, -0.00013466179370880127, -0.0001300070434808731, -0.00012535229325294495, -0.00012069754302501678, -0.00011604279279708862, -0.00011138804256916046, -0.0001067332923412323, -0.00010207854211330414, -9.742379188537598e-05, -9.276904165744781e-05, -8.811429142951965e-05, -8.345954120159149e-05, -7.880479097366333e-05, -7.415004074573517e-05, -6.949529051780701e-05, -6.484054028987885e-05, -6.0185790061950684e-05, -5.553103983402252e-05, -5.087628960609436e-05, -4.62215393781662e-05, -4.156678915023804e-05, -3.6912038922309875e-05, -3.2257288694381714e-05, -2.7602538466453552e-05, -2.294778823852539e-05, -1.829303801059723e-05, -1.3638287782669067e-05, -8.983537554740906e-06, -4.328787326812744e-06, 3.259629011154175e-07, 4.980713129043579e-06, 9.63546335697174e-06, 1.4290213584899902e-05, 1.8944963812828064e-05, 2.3599714040756226e-05, 2.8254464268684387e-05, 3.290921449661255e-05, 3.756396472454071e-05, 4.221871495246887e-05, 4.6873465180397034e-05, 5.1528215408325195e-05, 5.618296563625336e-05, 6.083771586418152e-05, 6.549246609210968e-05, 7.014721632003784e-05, 7.4801966547966e-05, 7.945671677589417e-05, 8.411146700382233e-05, 8.876621723175049e-05, 9.342096745967865e-05, 9.807571768760681e-05, 0.00010273046791553497, 0.00010738521814346313, 0.0001120399683713913, 0.00011669471859931946, 0.00012134946882724762, 0.00012600421905517578]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 17.0, 33.0, 120.0, 533.0, 4067.0, 129270.0, 901820.0, 11190.0, 1136.0, 222.0, 67.0, 27.0, 14.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6297378540039062, -0.6037139892578125, -0.5776901245117188, -0.551666259765625, -0.5256423950195312, -0.4996185302734375, -0.47359466552734375, -0.44757080078125, -0.42154693603515625, -0.3955230712890625, -0.36949920654296875, -0.343475341796875, -0.31745147705078125, -0.2914276123046875, -0.26540374755859375, -0.2393798828125, -0.21335601806640625, -0.1873321533203125, -0.16130828857421875, -0.135284423828125, -0.10926055908203125, -0.0832366943359375, -0.05721282958984375, -0.03118896484375, -0.00516510009765625, 0.0208587646484375, 0.04688262939453125, 0.072906494140625, 0.09893035888671875, 0.1249542236328125, 0.15097808837890625, 0.177001953125, 0.20302581787109375, 0.2290496826171875, 0.25507354736328125, 0.281097412109375, 0.30712127685546875, 0.3331451416015625, 0.35916900634765625, 0.38519287109375, 0.41121673583984375, 0.4372406005859375, 0.46326446533203125, 0.489288330078125, 0.5153121948242188, 0.5413360595703125, 0.5673599243164062, 0.5933837890625, 0.6194076538085938, 0.6454315185546875, 0.6714553833007812, 0.697479248046875, 0.7235031127929688, 0.7495269775390625, 0.7755508422851562, 0.80157470703125, 0.8275985717773438, 0.8536224365234375, 0.8796463012695312, 0.905670166015625, 0.9316940307617188, 0.9577178955078125, 0.9837417602539062, 1.009765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 10.0, 19.0, 17.0, 24.0, 37.0, 41.0, 52.0, 78.0, 85.0, 114.0, 114.0, 78.0, 74.0, 53.0, 41.0, 35.0, 24.0, 21.0, 9.0, 12.0, 11.0, 7.0, 8.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06536865234375, -0.06344318389892578, -0.06151771545410156, -0.059592247009277344, -0.057666778564453125, -0.055741310119628906, -0.05381584167480469, -0.05189037322998047, -0.04996490478515625, -0.04803943634033203, -0.04611396789550781, -0.044188499450683594, -0.042263031005859375, -0.040337562561035156, -0.03841209411621094, -0.03648662567138672, -0.0345611572265625, -0.03263568878173828, -0.030710220336914062, -0.028784751892089844, -0.026859283447265625, -0.024933815002441406, -0.023008346557617188, -0.02108287811279297, -0.01915740966796875, -0.01723194122314453, -0.015306472778320312, -0.013381004333496094, -0.011455535888671875, -0.009530067443847656, -0.0076045989990234375, -0.005679130554199219, -0.003753662109375, -0.0018281936645507812, 9.72747802734375e-05, 0.0020227432250976562, 0.003948211669921875, 0.005873680114746094, 0.0077991485595703125, 0.009724617004394531, 0.01165008544921875, 0.013575553894042969, 0.015501022338867188, 0.017426490783691406, 0.019351959228515625, 0.021277427673339844, 0.023202896118164062, 0.02512836456298828, 0.0270538330078125, 0.02897930145263672, 0.030904769897460938, 0.032830238342285156, 0.034755706787109375, 0.036681175231933594, 0.03860664367675781, 0.04053211212158203, 0.04245758056640625, 0.04438304901123047, 0.04630851745605469, 0.048233985900878906, 0.050159454345703125, 0.052084922790527344, 0.05401039123535156, 0.05593585968017578, 0.057861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 14.0, 17.0, 24.0, 60.0, 95.0, 237.0, 215.0, 154.0, 82.0, 47.0, 22.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4313602447509766, -2.3174726963043213, -2.203585147857666, -2.0896973609924316, -1.975809931755066, -1.861922264099121, -1.7480347156524658, -1.6341471672058105, -1.5202596187591553, -1.4063720703125, -1.2924844026565552, -1.1785968542099, -1.0647093057632446, -0.9508216977119446, -0.8369340896606445, -0.7230465412139893, -0.6091588735580444, -0.4952712953090668, -0.3813837170600891, -0.26749610900878906, -0.1536085307598114, -0.03972095251083374, 0.07416665554046631, 0.18805420398712158, 0.30194181203842163, 0.4158293902873993, 0.529716968536377, 0.643604576587677, 0.757492184638977, 0.8713797330856323, 0.9852673411369324, 1.0991549491882324, 1.2130424976348877, 1.326930046081543, 1.4408177137374878, 1.554705262184143, 1.6685928106307983, 1.7824804782867432, 1.8963680267333984, 2.0102555751800537, 2.124143123626709, 2.2380306720733643, 2.3519182205200195, 2.465806007385254, 2.579693555831909, 2.6935811042785645, 2.8074686527252197, 2.921356201171875, 3.0352439880371094, 3.1491315364837646, 3.26301908493042, 3.3769068717956543, 3.4907944202423096, 3.604681968688965, 3.71856951713562, 3.8324570655822754, 3.9463446140289307, 4.060232162475586, 4.17411994934082, 4.2880072593688965, 4.401895046234131, 4.515782356262207, 4.629670143127441, 4.743557929992676, 4.857445240020752]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 14.0, 22.0, 18.0, 35.0, 42.0, 54.0, 61.0, 75.0, 83.0, 106.0, 115.0, 71.0, 77.0, 60.0, 52.0, 40.0, 26.0, 28.0, 12.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.684027075767517, -1.607417106628418, -1.5308072566986084, -1.4541972875595093, -1.3775873184204102, -1.3009774684906006, -1.2243674993515015, -1.1477575302124023, -1.0711476802825928, -0.9945377707481384, -0.9179278016090393, -0.841317892074585, -0.7647079229354858, -0.6880980134010315, -0.6114881038665771, -0.534878134727478, -0.4582681655883789, -0.3816582262516022, -0.30504828691482544, -0.2284383773803711, -0.15182843804359436, -0.07521849870681763, 0.0013914108276367188, 0.07800137996673584, 0.15461128950119019, 0.23122122883796692, 0.30783116817474365, 0.384441077709198, 0.46105101704597473, 0.5376609563827515, 0.6142708659172058, 0.6908808350563049, 0.7674908638000488, 0.8441007733345032, 0.9207107424736023, 0.9973206520080566, 1.0739306211471558, 1.1505405902862549, 1.2271504402160645, 1.3037604093551636, 1.3803703784942627, 1.4569803476333618, 1.5335901975631714, 1.6102001667022705, 1.6868101358413696, 1.7634201049804688, 1.8400299549102783, 1.9166399240493774, 1.993249773979187, 2.069859743118286, 2.1464695930480957, 2.2230796813964844, 2.299689531326294, 2.3762993812561035, 2.452909469604492, 2.5295193195343018, 2.6061291694641113, 2.682739019393921, 2.7593491077423096, 2.835958957672119, 2.9125688076019287, 2.9891788959503174, 3.065788745880127, 3.1423988342285156, 3.219008684158325]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 6.0, 15.0, 32.0, 85.0, 270.0, 739.0, 2174.0, 14801.0, 1011544.0, 15497.0, 2189.0, 765.0, 263.0, 97.0, 41.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9970703125, -8.736328125, -8.4755859375, -8.21484375, -7.9541015625, -7.693359375, -7.4326171875, -7.171875, -6.9111328125, -6.650390625, -6.3896484375, -6.12890625, -5.8681640625, -5.607421875, -5.3466796875, -5.0859375, -4.8251953125, -4.564453125, -4.3037109375, -4.04296875, -3.7822265625, -3.521484375, -3.2607421875, -3.0, -2.7392578125, -2.478515625, -2.2177734375, -1.95703125, -1.6962890625, -1.435546875, -1.1748046875, -0.9140625, -0.6533203125, -0.392578125, -0.1318359375, 0.12890625, 0.3896484375, 0.650390625, 0.9111328125, 1.171875, 1.4326171875, 1.693359375, 1.9541015625, 2.21484375, 2.4755859375, 2.736328125, 2.9970703125, 3.2578125, 3.5185546875, 3.779296875, 4.0400390625, 4.30078125, 4.5615234375, 4.822265625, 5.0830078125, 5.34375, 5.6044921875, 5.865234375, 6.1259765625, 6.38671875, 6.6474609375, 6.908203125, 7.1689453125, 7.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 17.0, 26.0, 35.0, 35.0, 55.0, 76.0, 108.0, 117.0, 104.0, 101.0, 94.0, 69.0, 55.0, 27.0, 37.0, 25.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.53021240234375, -2.3533935546875, -2.17657470703125, -1.999755859375, -1.82293701171875, -1.6461181640625, -1.46929931640625, -1.29248046875, -1.11566162109375, -0.9388427734375, -0.76202392578125, -0.585205078125, -0.40838623046875, -0.2315673828125, -0.05474853515625, 0.1220703125, 0.29888916015625, 0.4757080078125, 0.65252685546875, 0.829345703125, 1.00616455078125, 1.1829833984375, 1.35980224609375, 1.53662109375, 1.71343994140625, 1.8902587890625, 2.06707763671875, 2.243896484375, 2.42071533203125, 2.5975341796875, 2.77435302734375, 2.951171875, 3.12799072265625, 3.3048095703125, 3.48162841796875, 3.658447265625, 3.83526611328125, 4.0120849609375, 4.18890380859375, 4.36572265625, 4.54254150390625, 4.7193603515625, 4.89617919921875, 5.072998046875, 5.24981689453125, 5.4266357421875, 5.60345458984375, 5.7802734375, 5.95709228515625, 6.1339111328125, 6.31072998046875, 6.487548828125, 6.66436767578125, 6.8411865234375, 7.01800537109375, 7.19482421875, 7.37164306640625, 7.5484619140625, 7.72528076171875, 7.902099609375, 8.07891845703125, 8.2557373046875, 8.43255615234375, 8.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 11.0, 12.0, 14.0, 31.0, 51.0, 51.0, 92.0, 182.0, 423.0, 1178.0, 4959.0, 971537.0, 65308.0, 3168.0, 821.0, 304.0, 119.0, 70.0, 45.0, 34.0, 24.0, 25.0, 11.0, 14.0, 9.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.8861083984375, -7.592529296875, -7.2989501953125, -7.00537109375, -6.7117919921875, -6.418212890625, -6.1246337890625, -5.8310546875, -5.5374755859375, -5.243896484375, -4.9503173828125, -4.65673828125, -4.3631591796875, -4.069580078125, -3.7760009765625, -3.482421875, -3.1888427734375, -2.895263671875, -2.6016845703125, -2.30810546875, -2.0145263671875, -1.720947265625, -1.4273681640625, -1.1337890625, -0.8402099609375, -0.546630859375, -0.2530517578125, 0.04052734375, 0.3341064453125, 0.627685546875, 0.9212646484375, 1.21484375, 1.5084228515625, 1.802001953125, 2.0955810546875, 2.38916015625, 2.6827392578125, 2.976318359375, 3.2698974609375, 3.5634765625, 3.8570556640625, 4.150634765625, 4.4442138671875, 4.73779296875, 5.0313720703125, 5.324951171875, 5.6185302734375, 5.912109375, 6.2056884765625, 6.499267578125, 6.7928466796875, 7.08642578125, 7.3800048828125, 7.673583984375, 7.9671630859375, 8.2607421875, 8.5543212890625, 8.847900390625, 9.1414794921875, 9.43505859375, 9.7286376953125, 10.022216796875, 10.3157958984375, 10.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 12.0, 15.0, 31.0, 23.0, 36.0, 44.0, 46.0, 53.0, 62.0, 54.0, 66.0, 53.0, 57.0, 58.0, 48.0, 53.0, 55.0, 34.0, 28.0, 25.0, 21.0, 13.0, 21.0, 7.0, 14.0, 8.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.658416748046875, -2.55316162109375, -2.447906494140625, -2.3426513671875, -2.237396240234375, -2.13214111328125, -2.026885986328125, -1.921630859375, -1.816375732421875, -1.71112060546875, -1.605865478515625, -1.5006103515625, -1.395355224609375, -1.29010009765625, -1.184844970703125, -1.07958984375, -0.974334716796875, -0.86907958984375, -0.763824462890625, -0.6585693359375, -0.553314208984375, -0.44805908203125, -0.342803955078125, -0.237548828125, -0.132293701171875, -0.02703857421875, 0.078216552734375, 0.1834716796875, 0.288726806640625, 0.39398193359375, 0.499237060546875, 0.6044921875, 0.709747314453125, 0.81500244140625, 0.920257568359375, 1.0255126953125, 1.130767822265625, 1.23602294921875, 1.341278076171875, 1.446533203125, 1.551788330078125, 1.65704345703125, 1.762298583984375, 1.8675537109375, 1.972808837890625, 2.07806396484375, 2.183319091796875, 2.28857421875, 2.393829345703125, 2.49908447265625, 2.604339599609375, 2.7095947265625, 2.814849853515625, 2.92010498046875, 3.025360107421875, 3.130615234375, 3.235870361328125, 3.34112548828125, 3.446380615234375, 3.5516357421875, 3.656890869140625, 3.76214599609375, 3.867401123046875, 3.97265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 5.0, 12.0, 7.0, 15.0, 20.0, 40.0, 74.0, 244.0, 1425.0, 13914.0, 981718.0, 47442.0, 2943.0, 429.0, 99.0, 47.0, 21.0, 20.0, 8.0, 13.0, 4.0, 5.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9833984375, -1.9278106689453125, -1.872222900390625, -1.8166351318359375, -1.76104736328125, -1.7054595947265625, -1.649871826171875, -1.5942840576171875, -1.5386962890625, -1.4831085205078125, -1.427520751953125, -1.3719329833984375, -1.31634521484375, -1.2607574462890625, -1.205169677734375, -1.1495819091796875, -1.093994140625, -1.0384063720703125, -0.982818603515625, -0.9272308349609375, -0.87164306640625, -0.8160552978515625, -0.760467529296875, -0.7048797607421875, -0.6492919921875, -0.5937042236328125, -0.538116455078125, -0.4825286865234375, -0.42694091796875, -0.3713531494140625, -0.315765380859375, -0.2601776123046875, -0.20458984375, -0.1490020751953125, -0.093414306640625, -0.0378265380859375, 0.01776123046875, 0.0733489990234375, 0.128936767578125, 0.1845245361328125, 0.2401123046875, 0.2957000732421875, 0.351287841796875, 0.4068756103515625, 0.46246337890625, 0.5180511474609375, 0.573638916015625, 0.6292266845703125, 0.684814453125, 0.7404022216796875, 0.795989990234375, 0.8515777587890625, 0.90716552734375, 0.9627532958984375, 1.018341064453125, 1.0739288330078125, 1.1295166015625, 1.1851043701171875, 1.240692138671875, 1.2962799072265625, 1.35186767578125, 1.4074554443359375, 1.463043212890625, 1.5186309814453125, 1.57421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 9.0, 12.0, 10.0, 12.0, 16.0, 23.0, 40.0, 66.0, 210.0, 321.0, 121.0, 57.0, 31.0, 18.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.465217590332031e-05, -9.140651673078537e-05, -8.816085755825043e-05, -8.491519838571548e-05, -8.166953921318054e-05, -7.84238800406456e-05, -7.517822086811066e-05, -7.193256169557571e-05, -6.868690252304077e-05, -6.544124335050583e-05, -6.219558417797089e-05, -5.8949925005435944e-05, -5.5704265832901e-05, -5.245860666036606e-05, -4.9212947487831116e-05, -4.596728831529617e-05, -4.272162914276123e-05, -3.947596997022629e-05, -3.6230310797691345e-05, -3.29846516251564e-05, -2.973899245262146e-05, -2.6493333280086517e-05, -2.3247674107551575e-05, -2.0002014935016632e-05, -1.675635576248169e-05, -1.3510696589946747e-05, -1.0265037417411804e-05, -7.0193782448768616e-06, -3.773719072341919e-06, -5.280598998069763e-07, 2.7175992727279663e-06, 5.963258445262909e-06, 9.208917617797852e-06, 1.2454576790332794e-05, 1.5700235962867737e-05, 1.894589513540268e-05, 2.2191554307937622e-05, 2.5437213480472565e-05, 2.8682872653007507e-05, 3.192853182554245e-05, 3.517419099807739e-05, 3.8419850170612335e-05, 4.166550934314728e-05, 4.491116851568222e-05, 4.815682768821716e-05, 5.1402486860752106e-05, 5.464814603328705e-05, 5.789380520582199e-05, 6.113946437835693e-05, 6.438512355089188e-05, 6.763078272342682e-05, 7.087644189596176e-05, 7.41221010684967e-05, 7.736776024103165e-05, 8.061341941356659e-05, 8.385907858610153e-05, 8.710473775863647e-05, 9.035039693117142e-05, 9.359605610370636e-05, 9.68417152762413e-05, 0.00010008737444877625, 0.00010333303362131119, 0.00010657869279384613, 0.00010982435196638107, 0.00011307001113891602]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 12.0, 8.0, 15.0, 20.0, 32.0, 65.0, 150.0, 404.0, 1385.0, 8625.0, 258555.0, 765219.0, 11493.0, 1784.0, 454.0, 137.0, 60.0, 39.0, 23.0, 19.0, 8.0, 6.0, 3.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.989166259765625, -0.94805908203125, -0.906951904296875, -0.8658447265625, -0.824737548828125, -0.78363037109375, -0.742523193359375, -0.701416015625, -0.660308837890625, -0.61920166015625, -0.578094482421875, -0.5369873046875, -0.495880126953125, -0.45477294921875, -0.413665771484375, -0.37255859375, -0.331451416015625, -0.29034423828125, -0.249237060546875, -0.2081298828125, -0.167022705078125, -0.12591552734375, -0.084808349609375, -0.043701171875, -0.002593994140625, 0.03851318359375, 0.079620361328125, 0.1207275390625, 0.161834716796875, 0.20294189453125, 0.244049072265625, 0.28515625, 0.326263427734375, 0.36737060546875, 0.408477783203125, 0.4495849609375, 0.490692138671875, 0.53179931640625, 0.572906494140625, 0.614013671875, 0.655120849609375, 0.69622802734375, 0.737335205078125, 0.7784423828125, 0.819549560546875, 0.86065673828125, 0.901763916015625, 0.94287109375, 0.983978271484375, 1.02508544921875, 1.066192626953125, 1.1072998046875, 1.148406982421875, 1.18951416015625, 1.230621337890625, 1.271728515625, 1.312835693359375, 1.35394287109375, 1.395050048828125, 1.4361572265625, 1.477264404296875, 1.51837158203125, 1.559478759765625, 1.6005859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 12.0, 18.0, 19.0, 22.0, 31.0, 32.0, 53.0, 95.0, 179.0, 201.0, 97.0, 54.0, 31.0, 34.0, 20.0, 18.0, 9.0, 13.0, 7.0, 11.0, 2.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.267822265625, -0.2609672546386719, -0.25411224365234375, -0.24725723266601562, -0.2404022216796875, -0.23354721069335938, -0.22669219970703125, -0.21983718872070312, -0.212982177734375, -0.20612716674804688, -0.19927215576171875, -0.19241714477539062, -0.1855621337890625, -0.17870712280273438, -0.17185211181640625, -0.16499710083007812, -0.15814208984375, -0.15128707885742188, -0.14443206787109375, -0.13757705688476562, -0.1307220458984375, -0.12386703491210938, -0.11701202392578125, -0.11015701293945312, -0.103302001953125, -0.09644699096679688, -0.08959197998046875, -0.08273696899414062, -0.0758819580078125, -0.06902694702148438, -0.06217193603515625, -0.055316925048828125, -0.0484619140625, -0.041606903076171875, -0.03475189208984375, -0.027896881103515625, -0.0210418701171875, -0.014186859130859375, -0.00733184814453125, -0.000476837158203125, 0.006378173828125, 0.013233184814453125, 0.02008819580078125, 0.026943206787109375, 0.0337982177734375, 0.040653228759765625, 0.04750823974609375, 0.054363250732421875, 0.06121826171875, 0.06807327270507812, 0.07492828369140625, 0.08178329467773438, 0.0886383056640625, 0.09549331665039062, 0.10234832763671875, 0.10920333862304688, 0.116058349609375, 0.12291336059570312, 0.12976837158203125, 0.13662338256835938, 0.1434783935546875, 0.15033340454101562, 0.15718841552734375, 0.16404342651367188, 0.1708984375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 34.0, 186.0, 633.0, 135.0, 22.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.469989061355591, -1.7525253295898438, -1.0350614786148071, -0.3175976276397705, 0.39986610412597656, 1.1173298358917236, 1.8347938060760498, 2.5522572994232178, 3.269721269607544, 3.987185001373291, 4.704648971557617, 5.422112464904785, 6.139576435089111, 6.8570404052734375, 7.5745038986206055, 8.291967391967773, 9.009431838989258, 9.726895332336426, 10.44435977935791, 11.161823272705078, 11.879286766052246, 12.596750259399414, 13.314214706420898, 14.031678199768066, 14.749141693115234, 15.466605186462402, 16.18406867980957, 16.901533126831055, 17.61899757385254, 18.33646011352539, 19.053924560546875, 19.77138900756836, 20.48885154724121, 21.206315994262695, 21.923778533935547, 22.64124298095703, 23.358707427978516, 24.076169967651367, 24.79363441467285, 25.511096954345703, 26.228561401367188, 26.946025848388672, 27.663488388061523, 28.380952835083008, 29.098417282104492, 29.815879821777344, 30.533344268798828, 31.250808715820312, 31.968273162841797, 32.68573760986328, 33.403202056884766, 34.12066650390625, 34.83812713623047, 35.55559158325195, 36.27305603027344, 36.99052047729492, 37.70798110961914, 38.425445556640625, 39.14291000366211, 39.860374450683594, 40.57783508300781, 41.2952995300293, 42.01276397705078, 42.730228424072266, 43.44769287109375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 13.0, 17.0, 16.0, 27.0, 39.0, 42.0, 50.0, 56.0, 41.0, 78.0, 65.0, 58.0, 49.0, 49.0, 56.0, 48.0, 43.0, 46.0, 31.0, 36.0, 43.0, 23.0, 19.0, 14.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7473456859588623, -3.5792205333709717, -3.411095142364502, -3.2429699897766113, -3.0748448371887207, -2.90671968460083, -2.7385945320129395, -2.5704691410064697, -2.402343988418579, -2.2342188358306885, -2.0660934448242188, -1.8979682922363281, -1.7298431396484375, -1.5617179870605469, -1.3935927152633667, -1.2254674434661865, -1.057342290878296, -0.8892170786857605, -0.7210918664932251, -0.5529666543006897, -0.3848414421081543, -0.2167162299156189, -0.048591017723083496, 0.11953425407409668, 0.2876594066619873, 0.4557846188545227, 0.6239098310470581, 0.7920350432395935, 0.9601602554321289, 1.1282854080200195, 1.2964106798171997, 1.4645359516143799, 1.6326613426208496, 1.8007864952087402, 1.9689117670059204, 2.1370370388031006, 2.305162191390991, 2.473287343978882, 2.6414127349853516, 2.809537887573242, 2.977663040161133, 3.1457881927490234, 3.313913345336914, 3.482038736343384, 3.6501638889312744, 3.818289041519165, 3.9864144325256348, 4.154539585113525, 4.322664737701416, 4.490789890289307, 4.658915042877197, 4.827040195465088, 4.995165824890137, 5.163290977478027, 5.331416130065918, 5.499541282653809, 5.667666435241699, 5.83579158782959, 6.0039167404174805, 6.172041893005371, 6.340167045593262, 6.5082926750183105, 6.676417827606201, 6.844542980194092, 7.012668132781982]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 8.0, 11.0, 20.0, 31.0, 46.0, 56.0, 83.0, 84.0, 143.0, 220.0, 369.0, 588.0, 1142.0, 3074.0, 12078.0, 847305.0, 3294529.0, 26550.0, 4348.0, 1555.0, 774.0, 394.0, 253.0, 173.0, 129.0, 83.0, 63.0, 41.0, 26.0, 17.0, 18.0, 15.0, 13.0, 6.0, 11.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.29608154296875, -6.1116943359375, -5.92730712890625, -5.742919921875, -5.55853271484375, -5.3741455078125, -5.18975830078125, -5.00537109375, -4.82098388671875, -4.6365966796875, -4.45220947265625, -4.267822265625, -4.08343505859375, -3.8990478515625, -3.71466064453125, -3.5302734375, -3.34588623046875, -3.1614990234375, -2.97711181640625, -2.792724609375, -2.60833740234375, -2.4239501953125, -2.23956298828125, -2.05517578125, -1.87078857421875, -1.6864013671875, -1.50201416015625, -1.317626953125, -1.13323974609375, -0.9488525390625, -0.76446533203125, -0.580078125, -0.39569091796875, -0.2113037109375, -0.02691650390625, 0.157470703125, 0.34185791015625, 0.5262451171875, 0.71063232421875, 0.89501953125, 1.07940673828125, 1.2637939453125, 1.44818115234375, 1.632568359375, 1.81695556640625, 2.0013427734375, 2.18572998046875, 2.3701171875, 2.55450439453125, 2.7388916015625, 2.92327880859375, 3.107666015625, 3.29205322265625, 3.4764404296875, 3.66082763671875, 3.84521484375, 4.02960205078125, 4.2139892578125, 4.39837646484375, 4.582763671875, 4.76715087890625, 4.9515380859375, 5.13592529296875, 5.3203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 30.0, 13.0, 27.0, 31.0, 34.0, 26.0, 40.0, 55.0, 58.0, 55.0, 60.0, 62.0, 67.0, 43.0, 54.0, 47.0, 47.0, 33.0, 25.0, 31.0, 22.0, 28.0, 11.0, 8.0, 12.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9716796875, -1.9201812744140625, -1.868682861328125, -1.8171844482421875, -1.76568603515625, -1.7141876220703125, -1.662689208984375, -1.6111907958984375, -1.5596923828125, -1.5081939697265625, -1.456695556640625, -1.4051971435546875, -1.35369873046875, -1.3022003173828125, -1.250701904296875, -1.1992034912109375, -1.147705078125, -1.0962066650390625, -1.044708251953125, -0.9932098388671875, -0.94171142578125, -0.8902130126953125, -0.838714599609375, -0.7872161865234375, -0.7357177734375, -0.6842193603515625, -0.632720947265625, -0.5812225341796875, -0.52972412109375, -0.4782257080078125, -0.426727294921875, -0.3752288818359375, -0.32373046875, -0.2722320556640625, -0.220733642578125, -0.1692352294921875, -0.11773681640625, -0.0662384033203125, -0.014739990234375, 0.0367584228515625, 0.0882568359375, 0.1397552490234375, 0.191253662109375, 0.2427520751953125, 0.29425048828125, 0.3457489013671875, 0.397247314453125, 0.4487457275390625, 0.500244140625, 0.5517425537109375, 0.603240966796875, 0.6547393798828125, 0.70623779296875, 0.7577362060546875, 0.809234619140625, 0.8607330322265625, 0.9122314453125, 0.9637298583984375, 1.015228271484375, 1.0667266845703125, 1.11822509765625, 1.1697235107421875, 1.221221923828125, 1.2727203369140625, 1.32421875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 10.0, 6.0, 15.0, 9.0, 22.0, 28.0, 43.0, 77.0, 162.0, 302.0, 941.0, 3852.0, 35359.0, 4094043.0, 52897.0, 4643.0, 1094.0, 339.0, 158.0, 93.0, 36.0, 34.0, 24.0, 19.0, 15.0, 6.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.96484375, -7.7408447265625, -7.516845703125, -7.2928466796875, -7.06884765625, -6.8448486328125, -6.620849609375, -6.3968505859375, -6.1728515625, -5.9488525390625, -5.724853515625, -5.5008544921875, -5.27685546875, -5.0528564453125, -4.828857421875, -4.6048583984375, -4.380859375, -4.1568603515625, -3.932861328125, -3.7088623046875, -3.48486328125, -3.2608642578125, -3.036865234375, -2.8128662109375, -2.5888671875, -2.3648681640625, -2.140869140625, -1.9168701171875, -1.69287109375, -1.4688720703125, -1.244873046875, -1.0208740234375, -0.796875, -0.5728759765625, -0.348876953125, -0.1248779296875, 0.09912109375, 0.3231201171875, 0.547119140625, 0.7711181640625, 0.9951171875, 1.2191162109375, 1.443115234375, 1.6671142578125, 1.89111328125, 2.1151123046875, 2.339111328125, 2.5631103515625, 2.787109375, 3.0111083984375, 3.235107421875, 3.4591064453125, 3.68310546875, 3.9071044921875, 4.131103515625, 4.3551025390625, 4.5791015625, 4.8031005859375, 5.027099609375, 5.2510986328125, 5.47509765625, 5.6990966796875, 5.923095703125, 6.1470947265625, 6.37109375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 4.0, 10.0, 13.0, 15.0, 16.0, 33.0, 51.0, 91.0, 182.0, 491.0, 1129.0, 1121.0, 487.0, 174.0, 87.0, 37.0, 33.0, 21.0, 13.0, 8.0, 14.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9563369750976562, -0.9273223876953125, -0.8983078002929688, -0.869293212890625, -0.8402786254882812, -0.8112640380859375, -0.7822494506835938, -0.75323486328125, -0.7242202758789062, -0.6952056884765625, -0.6661911010742188, -0.637176513671875, -0.6081619262695312, -0.5791473388671875, -0.5501327514648438, -0.5211181640625, -0.49210357666015625, -0.4630889892578125, -0.43407440185546875, -0.405059814453125, -0.37604522705078125, -0.3470306396484375, -0.31801605224609375, -0.28900146484375, -0.25998687744140625, -0.2309722900390625, -0.20195770263671875, -0.172943115234375, -0.14392852783203125, -0.1149139404296875, -0.08589935302734375, -0.056884765625, -0.02787017822265625, 0.0011444091796875, 0.03015899658203125, 0.059173583984375, 0.08818817138671875, 0.1172027587890625, 0.14621734619140625, 0.17523193359375, 0.20424652099609375, 0.2332611083984375, 0.26227569580078125, 0.291290283203125, 0.32030487060546875, 0.3493194580078125, 0.37833404541015625, 0.4073486328125, 0.43636322021484375, 0.4653778076171875, 0.49439239501953125, 0.523406982421875, 0.5524215698242188, 0.5814361572265625, 0.6104507446289062, 0.63946533203125, 0.6684799194335938, 0.6974945068359375, 0.7265090942382812, 0.755523681640625, 0.7845382690429688, 0.8135528564453125, 0.8425674438476562, 0.87158203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 7.0, 22.0, 29.0, 52.0, 91.0, 107.0, 120.0, 165.0, 132.0, 77.0, 62.0, 39.0, 24.0, 18.0, 7.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.905581474304199, -3.803659677505493, -3.701737880706787, -3.59981632232666, -3.497894525527954, -3.395972728729248, -3.294050931930542, -3.192129135131836, -3.090207576751709, -2.988285779953003, -2.886363983154297, -2.78444242477417, -2.682520627975464, -2.580598831176758, -2.4786770343780518, -2.3767552375793457, -2.2748334407806396, -2.1729116439819336, -2.0709898471832275, -1.969068169593811, -1.8671464920043945, -1.7652246952056885, -1.6633028984069824, -1.5613811016082764, -1.4594594240188599, -1.3575376272201538, -1.2556159496307373, -1.1536941528320312, -1.0517723560333252, -0.9498506784439087, -0.8479288816452026, -0.7460071444511414, -0.6440856456756592, -0.5421639084815979, -0.44024214148521423, -0.33832037448883057, -0.2363986372947693, -0.134476900100708, -0.03255510330200195, 0.06936663389205933, 0.1712883710861206, 0.2732101082801819, 0.37513187527656555, 0.4770536422729492, 0.5789753794670105, 0.6808971166610718, 0.7828189134597778, 0.8847406506538391, 0.9866623878479004, 1.0885841846466064, 1.190505862236023, 1.292427659034729, 1.3943493366241455, 1.4962711334228516, 1.5981929302215576, 1.7001147270202637, 1.8020364046096802, 1.9039582014083862, 2.0058798789978027, 2.107801675796509, 2.209723472595215, 2.311645030975342, 2.413567066192627, 2.515488624572754, 2.61741042137146]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 1.0, 6.0, 14.0, 23.0, 18.0, 22.0, 28.0, 30.0, 38.0, 45.0, 41.0, 51.0, 57.0, 51.0, 62.0, 59.0, 53.0, 61.0, 51.0, 59.0, 42.0, 31.0, 26.0, 28.0, 26.0, 13.0, 9.0, 14.0, 9.0, 8.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.178774833679199, -2.117802858352661, -2.056831121444702, -1.9958592653274536, -1.934887409210205, -1.873915433883667, -1.8129435777664185, -1.75197172164917, -1.6909998655319214, -1.6300280094146729, -1.5690561532974243, -1.5080842971801758, -1.4471123218536377, -1.3861405849456787, -1.3251686096191406, -1.264196753501892, -1.2032248973846436, -1.142253041267395, -1.0812811851501465, -1.020309329032898, -0.9593374133110046, -0.8983655571937561, -0.8373936414718628, -0.7764217853546143, -0.7154499292373657, -0.6544780731201172, -0.5935062170028687, -0.5325343012809753, -0.4715624451637268, -0.41059058904647827, -0.34961870312690735, -0.2886468172073364, -0.22767508029937744, -0.1667032092809677, -0.10573133826255798, -0.044759467244148254, 0.016212403774261475, 0.07718425989151001, 0.13815614581108093, 0.19912803173065186, 0.2600998878479004, 0.3210717439651489, 0.38204362988471985, 0.44301551580429077, 0.5039873719215393, 0.5649592280387878, 0.6259311437606812, 0.6869029998779297, 0.7478748559951782, 0.8088467121124268, 0.8698185682296753, 0.9307904839515686, 0.9917623400688171, 1.052734136581421, 1.113706111907959, 1.1746779680252075, 1.235649824142456, 1.2966216802597046, 1.3575935363769531, 1.4185653924942017, 1.4795372486114502, 1.5405092239379883, 1.6014810800552368, 1.6624529361724854, 1.7234247922897339]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 13.0, 8.0, 7.0, 12.0, 9.0, 14.0, 22.0, 27.0, 61.0, 150.0, 373.0, 1375.0, 6529.0, 45116.0, 869081.0, 110698.0, 11702.0, 2314.0, 575.0, 206.0, 81.0, 34.0, 27.0, 19.0, 19.0, 9.0, 5.0, 13.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.10546875, -2.041015625, -1.9765625, -1.912109375, -1.84765625, -1.783203125, -1.71875, -1.654296875, -1.58984375, -1.525390625, -1.4609375, -1.396484375, -1.33203125, -1.267578125, -1.203125, -1.138671875, -1.07421875, -1.009765625, -0.9453125, -0.880859375, -0.81640625, -0.751953125, -0.6875, -0.623046875, -0.55859375, -0.494140625, -0.4296875, -0.365234375, -0.30078125, -0.236328125, -0.171875, -0.107421875, -0.04296875, 0.021484375, 0.0859375, 0.150390625, 0.21484375, 0.279296875, 0.34375, 0.408203125, 0.47265625, 0.537109375, 0.6015625, 0.666015625, 0.73046875, 0.794921875, 0.859375, 0.923828125, 0.98828125, 1.052734375, 1.1171875, 1.181640625, 1.24609375, 1.310546875, 1.375, 1.439453125, 1.50390625, 1.568359375, 1.6328125, 1.697265625, 1.76171875, 1.826171875, 1.890625, 1.955078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 21.0, 50.0, 69.0, 83.0, 109.0, 147.0, 121.0, 139.0, 106.0, 67.0, 32.0, 20.0, 13.0, 11.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6845703125, -1.6005096435546875, -1.516448974609375, -1.4323883056640625, -1.34832763671875, -1.2642669677734375, -1.180206298828125, -1.0961456298828125, -1.0120849609375, -0.9280242919921875, -0.843963623046875, -0.7599029541015625, -0.67584228515625, -0.5917816162109375, -0.507720947265625, -0.4236602783203125, -0.339599609375, -0.2555389404296875, -0.171478271484375, -0.0874176025390625, -0.00335693359375, 0.0807037353515625, 0.164764404296875, 0.2488250732421875, 0.3328857421875, 0.4169464111328125, 0.501007080078125, 0.5850677490234375, 0.66912841796875, 0.7531890869140625, 0.837249755859375, 0.9213104248046875, 1.00537109375, 1.0894317626953125, 1.173492431640625, 1.2575531005859375, 1.34161376953125, 1.4256744384765625, 1.509735107421875, 1.5937957763671875, 1.6778564453125, 1.7619171142578125, 1.845977783203125, 1.9300384521484375, 2.01409912109375, 2.0981597900390625, 2.182220458984375, 2.2662811279296875, 2.350341796875, 2.4344024658203125, 2.518463134765625, 2.6025238037109375, 2.68658447265625, 2.7706451416015625, 2.854705810546875, 2.9387664794921875, 3.0228271484375, 3.1068878173828125, 3.190948486328125, 3.2750091552734375, 3.35906982421875, 3.4431304931640625, 3.527191162109375, 3.6112518310546875, 3.6953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 6.0, 13.0, 26.0, 33.0, 55.0, 108.0, 194.0, 283.0, 467.0, 888.0, 1692.0, 3450.0, 7705.0, 18884.0, 57623.0, 342602.0, 499653.0, 74893.0, 22619.0, 8974.0, 4054.0, 1952.0, 1006.0, 555.0, 311.0, 178.0, 123.0, 76.0, 48.0, 30.0, 14.0, 12.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.49554443359375, -0.4779052734375, -0.46026611328125, -0.442626953125, -0.42498779296875, -0.4073486328125, -0.38970947265625, -0.3720703125, -0.35443115234375, -0.3367919921875, -0.31915283203125, -0.301513671875, -0.28387451171875, -0.2662353515625, -0.24859619140625, -0.23095703125, -0.21331787109375, -0.1956787109375, -0.17803955078125, -0.160400390625, -0.14276123046875, -0.1251220703125, -0.10748291015625, -0.08984375, -0.07220458984375, -0.0545654296875, -0.03692626953125, -0.019287109375, -0.00164794921875, 0.0159912109375, 0.03363037109375, 0.05126953125, 0.06890869140625, 0.0865478515625, 0.10418701171875, 0.121826171875, 0.13946533203125, 0.1571044921875, 0.17474365234375, 0.1923828125, 0.21002197265625, 0.2276611328125, 0.24530029296875, 0.262939453125, 0.28057861328125, 0.2982177734375, 0.31585693359375, 0.33349609375, 0.35113525390625, 0.3687744140625, 0.38641357421875, 0.404052734375, 0.42169189453125, 0.4393310546875, 0.45697021484375, 0.474609375, 0.49224853515625, 0.5098876953125, 0.52752685546875, 0.545166015625, 0.56280517578125, 0.5804443359375, 0.59808349609375, 0.61572265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 14.0, 6.0, 8.0, 17.0, 17.0, 20.0, 15.0, 32.0, 40.0, 28.0, 38.0, 41.0, 46.0, 56.0, 48.0, 59.0, 53.0, 63.0, 52.0, 50.0, 44.0, 32.0, 49.0, 35.0, 20.0, 14.0, 19.0, 16.0, 9.0, 13.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8896484375, -1.8306121826171875, -1.771575927734375, -1.7125396728515625, -1.65350341796875, -1.5944671630859375, -1.535430908203125, -1.4763946533203125, -1.4173583984375, -1.3583221435546875, -1.299285888671875, -1.2402496337890625, -1.18121337890625, -1.1221771240234375, -1.063140869140625, -1.0041046142578125, -0.945068359375, -0.8860321044921875, -0.826995849609375, -0.7679595947265625, -0.70892333984375, -0.6498870849609375, -0.590850830078125, -0.5318145751953125, -0.4727783203125, -0.4137420654296875, -0.354705810546875, -0.2956695556640625, -0.23663330078125, -0.1775970458984375, -0.118560791015625, -0.0595245361328125, -0.00048828125, 0.0585479736328125, 0.117584228515625, 0.1766204833984375, 0.23565673828125, 0.2946929931640625, 0.353729248046875, 0.4127655029296875, 0.4718017578125, 0.5308380126953125, 0.589874267578125, 0.6489105224609375, 0.70794677734375, 0.7669830322265625, 0.826019287109375, 0.8850555419921875, 0.944091796875, 1.0031280517578125, 1.062164306640625, 1.1212005615234375, 1.18023681640625, 1.2392730712890625, 1.298309326171875, 1.3573455810546875, 1.4163818359375, 1.4754180908203125, 1.534454345703125, 1.5934906005859375, 1.65252685546875, 1.7115631103515625, 1.770599365234375, 1.8296356201171875, 1.888671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 16.0, 31.0, 37.0, 63.0, 106.0, 156.0, 286.0, 596.0, 1201.0, 2601.0, 7436.0, 25906.0, 168115.0, 743987.0, 73165.0, 15769.0, 5096.0, 1961.0, 868.0, 465.0, 243.0, 163.0, 83.0, 53.0, 39.0, 23.0, 23.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.149505615234375, -0.14422607421875, -0.138946533203125, -0.1336669921875, -0.128387451171875, -0.12310791015625, -0.117828369140625, -0.112548828125, -0.107269287109375, -0.10198974609375, -0.096710205078125, -0.0914306640625, -0.086151123046875, -0.08087158203125, -0.075592041015625, -0.0703125, -0.065032958984375, -0.05975341796875, -0.054473876953125, -0.0491943359375, -0.043914794921875, -0.03863525390625, -0.033355712890625, -0.028076171875, -0.022796630859375, -0.01751708984375, -0.012237548828125, -0.0069580078125, -0.001678466796875, 0.00360107421875, 0.008880615234375, 0.01416015625, 0.019439697265625, 0.02471923828125, 0.029998779296875, 0.0352783203125, 0.040557861328125, 0.04583740234375, 0.051116943359375, 0.056396484375, 0.061676025390625, 0.06695556640625, 0.072235107421875, 0.0775146484375, 0.082794189453125, 0.08807373046875, 0.093353271484375, 0.0986328125, 0.103912353515625, 0.10919189453125, 0.114471435546875, 0.1197509765625, 0.125030517578125, 0.13031005859375, 0.135589599609375, 0.140869140625, 0.146148681640625, 0.15142822265625, 0.156707763671875, 0.1619873046875, 0.167266845703125, 0.17254638671875, 0.177825927734375, 0.18310546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 24.0, 36.0, 54.0, 91.0, 203.0, 250.0, 110.0, 73.0, 39.0, 22.0, 17.0, 13.0, 11.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001537799835205078, -0.00014941394329071045, -0.00014504790306091309, -0.00014068186283111572, -0.00013631582260131836, -0.000131949782371521, -0.00012758374214172363, -0.00012321770191192627, -0.0001188516616821289, -0.00011448562145233154, -0.00011011958122253418, -0.00010575354099273682, -0.00010138750076293945, -9.702146053314209e-05, -9.265542030334473e-05, -8.828938007354736e-05, -8.392333984375e-05, -7.955729961395264e-05, -7.519125938415527e-05, -7.082521915435791e-05, -6.645917892456055e-05, -6.209313869476318e-05, -5.772709846496582e-05, -5.336105823516846e-05, -4.8995018005371094e-05, -4.462897777557373e-05, -4.026293754577637e-05, -3.5896897315979004e-05, -3.153085708618164e-05, -2.7164816856384277e-05, -2.2798776626586914e-05, -1.843273639678955e-05, -1.4066696166992188e-05, -9.700655937194824e-06, -5.334615707397461e-06, -9.685754776000977e-07, 3.3974647521972656e-06, 7.763504981994629e-06, 1.2129545211791992e-05, 1.6495585441589355e-05, 2.086162567138672e-05, 2.5227665901184082e-05, 2.9593706130981445e-05, 3.395974636077881e-05, 3.832578659057617e-05, 4.2691826820373535e-05, 4.70578670501709e-05, 5.142390727996826e-05, 5.5789947509765625e-05, 6.015598773956299e-05, 6.452202796936035e-05, 6.888806819915771e-05, 7.325410842895508e-05, 7.762014865875244e-05, 8.19861888885498e-05, 8.635222911834717e-05, 9.071826934814453e-05, 9.50843095779419e-05, 9.945034980773926e-05, 0.00010381639003753662, 0.00010818243026733398, 0.00011254847049713135, 0.00011691451072692871, 0.00012128055095672607, 0.00012564659118652344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 9.0, 2.0, 10.0, 17.0, 18.0, 24.0, 41.0, 55.0, 102.0, 195.0, 371.0, 846.0, 1875.0, 4724.0, 14013.0, 60315.0, 637229.0, 279206.0, 33879.0, 9400.0, 3490.0, 1362.0, 650.0, 323.0, 156.0, 74.0, 66.0, 32.0, 16.0, 18.0, 12.0, 8.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1912841796875, -0.1859455108642578, -0.18060684204101562, -0.17526817321777344, -0.16992950439453125, -0.16459083557128906, -0.15925216674804688, -0.1539134979248047, -0.1485748291015625, -0.1432361602783203, -0.13789749145507812, -0.13255882263183594, -0.12722015380859375, -0.12188148498535156, -0.11654281616210938, -0.11120414733886719, -0.105865478515625, -0.10052680969238281, -0.09518814086914062, -0.08984947204589844, -0.08451080322265625, -0.07917213439941406, -0.07383346557617188, -0.06849479675292969, -0.0631561279296875, -0.05781745910644531, -0.052478790283203125, -0.04714012145996094, -0.04180145263671875, -0.03646278381347656, -0.031124114990234375, -0.025785446166992188, -0.02044677734375, -0.015108108520507812, -0.009769439697265625, -0.0044307708740234375, 0.00090789794921875, 0.0062465667724609375, 0.011585235595703125, 0.016923904418945312, 0.0222625732421875, 0.027601242065429688, 0.032939910888671875, 0.03827857971191406, 0.04361724853515625, 0.04895591735839844, 0.054294586181640625, 0.05963325500488281, 0.064971923828125, 0.07031059265136719, 0.07564926147460938, 0.08098793029785156, 0.08632659912109375, 0.09166526794433594, 0.09700393676757812, 0.10234260559082031, 0.1076812744140625, 0.11301994323730469, 0.11835861206054688, 0.12369728088378906, 0.12903594970703125, 0.13437461853027344, 0.13971328735351562, 0.1450519561767578, 0.150390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 1.0, 7.0, 10.0, 5.0, 20.0, 24.0, 41.0, 36.0, 57.0, 67.0, 70.0, 116.0, 144.0, 95.0, 60.0, 61.0, 37.0, 29.0, 18.0, 17.0, 15.0, 9.0, 7.0, 8.0, 7.0, 5.0, 5.0, 4.0, 6.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.028013944625854492, -0.027020931243896484, -0.026027917861938477, -0.02503490447998047, -0.02404189109802246, -0.023048877716064453, -0.022055864334106445, -0.021062850952148438, -0.02006983757019043, -0.019076824188232422, -0.018083810806274414, -0.017090797424316406, -0.0160977840423584, -0.01510477066040039, -0.014111757278442383, -0.013118743896484375, -0.012125730514526367, -0.01113271713256836, -0.010139703750610352, -0.009146690368652344, -0.008153676986694336, -0.007160663604736328, -0.00616765022277832, -0.0051746368408203125, -0.004181623458862305, -0.003188610076904297, -0.002195596694946289, -0.0012025833129882812, -0.00020956993103027344, 0.0007834434509277344, 0.0017764568328857422, 0.00276947021484375, 0.003762483596801758, 0.004755496978759766, 0.0057485103607177734, 0.006741523742675781, 0.007734537124633789, 0.008727550506591797, 0.009720563888549805, 0.010713577270507812, 0.01170659065246582, 0.012699604034423828, 0.013692617416381836, 0.014685630798339844, 0.01567864418029785, 0.01667165756225586, 0.017664670944213867, 0.018657684326171875, 0.019650697708129883, 0.02064371109008789, 0.0216367244720459, 0.022629737854003906, 0.023622751235961914, 0.024615764617919922, 0.02560877799987793, 0.026601791381835938, 0.027594804763793945, 0.028587818145751953, 0.02958083152770996, 0.03057384490966797, 0.03156685829162598, 0.032559871673583984, 0.03355288505554199, 0.0345458984375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 16.0, 23.0, 63.0, 137.0, 276.0, 243.0, 123.0, 58.0, 29.0, 13.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.240875244140625, -4.134738445281982, -4.02860164642334, -3.922464609146118, -3.8163275718688965, -3.710190773010254, -3.6040539741516113, -3.4979169368743896, -3.391779899597168, -3.2856431007385254, -3.1795060634613037, -3.073369264602661, -2.9672322273254395, -2.861095428466797, -2.7549586296081543, -2.6488215923309326, -2.54268479347229, -2.4365479946136475, -2.330410957336426, -2.224274158477783, -2.1181371212005615, -2.012000322341919, -1.9058634042739868, -1.7997264862060547, -1.6935895681381226, -1.5874526500701904, -1.4813157320022583, -1.3751788139343262, -1.2690420150756836, -1.162904977798462, -1.0567681789398193, -0.9506312608718872, -0.8444943428039551, -0.738357424736023, -0.6322205066680908, -0.5260836482048035, -0.41994673013687134, -0.3138098120689392, -0.20767295360565186, -0.10153603553771973, 0.004600882530212402, 0.11073778569698334, 0.21687468886375427, 0.323011577129364, 0.42914849519729614, 0.5352854132652283, 0.6414222717285156, 0.7475591897964478, 0.8536961078643799, 0.959833025932312, 1.0659699440002441, 1.1721067428588867, 1.2782437801361084, 1.384380578994751, 1.490517497062683, 1.5966544151306152, 1.7027913331985474, 1.8089282512664795, 1.9150651693344116, 2.0212020874023438, 2.1273388862609863, 2.233475923538208, 2.3396127223968506, 2.4457497596740723, 2.551886558532715]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 12.0, 14.0, 47.0, 55.0, 80.0, 107.0, 117.0, 125.0, 130.0, 111.0, 79.0, 50.0, 28.0, 20.0, 14.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5628656148910522, -1.4866338968276978, -1.4104021787643433, -1.3341704607009888, -1.2579387426376343, -1.1817070245742798, -1.1054753065109253, -1.0292435884475708, -0.9530118703842163, -0.8767801523208618, -0.8005484342575073, -0.7243167161941528, -0.6480849981307983, -0.5718532800674438, -0.49562156200408936, -0.41938984394073486, -0.34315812587738037, -0.2669264078140259, -0.1906946897506714, -0.1144629716873169, -0.0382312536239624, 0.03800046443939209, 0.11423218250274658, 0.19046390056610107, 0.26669561862945557, 0.34292733669281006, 0.41915905475616455, 0.49539077281951904, 0.5716224908828735, 0.647854208946228, 0.7240859270095825, 0.800317645072937, 0.876549243927002, 0.9527809619903564, 1.029012680053711, 1.1052443981170654, 1.18147611618042, 1.2577078342437744, 1.333939552307129, 1.4101712703704834, 1.486402988433838, 1.5626347064971924, 1.6388664245605469, 1.7150981426239014, 1.7913298606872559, 1.8675615787506104, 1.9437932968139648, 2.0200250148773193, 2.096256732940674, 2.1724884510040283, 2.248720169067383, 2.3249518871307373, 2.401183605194092, 2.4774153232574463, 2.553647041320801, 2.6298787593841553, 2.7061104774475098, 2.7823421955108643, 2.8585739135742188, 2.9348056316375732, 3.0110373497009277, 3.0872690677642822, 3.1635007858276367, 3.239732503890991, 3.3159642219543457]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 5.0, 8.0, 16.0, 32.0, 118.0, 469.0, 1653.0, 7448.0, 112744.0, 908152.0, 14005.0, 2856.0, 703.0, 209.0, 54.0, 16.0, 14.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.7916259765625, -4.637939453125, -4.4842529296875, -4.33056640625, -4.1768798828125, -4.023193359375, -3.8695068359375, -3.7158203125, -3.5621337890625, -3.408447265625, -3.2547607421875, -3.10107421875, -2.9473876953125, -2.793701171875, -2.6400146484375, -2.486328125, -2.3326416015625, -2.178955078125, -2.0252685546875, -1.87158203125, -1.7178955078125, -1.564208984375, -1.4105224609375, -1.2568359375, -1.1031494140625, -0.949462890625, -0.7957763671875, -0.64208984375, -0.4884033203125, -0.334716796875, -0.1810302734375, -0.02734375, 0.1263427734375, 0.280029296875, 0.4337158203125, 0.58740234375, 0.7410888671875, 0.894775390625, 1.0484619140625, 1.2021484375, 1.3558349609375, 1.509521484375, 1.6632080078125, 1.81689453125, 1.9705810546875, 2.124267578125, 2.2779541015625, 2.431640625, 2.5853271484375, 2.739013671875, 2.8927001953125, 3.04638671875, 3.2000732421875, 3.353759765625, 3.5074462890625, 3.6611328125, 3.8148193359375, 3.968505859375, 4.1221923828125, 4.27587890625, 4.4295654296875, 4.583251953125, 4.7369384765625, 4.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [7.0, 4.0, 6.0, 9.0, 8.0, 9.0, 29.0, 22.0, 44.0, 58.0, 58.0, 78.0, 90.0, 94.0, 94.0, 88.0, 64.0, 73.0, 55.0, 37.0, 28.0, 19.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.532684326171875, -1.41497802734375, -1.297271728515625, -1.1795654296875, -1.061859130859375, -0.94415283203125, -0.826446533203125, -0.708740234375, -0.591033935546875, -0.47332763671875, -0.355621337890625, -0.2379150390625, -0.120208740234375, -0.00250244140625, 0.115203857421875, 0.23291015625, 0.350616455078125, 0.46832275390625, 0.586029052734375, 0.7037353515625, 0.821441650390625, 0.93914794921875, 1.056854248046875, 1.174560546875, 1.292266845703125, 1.40997314453125, 1.527679443359375, 1.6453857421875, 1.763092041015625, 1.88079833984375, 1.998504638671875, 2.1162109375, 2.233917236328125, 2.35162353515625, 2.469329833984375, 2.5870361328125, 2.704742431640625, 2.82244873046875, 2.940155029296875, 3.057861328125, 3.175567626953125, 3.29327392578125, 3.410980224609375, 3.5286865234375, 3.646392822265625, 3.76409912109375, 3.881805419921875, 3.99951171875, 4.117218017578125, 4.23492431640625, 4.352630615234375, 4.4703369140625, 4.588043212890625, 4.70574951171875, 4.823455810546875, 4.941162109375, 5.058868408203125, 5.17657470703125, 5.294281005859375, 5.4119873046875, 5.529693603515625, 5.64739990234375, 5.765106201171875, 5.8828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 9.0, 13.0, 17.0, 11.0, 20.0, 27.0, 27.0, 32.0, 46.0, 41.0, 55.0, 71.0, 189.0, 754.0, 11338.0, 1022694.0, 11897.0, 708.0, 140.0, 76.0, 38.0, 46.0, 38.0, 33.0, 20.0, 30.0, 29.0, 12.0, 16.0, 15.0, 15.0, 12.0, 11.0, 13.0, 4.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8839111328125, -6.650634765625, -6.4173583984375, -6.18408203125, -5.9508056640625, -5.717529296875, -5.4842529296875, -5.2509765625, -5.0177001953125, -4.784423828125, -4.5511474609375, -4.31787109375, -4.0845947265625, -3.851318359375, -3.6180419921875, -3.384765625, -3.1514892578125, -2.918212890625, -2.6849365234375, -2.45166015625, -2.2183837890625, -1.985107421875, -1.7518310546875, -1.5185546875, -1.2852783203125, -1.052001953125, -0.8187255859375, -0.58544921875, -0.3521728515625, -0.118896484375, 0.1143798828125, 0.34765625, 0.5809326171875, 0.814208984375, 1.0474853515625, 1.28076171875, 1.5140380859375, 1.747314453125, 1.9805908203125, 2.2138671875, 2.4471435546875, 2.680419921875, 2.9136962890625, 3.14697265625, 3.3802490234375, 3.613525390625, 3.8468017578125, 4.080078125, 4.3133544921875, 4.546630859375, 4.7799072265625, 5.01318359375, 5.2464599609375, 5.479736328125, 5.7130126953125, 5.9462890625, 6.1795654296875, 6.412841796875, 6.6461181640625, 6.87939453125, 7.1126708984375, 7.345947265625, 7.5792236328125, 7.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 8.0, 7.0, 1.0, 10.0, 4.0, 9.0, 14.0, 18.0, 24.0, 15.0, 17.0, 16.0, 22.0, 44.0, 35.0, 25.0, 41.0, 34.0, 32.0, 32.0, 41.0, 39.0, 50.0, 40.0, 35.0, 37.0, 37.0, 28.0, 34.0, 29.0, 22.0, 29.0, 29.0, 17.0, 15.0, 15.0, 14.0, 9.0, 14.0, 16.0, 11.0, 5.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615234375, -1.5607757568359375, -1.506317138671875, -1.4518585205078125, -1.39739990234375, -1.3429412841796875, -1.288482666015625, -1.2340240478515625, -1.1795654296875, -1.1251068115234375, -1.070648193359375, -1.0161895751953125, -0.96173095703125, -0.9072723388671875, -0.852813720703125, -0.7983551025390625, -0.743896484375, -0.6894378662109375, -0.634979248046875, -0.5805206298828125, -0.52606201171875, -0.4716033935546875, -0.417144775390625, -0.3626861572265625, -0.3082275390625, -0.2537689208984375, -0.199310302734375, -0.1448516845703125, -0.09039306640625, -0.0359344482421875, 0.018524169921875, 0.0729827880859375, 0.12744140625, 0.1819000244140625, 0.236358642578125, 0.2908172607421875, 0.34527587890625, 0.3997344970703125, 0.454193115234375, 0.5086517333984375, 0.5631103515625, 0.6175689697265625, 0.672027587890625, 0.7264862060546875, 0.78094482421875, 0.8354034423828125, 0.889862060546875, 0.9443206787109375, 0.998779296875, 1.0532379150390625, 1.107696533203125, 1.1621551513671875, 1.21661376953125, 1.2710723876953125, 1.325531005859375, 1.3799896240234375, 1.4344482421875, 1.4889068603515625, 1.543365478515625, 1.5978240966796875, 1.65228271484375, 1.7067413330078125, 1.761199951171875, 1.8156585693359375, 1.8701171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 10.0, 12.0, 19.0, 24.0, 26.0, 36.0, 52.0, 58.0, 134.0, 245.0, 435.0, 959.0, 2551.0, 8551.0, 53586.0, 910460.0, 57741.0, 8911.0, 2646.0, 1007.0, 468.0, 220.0, 132.0, 74.0, 46.0, 31.0, 32.0, 17.0, 14.0, 12.0, 5.0, 6.0, 13.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.6025390625, -0.5860366821289062, -0.5695343017578125, -0.5530319213867188, -0.536529541015625, -0.5200271606445312, -0.5035247802734375, -0.48702239990234375, -0.47052001953125, -0.45401763916015625, -0.4375152587890625, -0.42101287841796875, -0.404510498046875, -0.38800811767578125, -0.3715057373046875, -0.35500335693359375, -0.3385009765625, -0.32199859619140625, -0.3054962158203125, -0.28899383544921875, -0.272491455078125, -0.25598907470703125, -0.2394866943359375, -0.22298431396484375, -0.20648193359375, -0.18997955322265625, -0.1734771728515625, -0.15697479248046875, -0.140472412109375, -0.12397003173828125, -0.1074676513671875, -0.09096527099609375, -0.074462890625, -0.05796051025390625, -0.0414581298828125, -0.02495574951171875, -0.008453369140625, 0.00804901123046875, 0.0245513916015625, 0.04105377197265625, 0.05755615234375, 0.07405853271484375, 0.0905609130859375, 0.10706329345703125, 0.123565673828125, 0.14006805419921875, 0.1565704345703125, 0.17307281494140625, 0.1895751953125, 0.20607757568359375, 0.2225799560546875, 0.23908233642578125, 0.255584716796875, 0.27208709716796875, 0.2885894775390625, 0.30509185791015625, 0.32159423828125, 0.33809661865234375, 0.3545989990234375, 0.37110137939453125, 0.387603759765625, 0.40410614013671875, 0.4206085205078125, 0.43711090087890625, 0.45361328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 13.0, 12.0, 15.0, 21.0, 44.0, 95.0, 194.0, 307.0, 100.0, 63.0, 29.0, 14.0, 18.0, 17.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.296966552734375e-05, -8.079409599304199e-05, -7.861852645874023e-05, -7.644295692443848e-05, -7.426738739013672e-05, -7.209181785583496e-05, -6.99162483215332e-05, -6.774067878723145e-05, -6.556510925292969e-05, -6.338953971862793e-05, -6.121397018432617e-05, -5.9038400650024414e-05, -5.6862831115722656e-05, -5.46872615814209e-05, -5.251169204711914e-05, -5.033612251281738e-05, -4.8160552978515625e-05, -4.598498344421387e-05, -4.380941390991211e-05, -4.163384437561035e-05, -3.9458274841308594e-05, -3.7282705307006836e-05, -3.510713577270508e-05, -3.293156623840332e-05, -3.075599670410156e-05, -2.8580427169799805e-05, -2.6404857635498047e-05, -2.422928810119629e-05, -2.205371856689453e-05, -1.9878149032592773e-05, -1.7702579498291016e-05, -1.5527009963989258e-05, -1.33514404296875e-05, -1.1175870895385742e-05, -9.000301361083984e-06, -6.8247318267822266e-06, -4.649162292480469e-06, -2.473592758178711e-06, -2.980232238769531e-07, 1.8775463104248047e-06, 4.0531158447265625e-06, 6.22868537902832e-06, 8.404254913330078e-06, 1.0579824447631836e-05, 1.2755393981933594e-05, 1.4930963516235352e-05, 1.710653305053711e-05, 1.9282102584838867e-05, 2.1457672119140625e-05, 2.3633241653442383e-05, 2.580881118774414e-05, 2.79843807220459e-05, 3.0159950256347656e-05, 3.2335519790649414e-05, 3.451108932495117e-05, 3.668665885925293e-05, 3.886222839355469e-05, 4.1037797927856445e-05, 4.32133674621582e-05, 4.538893699645996e-05, 4.756450653076172e-05, 4.9740076065063477e-05, 5.1915645599365234e-05, 5.409121513366699e-05, 5.626678466796875e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 3.0, 13.0, 10.0, 10.0, 22.0, 24.0, 46.0, 77.0, 175.0, 375.0, 972.0, 3599.0, 20136.0, 871043.0, 138548.0, 10056.0, 2186.0, 690.0, 271.0, 129.0, 64.0, 41.0, 16.0, 9.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63671875, -0.6153640747070312, -0.5940093994140625, -0.5726547241210938, -0.551300048828125, -0.5299453735351562, -0.5085906982421875, -0.48723602294921875, -0.46588134765625, -0.44452667236328125, -0.4231719970703125, -0.40181732177734375, -0.380462646484375, -0.35910797119140625, -0.3377532958984375, -0.31639862060546875, -0.2950439453125, -0.27368927001953125, -0.2523345947265625, -0.23097991943359375, -0.209625244140625, -0.18827056884765625, -0.1669158935546875, -0.14556121826171875, -0.12420654296875, -0.10285186767578125, -0.0814971923828125, -0.06014251708984375, -0.038787841796875, -0.01743316650390625, 0.0039215087890625, 0.02527618408203125, 0.046630859375, 0.06798553466796875, 0.0893402099609375, 0.11069488525390625, 0.132049560546875, 0.15340423583984375, 0.1747589111328125, 0.19611358642578125, 0.21746826171875, 0.23882293701171875, 0.2601776123046875, 0.28153228759765625, 0.302886962890625, 0.32424163818359375, 0.3455963134765625, 0.36695098876953125, 0.3883056640625, 0.40966033935546875, 0.4310150146484375, 0.45236968994140625, 0.473724365234375, 0.49507904052734375, 0.5164337158203125, 0.5377883911132812, 0.55914306640625, 0.5804977416992188, 0.6018524169921875, 0.6232070922851562, 0.644561767578125, 0.6659164428710938, 0.6872711181640625, 0.7086257934570312, 0.72998046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 18.0, 15.0, 18.0, 42.0, 75.0, 156.0, 255.0, 138.0, 76.0, 44.0, 30.0, 22.0, 26.0, 13.0, 7.0, 7.0, 6.0, 6.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.2054290771484375, -0.199310302734375, -0.1931915283203125, -0.18707275390625, -0.1809539794921875, -0.174835205078125, -0.1687164306640625, -0.16259765625, -0.1564788818359375, -0.150360107421875, -0.1442413330078125, -0.13812255859375, -0.1320037841796875, -0.125885009765625, -0.1197662353515625, -0.1136474609375, -0.1075286865234375, -0.101409912109375, -0.0952911376953125, -0.08917236328125, -0.0830535888671875, -0.076934814453125, -0.0708160400390625, -0.064697265625, -0.0585784912109375, -0.052459716796875, -0.0463409423828125, -0.04022216796875, -0.0341033935546875, -0.027984619140625, -0.0218658447265625, -0.0157470703125, -0.0096282958984375, -0.003509521484375, 0.0026092529296875, 0.00872802734375, 0.0148468017578125, 0.020965576171875, 0.0270843505859375, 0.033203125, 0.0393218994140625, 0.045440673828125, 0.0515594482421875, 0.05767822265625, 0.0637969970703125, 0.069915771484375, 0.0760345458984375, 0.0821533203125, 0.0882720947265625, 0.094390869140625, 0.1005096435546875, 0.10662841796875, 0.1127471923828125, 0.118865966796875, 0.1249847412109375, 0.131103515625, 0.1372222900390625, 0.143341064453125, 0.1494598388671875, 0.15557861328125, 0.1616973876953125, 0.167816162109375, 0.1739349365234375, 0.1800537109375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 16.0, 13.0, 30.0, 45.0, 75.0, 168.0, 215.0, 163.0, 91.0, 64.0, 42.0, 20.0, 11.0, 9.0, 9.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.364039421081543, -5.232263565063477, -5.10048770904541, -4.9687113761901855, -4.836935520172119, -4.705159664154053, -4.573383808135986, -4.44160795211792, -4.309831619262695, -4.178055763244629, -4.0462799072265625, -3.914503812789917, -3.7827277183532715, -3.650951862335205, -3.5191760063171387, -3.3874001502990723, -3.255624294281006, -3.1238484382629395, -2.992072343826294, -2.8602964878082275, -2.728520393371582, -2.5967445373535156, -2.464968681335449, -2.333192825317383, -2.2014167308807373, -2.069640874862671, -1.9378647804260254, -1.806088924407959, -1.674312949180603, -1.542536973953247, -1.4107611179351807, -1.2789851427078247, -1.1472094058990479, -1.015433430671692, -0.8836575150489807, -0.7518815994262695, -0.6201056241989136, -0.4883296489715576, -0.35655373334884644, -0.22477781772613525, -0.0930018424987793, 0.03877410292625427, 0.17055004835128784, 0.3023259937763214, 0.434101939201355, 0.5658779144287109, 0.6976538300514221, 0.8294297456741333, 0.9612057209014893, 1.0929816961288452, 1.2247576713562012, 1.3565335273742676, 1.4883095026016235, 1.6200854778289795, 1.751861333847046, 1.8836373090744019, 2.015413284301758, 2.147189140319824, 2.2789652347564697, 2.410741090774536, 2.5425171852111816, 2.674293041229248, 2.8060688972473145, 2.937844753265381, 3.0696208477020264]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 3.0, 5.0, 4.0, 8.0, 14.0, 14.0, 16.0, 26.0, 32.0, 33.0, 40.0, 45.0, 51.0, 50.0, 50.0, 64.0, 67.0, 56.0, 45.0, 65.0, 50.0, 47.0, 35.0, 41.0, 33.0, 25.0, 24.0, 18.0, 11.0, 8.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515451192855835, -2.3930253982543945, -2.270599842071533, -2.148174285888672, -2.0257484912872314, -1.9033228158950806, -1.7808971405029297, -1.6584714651107788, -1.536045789718628, -1.413620114326477, -1.2911944389343262, -1.1687687635421753, -1.0463430881500244, -0.9239174127578735, -0.8014917373657227, -0.6790660619735718, -0.5566403865814209, -0.43421471118927, -0.31178903579711914, -0.18936336040496826, -0.06693768501281738, 0.055487990379333496, 0.17791366577148438, 0.30033934116363525, 0.42276501655578613, 0.545190691947937, 0.6676163673400879, 0.7900420427322388, 0.9124677181243896, 1.0348933935165405, 1.1573190689086914, 1.2797447443008423, 1.402170181274414, 1.524595856666565, 1.6470215320587158, 1.7694472074508667, 1.8918728828430176, 2.014298439025879, 2.1367242336273193, 2.2591500282287598, 2.381575584411621, 2.5040011405944824, 2.626426935195923, 2.7488527297973633, 2.8712782859802246, 2.993703842163086, 3.1161296367645264, 3.238555431365967, 3.360980987548828, 3.4834065437316895, 3.60583233833313, 3.7282581329345703, 3.8506836891174316, 3.973109245300293, 4.0955352783203125, 4.217960834503174, 4.340386390686035, 4.4628119468688965, 4.585237503051758, 4.707663536071777, 4.830089092254639, 4.9525146484375, 5.0749406814575195, 5.197366237640381, 5.319791793823242]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 5.0, 7.0, 14.0, 10.0, 14.0, 8.0, 16.0, 12.0, 18.0, 33.0, 42.0, 39.0, 79.0, 114.0, 241.0, 461.0, 1210.0, 5910.0, 2078111.0, 2099369.0, 6270.0, 1184.0, 467.0, 220.0, 143.0, 78.0, 41.0, 32.0, 25.0, 19.0, 23.0, 11.0, 10.0, 3.0, 2.0, 10.0, 3.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.14739990234375, -5.9354248046875, -5.72344970703125, -5.511474609375, -5.29949951171875, -5.0875244140625, -4.87554931640625, -4.66357421875, -4.45159912109375, -4.2396240234375, -4.02764892578125, -3.815673828125, -3.60369873046875, -3.3917236328125, -3.17974853515625, -2.9677734375, -2.75579833984375, -2.5438232421875, -2.33184814453125, -2.119873046875, -1.90789794921875, -1.6959228515625, -1.48394775390625, -1.27197265625, -1.05999755859375, -0.8480224609375, -0.63604736328125, -0.424072265625, -0.21209716796875, -0.0001220703125, 0.21185302734375, 0.423828125, 0.63580322265625, 0.8477783203125, 1.05975341796875, 1.271728515625, 1.48370361328125, 1.6956787109375, 1.90765380859375, 2.11962890625, 2.33160400390625, 2.5435791015625, 2.75555419921875, 2.967529296875, 3.17950439453125, 3.3914794921875, 3.60345458984375, 3.8154296875, 4.02740478515625, 4.2393798828125, 4.45135498046875, 4.663330078125, 4.87530517578125, 5.0872802734375, 5.29925537109375, 5.51123046875, 5.72320556640625, 5.9351806640625, 6.14715576171875, 6.359130859375, 6.57110595703125, 6.7830810546875, 6.99505615234375, 7.20703125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 8.0, 16.0, 16.0, 18.0, 28.0, 25.0, 41.0, 40.0, 49.0, 53.0, 63.0, 68.0, 68.0, 57.0, 60.0, 64.0, 57.0, 54.0, 34.0, 38.0, 27.0, 23.0, 20.0, 12.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.880859375, -1.8299560546875, -1.779052734375, -1.7281494140625, -1.67724609375, -1.6263427734375, -1.575439453125, -1.5245361328125, -1.4736328125, -1.4227294921875, -1.371826171875, -1.3209228515625, -1.27001953125, -1.2191162109375, -1.168212890625, -1.1173095703125, -1.06640625, -1.0155029296875, -0.964599609375, -0.9136962890625, -0.86279296875, -0.8118896484375, -0.760986328125, -0.7100830078125, -0.6591796875, -0.6082763671875, -0.557373046875, -0.5064697265625, -0.45556640625, -0.4046630859375, -0.353759765625, -0.3028564453125, -0.251953125, -0.2010498046875, -0.150146484375, -0.0992431640625, -0.04833984375, 0.0025634765625, 0.053466796875, 0.1043701171875, 0.1552734375, 0.2061767578125, 0.257080078125, 0.3079833984375, 0.35888671875, 0.4097900390625, 0.460693359375, 0.5115966796875, 0.5625, 0.6134033203125, 0.664306640625, 0.7152099609375, 0.76611328125, 0.8170166015625, 0.867919921875, 0.9188232421875, 0.9697265625, 1.0206298828125, 1.071533203125, 1.1224365234375, 1.17333984375, 1.2242431640625, 1.275146484375, 1.3260498046875, 1.376953125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 9.0, 14.0, 20.0, 66.0, 208.0, 1175.0, 3583173.0, 608237.0, 991.0, 192.0, 71.0, 39.0, 27.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.3515625, -13.9027099609375, -13.453857421875, -13.0050048828125, -12.55615234375, -12.1072998046875, -11.658447265625, -11.2095947265625, -10.7607421875, -10.3118896484375, -9.863037109375, -9.4141845703125, -8.96533203125, -8.5164794921875, -8.067626953125, -7.6187744140625, -7.169921875, -6.7210693359375, -6.272216796875, -5.8233642578125, -5.37451171875, -4.9256591796875, -4.476806640625, -4.0279541015625, -3.5791015625, -3.1302490234375, -2.681396484375, -2.2325439453125, -1.78369140625, -1.3348388671875, -0.885986328125, -0.4371337890625, 0.01171875, 0.4605712890625, 0.909423828125, 1.3582763671875, 1.80712890625, 2.2559814453125, 2.704833984375, 3.1536865234375, 3.6025390625, 4.0513916015625, 4.500244140625, 4.9490966796875, 5.39794921875, 5.8468017578125, 6.295654296875, 6.7445068359375, 7.193359375, 7.6422119140625, 8.091064453125, 8.5399169921875, 8.98876953125, 9.4376220703125, 9.886474609375, 10.3353271484375, 10.7841796875, 11.2330322265625, 11.681884765625, 12.1307373046875, 12.57958984375, 13.0284423828125, 13.477294921875, 13.9261474609375, 14.375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 12.0, 23.0, 36.0, 74.0, 260.0, 1573.0, 1606.0, 321.0, 86.0, 35.0, 15.0, 15.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.3364715576171875, -1.295989990234375, -1.2555084228515625, -1.21502685546875, -1.1745452880859375, -1.134063720703125, -1.0935821533203125, -1.0531005859375, -1.0126190185546875, -0.972137451171875, -0.9316558837890625, -0.89117431640625, -0.8506927490234375, -0.810211181640625, -0.7697296142578125, -0.729248046875, -0.6887664794921875, -0.648284912109375, -0.6078033447265625, -0.56732177734375, -0.5268402099609375, -0.486358642578125, -0.4458770751953125, -0.4053955078125, -0.3649139404296875, -0.324432373046875, -0.2839508056640625, -0.24346923828125, -0.2029876708984375, -0.162506103515625, -0.1220245361328125, -0.08154296875, -0.0410614013671875, -0.000579833984375, 0.0399017333984375, 0.08038330078125, 0.1208648681640625, 0.161346435546875, 0.2018280029296875, 0.2423095703125, 0.2827911376953125, 0.323272705078125, 0.3637542724609375, 0.40423583984375, 0.4447174072265625, 0.485198974609375, 0.5256805419921875, 0.566162109375, 0.6066436767578125, 0.647125244140625, 0.6876068115234375, 0.72808837890625, 0.7685699462890625, 0.809051513671875, 0.8495330810546875, 0.8900146484375, 0.9304962158203125, 0.970977783203125, 1.0114593505859375, 1.05194091796875, 1.0924224853515625, 1.132904052734375, 1.1733856201171875, 1.2138671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 10.0, 17.0, 24.0, 49.0, 77.0, 128.0, 197.0, 177.0, 124.0, 72.0, 48.0, 25.0, 17.0, 13.0, 3.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4512486457824707, -3.3520452976226807, -3.2528417110443115, -3.1536383628845215, -3.0544350147247314, -2.9552314281463623, -2.8560280799865723, -2.756824493408203, -2.657621145248413, -2.558417797088623, -2.459214210510254, -2.360010862350464, -2.260807514190674, -2.1616039276123047, -2.0624005794525146, -1.963197112083435, -1.863993763923645, -1.7647902965545654, -1.6655869483947754, -1.5663834810256958, -1.4671800136566162, -1.3679766654968262, -1.2687731981277466, -1.169569730758667, -1.070366382598877, -0.9711629748344421, -0.8719595074653625, -0.7727560997009277, -0.6735526323318481, -0.5743492245674133, -0.4751458168029785, -0.3759423494338989, -0.27673888206481934, -0.17753544449806213, -0.07833202183246613, 0.020871400833129883, 0.12007483839988708, 0.2192782759666443, 0.3184816837310791, 0.4176851511001587, 0.5168885588645935, 0.6160919666290283, 0.7152954339981079, 0.8144988417625427, 0.9137022495269775, 1.0129057168960571, 1.1121091842651367, 1.2113125324249268, 1.3105159997940063, 1.409719467163086, 1.508922815322876, 1.6081262826919556, 1.7073297500610352, 1.8065330982208252, 1.9057365655899048, 2.0049400329589844, 2.1041433811187744, 2.2033467292785645, 2.3025503158569336, 2.4017536640167236, 2.5009570121765137, 2.600160598754883, 2.699363946914673, 2.798567295074463, 2.897770881652832]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 5.0, 9.0, 16.0, 16.0, 19.0, 33.0, 32.0, 32.0, 52.0, 46.0, 42.0, 55.0, 58.0, 61.0, 53.0, 58.0, 61.0, 50.0, 43.0, 53.0, 45.0, 32.0, 25.0, 21.0, 24.0, 20.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7910429239273071, -1.7389572858810425, -1.6868716478347778, -1.6347860097885132, -1.5827003717422485, -1.5306147336959839, -1.4785289764404297, -1.426443338394165, -1.3743577003479004, -1.3222720623016357, -1.270186424255371, -1.2181007862091064, -1.1660151481628418, -1.1139295101165771, -1.0618438720703125, -1.0097582340240479, -0.9576725959777832, -0.9055869579315186, -0.8535013198852539, -0.8014156818389893, -0.7493300437927246, -0.69724440574646, -0.6451587080955505, -0.5930730700492859, -0.5409874320030212, -0.4889017939567566, -0.43681615591049194, -0.3847304880619049, -0.33264485001564026, -0.2805592119693756, -0.22847354412078857, -0.17638790607452393, -0.12430238723754883, -0.07221674174070358, -0.020131096243858337, 0.031954556703567505, 0.08404019474983215, 0.1361258327960968, 0.18821150064468384, 0.2402971386909485, 0.29238277673721313, 0.3444684147834778, 0.39655405282974243, 0.44863972067832947, 0.5007253885269165, 0.5528110265731812, 0.6048966646194458, 0.6569823026657104, 0.7090679407119751, 0.7611535787582397, 0.8132392168045044, 0.865324854850769, 0.9174104928970337, 0.9694961309432983, 1.0215818881988525, 1.0736675262451172, 1.1257531642913818, 1.1778388023376465, 1.2299244403839111, 1.2820100784301758, 1.3340957164764404, 1.386181354522705, 1.4382669925689697, 1.4903526306152344, 1.542438268661499]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 6.0, 7.0, 16.0, 17.0, 34.0, 64.0, 142.0, 350.0, 865.0, 2737.0, 10385.0, 70445.0, 909373.0, 42752.0, 7928.0, 2161.0, 718.0, 278.0, 126.0, 61.0, 30.0, 13.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6762847900390625, -1.628936767578125, -1.5815887451171875, -1.53424072265625, -1.4868927001953125, -1.439544677734375, -1.3921966552734375, -1.3448486328125, -1.2975006103515625, -1.250152587890625, -1.2028045654296875, -1.15545654296875, -1.1081085205078125, -1.060760498046875, -1.0134124755859375, -0.966064453125, -0.9187164306640625, -0.871368408203125, -0.8240203857421875, -0.77667236328125, -0.7293243408203125, -0.681976318359375, -0.6346282958984375, -0.5872802734375, -0.5399322509765625, -0.492584228515625, -0.4452362060546875, -0.39788818359375, -0.3505401611328125, -0.303192138671875, -0.2558441162109375, -0.20849609375, -0.1611480712890625, -0.113800048828125, -0.0664520263671875, -0.01910400390625, 0.0282440185546875, 0.075592041015625, 0.1229400634765625, 0.1702880859375, 0.2176361083984375, 0.264984130859375, 0.3123321533203125, 0.35968017578125, 0.4070281982421875, 0.454376220703125, 0.5017242431640625, 0.549072265625, 0.5964202880859375, 0.643768310546875, 0.6911163330078125, 0.73846435546875, 0.7858123779296875, 0.833160400390625, 0.8805084228515625, 0.9278564453125, 0.9752044677734375, 1.022552490234375, 1.0699005126953125, 1.11724853515625, 1.1645965576171875, 1.211944580078125, 1.2592926025390625, 1.306640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 6.0, 8.0, 18.0, 22.0, 27.0, 38.0, 53.0, 62.0, 72.0, 81.0, 85.0, 81.0, 92.0, 78.0, 60.0, 56.0, 39.0, 40.0, 19.0, 27.0, 12.0, 12.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.7027130126953125, -1.659332275390625, -1.6159515380859375, -1.57257080078125, -1.5291900634765625, -1.485809326171875, -1.4424285888671875, -1.3990478515625, -1.3556671142578125, -1.312286376953125, -1.2689056396484375, -1.22552490234375, -1.1821441650390625, -1.138763427734375, -1.0953826904296875, -1.052001953125, -1.0086212158203125, -0.965240478515625, -0.9218597412109375, -0.87847900390625, -0.8350982666015625, -0.791717529296875, -0.7483367919921875, -0.7049560546875, -0.6615753173828125, -0.618194580078125, -0.5748138427734375, -0.53143310546875, -0.4880523681640625, -0.444671630859375, -0.4012908935546875, -0.35791015625, -0.3145294189453125, -0.271148681640625, -0.2277679443359375, -0.18438720703125, -0.1410064697265625, -0.097625732421875, -0.0542449951171875, -0.0108642578125, 0.0325164794921875, 0.075897216796875, 0.1192779541015625, 0.16265869140625, 0.2060394287109375, 0.249420166015625, 0.2928009033203125, 0.336181640625, 0.3795623779296875, 0.422943115234375, 0.4663238525390625, 0.50970458984375, 0.5530853271484375, 0.596466064453125, 0.6398468017578125, 0.6832275390625, 0.7266082763671875, 0.769989013671875, 0.8133697509765625, 0.85675048828125, 0.9001312255859375, 0.943511962890625, 0.9868927001953125, 1.0302734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 13.0, 9.0, 12.0, 18.0, 33.0, 40.0, 88.0, 126.0, 216.0, 459.0, 826.0, 1847.0, 4413.0, 12832.0, 51023.0, 612549.0, 313743.0, 34027.0, 9528.0, 3621.0, 1485.0, 745.0, 383.0, 198.0, 110.0, 80.0, 34.0, 22.0, 24.0, 4.0, 6.0, 8.0, 7.0, 6.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.515625, -0.49892425537109375, -0.4822235107421875, -0.46552276611328125, -0.448822021484375, -0.43212127685546875, -0.4154205322265625, -0.39871978759765625, -0.38201904296875, -0.36531829833984375, -0.3486175537109375, -0.33191680908203125, -0.315216064453125, -0.29851531982421875, -0.2818145751953125, -0.26511383056640625, -0.2484130859375, -0.23171234130859375, -0.2150115966796875, -0.19831085205078125, -0.181610107421875, -0.16490936279296875, -0.1482086181640625, -0.13150787353515625, -0.11480712890625, -0.09810638427734375, -0.0814056396484375, -0.06470489501953125, -0.048004150390625, -0.03130340576171875, -0.0146026611328125, 0.00209808349609375, 0.018798828125, 0.03549957275390625, 0.0522003173828125, 0.06890106201171875, 0.085601806640625, 0.10230255126953125, 0.1190032958984375, 0.13570404052734375, 0.15240478515625, 0.16910552978515625, 0.1858062744140625, 0.20250701904296875, 0.219207763671875, 0.23590850830078125, 0.2526092529296875, 0.26930999755859375, 0.2860107421875, 0.30271148681640625, 0.3194122314453125, 0.33611297607421875, 0.352813720703125, 0.36951446533203125, 0.3862152099609375, 0.40291595458984375, 0.41961669921875, 0.43631744384765625, 0.4530181884765625, 0.46971893310546875, 0.486419677734375, 0.5031204223632812, 0.5198211669921875, 0.5365219116210938, 0.55322265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 1.0, 8.0, 12.0, 16.0, 15.0, 16.0, 21.0, 27.0, 30.0, 44.0, 41.0, 49.0, 49.0, 42.0, 62.0, 55.0, 60.0, 47.0, 40.0, 54.0, 45.0, 47.0, 38.0, 39.0, 24.0, 11.0, 26.0, 15.0, 18.0, 7.0, 7.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.69140625, -1.6441192626953125, -1.596832275390625, -1.5495452880859375, -1.50225830078125, -1.4549713134765625, -1.407684326171875, -1.3603973388671875, -1.3131103515625, -1.2658233642578125, -1.218536376953125, -1.1712493896484375, -1.12396240234375, -1.0766754150390625, -1.029388427734375, -0.9821014404296875, -0.934814453125, -0.8875274658203125, -0.840240478515625, -0.7929534912109375, -0.74566650390625, -0.6983795166015625, -0.651092529296875, -0.6038055419921875, -0.5565185546875, -0.5092315673828125, -0.461944580078125, -0.4146575927734375, -0.36737060546875, -0.3200836181640625, -0.272796630859375, -0.2255096435546875, -0.17822265625, -0.1309356689453125, -0.083648681640625, -0.0363616943359375, 0.01092529296875, 0.0582122802734375, 0.105499267578125, 0.1527862548828125, 0.2000732421875, 0.2473602294921875, 0.294647216796875, 0.3419342041015625, 0.38922119140625, 0.4365081787109375, 0.483795166015625, 0.5310821533203125, 0.578369140625, 0.6256561279296875, 0.672943115234375, 0.7202301025390625, 0.76751708984375, 0.8148040771484375, 0.862091064453125, 0.9093780517578125, 0.9566650390625, 1.0039520263671875, 1.051239013671875, 1.0985260009765625, 1.14581298828125, 1.1930999755859375, 1.240386962890625, 1.2876739501953125, 1.3349609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 9.0, 18.0, 23.0, 36.0, 41.0, 71.0, 85.0, 136.0, 195.0, 343.0, 552.0, 1033.0, 2053.0, 5045.0, 16951.0, 111584.0, 782196.0, 102506.0, 16211.0, 4873.0, 2016.0, 1029.0, 539.0, 349.0, 185.0, 136.0, 85.0, 71.0, 47.0, 29.0, 27.0, 14.0, 11.0, 14.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10308837890625, -0.09946918487548828, -0.09584999084472656, -0.09223079681396484, -0.08861160278320312, -0.0849924087524414, -0.08137321472167969, -0.07775402069091797, -0.07413482666015625, -0.07051563262939453, -0.06689643859863281, -0.0632772445678711, -0.059658050537109375, -0.056038856506347656, -0.05241966247558594, -0.04880046844482422, -0.0451812744140625, -0.04156208038330078, -0.03794288635253906, -0.034323692321777344, -0.030704498291015625, -0.027085304260253906, -0.023466110229492188, -0.01984691619873047, -0.01622772216796875, -0.012608528137207031, -0.008989334106445312, -0.005370140075683594, -0.001750946044921875, 0.0018682479858398438, 0.0054874420166015625, 0.009106636047363281, 0.012725830078125, 0.01634502410888672, 0.019964218139648438, 0.023583412170410156, 0.027202606201171875, 0.030821800231933594, 0.03444099426269531, 0.03806018829345703, 0.04167938232421875, 0.04529857635498047, 0.04891777038574219, 0.052536964416503906, 0.056156158447265625, 0.059775352478027344, 0.06339454650878906, 0.06701374053955078, 0.0706329345703125, 0.07425212860107422, 0.07787132263183594, 0.08149051666259766, 0.08510971069335938, 0.0887289047241211, 0.09234809875488281, 0.09596729278564453, 0.09958648681640625, 0.10320568084716797, 0.10682487487792969, 0.1104440689086914, 0.11406326293945312, 0.11768245697021484, 0.12130165100097656, 0.12492084503173828, 0.1285400390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 10.0, 28.0, 32.0, 67.0, 118.0, 203.0, 184.0, 139.0, 86.0, 43.0, 29.0, 13.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.562471389770508e-05, -6.311200559139252e-05, -6.0599297285079956e-05, -5.8086588978767395e-05, -5.5573880672454834e-05, -5.306117236614227e-05, -5.054846405982971e-05, -4.803575575351715e-05, -4.552304744720459e-05, -4.301033914089203e-05, -4.049763083457947e-05, -3.798492252826691e-05, -3.5472214221954346e-05, -3.2959505915641785e-05, -3.0446797609329224e-05, -2.7934089303016663e-05, -2.54213809967041e-05, -2.290867269039154e-05, -2.039596438407898e-05, -1.788325607776642e-05, -1.5370547771453857e-05, -1.2857839465141296e-05, -1.0345131158828735e-05, -7.832422852516174e-06, -5.319714546203613e-06, -2.8070062398910522e-06, -2.942979335784912e-07, 2.21841037273407e-06, 4.731118679046631e-06, 7.243826985359192e-06, 9.756535291671753e-06, 1.2269243597984314e-05, 1.4781951904296875e-05, 1.7294660210609436e-05, 1.9807368516921997e-05, 2.2320076823234558e-05, 2.483278512954712e-05, 2.734549343585968e-05, 2.985820174217224e-05, 3.23709100484848e-05, 3.488361835479736e-05, 3.7396326661109924e-05, 3.9909034967422485e-05, 4.2421743273735046e-05, 4.493445158004761e-05, 4.744715988636017e-05, 4.995986819267273e-05, 5.247257649898529e-05, 5.498528480529785e-05, 5.749799311161041e-05, 6.0010701417922974e-05, 6.252340972423553e-05, 6.50361180305481e-05, 6.754882633686066e-05, 7.006153464317322e-05, 7.257424294948578e-05, 7.508695125579834e-05, 7.75996595621109e-05, 8.011236786842346e-05, 8.262507617473602e-05, 8.513778448104858e-05, 8.765049278736115e-05, 9.01632010936737e-05, 9.267590939998627e-05, 9.518861770629883e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 10.0, 10.0, 12.0, 14.0, 37.0, 72.0, 245.0, 654.0, 2726.0, 30165.0, 990137.0, 21225.0, 2305.0, 573.0, 196.0, 70.0, 30.0, 17.0, 16.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3935546875, -0.38245391845703125, -0.3713531494140625, -0.36025238037109375, -0.349151611328125, -0.33805084228515625, -0.3269500732421875, -0.31584930419921875, -0.30474853515625, -0.29364776611328125, -0.2825469970703125, -0.27144622802734375, -0.260345458984375, -0.24924468994140625, -0.2381439208984375, -0.22704315185546875, -0.2159423828125, -0.20484161376953125, -0.1937408447265625, -0.18264007568359375, -0.171539306640625, -0.16043853759765625, -0.1493377685546875, -0.13823699951171875, -0.12713623046875, -0.11603546142578125, -0.1049346923828125, -0.09383392333984375, -0.082733154296875, -0.07163238525390625, -0.0605316162109375, -0.04943084716796875, -0.038330078125, -0.02722930908203125, -0.0161285400390625, -0.00502777099609375, 0.006072998046875, 0.01717376708984375, 0.0282745361328125, 0.03937530517578125, 0.05047607421875, 0.06157684326171875, 0.0726776123046875, 0.08377838134765625, 0.094879150390625, 0.10597991943359375, 0.1170806884765625, 0.12818145751953125, 0.1392822265625, 0.15038299560546875, 0.1614837646484375, 0.17258453369140625, 0.183685302734375, 0.19478607177734375, 0.2058868408203125, 0.21698760986328125, 0.22808837890625, 0.23918914794921875, 0.2502899169921875, 0.26139068603515625, 0.272491455078125, 0.28359222412109375, 0.2946929931640625, 0.30579376220703125, 0.31689453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 20.0, 29.0, 34.0, 31.0, 71.0, 103.0, 141.0, 133.0, 118.0, 80.0, 60.0, 35.0, 27.0, 18.0, 20.0, 11.0, 7.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0280914306640625, -0.027221202850341797, -0.026350975036621094, -0.02548074722290039, -0.024610519409179688, -0.023740291595458984, -0.02287006378173828, -0.021999835968017578, -0.021129608154296875, -0.020259380340576172, -0.01938915252685547, -0.018518924713134766, -0.017648696899414062, -0.01677846908569336, -0.015908241271972656, -0.015038013458251953, -0.01416778564453125, -0.013297557830810547, -0.012427330017089844, -0.01155710220336914, -0.010686874389648438, -0.009816646575927734, -0.008946418762207031, -0.008076190948486328, -0.007205963134765625, -0.006335735321044922, -0.005465507507324219, -0.004595279693603516, -0.0037250518798828125, -0.0028548240661621094, -0.0019845962524414062, -0.0011143684387207031, -0.000244140625, 0.0006260871887207031, 0.0014963150024414062, 0.0023665428161621094, 0.0032367706298828125, 0.004106998443603516, 0.004977226257324219, 0.005847454071044922, 0.006717681884765625, 0.007587909698486328, 0.008458137512207031, 0.009328365325927734, 0.010198593139648438, 0.01106882095336914, 0.011939048767089844, 0.012809276580810547, 0.01367950439453125, 0.014549732208251953, 0.015419960021972656, 0.01629018783569336, 0.017160415649414062, 0.018030643463134766, 0.01890087127685547, 0.019771099090576172, 0.020641326904296875, 0.021511554718017578, 0.02238178253173828, 0.023252010345458984, 0.024122238159179688, 0.02499246597290039, 0.025862693786621094, 0.026732921600341797, 0.0276031494140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 16.0, 30.0, 53.0, 102.0, 263.0, 260.0, 140.0, 71.0, 23.0, 10.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.3868608474731445, -3.309995412826538, -3.2331299781799316, -3.1562647819519043, -3.079399347305298, -3.0025339126586914, -2.925668478012085, -2.8488030433654785, -2.771937847137451, -2.6950724124908447, -2.6182069778442383, -2.541341781616211, -2.4644763469696045, -2.387610912322998, -2.3107454776763916, -2.233880043029785, -2.1570146083831787, -2.0801491737365723, -2.003283739089966, -1.926418423652649, -1.849553108215332, -1.7726876735687256, -1.6958222389221191, -1.6189568042755127, -1.5420914888381958, -1.4652260541915894, -1.3883607387542725, -1.311495304107666, -1.2346298694610596, -1.1577645540237427, -1.0808991193771362, -1.0040338039398193, -0.9271682500839233, -0.8503028750419617, -0.7734375, -0.6965720653533936, -0.6197066903114319, -0.5428413152694702, -0.46597591042518616, -0.3891105055809021, -0.31224513053894043, -0.23537974059581757, -0.1585143506526947, -0.08164896070957184, -0.004783570766448975, 0.0720818042755127, 0.14894720911979675, 0.2258126139640808, 0.3026779890060425, 0.37954336404800415, 0.4564087688922882, 0.5332741737365723, 0.6101395487785339, 0.6870049238204956, 0.763870358467102, 0.8407357335090637, 0.9176011085510254, 0.9944664835929871, 1.0713318586349487, 1.1481972932815552, 1.225062608718872, 1.3019280433654785, 1.378793478012085, 1.4556589126586914, 1.5325242280960083]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 13.0, 28.0, 33.0, 41.0, 57.0, 63.0, 55.0, 72.0, 84.0, 67.0, 90.0, 68.0, 58.0, 64.0, 39.0, 41.0, 35.0, 16.0, 23.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5457602739334106, -1.5074880123138428, -1.4692156314849854, -1.430943250656128, -1.39267098903656, -1.3543987274169922, -1.3161263465881348, -1.2778539657592773, -1.2395817041397095, -1.2013094425201416, -1.1630370616912842, -1.1247646808624268, -1.0864924192428589, -1.048220157623291, -1.0099477767944336, -0.971675455570221, -0.9334031343460083, -0.8951308131217957, -0.856858491897583, -0.8185861706733704, -0.7803138494491577, -0.7420415282249451, -0.7037692070007324, -0.6654968857765198, -0.6272245645523071, -0.5889522433280945, -0.5506799221038818, -0.5124076008796692, -0.47413527965545654, -0.4358629584312439, -0.39759063720703125, -0.3593183159828186, -0.32104605436325073, -0.2827737331390381, -0.24450141191482544, -0.2062290906906128, -0.16795676946640015, -0.1296844482421875, -0.09141212701797485, -0.05313980579376221, -0.01486748456954956, 0.023404836654663086, 0.06167715787887573, 0.09994947910308838, 0.13822180032730103, 0.17649412155151367, 0.21476644277572632, 0.25303876399993896, 0.2913110852241516, 0.32958340644836426, 0.3678557276725769, 0.40612804889678955, 0.4444003701210022, 0.48267269134521484, 0.5209450125694275, 0.5592173337936401, 0.5974896550178528, 0.6357619762420654, 0.6740342974662781, 0.7123066186904907, 0.7505789399147034, 0.788851261138916, 0.8271235823631287, 0.8653959035873413, 0.903668224811554]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 13.0, 18.0, 44.0, 78.0, 140.0, 310.0, 805.0, 2258.0, 7211.0, 28975.0, 857963.0, 127729.0, 15924.0, 4493.0, 1500.0, 601.0, 245.0, 99.0, 41.0, 29.0, 19.0, 5.0, 9.0, 3.0, 4.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.676605224609375, -2.58367919921875, -2.490753173828125, -2.3978271484375, -2.304901123046875, -2.21197509765625, -2.119049072265625, -2.026123046875, -1.933197021484375, -1.84027099609375, -1.747344970703125, -1.6544189453125, -1.561492919921875, -1.46856689453125, -1.375640869140625, -1.28271484375, -1.189788818359375, -1.09686279296875, -1.003936767578125, -0.9110107421875, -0.818084716796875, -0.72515869140625, -0.632232666015625, -0.539306640625, -0.446380615234375, -0.35345458984375, -0.260528564453125, -0.1676025390625, -0.074676513671875, 0.01824951171875, 0.111175537109375, 0.2041015625, 0.297027587890625, 0.38995361328125, 0.482879638671875, 0.5758056640625, 0.668731689453125, 0.76165771484375, 0.854583740234375, 0.947509765625, 1.040435791015625, 1.13336181640625, 1.226287841796875, 1.3192138671875, 1.412139892578125, 1.50506591796875, 1.597991943359375, 1.69091796875, 1.783843994140625, 1.87677001953125, 1.969696044921875, 2.0626220703125, 2.155548095703125, 2.24847412109375, 2.341400146484375, 2.434326171875, 2.527252197265625, 2.62017822265625, 2.713104248046875, 2.8060302734375, 2.898956298828125, 2.99188232421875, 3.084808349609375, 3.177734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 13.0, 8.0, 15.0, 10.0, 26.0, 25.0, 18.0, 31.0, 33.0, 26.0, 46.0, 50.0, 48.0, 49.0, 47.0, 48.0, 61.0, 59.0, 55.0, 42.0, 42.0, 44.0, 35.0, 20.0, 32.0, 18.0, 11.0, 20.0, 11.0, 9.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6140289306640625, -1.553253173828125, -1.4924774169921875, -1.43170166015625, -1.3709259033203125, -1.310150146484375, -1.2493743896484375, -1.1885986328125, -1.1278228759765625, -1.067047119140625, -1.0062713623046875, -0.94549560546875, -0.8847198486328125, -0.823944091796875, -0.7631683349609375, -0.702392578125, -0.6416168212890625, -0.580841064453125, -0.5200653076171875, -0.45928955078125, -0.3985137939453125, -0.337738037109375, -0.2769622802734375, -0.2161865234375, -0.1554107666015625, -0.094635009765625, -0.0338592529296875, 0.02691650390625, 0.0876922607421875, 0.148468017578125, 0.2092437744140625, 0.27001953125, 0.3307952880859375, 0.391571044921875, 0.4523468017578125, 0.51312255859375, 0.5738983154296875, 0.634674072265625, 0.6954498291015625, 0.7562255859375, 0.8170013427734375, 0.877777099609375, 0.9385528564453125, 0.99932861328125, 1.0601043701171875, 1.120880126953125, 1.1816558837890625, 1.242431640625, 1.3032073974609375, 1.363983154296875, 1.4247589111328125, 1.48553466796875, 1.5463104248046875, 1.607086181640625, 1.6678619384765625, 1.7286376953125, 1.7894134521484375, 1.850189208984375, 1.9109649658203125, 1.97174072265625, 2.0325164794921875, 2.093292236328125, 2.1540679931640625, 2.21484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 12.0, 13.0, 26.0, 25.0, 15.0, 27.0, 23.0, 33.0, 42.0, 74.0, 86.0, 184.0, 479.0, 2553.0, 36455.0, 994964.0, 11429.0, 1236.0, 325.0, 147.0, 62.0, 57.0, 47.0, 34.0, 34.0, 18.0, 15.0, 17.0, 22.0, 12.0, 8.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.04296875, -5.86163330078125, -5.6802978515625, -5.49896240234375, -5.317626953125, -5.13629150390625, -4.9549560546875, -4.77362060546875, -4.59228515625, -4.41094970703125, -4.2296142578125, -4.04827880859375, -3.866943359375, -3.68560791015625, -3.5042724609375, -3.32293701171875, -3.1416015625, -2.96026611328125, -2.7789306640625, -2.59759521484375, -2.416259765625, -2.23492431640625, -2.0535888671875, -1.87225341796875, -1.69091796875, -1.50958251953125, -1.3282470703125, -1.14691162109375, -0.965576171875, -0.78424072265625, -0.6029052734375, -0.42156982421875, -0.240234375, -0.05889892578125, 0.1224365234375, 0.30377197265625, 0.485107421875, 0.66644287109375, 0.8477783203125, 1.02911376953125, 1.21044921875, 1.39178466796875, 1.5731201171875, 1.75445556640625, 1.935791015625, 2.11712646484375, 2.2984619140625, 2.47979736328125, 2.6611328125, 2.84246826171875, 3.0238037109375, 3.20513916015625, 3.386474609375, 3.56781005859375, 3.7491455078125, 3.93048095703125, 4.11181640625, 4.29315185546875, 4.4744873046875, 4.65582275390625, 4.837158203125, 5.01849365234375, 5.1998291015625, 5.38116455078125, 5.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 13.0, 13.0, 24.0, 18.0, 21.0, 19.0, 26.0, 31.0, 34.0, 54.0, 44.0, 43.0, 54.0, 43.0, 58.0, 57.0, 56.0, 42.0, 35.0, 39.0, 31.0, 32.0, 30.0, 17.0, 21.0, 18.0, 19.0, 21.0, 10.0, 7.0, 7.0, 7.0, 13.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.708984375, -1.653228759765625, -1.59747314453125, -1.541717529296875, -1.4859619140625, -1.430206298828125, -1.37445068359375, -1.318695068359375, -1.262939453125, -1.207183837890625, -1.15142822265625, -1.095672607421875, -1.0399169921875, -0.984161376953125, -0.92840576171875, -0.872650146484375, -0.81689453125, -0.761138916015625, -0.70538330078125, -0.649627685546875, -0.5938720703125, -0.538116455078125, -0.48236083984375, -0.426605224609375, -0.370849609375, -0.315093994140625, -0.25933837890625, -0.203582763671875, -0.1478271484375, -0.092071533203125, -0.03631591796875, 0.019439697265625, 0.0751953125, 0.130950927734375, 0.18670654296875, 0.242462158203125, 0.2982177734375, 0.353973388671875, 0.40972900390625, 0.465484619140625, 0.521240234375, 0.576995849609375, 0.63275146484375, 0.688507080078125, 0.7442626953125, 0.800018310546875, 0.85577392578125, 0.911529541015625, 0.96728515625, 1.023040771484375, 1.07879638671875, 1.134552001953125, 1.1903076171875, 1.246063232421875, 1.30181884765625, 1.357574462890625, 1.413330078125, 1.469085693359375, 1.52484130859375, 1.580596923828125, 1.6363525390625, 1.692108154296875, 1.74786376953125, 1.803619384765625, 1.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 3.0, 8.0, 3.0, 8.0, 11.0, 18.0, 26.0, 30.0, 47.0, 94.0, 156.0, 341.0, 899.0, 2617.0, 10008.0, 217973.0, 798886.0, 12419.0, 2960.0, 1029.0, 465.0, 225.0, 97.0, 68.0, 39.0, 28.0, 24.0, 15.0, 11.0, 4.0, 11.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9715957641601562, -0.9446563720703125, -0.9177169799804688, -0.890777587890625, -0.8638381958007812, -0.8368988037109375, -0.8099594116210938, -0.78302001953125, -0.7560806274414062, -0.7291412353515625, -0.7022018432617188, -0.675262451171875, -0.6483230590820312, -0.6213836669921875, -0.5944442749023438, -0.5675048828125, -0.5405654907226562, -0.5136260986328125, -0.48668670654296875, -0.459747314453125, -0.43280792236328125, -0.4058685302734375, -0.37892913818359375, -0.35198974609375, -0.32505035400390625, -0.2981109619140625, -0.27117156982421875, -0.244232177734375, -0.21729278564453125, -0.1903533935546875, -0.16341400146484375, -0.136474609375, -0.10953521728515625, -0.0825958251953125, -0.05565643310546875, -0.028717041015625, -0.00177764892578125, 0.0251617431640625, 0.05210113525390625, 0.07904052734375, 0.10597991943359375, 0.1329193115234375, 0.15985870361328125, 0.186798095703125, 0.21373748779296875, 0.2406768798828125, 0.26761627197265625, 0.2945556640625, 0.32149505615234375, 0.3484344482421875, 0.37537384033203125, 0.402313232421875, 0.42925262451171875, 0.4561920166015625, 0.48313140869140625, 0.51007080078125, 0.5370101928710938, 0.5639495849609375, 0.5908889770507812, 0.617828369140625, 0.6447677612304688, 0.6717071533203125, 0.6986465454101562, 0.7255859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 3.0, 10.0, 9.0, 11.0, 35.0, 54.0, 138.0, 487.0, 109.0, 54.0, 19.0, 11.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.0001100366935133934, -0.00010664574801921844, -0.00010325480252504349, -9.986385703086853e-05, -9.647291153669357e-05, -9.308196604251862e-05, -8.969102054834366e-05, -8.63000750541687e-05, -8.290912955999374e-05, -7.951818406581879e-05, -7.612723857164383e-05, -7.273629307746887e-05, -6.934534758329391e-05, -6.595440208911896e-05, -6.2563456594944e-05, -5.917251110076904e-05, -5.5781565606594086e-05, -5.239062011241913e-05, -4.899967461824417e-05, -4.5608729124069214e-05, -4.2217783629894257e-05, -3.88268381357193e-05, -3.543589264154434e-05, -3.2044947147369385e-05, -2.8654001653194427e-05, -2.526305615901947e-05, -2.1872110664844513e-05, -1.8481165170669556e-05, -1.5090219676494598e-05, -1.1699274182319641e-05, -8.308328688144684e-06, -4.9173831939697266e-06, -1.5264376997947693e-06, 1.864507794380188e-06, 5.255453288555145e-06, 8.646398782730103e-06, 1.203734427690506e-05, 1.5428289771080017e-05, 1.8819235265254974e-05, 2.221018075942993e-05, 2.560112625360489e-05, 2.8992071747779846e-05, 3.2383017241954803e-05, 3.577396273612976e-05, 3.916490823030472e-05, 4.2555853724479675e-05, 4.594679921865463e-05, 4.933774471282959e-05, 5.272869020700455e-05, 5.6119635701179504e-05, 5.951058119535446e-05, 6.290152668952942e-05, 6.629247218370438e-05, 6.968341767787933e-05, 7.307436317205429e-05, 7.646530866622925e-05, 7.98562541604042e-05, 8.324719965457916e-05, 8.663814514875412e-05, 9.002909064292908e-05, 9.342003613710403e-05, 9.681098163127899e-05, 0.00010020192712545395, 0.0001035928726196289]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 5.0, 9.0, 4.0, 17.0, 31.0, 53.0, 67.0, 143.0, 373.0, 974.0, 3387.0, 21421.0, 992084.0, 24486.0, 3724.0, 1029.0, 362.0, 165.0, 73.0, 47.0, 32.0, 19.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9280014038085938, -0.8916473388671875, -0.8552932739257812, -0.818939208984375, -0.7825851440429688, -0.7462310791015625, -0.7098770141601562, -0.67352294921875, -0.6371688842773438, -0.6008148193359375, -0.5644607543945312, -0.528106689453125, -0.49175262451171875, -0.4553985595703125, -0.41904449462890625, -0.3826904296875, -0.34633636474609375, -0.3099822998046875, -0.27362823486328125, -0.237274169921875, -0.20092010498046875, -0.1645660400390625, -0.12821197509765625, -0.09185791015625, -0.05550384521484375, -0.0191497802734375, 0.01720428466796875, 0.053558349609375, 0.08991241455078125, 0.1262664794921875, 0.16262054443359375, 0.198974609375, 0.23532867431640625, 0.2716827392578125, 0.30803680419921875, 0.344390869140625, 0.38074493408203125, 0.4170989990234375, 0.45345306396484375, 0.48980712890625, 0.5261611938476562, 0.5625152587890625, 0.5988693237304688, 0.635223388671875, 0.6715774536132812, 0.7079315185546875, 0.7442855834960938, 0.7806396484375, 0.8169937133789062, 0.8533477783203125, 0.8897018432617188, 0.926055908203125, 0.9624099731445312, 0.9987640380859375, 1.0351181030273438, 1.07147216796875, 1.1078262329101562, 1.1441802978515625, 1.1805343627929688, 1.216888427734375, 1.2532424926757812, 1.2895965576171875, 1.3259506225585938, 1.3623046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 15.0, 20.0, 53.0, 103.0, 380.0, 219.0, 72.0, 40.0, 17.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.339599609375, -0.3306083679199219, -0.32161712646484375, -0.3126258850097656, -0.3036346435546875, -0.2946434020996094, -0.28565216064453125, -0.2766609191894531, -0.267669677734375, -0.2586784362792969, -0.24968719482421875, -0.24069595336914062, -0.2317047119140625, -0.22271347045898438, -0.21372222900390625, -0.20473098754882812, -0.19573974609375, -0.18674850463867188, -0.17775726318359375, -0.16876602172851562, -0.1597747802734375, -0.15078353881835938, -0.14179229736328125, -0.13280105590820312, -0.123809814453125, -0.11481857299804688, -0.10582733154296875, -0.09683609008789062, -0.0878448486328125, -0.07885360717773438, -0.06986236572265625, -0.060871124267578125, -0.0518798828125, -0.042888641357421875, -0.03389739990234375, -0.024906158447265625, -0.0159149169921875, -0.006923675537109375, 0.00206756591796875, 0.011058807373046875, 0.020050048828125, 0.029041290283203125, 0.03803253173828125, 0.047023773193359375, 0.0560150146484375, 0.06500625610351562, 0.07399749755859375, 0.08298873901367188, 0.09197998046875, 0.10097122192382812, 0.10996246337890625, 0.11895370483398438, 0.1279449462890625, 0.13693618774414062, 0.14592742919921875, 0.15491867065429688, 0.163909912109375, 0.17290115356445312, 0.18189239501953125, 0.19088363647460938, 0.1998748779296875, 0.20886611938476562, 0.21785736083984375, 0.22684860229492188, 0.23583984375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 22.0, 131.0, 596.0, 201.0, 45.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-22.348182678222656, -21.938617706298828, -21.529050827026367, -21.11948585510254, -20.709918975830078, -20.30035400390625, -19.89078712463379, -19.48122215270996, -19.0716552734375, -18.662090301513672, -18.25252342224121, -17.842958450317383, -17.433391571044922, -17.023826599121094, -16.614259719848633, -16.204694747924805, -15.795129776000977, -15.385563850402832, -14.975997924804688, -14.566431999206543, -14.156866073608398, -13.74730110168457, -13.33773422241211, -12.928169250488281, -12.51860237121582, -12.109036445617676, -11.699470520019531, -11.289904594421387, -10.880338668823242, -10.470773696899414, -10.061206817626953, -9.651641845703125, -9.242074966430664, -8.83250904083252, -8.422943115234375, -8.01337718963623, -7.603811740875244, -7.1942458152771, -6.784679889678955, -6.375114440917969, -5.965548515319824, -5.55598258972168, -5.146416664123535, -4.736850738525391, -4.327285289764404, -3.9177193641662598, -3.5081534385681152, -3.09858775138855, -2.6890218257904053, -2.2794559001922607, -1.8698902130126953, -1.4603242874145508, -1.0507584810256958, -0.6411926746368408, -0.2316267490386963, 0.17793893814086914, 0.5875048637390137, 0.9970706701278687, 1.4066364765167236, 1.8162024021148682, 2.2257680892944336, 2.635334014892578, 3.0448999404907227, 3.454465627670288, 3.8640315532684326]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 9.0, 12.0, 12.0, 12.0, 14.0, 13.0, 27.0, 38.0, 23.0, 20.0, 33.0, 30.0, 41.0, 35.0, 52.0, 39.0, 38.0, 54.0, 51.0, 42.0, 34.0, 38.0, 26.0, 32.0, 20.0, 27.0, 30.0, 19.0, 25.0, 24.0, 27.0, 14.0, 16.0, 7.0, 9.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0938031673431396, -3.0046226978302, -2.9154422283172607, -2.826261520385742, -2.7370810508728027, -2.6479005813598633, -2.558720111846924, -2.4695396423339844, -2.380359172821045, -2.2911787033081055, -2.201998233795166, -2.1128177642822266, -2.023637056350708, -1.9344565868377686, -1.845276117324829, -1.7560956478118896, -1.666914939880371, -1.5777344703674316, -1.4885538816452026, -1.3993734121322632, -1.3101928234100342, -1.2210123538970947, -1.1318318843841553, -1.0426514148712158, -0.9534708261489868, -0.8642902970314026, -0.7751097679138184, -0.6859292984008789, -0.5967487692832947, -0.5075682401657104, -0.418387770652771, -0.32920724153518677, -0.24002671241760254, -0.1508461982011795, -0.06166568398475647, 0.02751481533050537, 0.1166953444480896, 0.20587587356567383, 0.2950563430786133, 0.3842368721961975, 0.47341740131378174, 0.562597930431366, 0.6517784595489502, 0.7409589290618896, 0.8301394581794739, 0.9193199872970581, 1.0085004568099976, 1.0976810455322266, 1.186861515045166, 1.2760419845581055, 1.3652225732803345, 1.454403042793274, 1.543583631515503, 1.6327641010284424, 1.7219445705413818, 1.8111250400543213, 1.9003056287765503, 1.9894860982894897, 2.0786666870117188, 2.167847156524658, 2.2570276260375977, 2.346208095550537, 2.4353885650634766, 2.524569272994995, 2.6137497425079346]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 9.0, 15.0, 19.0, 34.0, 48.0, 69.0, 117.0, 178.0, 342.0, 609.0, 1176.0, 2565.0, 7696.0, 56772.0, 2193297.0, 1868468.0, 50135.0, 6914.0, 3087.0, 1183.0, 623.0, 354.0, 211.0, 124.0, 86.0, 41.0, 36.0, 20.0, 14.0, 10.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.52880859375, -2.4521484375, -2.37548828125, -2.298828125, -2.22216796875, -2.1455078125, -2.06884765625, -1.9921875, -1.91552734375, -1.8388671875, -1.76220703125, -1.685546875, -1.60888671875, -1.5322265625, -1.45556640625, -1.37890625, -1.30224609375, -1.2255859375, -1.14892578125, -1.072265625, -0.99560546875, -0.9189453125, -0.84228515625, -0.765625, -0.68896484375, -0.6123046875, -0.53564453125, -0.458984375, -0.38232421875, -0.3056640625, -0.22900390625, -0.15234375, -0.07568359375, 0.0009765625, 0.07763671875, 0.154296875, 0.23095703125, 0.3076171875, 0.38427734375, 0.4609375, 0.53759765625, 0.6142578125, 0.69091796875, 0.767578125, 0.84423828125, 0.9208984375, 0.99755859375, 1.07421875, 1.15087890625, 1.2275390625, 1.30419921875, 1.380859375, 1.45751953125, 1.5341796875, 1.61083984375, 1.6875, 1.76416015625, 1.8408203125, 1.91748046875, 1.994140625, 2.07080078125, 2.1474609375, 2.22412109375, 2.30078125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 11.0, 9.0, 18.0, 22.0, 24.0, 48.0, 43.0, 45.0, 58.0, 74.0, 49.0, 76.0, 81.0, 63.0, 58.0, 67.0, 52.0, 52.0, 33.0, 28.0, 26.0, 20.0, 15.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8133697509765625, -1.764434814453125, -1.7154998779296875, -1.66656494140625, -1.6176300048828125, -1.568695068359375, -1.5197601318359375, -1.4708251953125, -1.4218902587890625, -1.372955322265625, -1.3240203857421875, -1.27508544921875, -1.2261505126953125, -1.177215576171875, -1.1282806396484375, -1.079345703125, -1.0304107666015625, -0.981475830078125, -0.9325408935546875, -0.88360595703125, -0.8346710205078125, -0.785736083984375, -0.7368011474609375, -0.6878662109375, -0.6389312744140625, -0.589996337890625, -0.5410614013671875, -0.49212646484375, -0.4431915283203125, -0.394256591796875, -0.3453216552734375, -0.29638671875, -0.2474517822265625, -0.198516845703125, -0.1495819091796875, -0.10064697265625, -0.0517120361328125, -0.002777099609375, 0.0461578369140625, 0.0950927734375, 0.1440277099609375, 0.192962646484375, 0.2418975830078125, 0.29083251953125, 0.3397674560546875, 0.388702392578125, 0.4376373291015625, 0.486572265625, 0.5355072021484375, 0.584442138671875, 0.6333770751953125, 0.68231201171875, 0.7312469482421875, 0.780181884765625, 0.8291168212890625, 0.8780517578125, 0.9269866943359375, 0.975921630859375, 1.0248565673828125, 1.07379150390625, 1.1227264404296875, 1.171661376953125, 1.2205963134765625, 1.26953125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 12.0, 20.0, 31.0, 104.0, 274.0, 1266.0, 25191.0, 4161344.0, 5151.0, 580.0, 154.0, 59.0, 32.0, 23.0, 7.0, 12.0, 5.0, 0.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.34375, -10.0234375, -9.703125, -9.3828125, -9.0625, -8.7421875, -8.421875, -8.1015625, -7.78125, -7.4609375, -7.140625, -6.8203125, -6.5, -6.1796875, -5.859375, -5.5390625, -5.21875, -4.8984375, -4.578125, -4.2578125, -3.9375, -3.6171875, -3.296875, -2.9765625, -2.65625, -2.3359375, -2.015625, -1.6953125, -1.375, -1.0546875, -0.734375, -0.4140625, -0.09375, 0.2265625, 0.546875, 0.8671875, 1.1875, 1.5078125, 1.828125, 2.1484375, 2.46875, 2.7890625, 3.109375, 3.4296875, 3.75, 4.0703125, 4.390625, 4.7109375, 5.03125, 5.3515625, 5.671875, 5.9921875, 6.3125, 6.6328125, 6.953125, 7.2734375, 7.59375, 7.9140625, 8.234375, 8.5546875, 8.875, 9.1953125, 9.515625, 9.8359375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 0.0, 7.0, 8.0, 6.0, 12.0, 28.0, 30.0, 64.0, 179.0, 906.0, 2105.0, 512.0, 122.0, 45.0, 18.0, 10.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.91796875, -0.8876953125, -0.857421875, -0.8271484375, -0.796875, -0.7666015625, -0.736328125, -0.7060546875, -0.67578125, -0.6455078125, -0.615234375, -0.5849609375, -0.5546875, -0.5244140625, -0.494140625, -0.4638671875, -0.43359375, -0.4033203125, -0.373046875, -0.3427734375, -0.3125, -0.2822265625, -0.251953125, -0.2216796875, -0.19140625, -0.1611328125, -0.130859375, -0.1005859375, -0.0703125, -0.0400390625, -0.009765625, 0.0205078125, 0.05078125, 0.0810546875, 0.111328125, 0.1416015625, 0.171875, 0.2021484375, 0.232421875, 0.2626953125, 0.29296875, 0.3232421875, 0.353515625, 0.3837890625, 0.4140625, 0.4443359375, 0.474609375, 0.5048828125, 0.53515625, 0.5654296875, 0.595703125, 0.6259765625, 0.65625, 0.6865234375, 0.716796875, 0.7470703125, 0.77734375, 0.8076171875, 0.837890625, 0.8681640625, 0.8984375, 0.9287109375, 0.958984375, 0.9892578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 23.0, 34.0, 66.0, 143.0, 232.0, 228.0, 111.0, 69.0, 40.0, 11.0, 17.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.052628517150879, -3.945894718170166, -3.8391611576080322, -3.7324273586273193, -3.6256935596466064, -3.5189599990844727, -3.4122262001037598, -3.305492401123047, -3.198758602142334, -3.092024803161621, -2.9852912425994873, -2.8785574436187744, -2.7718236446380615, -2.6650900840759277, -2.558356285095215, -2.451622486114502, -2.344888925552368, -2.2381551265716553, -2.1314215660095215, -2.0246877670288086, -1.9179539680480957, -1.8112202882766724, -1.704486608505249, -1.5977528095245361, -1.4910191297531128, -1.3842854499816895, -1.2775516510009766, -1.1708179712295532, -1.0640842914581299, -0.957350492477417, -0.8506168127059937, -0.7438830733299255, -0.6371493339538574, -0.5304155945777893, -0.4236818850040436, -0.31694817543029785, -0.21021443605422974, -0.10348069667816162, 0.0032529830932617188, 0.10998672246932983, 0.21672046184539795, 0.32345420122146606, 0.4301879107952118, 0.5369216203689575, 0.6436553597450256, 0.7503890991210938, 0.8571227788925171, 0.9638565182685852, 1.0705902576446533, 1.1773239374160767, 1.2840577363967896, 1.390791416168213, 1.4975252151489258, 1.6042588949203491, 1.7109925746917725, 1.8177263736724854, 1.9244600534439087, 2.031193733215332, 2.137927532196045, 2.244661331176758, 2.3513948917388916, 2.4581286907196045, 2.5648622512817383, 2.671596050262451, 2.778329849243164]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 7.0, 8.0, 15.0, 22.0, 19.0, 30.0, 51.0, 39.0, 59.0, 65.0, 70.0, 64.0, 71.0, 88.0, 70.0, 66.0, 66.0, 48.0, 35.0, 34.0, 25.0, 15.0, 9.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2870242595672607, -2.230461835861206, -2.1738996505737305, -2.117337226867676, -2.060774803161621, -2.0042126178741455, -1.9476501941680908, -1.8910878896713257, -1.8345255851745605, -1.7779632806777954, -1.7214008569717407, -1.6648385524749756, -1.6082762479782104, -1.5517139434814453, -1.4951515197753906, -1.4385892152786255, -1.3820269107818604, -1.3254646062850952, -1.2689021825790405, -1.2123398780822754, -1.1557775735855103, -1.0992152690887451, -1.0426528453826904, -0.9860905408859253, -0.9295281171798706, -0.8729657530784607, -0.8164034485816956, -0.7598410844802856, -0.7032787799835205, -0.6467164158821106, -0.5901540517807007, -0.5335917472839355, -0.4770294427871704, -0.4204671084880829, -0.36390477418899536, -0.30734241008758545, -0.2507801055908203, -0.1942177414894104, -0.13765540719032288, -0.08109307289123535, -0.024530738592147827, 0.032031599432229996, 0.08859393745660782, 0.14515627920627594, 0.20171861350536346, 0.2582809627056122, 0.3148432970046997, 0.37140563130378723, 0.42796796560287476, 0.4845302999019623, 0.5410926342010498, 0.5976549983024597, 0.6542173027992249, 0.7107796669006348, 0.7673419713973999, 0.8239043354988098, 0.8804666996002197, 0.9370290637016296, 0.9935913681983948, 1.0501537322998047, 1.1067160367965698, 1.163278341293335, 1.2198407649993896, 1.2764030694961548, 1.33296537399292]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 10.0, 20.0, 31.0, 44.0, 57.0, 121.0, 219.0, 377.0, 759.0, 1781.0, 4496.0, 14461.0, 75425.0, 680279.0, 228599.0, 29365.0, 7514.0, 2662.0, 1157.0, 484.0, 295.0, 140.0, 73.0, 53.0, 38.0, 19.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.336669921875, -0.3240776062011719, -0.31148529052734375, -0.2988929748535156, -0.2863006591796875, -0.2737083435058594, -0.26111602783203125, -0.24852371215820312, -0.235931396484375, -0.22333908081054688, -0.21074676513671875, -0.19815444946289062, -0.1855621337890625, -0.17296981811523438, -0.16037750244140625, -0.14778518676757812, -0.13519287109375, -0.12260055541992188, -0.11000823974609375, -0.09741592407226562, -0.0848236083984375, -0.07223129272460938, -0.05963897705078125, -0.047046661376953125, -0.034454345703125, -0.021862030029296875, -0.00926971435546875, 0.003322601318359375, 0.0159149169921875, 0.028507232666015625, 0.04109954833984375, 0.053691864013671875, 0.0662841796875, 0.07887649536132812, 0.09146881103515625, 0.10406112670898438, 0.1166534423828125, 0.12924575805664062, 0.14183807373046875, 0.15443038940429688, 0.167022705078125, 0.17961502075195312, 0.19220733642578125, 0.20479965209960938, 0.2173919677734375, 0.22998428344726562, 0.24257659912109375, 0.2551689147949219, 0.26776123046875, 0.2803535461425781, 0.29294586181640625, 0.3055381774902344, 0.3181304931640625, 0.3307228088378906, 0.34331512451171875, 0.3559074401855469, 0.368499755859375, 0.3810920715332031, 0.39368438720703125, 0.4062767028808594, 0.4188690185546875, 0.4314613342285156, 0.44405364990234375, 0.4566459655761719, 0.46923828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 17.0, 22.0, 33.0, 55.0, 69.0, 82.0, 99.0, 103.0, 118.0, 106.0, 85.0, 57.0, 54.0, 38.0, 22.0, 10.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.947418212890625, -1.89483642578125, -1.842254638671875, -1.7896728515625, -1.737091064453125, -1.68450927734375, -1.631927490234375, -1.579345703125, -1.526763916015625, -1.47418212890625, -1.421600341796875, -1.3690185546875, -1.316436767578125, -1.26385498046875, -1.211273193359375, -1.15869140625, -1.106109619140625, -1.05352783203125, -1.000946044921875, -0.9483642578125, -0.895782470703125, -0.84320068359375, -0.790618896484375, -0.738037109375, -0.685455322265625, -0.63287353515625, -0.580291748046875, -0.5277099609375, -0.475128173828125, -0.42254638671875, -0.369964599609375, -0.3173828125, -0.264801025390625, -0.21221923828125, -0.159637451171875, -0.1070556640625, -0.054473876953125, -0.00189208984375, 0.050689697265625, 0.103271484375, 0.155853271484375, 0.20843505859375, 0.261016845703125, 0.3135986328125, 0.366180419921875, 0.41876220703125, 0.471343994140625, 0.52392578125, 0.576507568359375, 0.62908935546875, 0.681671142578125, 0.7342529296875, 0.786834716796875, 0.83941650390625, 0.891998291015625, 0.944580078125, 0.997161865234375, 1.04974365234375, 1.102325439453125, 1.1549072265625, 1.207489013671875, 1.26007080078125, 1.312652587890625, 1.365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 9.0, 6.0, 7.0, 11.0, 10.0, 17.0, 34.0, 41.0, 63.0, 87.0, 123.0, 203.0, 263.0, 423.0, 633.0, 968.0, 1684.0, 3043.0, 6238.0, 13890.0, 35238.0, 108347.0, 406200.0, 329752.0, 87505.0, 29454.0, 11821.0, 5435.0, 2831.0, 1522.0, 887.0, 549.0, 389.0, 274.0, 174.0, 128.0, 109.0, 54.0, 40.0, 34.0, 22.0, 15.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17476463317871094, -0.16910934448242188, -0.1634540557861328, -0.15779876708984375, -0.1521434783935547, -0.14648818969726562, -0.14083290100097656, -0.1351776123046875, -0.12952232360839844, -0.12386703491210938, -0.11821174621582031, -0.11255645751953125, -0.10690116882324219, -0.10124588012695312, -0.09559059143066406, -0.089935302734375, -0.08428001403808594, -0.07862472534179688, -0.07296943664550781, -0.06731414794921875, -0.06165885925292969, -0.056003570556640625, -0.05034828186035156, -0.0446929931640625, -0.03903770446777344, -0.033382415771484375, -0.027727127075195312, -0.02207183837890625, -0.016416549682617188, -0.010761260986328125, -0.0051059722900390625, 0.00054931640625, 0.0062046051025390625, 0.011859893798828125, 0.017515182495117188, 0.02317047119140625, 0.028825759887695312, 0.034481048583984375, 0.04013633728027344, 0.0457916259765625, 0.05144691467285156, 0.057102203369140625, 0.06275749206542969, 0.06841278076171875, 0.07406806945800781, 0.07972335815429688, 0.08537864685058594, 0.091033935546875, 0.09668922424316406, 0.10234451293945312, 0.10799980163574219, 0.11365509033203125, 0.11931037902832031, 0.12496566772460938, 0.13062095642089844, 0.1362762451171875, 0.14193153381347656, 0.14758682250976562, 0.1532421112060547, 0.15889739990234375, 0.1645526885986328, 0.17020797729492188, 0.17586326599121094, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 12.0, 9.0, 9.0, 17.0, 22.0, 20.0, 28.0, 40.0, 53.0, 52.0, 54.0, 42.0, 55.0, 71.0, 52.0, 65.0, 68.0, 52.0, 48.0, 42.0, 36.0, 24.0, 26.0, 20.0, 21.0, 20.0, 8.0, 12.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.5984344482421875, -1.542572021484375, -1.4867095947265625, -1.43084716796875, -1.3749847412109375, -1.319122314453125, -1.2632598876953125, -1.2073974609375, -1.1515350341796875, -1.095672607421875, -1.0398101806640625, -0.98394775390625, -0.9280853271484375, -0.872222900390625, -0.8163604736328125, -0.760498046875, -0.7046356201171875, -0.648773193359375, -0.5929107666015625, -0.53704833984375, -0.4811859130859375, -0.425323486328125, -0.3694610595703125, -0.3135986328125, -0.2577362060546875, -0.201873779296875, -0.1460113525390625, -0.09014892578125, -0.0342864990234375, 0.021575927734375, 0.0774383544921875, 0.13330078125, 0.1891632080078125, 0.245025634765625, 0.3008880615234375, 0.35675048828125, 0.4126129150390625, 0.468475341796875, 0.5243377685546875, 0.5802001953125, 0.6360626220703125, 0.691925048828125, 0.7477874755859375, 0.80364990234375, 0.8595123291015625, 0.915374755859375, 0.9712371826171875, 1.027099609375, 1.0829620361328125, 1.138824462890625, 1.1946868896484375, 1.25054931640625, 1.3064117431640625, 1.362274169921875, 1.4181365966796875, 1.4739990234375, 1.5298614501953125, 1.585723876953125, 1.6415863037109375, 1.69744873046875, 1.7533111572265625, 1.809173583984375, 1.8650360107421875, 1.9208984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 13.0, 8.0, 21.0, 28.0, 29.0, 58.0, 78.0, 126.0, 193.0, 339.0, 772.0, 1447.0, 3128.0, 7886.0, 24737.0, 117379.0, 649130.0, 191485.0, 34275.0, 10130.0, 3816.0, 1645.0, 791.0, 419.0, 236.0, 122.0, 84.0, 51.0, 33.0, 24.0, 20.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07354736328125, -0.07122135162353516, -0.06889533996582031, -0.06656932830810547, -0.06424331665039062, -0.06191730499267578, -0.05959129333496094, -0.057265281677246094, -0.05493927001953125, -0.052613258361816406, -0.05028724670410156, -0.04796123504638672, -0.045635223388671875, -0.04330921173095703, -0.04098320007324219, -0.038657188415527344, -0.0363311767578125, -0.034005165100097656, -0.03167915344238281, -0.02935314178466797, -0.027027130126953125, -0.02470111846923828, -0.022375106811523438, -0.020049095153808594, -0.01772308349609375, -0.015397071838378906, -0.013071060180664062, -0.010745048522949219, -0.008419036865234375, -0.006093025207519531, -0.0037670135498046875, -0.0014410018920898438, 0.000885009765625, 0.0032110214233398438, 0.0055370330810546875, 0.007863044738769531, 0.010189056396484375, 0.012515068054199219, 0.014841079711914062, 0.017167091369628906, 0.01949310302734375, 0.021819114685058594, 0.024145126342773438, 0.02647113800048828, 0.028797149658203125, 0.03112316131591797, 0.03344917297363281, 0.035775184631347656, 0.0381011962890625, 0.040427207946777344, 0.04275321960449219, 0.04507923126220703, 0.047405242919921875, 0.04973125457763672, 0.05205726623535156, 0.054383277893066406, 0.05670928955078125, 0.059035301208496094, 0.06136131286621094, 0.06368732452392578, 0.06601333618164062, 0.06833934783935547, 0.07066535949707031, 0.07299137115478516, 0.0753173828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 14.0, 6.0, 14.0, 27.0, 21.0, 30.0, 45.0, 81.0, 84.0, 116.0, 147.0, 101.0, 82.0, 61.0, 38.0, 32.0, 20.0, 13.0, 13.0, 14.0, 11.0, 3.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.707408905029297e-05, -3.5713426768779755e-05, -3.435276448726654e-05, -3.2992102205753326e-05, -3.163143992424011e-05, -3.0270777642726898e-05, -2.8910115361213684e-05, -2.754945307970047e-05, -2.6188790798187256e-05, -2.4828128516674042e-05, -2.3467466235160828e-05, -2.2106803953647614e-05, -2.07461416721344e-05, -1.9385479390621185e-05, -1.802481710910797e-05, -1.6664154827594757e-05, -1.5303492546081543e-05, -1.3942830264568329e-05, -1.2582167983055115e-05, -1.12215057015419e-05, -9.860843420028687e-06, -8.500181138515472e-06, -7.139518857002258e-06, -5.778856575489044e-06, -4.41819429397583e-06, -3.057532012462616e-06, -1.6968697309494019e-06, -3.3620744943618774e-07, 1.0244548320770264e-06, 2.3851171135902405e-06, 3.7457793951034546e-06, 5.106441676616669e-06, 6.467103958129883e-06, 7.827766239643097e-06, 9.188428521156311e-06, 1.0549090802669525e-05, 1.190975308418274e-05, 1.3270415365695953e-05, 1.4631077647209167e-05, 1.599173992872238e-05, 1.7352402210235596e-05, 1.871306449174881e-05, 2.0073726773262024e-05, 2.1434389054775238e-05, 2.2795051336288452e-05, 2.4155713617801666e-05, 2.551637589931488e-05, 2.6877038180828094e-05, 2.823770046234131e-05, 2.9598362743854523e-05, 3.095902502536774e-05, 3.231968730688095e-05, 3.3680349588394165e-05, 3.504101186990738e-05, 3.640167415142059e-05, 3.776233643293381e-05, 3.912299871444702e-05, 4.0483660995960236e-05, 4.184432327747345e-05, 4.3204985558986664e-05, 4.456564784049988e-05, 4.592631012201309e-05, 4.7286972403526306e-05, 4.864763468503952e-05, 5.0008296966552734e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 10.0, 9.0, 13.0, 25.0, 36.0, 46.0, 82.0, 168.0, 410.0, 966.0, 2814.0, 10819.0, 61322.0, 626469.0, 303313.0, 32262.0, 6591.0, 1906.0, 654.0, 296.0, 133.0, 72.0, 44.0, 25.0, 22.0, 15.0, 7.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10919189453125, -0.10605716705322266, -0.10292243957519531, -0.09978771209716797, -0.09665298461914062, -0.09351825714111328, -0.09038352966308594, -0.0872488021850586, -0.08411407470703125, -0.0809793472290039, -0.07784461975097656, -0.07470989227294922, -0.07157516479492188, -0.06844043731689453, -0.06530570983886719, -0.062170982360839844, -0.0590362548828125, -0.055901527404785156, -0.05276679992675781, -0.04963207244873047, -0.046497344970703125, -0.04336261749267578, -0.04022789001464844, -0.037093162536621094, -0.03395843505859375, -0.030823707580566406, -0.027688980102539062, -0.02455425262451172, -0.021419525146484375, -0.01828479766845703, -0.015150070190429688, -0.012015342712402344, -0.008880615234375, -0.005745887756347656, -0.0026111602783203125, 0.0005235671997070312, 0.003658294677734375, 0.006793022155761719, 0.009927749633789062, 0.013062477111816406, 0.01619720458984375, 0.019331932067871094, 0.022466659545898438, 0.02560138702392578, 0.028736114501953125, 0.03187084197998047, 0.03500556945800781, 0.038140296936035156, 0.0412750244140625, 0.044409751892089844, 0.04754447937011719, 0.05067920684814453, 0.053813934326171875, 0.05694866180419922, 0.06008338928222656, 0.0632181167602539, 0.06635284423828125, 0.0694875717163086, 0.07262229919433594, 0.07575702667236328, 0.07889175415039062, 0.08202648162841797, 0.08516120910644531, 0.08829593658447266, 0.0914306640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 8.0, 9.0, 10.0, 7.0, 21.0, 22.0, 16.0, 33.0, 33.0, 60.0, 49.0, 59.0, 88.0, 66.0, 67.0, 76.0, 73.0, 64.0, 65.0, 38.0, 27.0, 26.0, 16.0, 13.0, 17.0, 10.0, 5.0, 7.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01541900634765625, -0.014920353889465332, -0.014421701431274414, -0.013923048973083496, -0.013424396514892578, -0.01292574405670166, -0.012427091598510742, -0.011928439140319824, -0.011429786682128906, -0.010931134223937988, -0.01043248176574707, -0.009933829307556152, -0.009435176849365234, -0.008936524391174316, -0.008437871932983398, -0.00793921947479248, -0.0074405670166015625, -0.0069419145584106445, -0.0064432621002197266, -0.005944609642028809, -0.005445957183837891, -0.004947304725646973, -0.004448652267456055, -0.003949999809265137, -0.0034513473510742188, -0.0029526948928833008, -0.002454042434692383, -0.001955389976501465, -0.0014567375183105469, -0.0009580850601196289, -0.00045943260192871094, 3.921985626220703e-05, 0.000537872314453125, 0.001036524772644043, 0.001535177230834961, 0.002033829689025879, 0.002532482147216797, 0.003031134605407715, 0.003529787063598633, 0.004028439521789551, 0.004527091979980469, 0.005025744438171387, 0.005524396896362305, 0.006023049354553223, 0.006521701812744141, 0.007020354270935059, 0.0075190067291259766, 0.008017659187316895, 0.008516311645507812, 0.00901496410369873, 0.009513616561889648, 0.010012269020080566, 0.010510921478271484, 0.011009573936462402, 0.01150822639465332, 0.012006878852844238, 0.012505531311035156, 0.013004183769226074, 0.013502836227416992, 0.01400148868560791, 0.014500141143798828, 0.014998793601989746, 0.015497446060180664, 0.015996098518371582, 0.0164947509765625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 11.0, 17.0, 51.0, 143.0, 376.0, 252.0, 98.0, 23.0, 18.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140503406524658, -4.036479473114014, -3.932455062866211, -3.8284311294555664, -3.7244069576263428, -3.620382785797119, -3.5163586139678955, -3.412334442138672, -3.3083105087280273, -3.2042863368988037, -3.10026216506958, -2.9962382316589355, -2.892214059829712, -2.7881898880004883, -2.6841657161712646, -2.580141544342041, -2.4761176109313965, -2.372093439102173, -2.268069267272949, -2.1640453338623047, -2.060021162033081, -1.9559969902038574, -1.8519728183746338, -1.7479487657546997, -1.6439244747161865, -1.539900302886963, -1.4358762502670288, -1.3318520784378052, -1.227828025817871, -1.1238038539886475, -1.0197796821594238, -0.9157556295394897, -0.8117315769195557, -0.7077074646949768, -0.603683352470398, -0.4996592104434967, -0.39563509821891785, -0.2916109561920166, -0.18758684396743774, -0.08356273174285889, 0.02046138048171997, 0.12448550015687943, 0.22850961983203888, 0.33253374695777893, 0.4365578591823578, 0.540582001209259, 0.6446061134338379, 0.7486302256584167, 0.8526543378829956, 0.9566784501075745, 1.0607025623321533, 1.164726734161377, 1.268750786781311, 1.3727749586105347, 1.4767990112304688, 1.5808231830596924, 1.684847354888916, 1.7888715267181396, 1.8928955793380737, 1.9969197511672974, 2.1009438037872314, 2.204967975616455, 2.3089921474456787, 2.4130163192749023, 2.517040252685547]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 10.0, 9.0, 24.0, 32.0, 40.0, 54.0, 80.0, 87.0, 96.0, 97.0, 121.0, 82.0, 76.0, 64.0, 47.0, 32.0, 17.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8105216026306152, -1.762357234954834, -1.7141928672790527, -1.6660284996032715, -1.6178641319274902, -1.569699764251709, -1.5215353965759277, -1.4733710289001465, -1.4252066612243652, -1.377042293548584, -1.3288779258728027, -1.2807135581970215, -1.2325491905212402, -1.184384822845459, -1.1362204551696777, -1.0880560874938965, -1.0398917198181152, -0.991727352142334, -0.9435629844665527, -0.8953986167907715, -0.8472342491149902, -0.799069881439209, -0.7509055137634277, -0.7027411460876465, -0.6545767784118652, -0.606412410736084, -0.5582480430603027, -0.5100836753845215, -0.46191930770874023, -0.413754940032959, -0.36559057235717773, -0.3174262046813965, -0.26926183700561523, -0.22109746932983398, -0.17293310165405273, -0.12476873397827148, -0.07660436630249023, -0.028439998626708984, 0.019724369049072266, 0.06788873672485352, 0.11605310440063477, 0.16421747207641602, 0.21238183975219727, 0.2605462074279785, 0.30871057510375977, 0.356874942779541, 0.40503931045532227, 0.4532036781311035, 0.5013680458068848, 0.549532413482666, 0.5976967811584473, 0.6458611488342285, 0.6940255165100098, 0.742189884185791, 0.7903542518615723, 0.8385186195373535, 0.8866829872131348, 0.934847354888916, 0.9830117225646973, 1.0311760902404785, 1.0793404579162598, 1.127504825592041, 1.1756691932678223, 1.2238335609436035, 1.2719979286193848]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 19.0, 46.0, 182.0, 635.0, 3850.0, 153918.0, 883016.0, 5693.0, 869.0, 188.0, 54.0, 33.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.401123046875, -5.25146484375, -5.101806640625, -4.9521484375, -4.802490234375, -4.65283203125, -4.503173828125, -4.353515625, -4.203857421875, -4.05419921875, -3.904541015625, -3.7548828125, -3.605224609375, -3.45556640625, -3.305908203125, -3.15625, -3.006591796875, -2.85693359375, -2.707275390625, -2.5576171875, -2.407958984375, -2.25830078125, -2.108642578125, -1.958984375, -1.809326171875, -1.65966796875, -1.510009765625, -1.3603515625, -1.210693359375, -1.06103515625, -0.911376953125, -0.76171875, -0.612060546875, -0.46240234375, -0.312744140625, -0.1630859375, -0.013427734375, 0.13623046875, 0.285888671875, 0.435546875, 0.585205078125, 0.73486328125, 0.884521484375, 1.0341796875, 1.183837890625, 1.33349609375, 1.483154296875, 1.6328125, 1.782470703125, 1.93212890625, 2.081787109375, 2.2314453125, 2.381103515625, 2.53076171875, 2.680419921875, 2.830078125, 2.979736328125, 3.12939453125, 3.279052734375, 3.4287109375, 3.578369140625, 3.72802734375, 3.877685546875, 4.02734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 18.0, 41.0, 52.0, 87.0, 148.0, 146.0, 184.0, 122.0, 85.0, 61.0, 23.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.409027099609375, -2.25750732421875, -2.105987548828125, -1.9544677734375, -1.802947998046875, -1.65142822265625, -1.499908447265625, -1.348388671875, -1.196868896484375, -1.04534912109375, -0.893829345703125, -0.7423095703125, -0.590789794921875, -0.43927001953125, -0.287750244140625, -0.13623046875, 0.015289306640625, 0.16680908203125, 0.318328857421875, 0.4698486328125, 0.621368408203125, 0.77288818359375, 0.924407958984375, 1.075927734375, 1.227447509765625, 1.37896728515625, 1.530487060546875, 1.6820068359375, 1.833526611328125, 1.98504638671875, 2.136566162109375, 2.2880859375, 2.439605712890625, 2.59112548828125, 2.742645263671875, 2.8941650390625, 3.045684814453125, 3.19720458984375, 3.348724365234375, 3.500244140625, 3.651763916015625, 3.80328369140625, 3.954803466796875, 4.1063232421875, 4.257843017578125, 4.40936279296875, 4.560882568359375, 4.71240234375, 4.863922119140625, 5.01544189453125, 5.166961669921875, 5.3184814453125, 5.470001220703125, 5.62152099609375, 5.773040771484375, 5.924560546875, 6.076080322265625, 6.22760009765625, 6.379119873046875, 6.5306396484375, 6.682159423828125, 6.83367919921875, 6.985198974609375, 7.13671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 5.0, 6.0, 7.0, 8.0, 21.0, 7.0, 19.0, 24.0, 36.0, 48.0, 48.0, 62.0, 82.0, 120.0, 193.0, 285.0, 536.0, 1225.0, 3680.0, 18013.0, 880941.0, 129064.0, 9440.0, 2419.0, 902.0, 449.0, 265.0, 141.0, 115.0, 96.0, 56.0, 55.0, 41.0, 32.0, 20.0, 18.0, 18.0, 15.0, 8.0, 7.0, 8.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.532745361328125, -2.46002197265625, -2.387298583984375, -2.3145751953125, -2.241851806640625, -2.16912841796875, -2.096405029296875, -2.023681640625, -1.950958251953125, -1.87823486328125, -1.805511474609375, -1.7327880859375, -1.660064697265625, -1.58734130859375, -1.514617919921875, -1.44189453125, -1.369171142578125, -1.29644775390625, -1.223724365234375, -1.1510009765625, -1.078277587890625, -1.00555419921875, -0.932830810546875, -0.860107421875, -0.787384033203125, -0.71466064453125, -0.641937255859375, -0.5692138671875, -0.496490478515625, -0.42376708984375, -0.351043701171875, -0.2783203125, -0.205596923828125, -0.13287353515625, -0.060150146484375, 0.0125732421875, 0.085296630859375, 0.15802001953125, 0.230743408203125, 0.303466796875, 0.376190185546875, 0.44891357421875, 0.521636962890625, 0.5943603515625, 0.667083740234375, 0.73980712890625, 0.812530517578125, 0.88525390625, 0.957977294921875, 1.03070068359375, 1.103424072265625, 1.1761474609375, 1.248870849609375, 1.32159423828125, 1.394317626953125, 1.467041015625, 1.539764404296875, 1.61248779296875, 1.685211181640625, 1.7579345703125, 1.830657958984375, 1.90338134765625, 1.976104736328125, 2.048828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 10.0, 13.0, 8.0, 10.0, 18.0, 21.0, 23.0, 21.0, 24.0, 21.0, 28.0, 36.0, 47.0, 40.0, 49.0, 35.0, 38.0, 60.0, 40.0, 53.0, 36.0, 40.0, 32.0, 24.0, 33.0, 28.0, 24.0, 31.0, 22.0, 17.0, 19.0, 21.0, 9.0, 18.0, 7.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4453125, -1.4024200439453125, -1.359527587890625, -1.3166351318359375, -1.27374267578125, -1.2308502197265625, -1.187957763671875, -1.1450653076171875, -1.1021728515625, -1.0592803955078125, -1.016387939453125, -0.9734954833984375, -0.93060302734375, -0.8877105712890625, -0.844818115234375, -0.8019256591796875, -0.759033203125, -0.7161407470703125, -0.673248291015625, -0.6303558349609375, -0.58746337890625, -0.5445709228515625, -0.501678466796875, -0.4587860107421875, -0.4158935546875, -0.3730010986328125, -0.330108642578125, -0.2872161865234375, -0.24432373046875, -0.2014312744140625, -0.158538818359375, -0.1156463623046875, -0.07275390625, -0.0298614501953125, 0.013031005859375, 0.0559234619140625, 0.09881591796875, 0.1417083740234375, 0.184600830078125, 0.2274932861328125, 0.2703857421875, 0.3132781982421875, 0.356170654296875, 0.3990631103515625, 0.44195556640625, 0.4848480224609375, 0.527740478515625, 0.5706329345703125, 0.613525390625, 0.6564178466796875, 0.699310302734375, 0.7422027587890625, 0.78509521484375, 0.8279876708984375, 0.870880126953125, 0.9137725830078125, 0.9566650390625, 0.9995574951171875, 1.042449951171875, 1.0853424072265625, 1.12823486328125, 1.1711273193359375, 1.214019775390625, 1.2569122314453125, 1.2998046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 7.0, 7.0, 9.0, 13.0, 24.0, 29.0, 44.0, 72.0, 146.0, 268.0, 602.0, 1745.0, 7381.0, 64764.0, 913148.0, 51111.0, 6590.0, 1501.0, 551.0, 245.0, 105.0, 74.0, 37.0, 21.0, 21.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2847442626953125, -0.273101806640625, -0.2614593505859375, -0.24981689453125, -0.2381744384765625, -0.226531982421875, -0.2148895263671875, -0.2032470703125, -0.1916046142578125, -0.179962158203125, -0.1683197021484375, -0.15667724609375, -0.1450347900390625, -0.133392333984375, -0.1217498779296875, -0.110107421875, -0.0984649658203125, -0.086822509765625, -0.0751800537109375, -0.06353759765625, -0.0518951416015625, -0.040252685546875, -0.0286102294921875, -0.0169677734375, -0.0053253173828125, 0.006317138671875, 0.0179595947265625, 0.02960205078125, 0.0412445068359375, 0.052886962890625, 0.0645294189453125, 0.076171875, 0.0878143310546875, 0.099456787109375, 0.1110992431640625, 0.12274169921875, 0.1343841552734375, 0.146026611328125, 0.1576690673828125, 0.1693115234375, 0.1809539794921875, 0.192596435546875, 0.2042388916015625, 0.21588134765625, 0.2275238037109375, 0.239166259765625, 0.2508087158203125, 0.262451171875, 0.2740936279296875, 0.285736083984375, 0.2973785400390625, 0.30902099609375, 0.3206634521484375, 0.332305908203125, 0.3439483642578125, 0.3555908203125, 0.3672332763671875, 0.378875732421875, 0.3905181884765625, 0.40216064453125, 0.4138031005859375, 0.425445556640625, 0.4370880126953125, 0.44873046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 26.0, 25.0, 44.0, 93.0, 149.0, 207.0, 153.0, 100.0, 57.0, 28.0, 20.0, 11.0, 11.0, 10.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082918167114258e-05, -3.9686448872089386e-05, -3.8543716073036194e-05, -3.7400983273983e-05, -3.625825047492981e-05, -3.511551767587662e-05, -3.3972784876823425e-05, -3.283005207777023e-05, -3.168731927871704e-05, -3.054458647966385e-05, -2.9401853680610657e-05, -2.8259120881557465e-05, -2.7116388082504272e-05, -2.597365528345108e-05, -2.4830922484397888e-05, -2.3688189685344696e-05, -2.2545456886291504e-05, -2.1402724087238312e-05, -2.025999128818512e-05, -1.9117258489131927e-05, -1.7974525690078735e-05, -1.6831792891025543e-05, -1.568906009197235e-05, -1.4546327292919159e-05, -1.3403594493865967e-05, -1.2260861694812775e-05, -1.1118128895759583e-05, -9.97539609670639e-06, -8.832663297653198e-06, -7.689930498600006e-06, -6.547197699546814e-06, -5.404464900493622e-06, -4.26173210144043e-06, -3.1189993023872375e-06, -1.9762665033340454e-06, -8.335337042808533e-07, 3.0919909477233887e-07, 1.451931893825531e-06, 2.594664692878723e-06, 3.7373974919319153e-06, 4.880130290985107e-06, 6.0228630900382996e-06, 7.165595889091492e-06, 8.308328688144684e-06, 9.451061487197876e-06, 1.0593794286251068e-05, 1.173652708530426e-05, 1.2879259884357452e-05, 1.4021992683410645e-05, 1.5164725482463837e-05, 1.630745828151703e-05, 1.745019108057022e-05, 1.8592923879623413e-05, 1.9735656678676605e-05, 2.0878389477729797e-05, 2.202112227678299e-05, 2.316385507583618e-05, 2.4306587874889374e-05, 2.5449320673942566e-05, 2.6592053472995758e-05, 2.773478627204895e-05, 2.8877519071102142e-05, 3.0020251870155334e-05, 3.1162984669208527e-05, 3.230571746826172e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 15.0, 20.0, 35.0, 57.0, 77.0, 135.0, 204.0, 436.0, 952.0, 2307.0, 7574.0, 44677.0, 872694.0, 101725.0, 11885.0, 3242.0, 1199.0, 532.0, 290.0, 169.0, 95.0, 64.0, 41.0, 30.0, 18.0, 11.0, 10.0, 4.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343017578125, -0.3321800231933594, -0.32134246826171875, -0.3105049133300781, -0.2996673583984375, -0.2888298034667969, -0.27799224853515625, -0.2671546936035156, -0.256317138671875, -0.24547958374023438, -0.23464202880859375, -0.22380447387695312, -0.2129669189453125, -0.20212936401367188, -0.19129180908203125, -0.18045425415039062, -0.16961669921875, -0.15877914428710938, -0.14794158935546875, -0.13710403442382812, -0.1262664794921875, -0.11542892456054688, -0.10459136962890625, -0.09375381469726562, -0.082916259765625, -0.07207870483398438, -0.06124114990234375, -0.050403594970703125, -0.0395660400390625, -0.028728485107421875, -0.01789093017578125, -0.007053375244140625, 0.0037841796875, 0.014621734619140625, 0.02545928955078125, 0.036296844482421875, 0.0471343994140625, 0.057971954345703125, 0.06880950927734375, 0.07964706420898438, 0.090484619140625, 0.10132217407226562, 0.11215972900390625, 0.12299728393554688, 0.1338348388671875, 0.14467239379882812, 0.15550994873046875, 0.16634750366210938, 0.17718505859375, 0.18802261352539062, 0.19886016845703125, 0.20969772338867188, 0.2205352783203125, 0.23137283325195312, 0.24221038818359375, 0.2530479431152344, 0.263885498046875, 0.2747230529785156, 0.28556060791015625, 0.2963981628417969, 0.3072357177734375, 0.3180732727050781, 0.32891082763671875, 0.3397483825683594, 0.3505859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 6.0, 13.0, 14.0, 15.0, 29.0, 36.0, 57.0, 107.0, 169.0, 206.0, 144.0, 60.0, 34.0, 26.0, 20.0, 10.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1260986328125, -0.12218761444091797, -0.11827659606933594, -0.1143655776977539, -0.11045455932617188, -0.10654354095458984, -0.10263252258300781, -0.09872150421142578, -0.09481048583984375, -0.09089946746826172, -0.08698844909667969, -0.08307743072509766, -0.07916641235351562, -0.0752553939819336, -0.07134437561035156, -0.06743335723876953, -0.0635223388671875, -0.05961132049560547, -0.05570030212402344, -0.051789283752441406, -0.047878265380859375, -0.043967247009277344, -0.04005622863769531, -0.03614521026611328, -0.03223419189453125, -0.02832317352294922, -0.024412155151367188, -0.020501136779785156, -0.016590118408203125, -0.012679100036621094, -0.008768081665039062, -0.004857063293457031, -0.000946044921875, 0.0029649734497070312, 0.0068759918212890625, 0.010787010192871094, 0.014698028564453125, 0.018609046936035156, 0.022520065307617188, 0.02643108367919922, 0.03034210205078125, 0.03425312042236328, 0.03816413879394531, 0.042075157165527344, 0.045986175537109375, 0.049897193908691406, 0.05380821228027344, 0.05771923065185547, 0.0616302490234375, 0.06554126739501953, 0.06945228576660156, 0.0733633041381836, 0.07727432250976562, 0.08118534088134766, 0.08509635925292969, 0.08900737762451172, 0.09291839599609375, 0.09682941436767578, 0.10074043273925781, 0.10465145111083984, 0.10856246948242188, 0.1124734878540039, 0.11638450622558594, 0.12029552459716797, 0.12420654296875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 28.0, 79.0, 204.0, 351.0, 197.0, 66.0, 33.0, 12.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.962121963500977, -7.778932094573975, -7.5957417488098145, -7.4125518798828125, -7.2293620109558105, -7.046172142028809, -6.862981796264648, -6.6797919273376465, -6.4966020584106445, -6.313412189483643, -6.130221843719482, -5.9470319747924805, -5.7638421058654785, -5.580652236938477, -5.397461891174316, -5.2142720222473145, -5.031081676483154, -4.847891807556152, -4.664701461791992, -4.48151159286499, -4.298321723937988, -4.115131378173828, -3.931941509246826, -3.748751640319824, -3.565561532974243, -3.382371425628662, -3.19918155670166, -3.015991449356079, -2.832801342010498, -2.649611473083496, -2.466421365737915, -2.283231258392334, -2.100041389465332, -1.9168514013290405, -1.733661413192749, -1.550471305847168, -1.3672813177108765, -1.184091329574585, -1.000901222229004, -0.8177112340927124, -0.6345212459564209, -0.451331228017807, -0.2681412100791931, -0.08495116233825684, 0.09823882579803467, 0.28142881393432617, 0.4646189212799072, 0.6478089094161987, 0.8309988975524902, 1.0141888856887817, 1.1973788738250732, 1.3805689811706543, 1.5637589693069458, 1.7469489574432373, 1.9301390647888184, 2.1133289337158203, 2.2965190410614014, 2.4797091484069824, 2.6628990173339844, 2.8460891246795654, 3.0292792320251465, 3.2124691009521484, 3.3956592082977295, 3.5788493156433105, 3.7620391845703125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 15.0, 23.0, 19.0, 32.0, 44.0, 52.0, 59.0, 59.0, 74.0, 82.0, 63.0, 73.0, 72.0, 68.0, 64.0, 44.0, 36.0, 41.0, 21.0, 21.0, 10.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.457720994949341, -2.319880962371826, -2.1820411682128906, -2.044201374053955, -1.9063613414764404, -1.7685214281082153, -1.6306815147399902, -1.4928416013717651, -1.35500168800354, -1.217161774635315, -1.0793218612670898, -0.9414819478988647, -0.8036420345306396, -0.6658021211624146, -0.5279622077941895, -0.39012229442596436, -0.25228238105773926, -0.11444246768951416, 0.023397445678710938, 0.16123735904693604, 0.29907727241516113, 0.43691718578338623, 0.5747570991516113, 0.7125970125198364, 0.8504369258880615, 0.9882768392562866, 1.1261167526245117, 1.2639566659927368, 1.401796579360962, 1.539636492729187, 1.677476406097412, 1.8153163194656372, 1.9531564712524414, 2.090996265411377, 2.2288362979888916, 2.3666763305664062, 2.504516124725342, 2.6423559188842773, 2.780195951461792, 2.9180359840393066, 3.055875778198242, 3.1937155723571777, 3.3315556049346924, 3.469395637512207, 3.6072354316711426, 3.745075225830078, 3.8829152584075928, 4.020755290985107, 4.158595085144043, 4.2964348793029785, 4.434274673461914, 4.572114944458008, 4.709954738616943, 4.847794532775879, 4.985634803771973, 5.123474597930908, 5.261314392089844, 5.399154186248779, 5.536993980407715, 5.674834251403809, 5.812674045562744, 5.95051383972168, 6.088354110717773, 6.226193904876709, 6.3640336990356445]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 12.0, 16.0, 32.0, 32.0, 52.0, 112.0, 165.0, 290.0, 513.0, 1064.0, 2546.0, 7845.0, 82427.0, 3549404.0, 519146.0, 22727.0, 4165.0, 2004.0, 843.0, 373.0, 194.0, 102.0, 76.0, 47.0, 31.0, 21.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.056640625, -2.975677490234375, -2.89471435546875, -2.813751220703125, -2.7327880859375, -2.651824951171875, -2.57086181640625, -2.489898681640625, -2.408935546875, -2.327972412109375, -2.24700927734375, -2.166046142578125, -2.0850830078125, -2.004119873046875, -1.92315673828125, -1.842193603515625, -1.76123046875, -1.680267333984375, -1.59930419921875, -1.518341064453125, -1.4373779296875, -1.356414794921875, -1.27545166015625, -1.194488525390625, -1.113525390625, -1.032562255859375, -0.95159912109375, -0.870635986328125, -0.7896728515625, -0.708709716796875, -0.62774658203125, -0.546783447265625, -0.4658203125, -0.384857177734375, -0.30389404296875, -0.222930908203125, -0.1419677734375, -0.061004638671875, 0.01995849609375, 0.100921630859375, 0.181884765625, 0.262847900390625, 0.34381103515625, 0.424774169921875, 0.5057373046875, 0.586700439453125, 0.66766357421875, 0.748626708984375, 0.82958984375, 0.910552978515625, 0.99151611328125, 1.072479248046875, 1.1534423828125, 1.234405517578125, 1.31536865234375, 1.396331787109375, 1.477294921875, 1.558258056640625, 1.63922119140625, 1.720184326171875, 1.8011474609375, 1.882110595703125, 1.96307373046875, 2.044036865234375, 2.125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 6.0, 6.0, 10.0, 14.0, 18.0, 17.0, 34.0, 51.0, 59.0, 75.0, 78.0, 85.0, 106.0, 104.0, 81.0, 61.0, 64.0, 43.0, 29.0, 13.0, 14.0, 13.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.12109375, -2.0625, -2.00390625, -1.9453125, -1.88671875, -1.828125, -1.76953125, -1.7109375, -1.65234375, -1.59375, -1.53515625, -1.4765625, -1.41796875, -1.359375, -1.30078125, -1.2421875, -1.18359375, -1.125, -1.06640625, -1.0078125, -0.94921875, -0.890625, -0.83203125, -0.7734375, -0.71484375, -0.65625, -0.59765625, -0.5390625, -0.48046875, -0.421875, -0.36328125, -0.3046875, -0.24609375, -0.1875, -0.12890625, -0.0703125, -0.01171875, 0.046875, 0.10546875, 0.1640625, 0.22265625, 0.28125, 0.33984375, 0.3984375, 0.45703125, 0.515625, 0.57421875, 0.6328125, 0.69140625, 0.75, 0.80859375, 0.8671875, 0.92578125, 0.984375, 1.04296875, 1.1015625, 1.16015625, 1.21875, 1.27734375, 1.3359375, 1.39453125, 1.453125, 1.51171875, 1.5703125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 13.0, 26.0, 55.0, 163.0, 632.0, 9759.0, 4178438.0, 4553.0, 441.0, 117.0, 32.0, 24.0, 12.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.4014892578125, -15.029541015625, -14.6575927734375, -14.28564453125, -13.9136962890625, -13.541748046875, -13.1697998046875, -12.7978515625, -12.4259033203125, -12.053955078125, -11.6820068359375, -11.31005859375, -10.9381103515625, -10.566162109375, -10.1942138671875, -9.822265625, -9.4503173828125, -9.078369140625, -8.7064208984375, -8.33447265625, -7.9625244140625, -7.590576171875, -7.2186279296875, -6.8466796875, -6.4747314453125, -6.102783203125, -5.7308349609375, -5.35888671875, -4.9869384765625, -4.614990234375, -4.2430419921875, -3.87109375, -3.4991455078125, -3.127197265625, -2.7552490234375, -2.38330078125, -2.0113525390625, -1.639404296875, -1.2674560546875, -0.8955078125, -0.5235595703125, -0.151611328125, 0.2203369140625, 0.59228515625, 0.9642333984375, 1.336181640625, 1.7081298828125, 2.080078125, 2.4520263671875, 2.823974609375, 3.1959228515625, 3.56787109375, 3.9398193359375, 4.311767578125, 4.6837158203125, 5.0556640625, 5.4276123046875, 5.799560546875, 6.1715087890625, 6.54345703125, 6.9154052734375, 7.287353515625, 7.6593017578125, 8.03125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 12.0, 31.0, 78.0, 422.0, 2589.0, 742.0, 99.0, 39.0, 21.0, 16.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.7972564697265625, -0.758575439453125, -0.7198944091796875, -0.68121337890625, -0.6425323486328125, -0.603851318359375, -0.5651702880859375, -0.5264892578125, -0.4878082275390625, -0.449127197265625, -0.4104461669921875, -0.37176513671875, -0.3330841064453125, -0.294403076171875, -0.2557220458984375, -0.217041015625, -0.1783599853515625, -0.139678955078125, -0.1009979248046875, -0.06231689453125, -0.0236358642578125, 0.015045166015625, 0.0537261962890625, 0.0924072265625, 0.1310882568359375, 0.169769287109375, 0.2084503173828125, 0.24713134765625, 0.2858123779296875, 0.324493408203125, 0.3631744384765625, 0.40185546875, 0.4405364990234375, 0.479217529296875, 0.5178985595703125, 0.55657958984375, 0.5952606201171875, 0.633941650390625, 0.6726226806640625, 0.7113037109375, 0.7499847412109375, 0.788665771484375, 0.8273468017578125, 0.86602783203125, 0.9047088623046875, 0.943389892578125, 0.9820709228515625, 1.020751953125, 1.0594329833984375, 1.098114013671875, 1.1367950439453125, 1.17547607421875, 1.2141571044921875, 1.252838134765625, 1.2915191650390625, 1.3302001953125, 1.3688812255859375, 1.407562255859375, 1.4462432861328125, 1.48492431640625, 1.5236053466796875, 1.562286376953125, 1.6009674072265625, 1.6396484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 10.0, 19.0, 39.0, 74.0, 173.0, 277.0, 184.0, 105.0, 47.0, 34.0, 13.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.185263633728027, -4.067671775817871, -3.9500796794891357, -3.8324875831604004, -3.714895486831665, -3.5973033905029297, -3.4797115325927734, -3.362119436264038, -3.2445273399353027, -3.1269352436065674, -3.009343385696411, -2.891751289367676, -2.7741591930389404, -2.656567096710205, -2.538975238800049, -2.4213831424713135, -2.3037912845611572, -2.186199188232422, -2.0686073303222656, -1.9510152339935303, -1.833423137664795, -1.7158311605453491, -1.5982391834259033, -1.480647087097168, -1.3630551099777222, -1.2454631328582764, -1.127871036529541, -1.0102790594100952, -0.8926870226860046, -0.7750949859619141, -0.6575030088424683, -0.5399109721183777, -0.4223191738128662, -0.30472713708877563, -0.18713513016700745, -0.06954312324523926, 0.04804891347885132, 0.1656409502029419, 0.2832329273223877, 0.40082496404647827, 0.5184170007705688, 0.6360090374946594, 0.75360107421875, 0.8711930513381958, 0.9887850880622864, 1.106377124786377, 1.2239691019058228, 1.3415610790252686, 1.459153175354004, 1.5767451524734497, 1.694337248802185, 1.8119292259216309, 1.9295213222503662, 2.0471134185791016, 2.164705276489258, 2.282297372817993, 2.3998894691467285, 2.517481565475464, 2.63507342338562, 2.7526655197143555, 2.870257616043091, 2.987849712371826, 3.1054415702819824, 3.2230336666107178, 3.340625524520874]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 14.0, 8.0, 15.0, 18.0, 34.0, 38.0, 39.0, 51.0, 66.0, 67.0, 77.0, 76.0, 68.0, 75.0, 58.0, 65.0, 55.0, 49.0, 33.0, 24.0, 21.0, 11.0, 11.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0943245887756348, -2.038926124572754, -1.9835278987884521, -1.9281295537948608, -1.8727312088012695, -1.8173328638076782, -1.761934518814087, -1.7065361738204956, -1.6511378288269043, -1.595739483833313, -1.5403411388397217, -1.4849427938461304, -1.429544448852539, -1.3741461038589478, -1.3187477588653564, -1.2633494138717651, -1.2079510688781738, -1.1525527238845825, -1.0971543788909912, -1.0417560338974, -0.9863576889038086, -0.9309593439102173, -0.875560998916626, -0.8201626539230347, -0.7647643089294434, -0.709365963935852, -0.6539676189422607, -0.5985692739486694, -0.5431709289550781, -0.4877725839614868, -0.4323742389678955, -0.3769758939743042, -0.32157766819000244, -0.26617932319641113, -0.21078097820281982, -0.15538263320922852, -0.09998428821563721, -0.0445859432220459, 0.01081240177154541, 0.06621074676513672, 0.12160909175872803, 0.17700743675231934, 0.23240578174591064, 0.28780412673950195, 0.34320247173309326, 0.39860081672668457, 0.4539991617202759, 0.5093975067138672, 0.5647958517074585, 0.6201941967010498, 0.6755925416946411, 0.7309908866882324, 0.7863892316818237, 0.841787576675415, 0.8971859216690063, 0.9525842666625977, 1.007982611656189, 1.0633809566497803, 1.1187793016433716, 1.174177646636963, 1.2295759916305542, 1.2849743366241455, 1.3403726816177368, 1.3957710266113281, 1.4511693716049194]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 1.0, 2.0, 7.0, 6.0, 6.0, 14.0, 19.0, 30.0, 54.0, 78.0, 164.0, 301.0, 589.0, 1272.0, 2850.0, 7962.0, 33878.0, 671775.0, 296371.0, 22463.0, 6190.0, 2353.0, 1077.0, 495.0, 254.0, 137.0, 77.0, 41.0, 30.0, 18.0, 12.0, 5.0, 13.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69091796875, -0.671112060546875, -0.65130615234375, -0.631500244140625, -0.6116943359375, -0.591888427734375, -0.57208251953125, -0.552276611328125, -0.532470703125, -0.512664794921875, -0.49285888671875, -0.473052978515625, -0.4532470703125, -0.433441162109375, -0.41363525390625, -0.393829345703125, -0.3740234375, -0.354217529296875, -0.33441162109375, -0.314605712890625, -0.2947998046875, -0.274993896484375, -0.25518798828125, -0.235382080078125, -0.215576171875, -0.195770263671875, -0.17596435546875, -0.156158447265625, -0.1363525390625, -0.116546630859375, -0.09674072265625, -0.076934814453125, -0.05712890625, -0.037322998046875, -0.01751708984375, 0.002288818359375, 0.0220947265625, 0.041900634765625, 0.06170654296875, 0.081512451171875, 0.101318359375, 0.121124267578125, 0.14093017578125, 0.160736083984375, 0.1805419921875, 0.200347900390625, 0.22015380859375, 0.239959716796875, 0.259765625, 0.279571533203125, 0.29937744140625, 0.319183349609375, 0.3389892578125, 0.358795166015625, 0.37860107421875, 0.398406982421875, 0.418212890625, 0.438018798828125, 0.45782470703125, 0.477630615234375, 0.4974365234375, 0.517242431640625, 0.53704833984375, 0.556854248046875, 0.57666015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 11.0, 15.0, 23.0, 35.0, 38.0, 56.0, 86.0, 91.0, 108.0, 98.0, 86.0, 85.0, 66.0, 56.0, 46.0, 26.0, 19.0, 14.0, 11.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.07421875, -2.0261688232421875, -1.978118896484375, -1.9300689697265625, -1.88201904296875, -1.8339691162109375, -1.785919189453125, -1.7378692626953125, -1.6898193359375, -1.6417694091796875, -1.593719482421875, -1.5456695556640625, -1.49761962890625, -1.4495697021484375, -1.401519775390625, -1.3534698486328125, -1.305419921875, -1.2573699951171875, -1.209320068359375, -1.1612701416015625, -1.11322021484375, -1.0651702880859375, -1.017120361328125, -0.9690704345703125, -0.9210205078125, -0.8729705810546875, -0.824920654296875, -0.7768707275390625, -0.72882080078125, -0.6807708740234375, -0.632720947265625, -0.5846710205078125, -0.53662109375, -0.4885711669921875, -0.440521240234375, -0.3924713134765625, -0.34442138671875, -0.2963714599609375, -0.248321533203125, -0.2002716064453125, -0.1522216796875, -0.1041717529296875, -0.056121826171875, -0.0080718994140625, 0.03997802734375, 0.0880279541015625, 0.136077880859375, 0.1841278076171875, 0.232177734375, 0.2802276611328125, 0.328277587890625, 0.3763275146484375, 0.42437744140625, 0.4724273681640625, 0.520477294921875, 0.5685272216796875, 0.6165771484375, 0.6646270751953125, 0.712677001953125, 0.7607269287109375, 0.80877685546875, 0.8568267822265625, 0.904876708984375, 0.9529266357421875, 1.0009765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 8.0, 13.0, 12.0, 36.0, 40.0, 45.0, 57.0, 79.0, 124.0, 184.0, 283.0, 459.0, 649.0, 1008.0, 1651.0, 3000.0, 5629.0, 12389.0, 33426.0, 133220.0, 572796.0, 206510.0, 45924.0, 15471.0, 6828.0, 3461.0, 1925.0, 1170.0, 719.0, 486.0, 271.0, 198.0, 165.0, 79.0, 64.0, 42.0, 39.0, 21.0, 22.0, 17.0, 7.0, 10.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2578125, -0.2499103546142578, -0.24200820922851562, -0.23410606384277344, -0.22620391845703125, -0.21830177307128906, -0.21039962768554688, -0.2024974822998047, -0.1945953369140625, -0.1866931915283203, -0.17879104614257812, -0.17088890075683594, -0.16298675537109375, -0.15508460998535156, -0.14718246459960938, -0.1392803192138672, -0.131378173828125, -0.12347602844238281, -0.11557388305664062, -0.10767173767089844, -0.09976959228515625, -0.09186744689941406, -0.08396530151367188, -0.07606315612792969, -0.0681610107421875, -0.06025886535644531, -0.052356719970703125, -0.04445457458496094, -0.03655242919921875, -0.028650283813476562, -0.020748138427734375, -0.012845993041992188, -0.00494384765625, 0.0029582977294921875, 0.010860443115234375, 0.018762588500976562, 0.02666473388671875, 0.03456687927246094, 0.042469024658203125, 0.05037117004394531, 0.0582733154296875, 0.06617546081542969, 0.07407760620117188, 0.08197975158691406, 0.08988189697265625, 0.09778404235839844, 0.10568618774414062, 0.11358833312988281, 0.121490478515625, 0.1293926239013672, 0.13729476928710938, 0.14519691467285156, 0.15309906005859375, 0.16100120544433594, 0.16890335083007812, 0.1768054962158203, 0.1847076416015625, 0.1926097869873047, 0.20051193237304688, 0.20841407775878906, 0.21631622314453125, 0.22421836853027344, 0.23212051391601562, 0.2400226593017578, 0.2479248046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 9.0, 7.0, 11.0, 10.0, 17.0, 17.0, 22.0, 28.0, 27.0, 36.0, 34.0, 38.0, 45.0, 34.0, 54.0, 46.0, 56.0, 58.0, 57.0, 40.0, 33.0, 38.0, 39.0, 38.0, 30.0, 35.0, 23.0, 18.0, 13.0, 18.0, 9.0, 12.0, 9.0, 7.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.708984375, -1.6570587158203125, -1.605133056640625, -1.5532073974609375, -1.50128173828125, -1.4493560791015625, -1.397430419921875, -1.3455047607421875, -1.2935791015625, -1.2416534423828125, -1.189727783203125, -1.1378021240234375, -1.08587646484375, -1.0339508056640625, -0.982025146484375, -0.9300994873046875, -0.878173828125, -0.8262481689453125, -0.774322509765625, -0.7223968505859375, -0.67047119140625, -0.6185455322265625, -0.566619873046875, -0.5146942138671875, -0.4627685546875, -0.4108428955078125, -0.358917236328125, -0.3069915771484375, -0.25506591796875, -0.2031402587890625, -0.151214599609375, -0.0992889404296875, -0.04736328125, 0.0045623779296875, 0.056488037109375, 0.1084136962890625, 0.16033935546875, 0.2122650146484375, 0.264190673828125, 0.3161163330078125, 0.3680419921875, 0.4199676513671875, 0.471893310546875, 0.5238189697265625, 0.57574462890625, 0.6276702880859375, 0.679595947265625, 0.7315216064453125, 0.783447265625, 0.8353729248046875, 0.887298583984375, 0.9392242431640625, 0.99114990234375, 1.0430755615234375, 1.095001220703125, 1.1469268798828125, 1.1988525390625, 1.2507781982421875, 1.302703857421875, 1.3546295166015625, 1.40655517578125, 1.4584808349609375, 1.510406494140625, 1.5623321533203125, 1.6142578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 12.0, 16.0, 14.0, 13.0, 29.0, 38.0, 65.0, 84.0, 113.0, 194.0, 318.0, 480.0, 866.0, 1527.0, 2990.0, 7101.0, 19018.0, 69654.0, 501464.0, 360428.0, 55683.0, 16161.0, 6054.0, 2779.0, 1413.0, 755.0, 426.0, 288.0, 172.0, 107.0, 81.0, 63.0, 46.0, 25.0, 16.0, 22.0, 8.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.09039306640625, -0.08780479431152344, -0.08521652221679688, -0.08262825012207031, -0.08003997802734375, -0.07745170593261719, -0.07486343383789062, -0.07227516174316406, -0.0696868896484375, -0.06709861755371094, -0.06451034545898438, -0.06192207336425781, -0.05933380126953125, -0.05674552917480469, -0.054157257080078125, -0.05156898498535156, -0.048980712890625, -0.04639244079589844, -0.043804168701171875, -0.04121589660644531, -0.03862762451171875, -0.03603935241699219, -0.033451080322265625, -0.030862808227539062, -0.0282745361328125, -0.025686264038085938, -0.023097991943359375, -0.020509719848632812, -0.01792144775390625, -0.015333175659179688, -0.012744903564453125, -0.010156631469726562, -0.007568359375, -0.0049800872802734375, -0.002391815185546875, 0.0001964569091796875, 0.00278472900390625, 0.0053730010986328125, 0.007961273193359375, 0.010549545288085938, 0.0131378173828125, 0.015726089477539062, 0.018314361572265625, 0.020902633666992188, 0.02349090576171875, 0.026079177856445312, 0.028667449951171875, 0.03125572204589844, 0.033843994140625, 0.03643226623535156, 0.039020538330078125, 0.04160881042480469, 0.04419708251953125, 0.04678535461425781, 0.049373626708984375, 0.05196189880371094, 0.0545501708984375, 0.05713844299316406, 0.059726715087890625, 0.06231498718261719, 0.06490325927734375, 0.06749153137207031, 0.07007980346679688, 0.07266807556152344, 0.07525634765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 12.0, 9.0, 8.0, 17.0, 26.0, 44.0, 56.0, 94.0, 136.0, 187.0, 133.0, 75.0, 36.0, 42.0, 23.0, 23.0, 7.0, 10.0, 10.0, 3.0, 7.0, 6.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -5.043204873800278e-05, -4.8590824007987976e-05, -4.6749599277973175e-05, -4.4908374547958374e-05, -4.306714981794357e-05, -4.122592508792877e-05, -3.938470035791397e-05, -3.754347562789917e-05, -3.570225089788437e-05, -3.386102616786957e-05, -3.201980143785477e-05, -3.0178576707839966e-05, -2.8337351977825165e-05, -2.6496127247810364e-05, -2.4654902517795563e-05, -2.2813677787780762e-05, -2.097245305776596e-05, -1.913122832775116e-05, -1.729000359773636e-05, -1.5448778867721558e-05, -1.3607554137706757e-05, -1.1766329407691956e-05, -9.925104677677155e-06, -8.083879947662354e-06, -6.2426552176475525e-06, -4.4014304876327515e-06, -2.5602057576179504e-06, -7.189810276031494e-07, 1.1222437024116516e-06, 2.9634684324264526e-06, 4.804693162441254e-06, 6.645917892456055e-06, 8.487142622470856e-06, 1.0328367352485657e-05, 1.2169592082500458e-05, 1.4010816812515259e-05, 1.585204154253006e-05, 1.769326627254486e-05, 1.9534491002559662e-05, 2.1375715732574463e-05, 2.3216940462589264e-05, 2.5058165192604065e-05, 2.6899389922618866e-05, 2.8740614652633667e-05, 3.058183938264847e-05, 3.242306411266327e-05, 3.426428884267807e-05, 3.610551357269287e-05, 3.794673830270767e-05, 3.978796303272247e-05, 4.1629187762737274e-05, 4.3470412492752075e-05, 4.5311637222766876e-05, 4.715286195278168e-05, 4.899408668279648e-05, 5.083531141281128e-05, 5.267653614282608e-05, 5.451776087284088e-05, 5.635898560285568e-05, 5.8200210332870483e-05, 6.0041435062885284e-05, 6.188265979290009e-05, 6.372388452291489e-05, 6.556510925292969e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 16.0, 14.0, 24.0, 32.0, 59.0, 97.0, 185.0, 349.0, 591.0, 1360.0, 3029.0, 8969.0, 41416.0, 623962.0, 328696.0, 28016.0, 6883.0, 2524.0, 1120.0, 544.0, 283.0, 145.0, 76.0, 56.0, 25.0, 25.0, 12.0, 13.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.11010265350341797, -0.10600852966308594, -0.1019144058227539, -0.09782028198242188, -0.09372615814208984, -0.08963203430175781, -0.08553791046142578, -0.08144378662109375, -0.07734966278076172, -0.07325553894042969, -0.06916141510009766, -0.06506729125976562, -0.060973167419433594, -0.05687904357910156, -0.05278491973876953, -0.0486907958984375, -0.04459667205810547, -0.04050254821777344, -0.036408424377441406, -0.032314300537109375, -0.028220176696777344, -0.024126052856445312, -0.02003192901611328, -0.01593780517578125, -0.011843681335449219, -0.0077495574951171875, -0.0036554336547851562, 0.000438690185546875, 0.004532814025878906, 0.008626937866210938, 0.012721061706542969, 0.016815185546875, 0.02090930938720703, 0.025003433227539062, 0.029097557067871094, 0.033191680908203125, 0.037285804748535156, 0.04137992858886719, 0.04547405242919922, 0.04956817626953125, 0.05366230010986328, 0.05775642395019531, 0.061850547790527344, 0.06594467163085938, 0.0700387954711914, 0.07413291931152344, 0.07822704315185547, 0.0823211669921875, 0.08641529083251953, 0.09050941467285156, 0.0946035385131836, 0.09869766235351562, 0.10279178619384766, 0.10688591003417969, 0.11098003387451172, 0.11507415771484375, 0.11916828155517578, 0.12326240539550781, 0.12735652923583984, 0.13145065307617188, 0.1355447769165039, 0.13963890075683594, 0.14373302459716797, 0.1478271484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 4.0, 8.0, 12.0, 13.0, 18.0, 23.0, 35.0, 51.0, 65.0, 77.0, 100.0, 140.0, 98.0, 89.0, 64.0, 37.0, 31.0, 35.0, 17.0, 19.0, 9.0, 8.0, 9.0, 4.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.024383544921875, -0.023694276809692383, -0.023005008697509766, -0.02231574058532715, -0.02162647247314453, -0.020937204360961914, -0.020247936248779297, -0.01955866813659668, -0.018869400024414062, -0.018180131912231445, -0.017490863800048828, -0.01680159568786621, -0.016112327575683594, -0.015423059463500977, -0.01473379135131836, -0.014044523239135742, -0.013355255126953125, -0.012665987014770508, -0.01197671890258789, -0.011287450790405273, -0.010598182678222656, -0.009908914566040039, -0.009219646453857422, -0.008530378341674805, -0.007841110229492188, -0.00715184211730957, -0.006462574005126953, -0.005773305892944336, -0.005084037780761719, -0.0043947696685791016, -0.0037055015563964844, -0.003016233444213867, -0.00232696533203125, -0.0016376972198486328, -0.0009484291076660156, -0.00025916099548339844, 0.00043010711669921875, 0.001119375228881836, 0.0018086433410644531, 0.0024979114532470703, 0.0031871795654296875, 0.0038764476776123047, 0.004565715789794922, 0.005254983901977539, 0.005944252014160156, 0.0066335201263427734, 0.007322788238525391, 0.008012056350708008, 0.008701324462890625, 0.009390592575073242, 0.01007986068725586, 0.010769128799438477, 0.011458396911621094, 0.012147665023803711, 0.012836933135986328, 0.013526201248168945, 0.014215469360351562, 0.01490473747253418, 0.015594005584716797, 0.016283273696899414, 0.01697254180908203, 0.01766180992126465, 0.018351078033447266, 0.019040346145629883, 0.0197296142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 26.0, 48.0, 204.0, 433.0, 192.0, 55.0, 24.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.729193687438965, -5.6084513664245605, -5.4877095222473145, -5.36696720123291, -5.246224880218506, -5.125482559204102, -5.0047407150268555, -4.883998394012451, -4.763256072998047, -4.642513751983643, -4.5217719078063965, -4.401029586791992, -4.280287265777588, -4.159544944763184, -4.0388031005859375, -3.918060779571533, -3.797318696975708, -3.676576614379883, -3.5558342933654785, -3.4350922107696533, -3.314349889755249, -3.193607807159424, -3.0728654861450195, -2.9521234035491943, -2.831381320953369, -2.710639238357544, -2.5898969173431396, -2.4691548347473145, -2.34841251373291, -2.227670431137085, -2.1069283485412598, -1.9861860275268555, -1.8654435873031616, -1.7447013854980469, -1.6239591836929321, -1.5032169818878174, -1.3824748992919922, -1.261732578277588, -1.1409904956817627, -1.020248293876648, -0.8995060920715332, -0.7787638902664185, -0.6580216884613037, -0.5372795462608337, -0.416537344455719, -0.29579514265060425, -0.17505300045013428, -0.05431079864501953, 0.06643140316009521, 0.18717359006404877, 0.3079157769680023, 0.4286579489707947, 0.5494001507759094, 0.6701423525810242, 0.7908844947814941, 0.9116266965866089, 1.0323688983917236, 1.1531111001968384, 1.2738533020019531, 1.3945953845977783, 1.5153377056121826, 1.6360797882080078, 1.7568219900131226, 1.8775641918182373, 1.998306393623352]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 13.0, 11.0, 17.0, 21.0, 39.0, 49.0, 53.0, 83.0, 86.0, 102.0, 95.0, 82.0, 89.0, 56.0, 68.0, 47.0, 31.0, 19.0, 13.0, 9.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9014041423797607, -1.8563053607940674, -1.811206579208374, -1.7661077976226807, -1.7210090160369873, -1.675910234451294, -1.6308114528656006, -1.5857127904891968, -1.5406140089035034, -1.49551522731781, -1.4504164457321167, -1.4053176641464233, -1.36021888256073, -1.3151202201843262, -1.2700214385986328, -1.2249226570129395, -1.179823875427246, -1.1347250938415527, -1.0896263122558594, -1.044527530670166, -0.9994288086891174, -0.9543300271034241, -0.9092312455177307, -0.8641325235366821, -0.8190336227416992, -0.7739348411560059, -0.7288360595703125, -0.6837372779846191, -0.6386385560035706, -0.5935397744178772, -0.5484409928321838, -0.5033422708511353, -0.4582434892654419, -0.41314470767974854, -0.36804595589637756, -0.3229471743106842, -0.27784842252731323, -0.23274964094161987, -0.1876508593559265, -0.14255210757255554, -0.09745332598686218, -0.05235455557703972, -0.007255785167217255, 0.03784298896789551, 0.08294175565242767, 0.12804052233695984, 0.1731393039226532, 0.21823805570602417, 0.26333683729171753, 0.3084356188774109, 0.35353437066078186, 0.3986331522464752, 0.4437319040298462, 0.48883068561553955, 0.5339294672012329, 0.5790282487869263, 0.6241270303726196, 0.669225811958313, 0.7143245935440063, 0.7594233751296997, 0.8045220971107483, 0.8496208786964417, 0.894719660282135, 0.9398183822631836, 0.984917163848877]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 0.0, 4.0, 15.0, 15.0, 17.0, 37.0, 49.0, 107.0, 176.0, 421.0, 793.0, 1890.0, 5246.0, 23085.0, 703177.0, 290624.0, 15727.0, 4199.0, 1560.0, 678.0, 310.0, 182.0, 74.0, 56.0, 34.0, 21.0, 23.0, 12.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.892578125, -1.8426361083984375, -1.792694091796875, -1.7427520751953125, -1.69281005859375, -1.6428680419921875, -1.592926025390625, -1.5429840087890625, -1.4930419921875, -1.4430999755859375, -1.393157958984375, -1.3432159423828125, -1.29327392578125, -1.2433319091796875, -1.193389892578125, -1.1434478759765625, -1.093505859375, -1.0435638427734375, -0.993621826171875, -0.9436798095703125, -0.89373779296875, -0.8437957763671875, -0.793853759765625, -0.7439117431640625, -0.6939697265625, -0.6440277099609375, -0.594085693359375, -0.5441436767578125, -0.49420166015625, -0.4442596435546875, -0.394317626953125, -0.3443756103515625, -0.29443359375, -0.2444915771484375, -0.194549560546875, -0.1446075439453125, -0.09466552734375, -0.0447235107421875, 0.005218505859375, 0.0551605224609375, 0.1051025390625, 0.1550445556640625, 0.204986572265625, 0.2549285888671875, 0.30487060546875, 0.3548126220703125, 0.404754638671875, 0.4546966552734375, 0.504638671875, 0.5545806884765625, 0.604522705078125, 0.6544647216796875, 0.70440673828125, 0.7543487548828125, 0.804290771484375, 0.8542327880859375, 0.9041748046875, 0.9541168212890625, 1.004058837890625, 1.0540008544921875, 1.10394287109375, 1.1538848876953125, 1.203826904296875, 1.2537689208984375, 1.3037109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 11.0, 15.0, 21.0, 33.0, 55.0, 75.0, 118.0, 123.0, 139.0, 129.0, 93.0, 57.0, 56.0, 37.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.449005126953125, -2.32183837890625, -2.194671630859375, -2.0675048828125, -1.940338134765625, -1.81317138671875, -1.686004638671875, -1.558837890625, -1.431671142578125, -1.30450439453125, -1.177337646484375, -1.0501708984375, -0.923004150390625, -0.79583740234375, -0.668670654296875, -0.54150390625, -0.414337158203125, -0.28717041015625, -0.160003662109375, -0.0328369140625, 0.094329833984375, 0.22149658203125, 0.348663330078125, 0.475830078125, 0.602996826171875, 0.73016357421875, 0.857330322265625, 0.9844970703125, 1.111663818359375, 1.23883056640625, 1.365997314453125, 1.4931640625, 1.620330810546875, 1.74749755859375, 1.874664306640625, 2.0018310546875, 2.128997802734375, 2.25616455078125, 2.383331298828125, 2.510498046875, 2.637664794921875, 2.76483154296875, 2.891998291015625, 3.0191650390625, 3.146331787109375, 3.27349853515625, 3.400665283203125, 3.52783203125, 3.654998779296875, 3.78216552734375, 3.909332275390625, 4.0364990234375, 4.163665771484375, 4.29083251953125, 4.417999267578125, 4.545166015625, 4.672332763671875, 4.79949951171875, 4.926666259765625, 5.0538330078125, 5.180999755859375, 5.30816650390625, 5.435333251953125, 5.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 4.0, 6.0, 10.0, 15.0, 13.0, 23.0, 44.0, 67.0, 69.0, 116.0, 202.0, 342.0, 598.0, 1440.0, 4065.0, 17497.0, 621294.0, 381574.0, 14793.0, 3621.0, 1311.0, 629.0, 322.0, 169.0, 116.0, 55.0, 38.0, 33.0, 25.0, 11.0, 13.0, 11.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5927734375, -1.54443359375, -1.49609375, -1.44775390625, -1.3994140625, -1.35107421875, -1.302734375, -1.25439453125, -1.2060546875, -1.15771484375, -1.109375, -1.06103515625, -1.0126953125, -0.96435546875, -0.916015625, -0.86767578125, -0.8193359375, -0.77099609375, -0.72265625, -0.67431640625, -0.6259765625, -0.57763671875, -0.529296875, -0.48095703125, -0.4326171875, -0.38427734375, -0.3359375, -0.28759765625, -0.2392578125, -0.19091796875, -0.142578125, -0.09423828125, -0.0458984375, 0.00244140625, 0.05078125, 0.09912109375, 0.1474609375, 0.19580078125, 0.244140625, 0.29248046875, 0.3408203125, 0.38916015625, 0.4375, 0.48583984375, 0.5341796875, 0.58251953125, 0.630859375, 0.67919921875, 0.7275390625, 0.77587890625, 0.82421875, 0.87255859375, 0.9208984375, 0.96923828125, 1.017578125, 1.06591796875, 1.1142578125, 1.16259765625, 1.2109375, 1.25927734375, 1.3076171875, 1.35595703125, 1.404296875, 1.45263671875, 1.5009765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 14.0, 11.0, 15.0, 15.0, 10.0, 21.0, 18.0, 17.0, 23.0, 31.0, 27.0, 28.0, 15.0, 34.0, 40.0, 53.0, 41.0, 36.0, 43.0, 34.0, 41.0, 39.0, 33.0, 41.0, 27.0, 29.0, 30.0, 19.0, 38.0, 22.0, 20.0, 19.0, 18.0, 13.0, 7.0, 10.0, 9.0, 9.0, 3.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-1.505859375, -1.4591217041015625, -1.412384033203125, -1.3656463623046875, -1.31890869140625, -1.2721710205078125, -1.225433349609375, -1.1786956787109375, -1.1319580078125, -1.0852203369140625, -1.038482666015625, -0.9917449951171875, -0.94500732421875, -0.8982696533203125, -0.851531982421875, -0.8047943115234375, -0.758056640625, -0.7113189697265625, -0.664581298828125, -0.6178436279296875, -0.57110595703125, -0.5243682861328125, -0.477630615234375, -0.4308929443359375, -0.3841552734375, -0.3374176025390625, -0.290679931640625, -0.2439422607421875, -0.19720458984375, -0.1504669189453125, -0.103729248046875, -0.0569915771484375, -0.01025390625, 0.0364837646484375, 0.083221435546875, 0.1299591064453125, 0.17669677734375, 0.2234344482421875, 0.270172119140625, 0.3169097900390625, 0.3636474609375, 0.4103851318359375, 0.457122802734375, 0.5038604736328125, 0.55059814453125, 0.5973358154296875, 0.644073486328125, 0.6908111572265625, 0.737548828125, 0.7842864990234375, 0.831024169921875, 0.8777618408203125, 0.92449951171875, 0.9712371826171875, 1.017974853515625, 1.0647125244140625, 1.1114501953125, 1.1581878662109375, 1.204925537109375, 1.2516632080078125, 1.29840087890625, 1.3451385498046875, 1.391876220703125, 1.4386138916015625, 1.4853515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 11.0, 19.0, 32.0, 49.0, 61.0, 68.0, 125.0, 209.0, 328.0, 520.0, 1078.0, 2222.0, 5485.0, 19302.0, 253061.0, 724926.0, 28389.0, 7054.0, 2698.0, 1233.0, 630.0, 367.0, 208.0, 129.0, 108.0, 60.0, 39.0, 26.0, 28.0, 11.0, 6.0, 8.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4403877258300781, -0.42667388916015625, -0.4129600524902344, -0.3992462158203125, -0.3855323791503906, -0.37181854248046875, -0.3581047058105469, -0.344390869140625, -0.3306770324707031, -0.31696319580078125, -0.3032493591308594, -0.2895355224609375, -0.2758216857910156, -0.26210784912109375, -0.24839401245117188, -0.23468017578125, -0.22096633911132812, -0.20725250244140625, -0.19353866577148438, -0.1798248291015625, -0.16611099243164062, -0.15239715576171875, -0.13868331909179688, -0.124969482421875, -0.11125564575195312, -0.09754180908203125, -0.08382797241210938, -0.0701141357421875, -0.056400299072265625, -0.04268646240234375, -0.028972625732421875, -0.0152587890625, -0.001544952392578125, 0.01216888427734375, 0.025882720947265625, 0.0395965576171875, 0.053310394287109375, 0.06702423095703125, 0.08073806762695312, 0.094451904296875, 0.10816574096679688, 0.12187957763671875, 0.13559341430664062, 0.1493072509765625, 0.16302108764648438, 0.17673492431640625, 0.19044876098632812, 0.20416259765625, 0.21787643432617188, 0.23159027099609375, 0.24530410766601562, 0.2590179443359375, 0.2727317810058594, 0.28644561767578125, 0.3001594543457031, 0.313873291015625, 0.3275871276855469, 0.34130096435546875, 0.3550148010253906, 0.3687286376953125, 0.3824424743652344, 0.39615631103515625, 0.4098701477050781, 0.423583984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 15.0, 22.0, 38.0, 76.0, 153.0, 283.0, 174.0, 86.0, 49.0, 36.0, 14.0, 6.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.266124546527863e-05, -6.047263741493225e-05, -5.8284029364585876e-05, -5.60954213142395e-05, -5.390681326389313e-05, -5.171820521354675e-05, -4.952959716320038e-05, -4.7340989112854004e-05, -4.515238106250763e-05, -4.2963773012161255e-05, -4.077516496181488e-05, -3.8586556911468506e-05, -3.639794886112213e-05, -3.420934081077576e-05, -3.202073276042938e-05, -2.9832124710083008e-05, -2.7643516659736633e-05, -2.545490860939026e-05, -2.3266300559043884e-05, -2.107769250869751e-05, -1.8889084458351135e-05, -1.670047640800476e-05, -1.4511868357658386e-05, -1.2323260307312012e-05, -1.0134652256965637e-05, -7.946044206619263e-06, -5.757436156272888e-06, -3.5688281059265137e-06, -1.3802200555801392e-06, 8.083879947662354e-07, 2.99699604511261e-06, 5.185604095458984e-06, 7.374212145805359e-06, 9.562820196151733e-06, 1.1751428246498108e-05, 1.3940036296844482e-05, 1.6128644347190857e-05, 1.831725239753723e-05, 2.0505860447883606e-05, 2.269446849822998e-05, 2.4883076548576355e-05, 2.707168459892273e-05, 2.9260292649269104e-05, 3.144890069961548e-05, 3.363750874996185e-05, 3.582611680030823e-05, 3.80147248506546e-05, 4.0203332901000977e-05, 4.239194095134735e-05, 4.4580549001693726e-05, 4.67691570520401e-05, 4.8957765102386475e-05, 5.114637315273285e-05, 5.3334981203079224e-05, 5.55235892534256e-05, 5.771219730377197e-05, 5.990080535411835e-05, 6.208941340446472e-05, 6.42780214548111e-05, 6.646662950515747e-05, 6.865523755550385e-05, 7.084384560585022e-05, 7.30324536561966e-05, 7.522106170654297e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 13.0, 6.0, 16.0, 22.0, 22.0, 62.0, 81.0, 147.0, 314.0, 679.0, 1864.0, 5856.0, 31259.0, 913260.0, 80837.0, 9608.0, 2692.0, 909.0, 411.0, 197.0, 100.0, 56.0, 27.0, 29.0, 16.0, 12.0, 7.0, 8.0, 4.0, 2.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6545028686523438, -0.6361541748046875, -0.6178054809570312, -0.599456787109375, -0.5811080932617188, -0.5627593994140625, -0.5444107055664062, -0.52606201171875, -0.5077133178710938, -0.4893646240234375, -0.47101593017578125, -0.452667236328125, -0.43431854248046875, -0.4159698486328125, -0.39762115478515625, -0.3792724609375, -0.36092376708984375, -0.3425750732421875, -0.32422637939453125, -0.305877685546875, -0.28752899169921875, -0.2691802978515625, -0.25083160400390625, -0.23248291015625, -0.21413421630859375, -0.1957855224609375, -0.17743682861328125, -0.159088134765625, -0.14073944091796875, -0.1223907470703125, -0.10404205322265625, -0.085693359375, -0.06734466552734375, -0.0489959716796875, -0.03064727783203125, -0.012298583984375, 0.00605010986328125, 0.0243988037109375, 0.04274749755859375, 0.06109619140625, 0.07944488525390625, 0.0977935791015625, 0.11614227294921875, 0.134490966796875, 0.15283966064453125, 0.1711883544921875, 0.18953704833984375, 0.2078857421875, 0.22623443603515625, 0.2445831298828125, 0.26293182373046875, 0.281280517578125, 0.29962921142578125, 0.3179779052734375, 0.33632659912109375, 0.35467529296875, 0.37302398681640625, 0.3913726806640625, 0.40972137451171875, 0.428070068359375, 0.44641876220703125, 0.4647674560546875, 0.48311614990234375, 0.50146484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 9.0, 12.0, 17.0, 24.0, 13.0, 32.0, 75.0, 137.0, 245.0, 188.0, 86.0, 42.0, 27.0, 18.0, 14.0, 15.0, 6.0, 8.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.16821861267089844, -0.16236495971679688, -0.1565113067626953, -0.15065765380859375, -0.1448040008544922, -0.13895034790039062, -0.13309669494628906, -0.1272430419921875, -0.12138938903808594, -0.11553573608398438, -0.10968208312988281, -0.10382843017578125, -0.09797477722167969, -0.09212112426757812, -0.08626747131347656, -0.080413818359375, -0.07456016540527344, -0.06870651245117188, -0.06285285949707031, -0.05699920654296875, -0.05114555358886719, -0.045291900634765625, -0.03943824768066406, -0.0335845947265625, -0.027730941772460938, -0.021877288818359375, -0.016023635864257812, -0.01016998291015625, -0.0043163299560546875, 0.001537322998046875, 0.0073909759521484375, 0.01324462890625, 0.019098281860351562, 0.024951934814453125, 0.030805587768554688, 0.03665924072265625, 0.04251289367675781, 0.048366546630859375, 0.05422019958496094, 0.0600738525390625, 0.06592750549316406, 0.07178115844726562, 0.07763481140136719, 0.08348846435546875, 0.08934211730957031, 0.09519577026367188, 0.10104942321777344, 0.106903076171875, 0.11275672912597656, 0.11861038208007812, 0.12446403503417969, 0.13031768798828125, 0.1361713409423828, 0.14202499389648438, 0.14787864685058594, 0.1537322998046875, 0.15958595275878906, 0.16543960571289062, 0.1712932586669922, 0.17714691162109375, 0.1830005645751953, 0.18885421752929688, 0.19470787048339844, 0.2005615234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 8.0, 17.0, 29.0, 47.0, 96.0, 216.0, 258.0, 149.0, 87.0, 42.0, 19.0, 12.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.628633975982666, -4.489284515380859, -4.349935054779053, -4.210585594177246, -4.0712361335754395, -3.931886672973633, -3.792536973953247, -3.6531875133514404, -3.513838052749634, -3.374488592147827, -3.2351391315460205, -3.095789670944214, -2.956439971923828, -2.8170905113220215, -2.677741050720215, -2.538391590118408, -2.3990421295166016, -2.259692668914795, -2.1203432083129883, -1.980993628501892, -1.8416441679000854, -1.7022947072982788, -1.5629451274871826, -1.423595666885376, -1.2842462062835693, -1.1448967456817627, -1.005547285079956, -0.8661977052688599, -0.7268482446670532, -0.5874987840652466, -0.44814926385879517, -0.30879974365234375, -0.1694507598876953, -0.030101269483566284, 0.10924822092056274, 0.24859771132469177, 0.3879472017288208, 0.5272966623306274, 0.6666461825370789, 0.8059957027435303, 0.9453451633453369, 1.0846946239471436, 1.2240440845489502, 1.3633936643600464, 1.502743124961853, 1.6420925855636597, 1.7814421653747559, 1.9207916259765625, 2.060141086578369, 2.199490547180176, 2.3388400077819824, 2.478189468383789, 2.6175389289855957, 2.7568883895874023, 2.896238088607788, 3.0355875492095947, 3.1749370098114014, 3.314286470413208, 3.4536359310150146, 3.5929853916168213, 3.732335090637207, 3.8716845512390137, 4.01103401184082, 4.150383472442627, 4.289732933044434]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 11.0, 15.0, 20.0, 18.0, 24.0, 32.0, 22.0, 37.0, 41.0, 49.0, 62.0, 52.0, 50.0, 64.0, 78.0, 53.0, 68.0, 31.0, 50.0, 36.0, 32.0, 35.0, 33.0, 23.0, 21.0, 9.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9645183086395264, -2.838589668273926, -2.7126612663269043, -2.5867326259613037, -2.4608042240142822, -2.3348755836486816, -2.20894718170166, -2.0830185413360596, -1.9570900201797485, -1.8311614990234375, -1.7052329778671265, -1.5793044567108154, -1.4533758163452148, -1.3274474143981934, -1.2015187740325928, -1.0755902528762817, -0.9496617317199707, -0.8237332105636597, -0.6978046894073486, -0.5718761086463928, -0.4459475874900818, -0.32001906633377075, -0.19409048557281494, -0.0681619644165039, 0.05776655673980713, 0.18369509279727936, 0.3096236288547516, 0.435552179813385, 0.561480700969696, 0.6874092221260071, 0.8133378028869629, 0.9392663240432739, 1.065195083618164, 1.191123604774475, 1.3170521259307861, 1.4429807662963867, 1.5689091682434082, 1.6948378086090088, 1.8207663297653198, 1.9466948509216309, 2.0726232528686523, 2.198551893234253, 2.3244802951812744, 2.450408935546875, 2.5763373374938965, 2.702265977859497, 2.8281946182250977, 2.954123020172119, 3.0800516605377197, 3.2059803009033203, 3.331908702850342, 3.4578373432159424, 3.583765745162964, 3.7096943855285645, 3.835622787475586, 3.9615514278411865, 4.087480068206787, 4.213408470153809, 4.339337348937988, 4.46526575088501, 4.591194152832031, 4.717122554779053, 4.843051433563232, 4.968979835510254, 5.094908237457275]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 8.0, 11.0, 28.0, 29.0, 47.0, 79.0, 174.0, 269.0, 567.0, 1381.0, 5354.0, 120878.0, 3994405.0, 63151.0, 4865.0, 1897.0, 537.0, 245.0, 136.0, 80.0, 46.0, 30.0, 21.0, 12.0, 8.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.203125, -5.08331298828125, -4.9635009765625, -4.84368896484375, -4.723876953125, -4.60406494140625, -4.4842529296875, -4.36444091796875, -4.24462890625, -4.12481689453125, -4.0050048828125, -3.88519287109375, -3.765380859375, -3.64556884765625, -3.5257568359375, -3.40594482421875, -3.2861328125, -3.16632080078125, -3.0465087890625, -2.92669677734375, -2.806884765625, -2.68707275390625, -2.5672607421875, -2.44744873046875, -2.32763671875, -2.20782470703125, -2.0880126953125, -1.96820068359375, -1.848388671875, -1.72857666015625, -1.6087646484375, -1.48895263671875, -1.369140625, -1.24932861328125, -1.1295166015625, -1.00970458984375, -0.889892578125, -0.77008056640625, -0.6502685546875, -0.53045654296875, -0.41064453125, -0.29083251953125, -0.1710205078125, -0.05120849609375, 0.068603515625, 0.18841552734375, 0.3082275390625, 0.42803955078125, 0.5478515625, 0.66766357421875, 0.7874755859375, 0.90728759765625, 1.027099609375, 1.14691162109375, 1.2667236328125, 1.38653564453125, 1.50634765625, 1.62615966796875, 1.7459716796875, 1.86578369140625, 1.985595703125, 2.10540771484375, 2.2252197265625, 2.34503173828125, 2.46484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 7.0, 15.0, 24.0, 46.0, 50.0, 56.0, 84.0, 90.0, 109.0, 100.0, 87.0, 87.0, 62.0, 56.0, 35.0, 23.0, 12.0, 17.0, 7.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.2640838623046875, -2.205902099609375, -2.1477203369140625, -2.08953857421875, -2.0313568115234375, -1.973175048828125, -1.9149932861328125, -1.8568115234375, -1.7986297607421875, -1.740447998046875, -1.6822662353515625, -1.62408447265625, -1.5659027099609375, -1.507720947265625, -1.4495391845703125, -1.391357421875, -1.3331756591796875, -1.274993896484375, -1.2168121337890625, -1.15863037109375, -1.1004486083984375, -1.042266845703125, -0.9840850830078125, -0.9259033203125, -0.8677215576171875, -0.809539794921875, -0.7513580322265625, -0.69317626953125, -0.6349945068359375, -0.576812744140625, -0.5186309814453125, -0.46044921875, -0.4022674560546875, -0.344085693359375, -0.2859039306640625, -0.22772216796875, -0.1695404052734375, -0.111358642578125, -0.0531768798828125, 0.0050048828125, 0.0631866455078125, 0.121368408203125, 0.1795501708984375, 0.23773193359375, 0.2959136962890625, 0.354095458984375, 0.4122772216796875, 0.470458984375, 0.5286407470703125, 0.586822509765625, 0.6450042724609375, 0.70318603515625, 0.7613677978515625, 0.819549560546875, 0.8777313232421875, 0.9359130859375, 0.9940948486328125, 1.052276611328125, 1.1104583740234375, 1.16864013671875, 1.2268218994140625, 1.285003662109375, 1.3431854248046875, 1.4013671875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 15.0, 9.0, 18.0, 35.0, 75.0, 116.0, 259.0, 594.0, 1912.0, 8790.0, 271441.0, 3890439.0, 16413.0, 2678.0, 808.0, 311.0, 143.0, 85.0, 48.0, 23.0, 19.0, 11.0, 12.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.936981201171875, -4.80755615234375, -4.678131103515625, -4.5487060546875, -4.419281005859375, -4.28985595703125, -4.160430908203125, -4.031005859375, -3.901580810546875, -3.77215576171875, -3.642730712890625, -3.5133056640625, -3.383880615234375, -3.25445556640625, -3.125030517578125, -2.99560546875, -2.866180419921875, -2.73675537109375, -2.607330322265625, -2.4779052734375, -2.348480224609375, -2.21905517578125, -2.089630126953125, -1.960205078125, -1.830780029296875, -1.70135498046875, -1.571929931640625, -1.4425048828125, -1.313079833984375, -1.18365478515625, -1.054229736328125, -0.9248046875, -0.795379638671875, -0.66595458984375, -0.536529541015625, -0.4071044921875, -0.277679443359375, -0.14825439453125, -0.018829345703125, 0.110595703125, 0.240020751953125, 0.36944580078125, 0.498870849609375, 0.6282958984375, 0.757720947265625, 0.88714599609375, 1.016571044921875, 1.14599609375, 1.275421142578125, 1.40484619140625, 1.534271240234375, 1.6636962890625, 1.793121337890625, 1.92254638671875, 2.051971435546875, 2.181396484375, 2.310821533203125, 2.44024658203125, 2.569671630859375, 2.6990966796875, 2.828521728515625, 2.95794677734375, 3.087371826171875, 3.216796875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 3.0, 16.0, 19.0, 14.0, 34.0, 73.0, 307.0, 1480.0, 1544.0, 376.0, 97.0, 44.0, 14.0, 13.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6707687377929688, -0.6428070068359375, -0.6148452758789062, -0.586883544921875, -0.5589218139648438, -0.5309600830078125, -0.5029983520507812, -0.47503662109375, -0.44707489013671875, -0.4191131591796875, -0.39115142822265625, -0.363189697265625, -0.33522796630859375, -0.3072662353515625, -0.27930450439453125, -0.2513427734375, -0.22338104248046875, -0.1954193115234375, -0.16745758056640625, -0.139495849609375, -0.11153411865234375, -0.0835723876953125, -0.05561065673828125, -0.02764892578125, 0.00031280517578125, 0.0282745361328125, 0.05623626708984375, 0.084197998046875, 0.11215972900390625, 0.1401214599609375, 0.16808319091796875, 0.196044921875, 0.22400665283203125, 0.2519683837890625, 0.27993011474609375, 0.307891845703125, 0.33585357666015625, 0.3638153076171875, 0.39177703857421875, 0.41973876953125, 0.44770050048828125, 0.4756622314453125, 0.5036239624023438, 0.531585693359375, 0.5595474243164062, 0.5875091552734375, 0.6154708862304688, 0.6434326171875, 0.6713943481445312, 0.6993560791015625, 0.7273178100585938, 0.755279541015625, 0.7832412719726562, 0.8112030029296875, 0.8391647338867188, 0.86712646484375, 0.8950881958007812, 0.9230499267578125, 0.9510116577148438, 0.978973388671875, 1.0069351196289062, 1.0348968505859375, 1.0628585815429688, 1.0908203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 12.0, 16.0, 39.0, 62.0, 142.0, 231.0, 237.0, 126.0, 50.0, 28.0, 21.0, 10.0, 11.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6737101078033447, -3.565480947494507, -3.457251787185669, -3.349022626876831, -3.2407937049865723, -3.1325645446777344, -3.0243353843688965, -2.9161062240600586, -2.8078770637512207, -2.699647903442383, -2.591418743133545, -2.483189582824707, -2.374960422515869, -2.2667312622070312, -2.1585023403167725, -2.0502731800079346, -1.9420440196990967, -1.8338148593902588, -1.725585699081421, -1.6173566579818726, -1.5091274976730347, -1.4008983373641968, -1.2926692962646484, -1.1844401359558105, -1.0762109756469727, -0.9679818153381348, -0.8597527146339417, -0.7515236139297485, -0.6432944536209106, -0.5350652933120728, -0.42683619260787964, -0.3186070919036865, -0.21037769317626953, -0.10214856266975403, 0.006080567836761475, 0.11430969834327698, 0.22253882884979248, 0.33076798915863037, 0.4389970898628235, 0.5472261905670166, 0.6554553508758545, 0.7636845111846924, 0.8719136118888855, 0.9801427125930786, 1.0883718729019165, 1.1966010332107544, 1.3048300743103027, 1.4130592346191406, 1.5212883949279785, 1.6295175552368164, 1.7377467155456543, 1.8459757566452026, 1.9542049169540405, 2.062434196472168, 2.1706631183624268, 2.2788922786712646, 2.3871214389801025, 2.4953505992889404, 2.6035797595977783, 2.711808919906616, 2.820037841796875, 2.928267002105713, 3.036496162414551, 3.1447253227233887, 3.2529544830322266]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 17.0, 12.0, 21.0, 29.0, 32.0, 41.0, 70.0, 62.0, 66.0, 82.0, 80.0, 88.0, 66.0, 73.0, 63.0, 56.0, 37.0, 37.0, 16.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9855552911758423, -1.9296249151229858, -1.8736945390701294, -1.817764163017273, -1.7618337869644165, -1.70590341091156, -1.6499730348587036, -1.5940426588058472, -1.5381122827529907, -1.4821819067001343, -1.4262515306472778, -1.3703211545944214, -1.314390778541565, -1.2584604024887085, -1.202530026435852, -1.1465996503829956, -1.0906693935394287, -1.0347390174865723, -0.9788086414337158, -0.9228782653808594, -0.8669478893280029, -0.8110175132751465, -0.75508713722229, -0.6991567611694336, -0.6432263851165771, -0.5872960090637207, -0.5313656330108643, -0.4754352569580078, -0.41950488090515137, -0.3635745346546173, -0.30764415860176086, -0.2517137825489044, -0.19578337669372559, -0.13985300064086914, -0.08392263203859329, -0.027992263436317444, 0.027938112616539, 0.08386847376823425, 0.1397988498210907, 0.19572922587394714, 0.2516596019268036, 0.30758997797966003, 0.3635203540325165, 0.41945070028305054, 0.475381076335907, 0.5313114523887634, 0.5872418284416199, 0.6431722044944763, 0.6991025805473328, 0.7550329566001892, 0.8109633326530457, 0.8668937087059021, 0.9228240847587585, 0.9787544012069702, 1.0346847772598267, 1.090615153312683, 1.1465455293655396, 1.202475905418396, 1.2584062814712524, 1.3143366575241089, 1.3702670335769653, 1.4261974096298218, 1.4821277856826782, 1.5380581617355347, 1.5939885377883911]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 11.0, 5.0, 9.0, 12.0, 10.0, 17.0, 27.0, 41.0, 55.0, 66.0, 128.0, 223.0, 491.0, 1025.0, 2941.0, 8834.0, 33302.0, 193004.0, 658880.0, 116154.0, 22947.0, 6427.0, 2202.0, 843.0, 400.0, 183.0, 119.0, 61.0, 47.0, 28.0, 15.0, 11.0, 12.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240478515625, -0.23200225830078125, -0.2235260009765625, -0.21504974365234375, -0.206573486328125, -0.19809722900390625, -0.1896209716796875, -0.18114471435546875, -0.17266845703125, -0.16419219970703125, -0.1557159423828125, -0.14723968505859375, -0.138763427734375, -0.13028717041015625, -0.1218109130859375, -0.11333465576171875, -0.1048583984375, -0.09638214111328125, -0.0879058837890625, -0.07942962646484375, -0.070953369140625, -0.06247711181640625, -0.0540008544921875, -0.04552459716796875, -0.03704833984375, -0.02857208251953125, -0.0200958251953125, -0.01161956787109375, -0.003143310546875, 0.00533294677734375, 0.0138092041015625, 0.02228546142578125, 0.03076171875, 0.03923797607421875, 0.0477142333984375, 0.05619049072265625, 0.064666748046875, 0.07314300537109375, 0.0816192626953125, 0.09009552001953125, 0.09857177734375, 0.10704803466796875, 0.1155242919921875, 0.12400054931640625, 0.132476806640625, 0.14095306396484375, 0.1494293212890625, 0.15790557861328125, 0.1663818359375, 0.17485809326171875, 0.1833343505859375, 0.19181060791015625, 0.200286865234375, 0.20876312255859375, 0.2172393798828125, 0.22571563720703125, 0.23419189453125, 0.24266815185546875, 0.2511444091796875, 0.25962066650390625, 0.268096923828125, 0.27657318115234375, 0.2850494384765625, 0.29352569580078125, 0.302001953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 11.0, 7.0, 8.0, 20.0, 23.0, 36.0, 49.0, 70.0, 79.0, 97.0, 120.0, 98.0, 113.0, 84.0, 69.0, 42.0, 33.0, 17.0, 10.0, 10.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -2.0111541748046875, -1.961761474609375, -1.9123687744140625, -1.86297607421875, -1.8135833740234375, -1.764190673828125, -1.7147979736328125, -1.6654052734375, -1.6160125732421875, -1.566619873046875, -1.5172271728515625, -1.46783447265625, -1.4184417724609375, -1.369049072265625, -1.3196563720703125, -1.270263671875, -1.2208709716796875, -1.171478271484375, -1.1220855712890625, -1.07269287109375, -1.0233001708984375, -0.973907470703125, -0.9245147705078125, -0.8751220703125, -0.8257293701171875, -0.776336669921875, -0.7269439697265625, -0.67755126953125, -0.6281585693359375, -0.578765869140625, -0.5293731689453125, -0.47998046875, -0.4305877685546875, -0.381195068359375, -0.3318023681640625, -0.28240966796875, -0.2330169677734375, -0.183624267578125, -0.1342315673828125, -0.0848388671875, -0.0354461669921875, 0.013946533203125, 0.0633392333984375, 0.11273193359375, 0.1621246337890625, 0.211517333984375, 0.2609100341796875, 0.310302734375, 0.3596954345703125, 0.409088134765625, 0.4584808349609375, 0.50787353515625, 0.5572662353515625, 0.606658935546875, 0.6560516357421875, 0.7054443359375, 0.7548370361328125, 0.804229736328125, 0.8536224365234375, 0.90301513671875, 0.9524078369140625, 1.001800537109375, 1.0511932373046875, 1.1005859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 11.0, 11.0, 17.0, 17.0, 34.0, 36.0, 49.0, 78.0, 114.0, 184.0, 265.0, 418.0, 681.0, 1276.0, 2469.0, 5341.0, 12929.0, 36642.0, 124762.0, 505197.0, 257423.0, 64055.0, 20859.0, 7931.0, 3522.0, 1780.0, 876.0, 546.0, 326.0, 224.0, 142.0, 96.0, 61.0, 47.0, 37.0, 25.0, 16.0, 17.0, 8.0, 8.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.1433887481689453, -0.13821792602539062, -0.13304710388183594, -0.12787628173828125, -0.12270545959472656, -0.11753463745117188, -0.11236381530761719, -0.1071929931640625, -0.10202217102050781, -0.09685134887695312, -0.09168052673339844, -0.08650970458984375, -0.08133888244628906, -0.07616806030273438, -0.07099723815917969, -0.065826416015625, -0.06065559387207031, -0.055484771728515625, -0.05031394958496094, -0.04514312744140625, -0.03997230529785156, -0.034801483154296875, -0.029630661010742188, -0.0244598388671875, -0.019289016723632812, -0.014118194580078125, -0.008947372436523438, -0.00377655029296875, 0.0013942718505859375, 0.006565093994140625, 0.011735916137695312, 0.01690673828125, 0.022077560424804688, 0.027248382568359375, 0.03241920471191406, 0.03759002685546875, 0.04276084899902344, 0.047931671142578125, 0.05310249328613281, 0.0582733154296875, 0.06344413757324219, 0.06861495971679688, 0.07378578186035156, 0.07895660400390625, 0.08412742614746094, 0.08929824829101562, 0.09446907043457031, 0.099639892578125, 0.10481071472167969, 0.10998153686523438, 0.11515235900878906, 0.12032318115234375, 0.12549400329589844, 0.13066482543945312, 0.1358356475830078, 0.1410064697265625, 0.1461772918701172, 0.15134811401367188, 0.15651893615722656, 0.16168975830078125, 0.16686058044433594, 0.17203140258789062, 0.1772022247314453, 0.182373046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 11.0, 14.0, 14.0, 10.0, 21.0, 12.0, 26.0, 25.0, 24.0, 31.0, 29.0, 27.0, 33.0, 44.0, 50.0, 63.0, 59.0, 50.0, 56.0, 55.0, 41.0, 30.0, 40.0, 43.0, 28.0, 29.0, 22.0, 15.0, 17.0, 13.0, 14.0, 6.0, 4.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1776580810546875, -1.135589599609375, -1.0935211181640625, -1.05145263671875, -1.0093841552734375, -0.967315673828125, -0.9252471923828125, -0.8831787109375, -0.8411102294921875, -0.799041748046875, -0.7569732666015625, -0.71490478515625, -0.6728363037109375, -0.630767822265625, -0.5886993408203125, -0.546630859375, -0.5045623779296875, -0.462493896484375, -0.4204254150390625, -0.37835693359375, -0.3362884521484375, -0.294219970703125, -0.2521514892578125, -0.2100830078125, -0.1680145263671875, -0.125946044921875, -0.0838775634765625, -0.04180908203125, 0.0002593994140625, 0.042327880859375, 0.0843963623046875, 0.12646484375, 0.1685333251953125, 0.210601806640625, 0.2526702880859375, 0.29473876953125, 0.3368072509765625, 0.378875732421875, 0.4209442138671875, 0.4630126953125, 0.5050811767578125, 0.547149658203125, 0.5892181396484375, 0.63128662109375, 0.6733551025390625, 0.715423583984375, 0.7574920654296875, 0.799560546875, 0.8416290283203125, 0.883697509765625, 0.9257659912109375, 0.96783447265625, 1.0099029541015625, 1.051971435546875, 1.0940399169921875, 1.1361083984375, 1.1781768798828125, 1.220245361328125, 1.2623138427734375, 1.30438232421875, 1.3464508056640625, 1.388519287109375, 1.4305877685546875, 1.47265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 9.0, 6.0, 14.0, 13.0, 16.0, 29.0, 51.0, 53.0, 89.0, 191.0, 265.0, 478.0, 985.0, 2166.0, 5905.0, 20534.0, 123271.0, 733148.0, 129521.0, 21549.0, 5891.0, 2161.0, 1016.0, 460.0, 301.0, 143.0, 92.0, 66.0, 39.0, 27.0, 15.0, 19.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0618896484375, -0.059861183166503906, -0.05783271789550781, -0.05580425262451172, -0.053775787353515625, -0.05174732208251953, -0.04971885681152344, -0.047690391540527344, -0.04566192626953125, -0.043633460998535156, -0.04160499572753906, -0.03957653045654297, -0.037548065185546875, -0.03551959991455078, -0.03349113464355469, -0.031462669372558594, -0.0294342041015625, -0.027405738830566406, -0.025377273559570312, -0.02334880828857422, -0.021320343017578125, -0.01929187774658203, -0.017263412475585938, -0.015234947204589844, -0.01320648193359375, -0.011178016662597656, -0.009149551391601562, -0.007121086120605469, -0.005092620849609375, -0.0030641555786132812, -0.0010356903076171875, 0.0009927749633789062, 0.003021240234375, 0.005049705505371094, 0.0070781707763671875, 0.009106636047363281, 0.011135101318359375, 0.013163566589355469, 0.015192031860351562, 0.017220497131347656, 0.01924896240234375, 0.021277427673339844, 0.023305892944335938, 0.02533435821533203, 0.027362823486328125, 0.02939128875732422, 0.03141975402832031, 0.033448219299316406, 0.0354766845703125, 0.037505149841308594, 0.03953361511230469, 0.04156208038330078, 0.043590545654296875, 0.04561901092529297, 0.04764747619628906, 0.049675941467285156, 0.05170440673828125, 0.053732872009277344, 0.05576133728027344, 0.05778980255126953, 0.059818267822265625, 0.06184673309326172, 0.06387519836425781, 0.0659036636352539, 0.06793212890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 9.0, 11.0, 16.0, 22.0, 37.0, 62.0, 122.0, 170.0, 214.0, 147.0, 88.0, 44.0, 27.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.574392318725586e-05, -6.418582051992416e-05, -6.262771785259247e-05, -6.106961518526077e-05, -5.951151251792908e-05, -5.795340985059738e-05, -5.6395307183265686e-05, -5.483720451593399e-05, -5.3279101848602295e-05, -5.17209991812706e-05, -5.0162896513938904e-05, -4.860479384660721e-05, -4.704669117927551e-05, -4.548858851194382e-05, -4.393048584461212e-05, -4.2372383177280426e-05, -4.081428050994873e-05, -3.9256177842617035e-05, -3.769807517528534e-05, -3.6139972507953644e-05, -3.458186984062195e-05, -3.302376717329025e-05, -3.146566450595856e-05, -2.990756183862686e-05, -2.8349459171295166e-05, -2.679135650396347e-05, -2.5233253836631775e-05, -2.367515116930008e-05, -2.2117048501968384e-05, -2.0558945834636688e-05, -1.9000843167304993e-05, -1.7442740499973297e-05, -1.58846378326416e-05, -1.4326535165309906e-05, -1.276843249797821e-05, -1.1210329830646515e-05, -9.65222716331482e-06, -8.094124495983124e-06, -6.536021828651428e-06, -4.977919161319733e-06, -3.419816493988037e-06, -1.8617138266563416e-06, -3.03611159324646e-07, 1.2544915080070496e-06, 2.812594175338745e-06, 4.370696842670441e-06, 5.928799510002136e-06, 7.486902177333832e-06, 9.045004844665527e-06, 1.0603107511997223e-05, 1.2161210179328918e-05, 1.3719312846660614e-05, 1.527741551399231e-05, 1.6835518181324005e-05, 1.83936208486557e-05, 1.9951723515987396e-05, 2.1509826183319092e-05, 2.3067928850650787e-05, 2.4626031517982483e-05, 2.618413418531418e-05, 2.7742236852645874e-05, 2.930033951997757e-05, 3.0858442187309265e-05, 3.241654485464096e-05, 3.3974647521972656e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 12.0, 21.0, 21.0, 32.0, 37.0, 62.0, 105.0, 165.0, 249.0, 422.0, 701.0, 1285.0, 2485.0, 5369.0, 13566.0, 40479.0, 169521.0, 561103.0, 184145.0, 43317.0, 14034.0, 5588.0, 2537.0, 1419.0, 727.0, 413.0, 262.0, 164.0, 91.0, 66.0, 38.0, 21.0, 23.0, 22.0, 5.0, 4.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.046112060546875, -0.0446014404296875, -0.0430908203125, -0.0415802001953125, -0.040069580078125, -0.0385589599609375, -0.03704833984375, -0.0355377197265625, -0.034027099609375, -0.0325164794921875, -0.031005859375, -0.0294952392578125, -0.027984619140625, -0.0264739990234375, -0.02496337890625, -0.0234527587890625, -0.021942138671875, -0.0204315185546875, -0.0189208984375, -0.0174102783203125, -0.015899658203125, -0.0143890380859375, -0.01287841796875, -0.0113677978515625, -0.009857177734375, -0.0083465576171875, -0.0068359375, -0.0053253173828125, -0.003814697265625, -0.0023040771484375, -0.00079345703125, 0.0007171630859375, 0.002227783203125, 0.0037384033203125, 0.0052490234375, 0.0067596435546875, 0.008270263671875, 0.0097808837890625, 0.01129150390625, 0.0128021240234375, 0.014312744140625, 0.0158233642578125, 0.017333984375, 0.0188446044921875, 0.020355224609375, 0.0218658447265625, 0.02337646484375, 0.0248870849609375, 0.026397705078125, 0.0279083251953125, 0.0294189453125, 0.0309295654296875, 0.032440185546875, 0.0339508056640625, 0.03546142578125, 0.0369720458984375, 0.038482666015625, 0.0399932861328125, 0.04150390625, 0.0430145263671875, 0.044525146484375, 0.0460357666015625, 0.04754638671875, 0.0490570068359375, 0.050567626953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 15.0, 12.0, 25.0, 29.0, 41.0, 46.0, 56.0, 58.0, 81.0, 84.0, 87.0, 73.0, 66.0, 56.0, 58.0, 27.0, 32.0, 24.0, 30.0, 16.0, 9.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013031005859375, -0.012640237808227539, -0.012249469757080078, -0.011858701705932617, -0.011467933654785156, -0.011077165603637695, -0.010686397552490234, -0.010295629501342773, -0.009904861450195312, -0.009514093399047852, -0.00912332534790039, -0.00873255729675293, -0.008341789245605469, -0.007951021194458008, -0.007560253143310547, -0.007169485092163086, -0.006778717041015625, -0.006387948989868164, -0.005997180938720703, -0.005606412887573242, -0.005215644836425781, -0.00482487678527832, -0.004434108734130859, -0.0040433406829833984, -0.0036525726318359375, -0.0032618045806884766, -0.0028710365295410156, -0.0024802684783935547, -0.0020895004272460938, -0.0016987323760986328, -0.0013079643249511719, -0.0009171962738037109, -0.00052642822265625, -0.00013566017150878906, 0.0002551078796386719, 0.0006458759307861328, 0.0010366439819335938, 0.0014274120330810547, 0.0018181800842285156, 0.0022089481353759766, 0.0025997161865234375, 0.0029904842376708984, 0.0033812522888183594, 0.0037720203399658203, 0.004162788391113281, 0.004553556442260742, 0.004944324493408203, 0.005335092544555664, 0.005725860595703125, 0.006116628646850586, 0.006507396697998047, 0.006898164749145508, 0.007288932800292969, 0.00767970085144043, 0.00807046890258789, 0.008461236953735352, 0.008852005004882812, 0.009242773056030273, 0.009633541107177734, 0.010024309158325195, 0.010415077209472656, 0.010805845260620117, 0.011196613311767578, 0.011587381362915039, 0.0119781494140625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 76.0, 219.0, 443.0, 151.0, 42.0, 17.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.538624286651611, -5.421570777893066, -5.3045172691345215, -5.187463760375977, -5.070409774780273, -4.9533562660217285, -4.836302757263184, -4.719249248504639, -4.602195739746094, -4.485142230987549, -4.368088722229004, -4.251034736633301, -4.133981227874756, -4.016927719116211, -3.899874210357666, -3.782820701599121, -3.665766716003418, -3.548713207244873, -3.431659460067749, -3.314605951309204, -3.197552442550659, -3.080498695373535, -2.9634451866149902, -2.8463916778564453, -2.7293381690979004, -2.6122846603393555, -2.4952309131622314, -2.3781774044036865, -2.2611238956451416, -2.1440701484680176, -2.0270166397094727, -1.9099630117416382, -1.7929093837738037, -1.6758557558059692, -1.5588022470474243, -1.4417486190795898, -1.3246949911117554, -1.207641363143921, -1.090587854385376, -0.9735342264175415, -0.8564806580543518, -0.7394270896911621, -0.6223734617233276, -0.5053198933601379, -0.38826629519462585, -0.27121269702911377, -0.15415912866592407, -0.0371055006980896, 0.0799480676651001, 0.19700166583061218, 0.31405526399612427, 0.43110883235931396, 0.5481624603271484, 0.6652160286903381, 0.7822695970535278, 0.8993232250213623, 1.0163767337799072, 1.1334303617477417, 1.2504838705062866, 1.367537498474121, 1.4845911264419556, 1.60164475440979, 1.718698263168335, 1.8357518911361694, 1.952805519104004]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 10.0, 11.0, 26.0, 33.0, 39.0, 61.0, 84.0, 87.0, 101.0, 103.0, 105.0, 81.0, 74.0, 63.0, 37.0, 25.0, 16.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8379266262054443, -1.7933305501937866, -1.7487343549728394, -1.7041382789611816, -1.6595420837402344, -1.6149460077285767, -1.570349931716919, -1.5257537364959717, -1.4811575412750244, -1.4365614652633667, -1.3919652700424194, -1.3473691940307617, -1.3027729988098145, -1.2581769227981567, -1.213580846786499, -1.1689846515655518, -1.124388575553894, -1.0797924995422363, -1.035196304321289, -0.9906002283096313, -0.9460040330886841, -0.9014079570770264, -0.8568118214607239, -0.8122156858444214, -0.7676195502281189, -0.7230234146118164, -0.6784272789955139, -0.6338311433792114, -0.5892350673675537, -0.5446388721466064, -0.5000427961349487, -0.45544666051864624, -0.41085052490234375, -0.36625438928604126, -0.32165825366973877, -0.27706214785575867, -0.23246601223945618, -0.1878698766231537, -0.14327377080917358, -0.0986776351928711, -0.054081499576568604, -0.00948537141084671, 0.03511075675487518, 0.07970687747001648, 0.12430301308631897, 0.16889914870262146, 0.21349525451660156, 0.25809139013290405, 0.30268752574920654, 0.34728366136550903, 0.3918797969818115, 0.4364759027957916, 0.4810720384120941, 0.5256681442260742, 0.5702642798423767, 0.6148604154586792, 0.6594565510749817, 0.7040526866912842, 0.7486488223075867, 0.7932449579238892, 0.8378410339355469, 0.8824372291564941, 0.9270333051681519, 0.9716294407844543, 1.0162255764007568]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 16.0, 23.0, 35.0, 35.0, 57.0, 76.0, 106.0, 171.0, 255.0, 391.0, 586.0, 967.0, 1604.0, 2866.0, 5421.0, 11688.0, 31004.0, 206334.0, 692358.0, 60578.0, 17201.0, 7445.0, 3817.0, 2066.0, 1245.0, 767.0, 448.0, 285.0, 211.0, 135.0, 100.0, 57.0, 53.0, 33.0, 28.0, 18.0, 10.0, 8.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.17578125, -1.1403961181640625, -1.105010986328125, -1.0696258544921875, -1.03424072265625, -0.9988555908203125, -0.963470458984375, -0.9280853271484375, -0.8927001953125, -0.8573150634765625, -0.821929931640625, -0.7865447998046875, -0.75115966796875, -0.7157745361328125, -0.680389404296875, -0.6450042724609375, -0.609619140625, -0.5742340087890625, -0.538848876953125, -0.5034637451171875, -0.46807861328125, -0.4326934814453125, -0.397308349609375, -0.3619232177734375, -0.3265380859375, -0.2911529541015625, -0.255767822265625, -0.2203826904296875, -0.18499755859375, -0.1496124267578125, -0.114227294921875, -0.0788421630859375, -0.04345703125, -0.0080718994140625, 0.027313232421875, 0.0626983642578125, 0.09808349609375, 0.1334686279296875, 0.168853759765625, 0.2042388916015625, 0.2396240234375, 0.2750091552734375, 0.310394287109375, 0.3457794189453125, 0.38116455078125, 0.4165496826171875, 0.451934814453125, 0.4873199462890625, 0.522705078125, 0.5580902099609375, 0.593475341796875, 0.6288604736328125, 0.66424560546875, 0.6996307373046875, 0.735015869140625, 0.7704010009765625, 0.8057861328125, 0.8411712646484375, 0.876556396484375, 0.9119415283203125, 0.94732666015625, 0.9827117919921875, 1.018096923828125, 1.0534820556640625, 1.0888671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 6.0, 8.0, 12.0, 19.0, 17.0, 34.0, 28.0, 50.0, 57.0, 51.0, 70.0, 77.0, 89.0, 83.0, 80.0, 64.0, 46.0, 43.0, 50.0, 27.0, 21.0, 14.0, 14.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.117218017578125, -2.04302978515625, -1.968841552734375, -1.8946533203125, -1.820465087890625, -1.74627685546875, -1.672088623046875, -1.597900390625, -1.523712158203125, -1.44952392578125, -1.375335693359375, -1.3011474609375, -1.226959228515625, -1.15277099609375, -1.078582763671875, -1.00439453125, -0.930206298828125, -0.85601806640625, -0.781829833984375, -0.7076416015625, -0.633453369140625, -0.55926513671875, -0.485076904296875, -0.410888671875, -0.336700439453125, -0.26251220703125, -0.188323974609375, -0.1141357421875, -0.039947509765625, 0.03424072265625, 0.108428955078125, 0.1826171875, 0.256805419921875, 0.33099365234375, 0.405181884765625, 0.4793701171875, 0.553558349609375, 0.62774658203125, 0.701934814453125, 0.776123046875, 0.850311279296875, 0.92449951171875, 0.998687744140625, 1.0728759765625, 1.147064208984375, 1.22125244140625, 1.295440673828125, 1.36962890625, 1.443817138671875, 1.51800537109375, 1.592193603515625, 1.6663818359375, 1.740570068359375, 1.81475830078125, 1.888946533203125, 1.963134765625, 2.037322998046875, 2.11151123046875, 2.185699462890625, 2.2598876953125, 2.334075927734375, 2.40826416015625, 2.482452392578125, 2.556640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 10.0, 11.0, 12.0, 16.0, 29.0, 38.0, 43.0, 59.0, 98.0, 141.0, 241.0, 427.0, 845.0, 1945.0, 5255.0, 18788.0, 142750.0, 808032.0, 52579.0, 10753.0, 3432.0, 1420.0, 646.0, 342.0, 196.0, 117.0, 100.0, 57.0, 42.0, 31.0, 16.0, 16.0, 19.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.35577392578125, -1.3150634765625, -1.27435302734375, -1.233642578125, -1.19293212890625, -1.1522216796875, -1.11151123046875, -1.07080078125, -1.03009033203125, -0.9893798828125, -0.94866943359375, -0.907958984375, -0.86724853515625, -0.8265380859375, -0.78582763671875, -0.7451171875, -0.70440673828125, -0.6636962890625, -0.62298583984375, -0.582275390625, -0.54156494140625, -0.5008544921875, -0.46014404296875, -0.41943359375, -0.37872314453125, -0.3380126953125, -0.29730224609375, -0.256591796875, -0.21588134765625, -0.1751708984375, -0.13446044921875, -0.09375, -0.05303955078125, -0.0123291015625, 0.02838134765625, 0.069091796875, 0.10980224609375, 0.1505126953125, 0.19122314453125, 0.23193359375, 0.27264404296875, 0.3133544921875, 0.35406494140625, 0.394775390625, 0.43548583984375, 0.4761962890625, 0.51690673828125, 0.5576171875, 0.59832763671875, 0.6390380859375, 0.67974853515625, 0.720458984375, 0.76116943359375, 0.8018798828125, 0.84259033203125, 0.88330078125, 0.92401123046875, 0.9647216796875, 1.00543212890625, 1.046142578125, 1.08685302734375, 1.1275634765625, 1.16827392578125, 1.208984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 9.0, 10.0, 16.0, 11.0, 13.0, 16.0, 16.0, 19.0, 21.0, 24.0, 29.0, 19.0, 27.0, 35.0, 33.0, 40.0, 34.0, 39.0, 57.0, 45.0, 47.0, 48.0, 32.0, 29.0, 30.0, 27.0, 27.0, 24.0, 28.0, 18.0, 23.0, 27.0, 28.0, 13.0, 10.0, 12.0, 9.0, 8.0, 7.0, 8.0, 4.0, 9.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4931640625, -1.447998046875, -1.40283203125, -1.357666015625, -1.3125, -1.267333984375, -1.22216796875, -1.177001953125, -1.1318359375, -1.086669921875, -1.04150390625, -0.996337890625, -0.951171875, -0.906005859375, -0.86083984375, -0.815673828125, -0.7705078125, -0.725341796875, -0.68017578125, -0.635009765625, -0.58984375, -0.544677734375, -0.49951171875, -0.454345703125, -0.4091796875, -0.364013671875, -0.31884765625, -0.273681640625, -0.228515625, -0.183349609375, -0.13818359375, -0.093017578125, -0.0478515625, -0.002685546875, 0.04248046875, 0.087646484375, 0.1328125, 0.177978515625, 0.22314453125, 0.268310546875, 0.3134765625, 0.358642578125, 0.40380859375, 0.448974609375, 0.494140625, 0.539306640625, 0.58447265625, 0.629638671875, 0.6748046875, 0.719970703125, 0.76513671875, 0.810302734375, 0.85546875, 0.900634765625, 0.94580078125, 0.990966796875, 1.0361328125, 1.081298828125, 1.12646484375, 1.171630859375, 1.216796875, 1.261962890625, 1.30712890625, 1.352294921875, 1.3974609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 9.0, 13.0, 17.0, 15.0, 27.0, 33.0, 47.0, 104.0, 183.0, 345.0, 679.0, 1735.0, 5620.0, 28669.0, 892448.0, 102019.0, 11429.0, 3060.0, 1013.0, 465.0, 237.0, 128.0, 83.0, 65.0, 34.0, 18.0, 11.0, 14.0, 7.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.7358856201171875, -0.706146240234375, -0.6764068603515625, -0.64666748046875, -0.6169281005859375, -0.587188720703125, -0.5574493408203125, -0.5277099609375, -0.4979705810546875, -0.468231201171875, -0.4384918212890625, -0.40875244140625, -0.3790130615234375, -0.349273681640625, -0.3195343017578125, -0.289794921875, -0.2600555419921875, -0.230316162109375, -0.2005767822265625, -0.17083740234375, -0.1410980224609375, -0.111358642578125, -0.0816192626953125, -0.0518798828125, -0.0221405029296875, 0.007598876953125, 0.0373382568359375, 0.06707763671875, 0.0968170166015625, 0.126556396484375, 0.1562957763671875, 0.18603515625, 0.2157745361328125, 0.245513916015625, 0.2752532958984375, 0.30499267578125, 0.3347320556640625, 0.364471435546875, 0.3942108154296875, 0.4239501953125, 0.4536895751953125, 0.483428955078125, 0.5131683349609375, 0.54290771484375, 0.5726470947265625, 0.602386474609375, 0.6321258544921875, 0.661865234375, 0.6916046142578125, 0.721343994140625, 0.7510833740234375, 0.78082275390625, 0.8105621337890625, 0.840301513671875, 0.8700408935546875, 0.8997802734375, 0.9295196533203125, 0.959259033203125, 0.9889984130859375, 1.01873779296875, 1.0484771728515625, 1.078216552734375, 1.1079559326171875, 1.1376953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 27.0, 29.0, 66.0, 241.0, 414.0, 85.0, 42.0, 27.0, 16.0, 12.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002275705337524414, -0.00022274907678365707, -0.00021792761981487274, -0.0002131061628460884, -0.00020828470587730408, -0.00020346324890851974, -0.0001986417919397354, -0.00019382033497095108, -0.00018899887800216675, -0.00018417742103338242, -0.00017935596406459808, -0.00017453450709581375, -0.00016971305012702942, -0.0001648915931582451, -0.00016007013618946075, -0.00015524867922067642, -0.0001504272222518921, -0.00014560576528310776, -0.00014078430831432343, -0.0001359628513455391, -0.00013114139437675476, -0.00012631993740797043, -0.0001214984804391861, -0.00011667702347040176, -0.00011185556650161743, -0.0001070341095328331, -0.00010221265256404877, -9.739119559526443e-05, -9.25697386264801e-05, -8.774828165769577e-05, -8.292682468891144e-05, -7.81053677201271e-05, -7.328391075134277e-05, -6.846245378255844e-05, -6.364099681377411e-05, -5.8819539844989777e-05, -5.3998082876205444e-05, -4.917662590742111e-05, -4.435516893863678e-05, -3.953371196985245e-05, -3.4712255001068115e-05, -2.9890798032283783e-05, -2.506934106349945e-05, -2.024788409471512e-05, -1.5426427125930786e-05, -1.0604970157146454e-05, -5.783513188362122e-06, -9.620562195777893e-07, 3.859400749206543e-06, 8.680857717990875e-06, 1.3502314686775208e-05, 1.832377165555954e-05, 2.3145228624343872e-05, 2.7966685593128204e-05, 3.278814256191254e-05, 3.760959953069687e-05, 4.24310564994812e-05, 4.7252513468265533e-05, 5.2073970437049866e-05, 5.68954274058342e-05, 6.171688437461853e-05, 6.653834134340286e-05, 7.13597983121872e-05, 7.618125528097153e-05, 8.100271224975586e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 4.0, 5.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 20.0, 31.0, 48.0, 92.0, 156.0, 260.0, 512.0, 1051.0, 2506.0, 6495.0, 24248.0, 479521.0, 497582.0, 24652.0, 6736.0, 2417.0, 1052.0, 473.0, 232.0, 130.0, 75.0, 65.0, 40.0, 20.0, 21.0, 18.0, 8.0, 10.0, 8.0, 8.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8100204467773438, -0.7875213623046875, -0.7650222778320312, -0.742523193359375, -0.7200241088867188, -0.6975250244140625, -0.6750259399414062, -0.65252685546875, -0.6300277709960938, -0.6075286865234375, -0.5850296020507812, -0.562530517578125, -0.5400314331054688, -0.5175323486328125, -0.49503326416015625, -0.4725341796875, -0.45003509521484375, -0.4275360107421875, -0.40503692626953125, -0.382537841796875, -0.36003875732421875, -0.3375396728515625, -0.31504058837890625, -0.29254150390625, -0.27004241943359375, -0.2475433349609375, -0.22504425048828125, -0.202545166015625, -0.18004608154296875, -0.1575469970703125, -0.13504791259765625, -0.112548828125, -0.09004974365234375, -0.0675506591796875, -0.04505157470703125, -0.022552490234375, -5.340576171875e-05, 0.0224456787109375, 0.04494476318359375, 0.06744384765625, 0.08994293212890625, 0.1124420166015625, 0.13494110107421875, 0.157440185546875, 0.17993927001953125, 0.2024383544921875, 0.22493743896484375, 0.2474365234375, 0.26993560791015625, 0.2924346923828125, 0.31493377685546875, 0.337432861328125, 0.35993194580078125, 0.3824310302734375, 0.40493011474609375, 0.42742919921875, 0.44992828369140625, 0.4724273681640625, 0.49492645263671875, 0.517425537109375, 0.5399246215820312, 0.5624237060546875, 0.5849227905273438, 0.607421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 0.0, 9.0, 7.0, 8.0, 6.0, 7.0, 23.0, 15.0, 19.0, 30.0, 57.0, 95.0, 278.0, 185.0, 78.0, 33.0, 38.0, 19.0, 20.0, 8.0, 10.0, 12.0, 12.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22328567504882812, -0.21463775634765625, -0.20598983764648438, -0.1973419189453125, -0.18869400024414062, -0.18004608154296875, -0.17139816284179688, -0.162750244140625, -0.15410232543945312, -0.14545440673828125, -0.13680648803710938, -0.1281585693359375, -0.11951065063476562, -0.11086273193359375, -0.10221481323242188, -0.09356689453125, -0.08491897583007812, -0.07627105712890625, -0.06762313842773438, -0.0589752197265625, -0.050327301025390625, -0.04167938232421875, -0.033031463623046875, -0.024383544921875, -0.015735626220703125, -0.00708770751953125, 0.001560211181640625, 0.0102081298828125, 0.018856048583984375, 0.02750396728515625, 0.036151885986328125, 0.0447998046875, 0.053447723388671875, 0.06209564208984375, 0.07074356079101562, 0.0793914794921875, 0.08803939819335938, 0.09668731689453125, 0.10533523559570312, 0.113983154296875, 0.12263107299804688, 0.13127899169921875, 0.13992691040039062, 0.1485748291015625, 0.15722274780273438, 0.16587066650390625, 0.17451858520507812, 0.18316650390625, 0.19181442260742188, 0.20046234130859375, 0.20911026000976562, 0.2177581787109375, 0.22640609741210938, 0.23505401611328125, 0.24370193481445312, 0.252349853515625, 0.2609977722167969, 0.26964569091796875, 0.2782936096191406, 0.2869415283203125, 0.2955894470214844, 0.30423736572265625, 0.3128852844238281, 0.321533203125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 37.0, 166.0, 544.0, 175.0, 46.0, 18.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5871992111206055, -5.2689971923828125, -4.9507951736450195, -4.632593631744385, -4.314391613006592, -3.996189594268799, -3.677987813949585, -3.359786033630371, -3.041584014892578, -2.723381996154785, -2.4051802158355713, -2.0869784355163574, -1.7687764167785645, -1.450574517250061, -1.1323726177215576, -0.8141708374023438, -0.4959688186645508, -0.17776691913604736, 0.14043498039245605, 0.4586368799209595, 0.7768387794494629, 1.0950406789779663, 1.4132425785064697, 1.7314443588256836, 2.0496463775634766, 2.3678483963012695, 2.6860501766204834, 3.0042519569396973, 3.3224539756774902, 3.640655994415283, 3.958857774734497, 4.277059555053711, 4.5952606201171875, 4.9134626388549805, 5.231664657592773, 5.549866199493408, 5.868068218231201, 6.186270236968994, 6.504471778869629, 6.822673797607422, 7.140875816345215, 7.459077835083008, 7.777279853820801, 8.095481872558594, 8.41368293762207, 8.731884956359863, 9.050086975097656, 9.36828899383545, 9.686491012573242, 10.004693031311035, 10.322895050048828, 10.641097068786621, 10.959299087524414, 11.27750015258789, 11.595702171325684, 11.913904190063477, 12.23210620880127, 12.550308227539062, 12.868510246276855, 13.186712265014648, 13.504913330078125, 13.823115348815918, 14.141317367553711, 14.459519386291504, 14.777721405029297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 9.0, 22.0, 20.0, 15.0, 21.0, 25.0, 34.0, 31.0, 22.0, 37.0, 32.0, 42.0, 45.0, 40.0, 45.0, 50.0, 48.0, 55.0, 51.0, 48.0, 31.0, 29.0, 39.0, 21.0, 23.0, 28.0, 27.0, 18.0, 15.0, 17.0, 9.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7176430225372314, -2.6250250339508057, -2.53240704536438, -2.439789295196533, -2.3471713066101074, -2.2545533180236816, -2.161935329437256, -2.06931734085083, -1.9766995906829834, -1.8840816020965576, -1.7914637327194214, -1.6988457441329956, -1.6062278747558594, -1.5136098861694336, -1.4209918975830078, -1.3283740282058716, -1.2357560396194458, -1.14313805103302, -1.0505201816558838, -0.957902193069458, -0.8652843236923218, -0.772666335105896, -0.680048406124115, -0.587430477142334, -0.494812548160553, -0.402194619178772, -0.30957669019699097, -0.21695873141288757, -0.12434080243110657, -0.03172287344932556, 0.06089508533477783, 0.15351301431655884, 0.24613094329833984, 0.33874887228012085, 0.43136680126190186, 0.5239847898483276, 0.6166026592254639, 0.7092206478118896, 0.8018385767936707, 0.8944565057754517, 0.9870744347572327, 1.0796923637390137, 1.1723103523254395, 1.2649282217025757, 1.3575462102890015, 1.4501640796661377, 1.5427820682525635, 1.6354000568389893, 1.7280179262161255, 1.8206359148025513, 1.9132537841796875, 2.0058717727661133, 2.098489761352539, 2.1911075115203857, 2.2837255001068115, 2.3763434886932373, 2.468961477279663, 2.561579465866089, 2.6541974544525146, 2.7468152046203613, 2.839433193206787, 2.932051181793213, 3.0246691703796387, 3.1172871589660645, 3.209904909133911]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 15.0, 21.0, 35.0, 53.0, 78.0, 146.0, 248.0, 621.0, 2846.0, 79248.0, 4097327.0, 11391.0, 1447.0, 404.0, 141.0, 97.0, 43.0, 43.0, 16.0, 13.0, 14.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4847412109375, -8.274169921875, -8.0635986328125, -7.85302734375, -7.6424560546875, -7.431884765625, -7.2213134765625, -7.0107421875, -6.8001708984375, -6.589599609375, -6.3790283203125, -6.16845703125, -5.9578857421875, -5.747314453125, -5.5367431640625, -5.326171875, -5.1156005859375, -4.905029296875, -4.6944580078125, -4.48388671875, -4.2733154296875, -4.062744140625, -3.8521728515625, -3.6416015625, -3.4310302734375, -3.220458984375, -3.0098876953125, -2.79931640625, -2.5887451171875, -2.378173828125, -2.1676025390625, -1.95703125, -1.7464599609375, -1.535888671875, -1.3253173828125, -1.11474609375, -0.9041748046875, -0.693603515625, -0.4830322265625, -0.2724609375, -0.0618896484375, 0.148681640625, 0.3592529296875, 0.56982421875, 0.7803955078125, 0.990966796875, 1.2015380859375, 1.412109375, 1.6226806640625, 1.833251953125, 2.0438232421875, 2.25439453125, 2.4649658203125, 2.675537109375, 2.8861083984375, 3.0966796875, 3.3072509765625, 3.517822265625, 3.7283935546875, 3.93896484375, 4.1495361328125, 4.360107421875, 4.5706787109375, 4.78125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 9.0, 15.0, 20.0, 26.0, 36.0, 49.0, 57.0, 79.0, 89.0, 113.0, 126.0, 86.0, 80.0, 64.0, 46.0, 34.0, 23.0, 18.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.2374420166015625, -2.179962158203125, -2.1224822998046875, -2.06500244140625, -2.0075225830078125, -1.950042724609375, -1.8925628662109375, -1.8350830078125, -1.7776031494140625, -1.720123291015625, -1.6626434326171875, -1.60516357421875, -1.5476837158203125, -1.490203857421875, -1.4327239990234375, -1.375244140625, -1.3177642822265625, -1.260284423828125, -1.2028045654296875, -1.14532470703125, -1.0878448486328125, -1.030364990234375, -0.9728851318359375, -0.9154052734375, -0.8579254150390625, -0.800445556640625, -0.7429656982421875, -0.68548583984375, -0.6280059814453125, -0.570526123046875, -0.5130462646484375, -0.45556640625, -0.3980865478515625, -0.340606689453125, -0.2831268310546875, -0.22564697265625, -0.1681671142578125, -0.110687255859375, -0.0532073974609375, 0.0042724609375, 0.0617523193359375, 0.119232177734375, 0.1767120361328125, 0.23419189453125, 0.2916717529296875, 0.349151611328125, 0.4066314697265625, 0.464111328125, 0.5215911865234375, 0.579071044921875, 0.6365509033203125, 0.69403076171875, 0.7515106201171875, 0.808990478515625, 0.8664703369140625, 0.9239501953125, 0.9814300537109375, 1.038909912109375, 1.0963897705078125, 1.15386962890625, 1.2113494873046875, 1.268829345703125, 1.3263092041015625, 1.3837890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 3.0, 5.0, 8.0, 10.0, 10.0, 21.0, 30.0, 35.0, 73.0, 101.0, 158.0, 314.0, 554.0, 1172.0, 2778.0, 7993.0, 35155.0, 2764463.0, 1340196.0, 29375.0, 7044.0, 2490.0, 1096.0, 515.0, 255.0, 150.0, 84.0, 62.0, 41.0, 24.0, 16.0, 14.0, 9.0, 4.0, 10.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.84375, -2.7725830078125, -2.701416015625, -2.6302490234375, -2.55908203125, -2.4879150390625, -2.416748046875, -2.3455810546875, -2.2744140625, -2.2032470703125, -2.132080078125, -2.0609130859375, -1.98974609375, -1.9185791015625, -1.847412109375, -1.7762451171875, -1.705078125, -1.6339111328125, -1.562744140625, -1.4915771484375, -1.42041015625, -1.3492431640625, -1.278076171875, -1.2069091796875, -1.1357421875, -1.0645751953125, -0.993408203125, -0.9222412109375, -0.85107421875, -0.7799072265625, -0.708740234375, -0.6375732421875, -0.56640625, -0.4952392578125, -0.424072265625, -0.3529052734375, -0.28173828125, -0.2105712890625, -0.139404296875, -0.0682373046875, 0.0029296875, 0.0740966796875, 0.145263671875, 0.2164306640625, 0.28759765625, 0.3587646484375, 0.429931640625, 0.5010986328125, 0.572265625, 0.6434326171875, 0.714599609375, 0.7857666015625, 0.85693359375, 0.9281005859375, 0.999267578125, 1.0704345703125, 1.1416015625, 1.2127685546875, 1.283935546875, 1.3551025390625, 1.42626953125, 1.4974365234375, 1.568603515625, 1.6397705078125, 1.7109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 11.0, 11.0, 18.0, 19.0, 54.0, 111.0, 310.0, 900.0, 1506.0, 613.0, 236.0, 91.0, 46.0, 26.0, 23.0, 19.0, 13.0, 13.0, 4.0, 4.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.4361114501953125, -0.416656494140625, -0.3972015380859375, -0.37774658203125, -0.3582916259765625, -0.338836669921875, -0.3193817138671875, -0.2999267578125, -0.2804718017578125, -0.261016845703125, -0.2415618896484375, -0.22210693359375, -0.2026519775390625, -0.183197021484375, -0.1637420654296875, -0.144287109375, -0.1248321533203125, -0.105377197265625, -0.0859222412109375, -0.06646728515625, -0.0470123291015625, -0.027557373046875, -0.0081024169921875, 0.0113525390625, 0.0308074951171875, 0.050262451171875, 0.0697174072265625, 0.08917236328125, 0.1086273193359375, 0.128082275390625, 0.1475372314453125, 0.1669921875, 0.1864471435546875, 0.205902099609375, 0.2253570556640625, 0.24481201171875, 0.2642669677734375, 0.283721923828125, 0.3031768798828125, 0.3226318359375, 0.3420867919921875, 0.361541748046875, 0.3809967041015625, 0.40045166015625, 0.4199066162109375, 0.439361572265625, 0.4588165283203125, 0.478271484375, 0.4977264404296875, 0.517181396484375, 0.5366363525390625, 0.55609130859375, 0.5755462646484375, 0.595001220703125, 0.6144561767578125, 0.6339111328125, 0.6533660888671875, 0.672821044921875, 0.6922760009765625, 0.71173095703125, 0.7311859130859375, 0.750640869140625, 0.7700958251953125, 0.78955078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 16.0, 6.0, 13.0, 16.0, 30.0, 68.0, 112.0, 182.0, 240.0, 133.0, 74.0, 36.0, 24.0, 20.0, 12.0, 3.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.897313117980957, -2.8127846717834473, -2.7282562255859375, -2.6437277793884277, -2.559199571609497, -2.4746711254119873, -2.3901426792144775, -2.3056142330169678, -2.221086025238037, -2.1365575790405273, -2.0520291328430176, -1.9675008058547974, -1.8829724788665771, -1.7984440326690674, -1.7139155864715576, -1.6293871402740479, -1.544858694076538, -1.4603302478790283, -1.375801920890808, -1.2912734746932983, -1.2067451477050781, -1.1222167015075684, -1.0376882553100586, -0.9531598687171936, -0.8686314821243286, -0.7841030955314636, -0.6995747089385986, -0.6150462627410889, -0.5305178761482239, -0.4459894895553589, -0.3614610433578491, -0.27693265676498413, -0.19240450859069824, -0.10787610709667206, -0.023347705602645874, 0.061180710792541504, 0.1457090973854065, 0.23023748397827148, 0.31476593017578125, 0.39929431676864624, 0.48382270336151123, 0.5683510899543762, 0.6528794765472412, 0.737407922744751, 0.821936309337616, 0.906464695930481, 0.9909931421279907, 1.075521469116211, 1.1600499153137207, 1.2445783615112305, 1.3291066884994507, 1.4136351346969604, 1.4981634616851807, 1.5826919078826904, 1.6672203540802002, 1.75174880027771, 1.8362771272659302, 1.92080557346344, 2.00533390045166, 2.08986234664917, 2.1743907928466797, 2.2589192390441895, 2.343447685241699, 2.42797589302063, 2.5125043392181396]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 18.0, 27.0, 34.0, 35.0, 57.0, 51.0, 66.0, 78.0, 85.0, 74.0, 69.0, 76.0, 71.0, 48.0, 42.0, 36.0, 35.0, 31.0, 20.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.907869815826416, -1.8558416366577148, -1.8038134574890137, -1.7517852783203125, -1.6997569799423218, -1.6477288007736206, -1.5957006216049194, -1.5436724424362183, -1.491644263267517, -1.439616084098816, -1.3875879049301147, -1.335559606552124, -1.2835314273834229, -1.2315032482147217, -1.1794750690460205, -1.1274468898773193, -1.0754187107086182, -1.023390531539917, -0.971362292766571, -0.9193341135978699, -0.8673059344291687, -0.8152776956558228, -0.7632495164871216, -0.7112213373184204, -0.6591930389404297, -0.6071648597717285, -0.5551366209983826, -0.5031084418296814, -0.4510802626609802, -0.39905205368995667, -0.3470238447189331, -0.29499566555023193, -0.24296748638153076, -0.1909392923116684, -0.13891109824180603, -0.08688288927078247, -0.034854695200920105, 0.01717349886894226, 0.06920170783996582, 0.12122988700866699, 0.17325809597969055, 0.22528629004955292, 0.2773144841194153, 0.32934269309043884, 0.3813709020614624, 0.4333990812301636, 0.48542729020118713, 0.5374554395675659, 0.5894836783409119, 0.641511857509613, 0.693540096282959, 0.7455682754516602, 0.7975964546203613, 0.8496246337890625, 0.9016528725624084, 0.9536810517311096, 1.0057092905044556, 1.0577374696731567, 1.109765648841858, 1.1617939472198486, 1.2138221263885498, 1.265850305557251, 1.3178784847259521, 1.3699066638946533, 1.4219348430633545]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 13.0, 11.0, 29.0, 44.0, 73.0, 90.0, 170.0, 293.0, 606.0, 1302.0, 3725.0, 15752.0, 146734.0, 784529.0, 79224.0, 10818.0, 2946.0, 1075.0, 502.0, 263.0, 141.0, 79.0, 46.0, 21.0, 19.0, 9.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.2967987060546875, -0.283538818359375, -0.2702789306640625, -0.25701904296875, -0.2437591552734375, -0.230499267578125, -0.2172393798828125, -0.2039794921875, -0.1907196044921875, -0.177459716796875, -0.1641998291015625, -0.15093994140625, -0.1376800537109375, -0.124420166015625, -0.1111602783203125, -0.097900390625, -0.0846405029296875, -0.071380615234375, -0.0581207275390625, -0.04486083984375, -0.0316009521484375, -0.018341064453125, -0.0050811767578125, 0.0081787109375, 0.0214385986328125, 0.034698486328125, 0.0479583740234375, 0.06121826171875, 0.0744781494140625, 0.087738037109375, 0.1009979248046875, 0.1142578125, 0.1275177001953125, 0.140777587890625, 0.1540374755859375, 0.16729736328125, 0.1805572509765625, 0.193817138671875, 0.2070770263671875, 0.2203369140625, 0.2335968017578125, 0.246856689453125, 0.2601165771484375, 0.27337646484375, 0.2866363525390625, 0.299896240234375, 0.3131561279296875, 0.326416015625, 0.3396759033203125, 0.352935791015625, 0.3661956787109375, 0.37945556640625, 0.3927154541015625, 0.405975341796875, 0.4192352294921875, 0.4324951171875, 0.4457550048828125, 0.459014892578125, 0.4722747802734375, 0.48553466796875, 0.4987945556640625, 0.512054443359375, 0.5253143310546875, 0.53857421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 11.0, 13.0, 15.0, 39.0, 28.0, 56.0, 59.0, 75.0, 106.0, 103.0, 100.0, 83.0, 85.0, 56.0, 49.0, 39.0, 29.0, 25.0, 4.0, 4.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.7196197509765625, -1.675567626953125, -1.6315155029296875, -1.58746337890625, -1.5434112548828125, -1.499359130859375, -1.4553070068359375, -1.4112548828125, -1.3672027587890625, -1.323150634765625, -1.2790985107421875, -1.23504638671875, -1.1909942626953125, -1.146942138671875, -1.1028900146484375, -1.058837890625, -1.0147857666015625, -0.970733642578125, -0.9266815185546875, -0.88262939453125, -0.8385772705078125, -0.794525146484375, -0.7504730224609375, -0.7064208984375, -0.6623687744140625, -0.618316650390625, -0.5742645263671875, -0.53021240234375, -0.4861602783203125, -0.442108154296875, -0.3980560302734375, -0.35400390625, -0.3099517822265625, -0.265899658203125, -0.2218475341796875, -0.17779541015625, -0.1337432861328125, -0.089691162109375, -0.0456390380859375, -0.0015869140625, 0.0424652099609375, 0.086517333984375, 0.1305694580078125, 0.17462158203125, 0.2186737060546875, 0.262725830078125, 0.3067779541015625, 0.350830078125, 0.3948822021484375, 0.438934326171875, 0.4829864501953125, 0.52703857421875, 0.5710906982421875, 0.615142822265625, 0.6591949462890625, 0.7032470703125, 0.7472991943359375, 0.791351318359375, 0.8354034423828125, 0.87945556640625, 0.9235076904296875, 0.967559814453125, 1.0116119384765625, 1.0556640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 16.0, 15.0, 11.0, 18.0, 30.0, 56.0, 63.0, 102.0, 161.0, 192.0, 328.0, 447.0, 740.0, 1143.0, 1885.0, 3493.0, 7001.0, 16099.0, 42615.0, 144353.0, 472674.0, 247016.0, 66114.0, 23128.0, 9718.0, 4658.0, 2493.0, 1371.0, 893.0, 523.0, 382.0, 223.0, 152.0, 126.0, 83.0, 68.0, 49.0, 20.0, 19.0, 20.0, 18.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15652084350585938, -0.15142059326171875, -0.14632034301757812, -0.1412200927734375, -0.13611984252929688, -0.13101959228515625, -0.12591934204101562, -0.120819091796875, -0.11571884155273438, -0.11061859130859375, -0.10551834106445312, -0.1004180908203125, -0.09531784057617188, -0.09021759033203125, -0.08511734008789062, -0.08001708984375, -0.07491683959960938, -0.06981658935546875, -0.06471633911132812, -0.0596160888671875, -0.054515838623046875, -0.04941558837890625, -0.044315338134765625, -0.039215087890625, -0.034114837646484375, -0.02901458740234375, -0.023914337158203125, -0.0188140869140625, -0.013713836669921875, -0.00861358642578125, -0.003513336181640625, 0.0015869140625, 0.006687164306640625, 0.01178741455078125, 0.016887664794921875, 0.0219879150390625, 0.027088165283203125, 0.03218841552734375, 0.037288665771484375, 0.042388916015625, 0.047489166259765625, 0.05258941650390625, 0.057689666748046875, 0.0627899169921875, 0.06789016723632812, 0.07299041748046875, 0.07809066772460938, 0.08319091796875, 0.08829116821289062, 0.09339141845703125, 0.09849166870117188, 0.1035919189453125, 0.10869216918945312, 0.11379241943359375, 0.11889266967773438, 0.123992919921875, 0.12909317016601562, 0.13419342041015625, 0.13929367065429688, 0.1443939208984375, 0.14949417114257812, 0.15459442138671875, 0.15969467163085938, 0.164794921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 9.0, 13.0, 8.0, 12.0, 13.0, 23.0, 28.0, 25.0, 32.0, 35.0, 33.0, 31.0, 43.0, 52.0, 38.0, 53.0, 38.0, 42.0, 52.0, 51.0, 34.0, 39.0, 33.0, 33.0, 24.0, 29.0, 22.0, 17.0, 17.0, 18.0, 17.0, 11.0, 12.0, 9.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.15576171875, -1.1162109375, -1.07666015625, -1.037109375, -0.99755859375, -0.9580078125, -0.91845703125, -0.87890625, -0.83935546875, -0.7998046875, -0.76025390625, -0.720703125, -0.68115234375, -0.6416015625, -0.60205078125, -0.5625, -0.52294921875, -0.4833984375, -0.44384765625, -0.404296875, -0.36474609375, -0.3251953125, -0.28564453125, -0.24609375, -0.20654296875, -0.1669921875, -0.12744140625, -0.087890625, -0.04833984375, -0.0087890625, 0.03076171875, 0.0703125, 0.10986328125, 0.1494140625, 0.18896484375, 0.228515625, 0.26806640625, 0.3076171875, 0.34716796875, 0.38671875, 0.42626953125, 0.4658203125, 0.50537109375, 0.544921875, 0.58447265625, 0.6240234375, 0.66357421875, 0.703125, 0.74267578125, 0.7822265625, 0.82177734375, 0.861328125, 0.90087890625, 0.9404296875, 0.97998046875, 1.01953125, 1.05908203125, 1.0986328125, 1.13818359375, 1.177734375, 1.21728515625, 1.2568359375, 1.29638671875, 1.3359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 7.0, 12.0, 16.0, 18.0, 16.0, 20.0, 39.0, 50.0, 84.0, 109.0, 167.0, 244.0, 440.0, 701.0, 1223.0, 2083.0, 4150.0, 9221.0, 25285.0, 101484.0, 531550.0, 289017.0, 52666.0, 16187.0, 6436.0, 3086.0, 1655.0, 958.0, 542.0, 349.0, 220.0, 159.0, 101.0, 56.0, 49.0, 36.0, 27.0, 30.0, 17.0, 8.0, 6.0, 8.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.051971435546875, -0.05038642883300781, -0.048801422119140625, -0.04721641540527344, -0.04563140869140625, -0.04404640197753906, -0.042461395263671875, -0.04087638854980469, -0.0392913818359375, -0.03770637512207031, -0.036121368408203125, -0.03453636169433594, -0.03295135498046875, -0.03136634826660156, -0.029781341552734375, -0.028196334838867188, -0.026611328125, -0.025026321411132812, -0.023441314697265625, -0.021856307983398438, -0.02027130126953125, -0.018686294555664062, -0.017101287841796875, -0.015516281127929688, -0.0139312744140625, -0.012346267700195312, -0.010761260986328125, -0.009176254272460938, -0.00759124755859375, -0.0060062408447265625, -0.004421234130859375, -0.0028362274169921875, -0.001251220703125, 0.0003337860107421875, 0.001918792724609375, 0.0035037994384765625, 0.00508880615234375, 0.0066738128662109375, 0.008258819580078125, 0.009843826293945312, 0.0114288330078125, 0.013013839721679688, 0.014598846435546875, 0.016183853149414062, 0.01776885986328125, 0.019353866577148438, 0.020938873291015625, 0.022523880004882812, 0.02410888671875, 0.025693893432617188, 0.027278900146484375, 0.028863906860351562, 0.03044891357421875, 0.03203392028808594, 0.033618927001953125, 0.03520393371582031, 0.0367889404296875, 0.03837394714355469, 0.039958953857421875, 0.04154396057128906, 0.04312896728515625, 0.04471397399902344, 0.046298980712890625, 0.04788398742675781, 0.049468994140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 18.0, 26.0, 49.0, 94.0, 118.0, 154.0, 163.0, 113.0, 80.0, 46.0, 32.0, 30.0, 13.0, 7.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -5.137734115123749e-05, -4.976615309715271e-05, -4.815496504306793e-05, -4.6543776988983154e-05, -4.4932588934898376e-05, -4.33214008808136e-05, -4.171021282672882e-05, -4.009902477264404e-05, -3.8487836718559265e-05, -3.687664866447449e-05, -3.526546061038971e-05, -3.365427255630493e-05, -3.2043084502220154e-05, -3.0431896448135376e-05, -2.8820708394050598e-05, -2.720952033996582e-05, -2.5598332285881042e-05, -2.3987144231796265e-05, -2.2375956177711487e-05, -2.076476812362671e-05, -1.915358006954193e-05, -1.7542392015457153e-05, -1.5931203961372375e-05, -1.4320015907287598e-05, -1.270882785320282e-05, -1.1097639799118042e-05, -9.486451745033264e-06, -7.875263690948486e-06, -6.2640756368637085e-06, -4.652887582778931e-06, -3.041699528694153e-06, -1.430511474609375e-06, 1.8067657947540283e-07, 1.7918646335601807e-06, 3.4030526876449585e-06, 5.014240741729736e-06, 6.625428795814514e-06, 8.236616849899292e-06, 9.84780490398407e-06, 1.1458992958068848e-05, 1.3070181012153625e-05, 1.4681369066238403e-05, 1.629255712032318e-05, 1.790374517440796e-05, 1.9514933228492737e-05, 2.1126121282577515e-05, 2.2737309336662292e-05, 2.434849739074707e-05, 2.5959685444831848e-05, 2.7570873498916626e-05, 2.9182061553001404e-05, 3.079324960708618e-05, 3.240443766117096e-05, 3.401562571525574e-05, 3.5626813769340515e-05, 3.723800182342529e-05, 3.884918987751007e-05, 4.046037793159485e-05, 4.2071565985679626e-05, 4.3682754039764404e-05, 4.529394209384918e-05, 4.690513014793396e-05, 4.851631820201874e-05, 5.0127506256103516e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 13.0, 13.0, 20.0, 20.0, 40.0, 57.0, 68.0, 114.0, 129.0, 227.0, 351.0, 586.0, 925.0, 1762.0, 3307.0, 6981.0, 16810.0, 49474.0, 189472.0, 495007.0, 198672.0, 51857.0, 17590.0, 7307.0, 3398.0, 1762.0, 961.0, 569.0, 374.0, 210.0, 144.0, 94.0, 76.0, 42.0, 35.0, 20.0, 17.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.04522705078125, -0.04391670227050781, -0.042606353759765625, -0.04129600524902344, -0.03998565673828125, -0.03867530822753906, -0.037364959716796875, -0.03605461120605469, -0.0347442626953125, -0.03343391418457031, -0.032123565673828125, -0.030813217163085938, -0.02950286865234375, -0.028192520141601562, -0.026882171630859375, -0.025571823120117188, -0.024261474609375, -0.022951126098632812, -0.021640777587890625, -0.020330429077148438, -0.01902008056640625, -0.017709732055664062, -0.016399383544921875, -0.015089035034179688, -0.0137786865234375, -0.012468338012695312, -0.011157989501953125, -0.009847640991210938, -0.00853729248046875, -0.0072269439697265625, -0.005916595458984375, -0.0046062469482421875, -0.0032958984375, -0.0019855499267578125, -0.000675201416015625, 0.0006351470947265625, 0.00194549560546875, 0.0032558441162109375, 0.004566192626953125, 0.0058765411376953125, 0.0071868896484375, 0.008497238159179688, 0.009807586669921875, 0.011117935180664062, 0.01242828369140625, 0.013738632202148438, 0.015048980712890625, 0.016359329223632812, 0.017669677734375, 0.018980026245117188, 0.020290374755859375, 0.021600723266601562, 0.02291107177734375, 0.024221420288085938, 0.025531768798828125, 0.026842117309570312, 0.0281524658203125, 0.029462814331054688, 0.030773162841796875, 0.03208351135253906, 0.03339385986328125, 0.03470420837402344, 0.036014556884765625, 0.03732490539550781, 0.03863525390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 2.0, 13.0, 17.0, 28.0, 27.0, 46.0, 37.0, 52.0, 64.0, 70.0, 69.0, 78.0, 90.0, 62.0, 74.0, 38.0, 42.0, 29.0, 24.0, 25.0, 22.0, 10.0, 17.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010894775390625, -0.010493159294128418, -0.010091543197631836, -0.009689927101135254, -0.009288311004638672, -0.00888669490814209, -0.008485078811645508, -0.008083462715148926, -0.007681846618652344, -0.007280230522155762, -0.00687861442565918, -0.006476998329162598, -0.006075382232666016, -0.005673766136169434, -0.0052721500396728516, -0.0048705339431762695, -0.0044689178466796875, -0.0040673017501831055, -0.0036656856536865234, -0.0032640695571899414, -0.0028624534606933594, -0.0024608373641967773, -0.0020592212677001953, -0.0016576051712036133, -0.0012559890747070312, -0.0008543729782104492, -0.0004527568817138672, -5.1140785217285156e-05, 0.0003504753112792969, 0.0007520914077758789, 0.001153707504272461, 0.001555323600769043, 0.001956939697265625, 0.002358555793762207, 0.002760171890258789, 0.003161787986755371, 0.003563404083251953, 0.003965020179748535, 0.004366636276245117, 0.004768252372741699, 0.005169868469238281, 0.005571484565734863, 0.005973100662231445, 0.006374716758728027, 0.006776332855224609, 0.007177948951721191, 0.0075795650482177734, 0.007981181144714355, 0.008382797241210938, 0.00878441333770752, 0.009186029434204102, 0.009587645530700684, 0.009989261627197266, 0.010390877723693848, 0.01079249382019043, 0.011194109916687012, 0.011595726013183594, 0.011997342109680176, 0.012398958206176758, 0.01280057430267334, 0.013202190399169922, 0.013603806495666504, 0.014005422592163086, 0.014407038688659668, 0.01480865478515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 31.0, 54.0, 267.0, 478.0, 112.0, 37.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.457675933837891, -4.319665431976318, -4.181655406951904, -4.043644905090332, -3.905634641647339, -3.7676243782043457, -3.6296138763427734, -3.4916036128997803, -3.353593349456787, -3.215583086013794, -3.077572822570801, -2.9395623207092285, -2.8015520572662354, -2.663541793823242, -2.52553129196167, -2.3875210285186768, -2.2495107650756836, -2.1115005016326904, -1.9734901189804077, -1.835479736328125, -1.6974694728851318, -1.5594592094421387, -1.421448826789856, -1.2834384441375732, -1.14542818069458, -1.007417917251587, -0.8694075345993042, -0.7313972115516663, -0.5933868885040283, -0.4553765654563904, -0.31736624240875244, -0.1793559193611145, -0.04134511947631836, 0.09666520357131958, 0.23467552661895752, 0.37268584966659546, 0.5106961727142334, 0.6487064957618713, 0.7867168188095093, 0.9247271418571472, 1.0627374649047852, 1.2007477283477783, 1.338758111000061, 1.4767684936523438, 1.614778757095337, 1.75278902053833, 1.8907994031906128, 2.0288097858428955, 2.1668200492858887, 2.304830312728882, 2.442840576171875, 2.5808510780334473, 2.7188613414764404, 2.8568716049194336, 2.994882106781006, 3.132892370223999, 3.270902633666992, 3.4089128971099854, 3.5469231605529785, 3.684933662414551, 3.822943925857544, 3.960954189300537, 4.098964691162109, 4.236974716186523, 4.374985218048096]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 13.0, 19.0, 24.0, 51.0, 44.0, 75.0, 80.0, 102.0, 99.0, 104.0, 95.0, 78.0, 65.0, 43.0, 34.0, 35.0, 10.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8624941110610962, -1.8180227279663086, -1.7735512256622314, -1.7290798425674438, -1.6846084594726562, -1.640136957168579, -1.5956655740737915, -1.551194190979004, -1.5067226886749268, -1.4622513055801392, -1.417779803276062, -1.3733084201812744, -1.3288370370864868, -1.2843656539916992, -1.239894151687622, -1.1954227685928345, -1.1509513854980469, -1.1064800024032593, -1.0620085000991821, -1.0175371170043945, -0.9730657339096069, -0.9285942912101746, -0.8841228485107422, -0.8396514654159546, -0.7951800227165222, -0.7507085800170898, -0.7062371969223022, -0.6617657542228699, -0.6172943115234375, -0.5728229284286499, -0.5283514857292175, -0.48388007283210754, -0.4394086003303528, -0.3949371874332428, -0.3504657745361328, -0.30599433183670044, -0.26152291893959045, -0.21705150604248047, -0.1725800633430481, -0.1281086504459381, -0.08363723754882812, -0.03916581720113754, 0.0053056031465530396, 0.04977703094482422, 0.0942484438419342, 0.1387198567390442, 0.18319129943847656, 0.22766271233558655, 0.27213412523269653, 0.3166055381298065, 0.3610769510269165, 0.4055483937263489, 0.45001980662345886, 0.49449121952056885, 0.5389626622200012, 0.5834341049194336, 0.6279054880142212, 0.6723769307136536, 0.7168483138084412, 0.7613197565078735, 0.8057911396026611, 0.8502625823020935, 0.8947340250015259, 0.9392054080963135, 0.9836768507957458]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 12.0, 9.0, 17.0, 28.0, 39.0, 71.0, 125.0, 198.0, 386.0, 860.0, 2464.0, 11431.0, 390462.0, 624198.0, 13527.0, 2881.0, 949.0, 369.0, 200.0, 115.0, 76.0, 47.0, 31.0, 18.0, 14.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7783203125, -1.727569580078125, -1.67681884765625, -1.626068115234375, -1.5753173828125, -1.524566650390625, -1.47381591796875, -1.423065185546875, -1.372314453125, -1.321563720703125, -1.27081298828125, -1.220062255859375, -1.1693115234375, -1.118560791015625, -1.06781005859375, -1.017059326171875, -0.96630859375, -0.915557861328125, -0.86480712890625, -0.814056396484375, -0.7633056640625, -0.712554931640625, -0.66180419921875, -0.611053466796875, -0.560302734375, -0.509552001953125, -0.45880126953125, -0.408050537109375, -0.3572998046875, -0.306549072265625, -0.25579833984375, -0.205047607421875, -0.154296875, -0.103546142578125, -0.05279541015625, -0.002044677734375, 0.0487060546875, 0.099456787109375, 0.15020751953125, 0.200958251953125, 0.251708984375, 0.302459716796875, 0.35321044921875, 0.403961181640625, 0.4547119140625, 0.505462646484375, 0.55621337890625, 0.606964111328125, 0.65771484375, 0.708465576171875, 0.75921630859375, 0.809967041015625, 0.8607177734375, 0.911468505859375, 0.96221923828125, 1.012969970703125, 1.063720703125, 1.114471435546875, 1.16522216796875, 1.215972900390625, 1.2667236328125, 1.317474365234375, 1.36822509765625, 1.418975830078125, 1.4697265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 28.0, 39.0, 38.0, 56.0, 69.0, 89.0, 83.0, 95.0, 91.0, 75.0, 67.0, 60.0, 47.0, 31.0, 25.0, 25.0, 15.0, 3.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.56219482421875, -2.4837646484375, -2.40533447265625, -2.326904296875, -2.24847412109375, -2.1700439453125, -2.09161376953125, -2.01318359375, -1.93475341796875, -1.8563232421875, -1.77789306640625, -1.699462890625, -1.62103271484375, -1.5426025390625, -1.46417236328125, -1.3857421875, -1.30731201171875, -1.2288818359375, -1.15045166015625, -1.072021484375, -0.99359130859375, -0.9151611328125, -0.83673095703125, -0.75830078125, -0.67987060546875, -0.6014404296875, -0.52301025390625, -0.444580078125, -0.36614990234375, -0.2877197265625, -0.20928955078125, -0.130859375, -0.05242919921875, 0.0260009765625, 0.10443115234375, 0.182861328125, 0.26129150390625, 0.3397216796875, 0.41815185546875, 0.49658203125, 0.57501220703125, 0.6534423828125, 0.73187255859375, 0.810302734375, 0.88873291015625, 0.9671630859375, 1.04559326171875, 1.1240234375, 1.20245361328125, 1.2808837890625, 1.35931396484375, 1.437744140625, 1.51617431640625, 1.5946044921875, 1.67303466796875, 1.75146484375, 1.82989501953125, 1.9083251953125, 1.98675537109375, 2.065185546875, 2.14361572265625, 2.2220458984375, 2.30047607421875, 2.37890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 3.0, 10.0, 4.0, 16.0, 13.0, 21.0, 25.0, 31.0, 66.0, 92.0, 125.0, 220.0, 314.0, 591.0, 975.0, 1654.0, 3594.0, 10190.0, 99596.0, 873907.0, 43284.0, 7294.0, 2893.0, 1432.0, 794.0, 486.0, 283.0, 189.0, 133.0, 77.0, 62.0, 44.0, 34.0, 20.0, 13.0, 10.0, 16.0, 9.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.0166015625, -0.9870223999023438, -0.9574432373046875, -0.9278640747070312, -0.898284912109375, -0.8687057495117188, -0.8391265869140625, -0.8095474243164062, -0.77996826171875, -0.7503890991210938, -0.7208099365234375, -0.6912307739257812, -0.661651611328125, -0.6320724487304688, -0.6024932861328125, -0.5729141235351562, -0.5433349609375, -0.5137557983398438, -0.4841766357421875, -0.45459747314453125, -0.425018310546875, -0.39543914794921875, -0.3658599853515625, -0.33628082275390625, -0.30670166015625, -0.27712249755859375, -0.2475433349609375, -0.21796417236328125, -0.188385009765625, -0.15880584716796875, -0.1292266845703125, -0.09964752197265625, -0.070068359375, -0.04048919677734375, -0.0109100341796875, 0.01866912841796875, 0.048248291015625, 0.07782745361328125, 0.1074066162109375, 0.13698577880859375, 0.16656494140625, 0.19614410400390625, 0.2257232666015625, 0.25530242919921875, 0.284881591796875, 0.31446075439453125, 0.3440399169921875, 0.37361907958984375, 0.4031982421875, 0.43277740478515625, 0.4623565673828125, 0.49193572998046875, 0.521514892578125, 0.5510940551757812, 0.5806732177734375, 0.6102523803710938, 0.63983154296875, 0.6694107055664062, 0.6989898681640625, 0.7285690307617188, 0.758148193359375, 0.7877273559570312, 0.8173065185546875, 0.8468856811523438, 0.87646484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 12.0, 23.0, 10.0, 14.0, 15.0, 25.0, 26.0, 28.0, 41.0, 37.0, 44.0, 42.0, 43.0, 47.0, 38.0, 36.0, 38.0, 35.0, 41.0, 46.0, 34.0, 52.0, 34.0, 16.0, 25.0, 30.0, 25.0, 16.0, 17.0, 13.0, 14.0, 17.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.4248809814453125, -1.377105712890625, -1.3293304443359375, -1.28155517578125, -1.2337799072265625, -1.186004638671875, -1.1382293701171875, -1.0904541015625, -1.0426788330078125, -0.994903564453125, -0.9471282958984375, -0.89935302734375, -0.8515777587890625, -0.803802490234375, -0.7560272216796875, -0.708251953125, -0.6604766845703125, -0.612701416015625, -0.5649261474609375, -0.51715087890625, -0.4693756103515625, -0.421600341796875, -0.3738250732421875, -0.3260498046875, -0.2782745361328125, -0.230499267578125, -0.1827239990234375, -0.13494873046875, -0.0871734619140625, -0.039398193359375, 0.0083770751953125, 0.05615234375, 0.1039276123046875, 0.151702880859375, 0.1994781494140625, 0.24725341796875, 0.2950286865234375, 0.342803955078125, 0.3905792236328125, 0.4383544921875, 0.4861297607421875, 0.533905029296875, 0.5816802978515625, 0.62945556640625, 0.6772308349609375, 0.725006103515625, 0.7727813720703125, 0.820556640625, 0.8683319091796875, 0.916107177734375, 0.9638824462890625, 1.01165771484375, 1.0594329833984375, 1.107208251953125, 1.1549835205078125, 1.2027587890625, 1.2505340576171875, 1.298309326171875, 1.3460845947265625, 1.39385986328125, 1.4416351318359375, 1.489410400390625, 1.5371856689453125, 1.5849609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 12.0, 16.0, 14.0, 25.0, 51.0, 58.0, 96.0, 222.0, 423.0, 1072.0, 3416.0, 21238.0, 895455.0, 115656.0, 7585.0, 1873.0, 647.0, 307.0, 139.0, 108.0, 43.0, 27.0, 19.0, 12.0, 12.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6549148559570312, -0.6355133056640625, -0.6161117553710938, -0.596710205078125, -0.5773086547851562, -0.5579071044921875, -0.5385055541992188, -0.51910400390625, -0.49970245361328125, -0.4803009033203125, -0.46089935302734375, -0.441497802734375, -0.42209625244140625, -0.4026947021484375, -0.38329315185546875, -0.3638916015625, -0.34449005126953125, -0.3250885009765625, -0.30568695068359375, -0.286285400390625, -0.26688385009765625, -0.2474822998046875, -0.22808074951171875, -0.20867919921875, -0.18927764892578125, -0.1698760986328125, -0.15047454833984375, -0.131072998046875, -0.11167144775390625, -0.0922698974609375, -0.07286834716796875, -0.053466796875, -0.03406524658203125, -0.0146636962890625, 0.00473785400390625, 0.024139404296875, 0.04354095458984375, 0.0629425048828125, 0.08234405517578125, 0.10174560546875, 0.12114715576171875, 0.1405487060546875, 0.15995025634765625, 0.179351806640625, 0.19875335693359375, 0.2181549072265625, 0.23755645751953125, 0.2569580078125, 0.27635955810546875, 0.2957611083984375, 0.31516265869140625, 0.334564208984375, 0.35396575927734375, 0.3733673095703125, 0.39276885986328125, 0.41217041015625, 0.43157196044921875, 0.4509735107421875, 0.47037506103515625, 0.489776611328125, 0.5091781616210938, 0.5285797119140625, 0.5479812622070312, 0.5673828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 20.0, 28.0, 46.0, 130.0, 386.0, 215.0, 72.0, 45.0, 15.0, 16.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018095970153808594, -0.00017732474952936172, -0.0001736897975206375, -0.0001700548455119133, -0.0001664198935031891, -0.00016278494149446487, -0.00015914998948574066, -0.00015551503747701645, -0.00015188008546829224, -0.00014824513345956802, -0.0001446101814508438, -0.0001409752294421196, -0.00013734027743339539, -0.00013370532542467117, -0.00013007037341594696, -0.00012643542140722275, -0.00012280046939849854, -0.00011916551738977432, -0.00011553056538105011, -0.0001118956133723259, -0.00010826066136360168, -0.00010462570935487747, -0.00010099075734615326, -9.735580533742905e-05, -9.372085332870483e-05, -9.008590131998062e-05, -8.645094931125641e-05, -8.28159973025322e-05, -7.918104529380798e-05, -7.554609328508377e-05, -7.191114127635956e-05, -6.827618926763535e-05, -6.464123725891113e-05, -6.100628525018692e-05, -5.737133324146271e-05, -5.3736381232738495e-05, -5.010142922401428e-05, -4.646647721529007e-05, -4.283152520656586e-05, -3.9196573197841644e-05, -3.556162118911743e-05, -3.192666918039322e-05, -2.8291717171669006e-05, -2.4656765162944794e-05, -2.102181315422058e-05, -1.738686114549637e-05, -1.3751909136772156e-05, -1.0116957128047943e-05, -6.4820051193237305e-06, -2.847053110599518e-06, 7.878988981246948e-07, 4.4228509068489075e-06, 8.05780291557312e-06, 1.1692754924297333e-05, 1.5327706933021545e-05, 1.8962658941745758e-05, 2.259761095046997e-05, 2.6232562959194183e-05, 2.9867514967918396e-05, 3.350246697664261e-05, 3.713741898536682e-05, 4.0772370994091034e-05, 4.4407323002815247e-05, 4.804227501153946e-05, 5.167722702026367e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 12.0, 23.0, 26.0, 37.0, 80.0, 142.0, 299.0, 616.0, 1531.0, 4692.0, 23567.0, 858957.0, 142973.0, 10695.0, 3024.0, 944.0, 447.0, 216.0, 92.0, 54.0, 34.0, 24.0, 13.0, 9.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.483154296875, -0.4651222229003906, -0.44709014892578125, -0.4290580749511719, -0.4110260009765625, -0.3929939270019531, -0.37496185302734375, -0.3569297790527344, -0.338897705078125, -0.3208656311035156, -0.30283355712890625, -0.2848014831542969, -0.2667694091796875, -0.24873733520507812, -0.23070526123046875, -0.21267318725585938, -0.19464111328125, -0.17660903930664062, -0.15857696533203125, -0.14054489135742188, -0.1225128173828125, -0.10448074340820312, -0.08644866943359375, -0.06841659545898438, -0.050384521484375, -0.032352447509765625, -0.01432037353515625, 0.003711700439453125, 0.0217437744140625, 0.039775848388671875, 0.05780792236328125, 0.07583999633789062, 0.0938720703125, 0.11190414428710938, 0.12993621826171875, 0.14796829223632812, 0.1660003662109375, 0.18403244018554688, 0.20206451416015625, 0.22009658813476562, 0.238128662109375, 0.2561607360839844, 0.27419281005859375, 0.2922248840332031, 0.3102569580078125, 0.3282890319824219, 0.34632110595703125, 0.3643531799316406, 0.38238525390625, 0.4004173278808594, 0.41844940185546875, 0.4364814758300781, 0.4545135498046875, 0.4725456237792969, 0.49057769775390625, 0.5086097717285156, 0.526641845703125, 0.5446739196777344, 0.5627059936523438, 0.5807380676269531, 0.5987701416015625, 0.6168022155761719, 0.6348342895507812, 0.6528663635253906, 0.6708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 7.0, 5.0, 5.0, 20.0, 13.0, 29.0, 38.0, 57.0, 112.0, 171.0, 228.0, 97.0, 67.0, 51.0, 22.0, 14.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2041015625, -0.19887542724609375, -0.1936492919921875, -0.18842315673828125, -0.183197021484375, -0.17797088623046875, -0.1727447509765625, -0.16751861572265625, -0.16229248046875, -0.15706634521484375, -0.1518402099609375, -0.14661407470703125, -0.141387939453125, -0.13616180419921875, -0.1309356689453125, -0.12570953369140625, -0.1204833984375, -0.11525726318359375, -0.1100311279296875, -0.10480499267578125, -0.099578857421875, -0.09435272216796875, -0.0891265869140625, -0.08390045166015625, -0.07867431640625, -0.07344818115234375, -0.0682220458984375, -0.06299591064453125, -0.057769775390625, -0.05254364013671875, -0.0473175048828125, -0.04209136962890625, -0.036865234375, -0.03163909912109375, -0.0264129638671875, -0.02118682861328125, -0.015960693359375, -0.01073455810546875, -0.0055084228515625, -0.00028228759765625, 0.00494384765625, 0.01016998291015625, 0.0153961181640625, 0.02062225341796875, 0.025848388671875, 0.03107452392578125, 0.0363006591796875, 0.04152679443359375, 0.0467529296875, 0.05197906494140625, 0.0572052001953125, 0.06243133544921875, 0.067657470703125, 0.07288360595703125, 0.0781097412109375, 0.08333587646484375, 0.08856201171875, 0.09378814697265625, 0.0990142822265625, 0.10424041748046875, 0.109466552734375, 0.11469268798828125, 0.1199188232421875, 0.12514495849609375, 0.13037109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 16.0, 25.0, 46.0, 101.0, 196.0, 310.0, 149.0, 66.0, 34.0, 24.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.903681993484497, -2.7609798908233643, -2.6182777881622314, -2.4755756855010986, -2.3328733444213867, -2.190171241760254, -2.047469139099121, -1.9047670364379883, -1.7620649337768555, -1.6193628311157227, -1.4766607284545898, -1.3339585065841675, -1.1912564039230347, -1.0485543012619019, -0.9058521389961243, -0.7631499767303467, -0.6204478740692139, -0.47774574160575867, -0.33504360914230347, -0.19234147667884827, -0.049639344215393066, 0.09306275844573975, 0.23576492071151733, 0.3784670829772949, 0.5211691856384277, 0.6638712882995605, 0.8065734505653381, 0.9492756128311157, 1.0919777154922485, 1.2346798181533813, 1.3773820400238037, 1.5200841426849365, 1.6627860069274902, 1.805488109588623, 1.9481902122497559, 2.0908923149108887, 2.2335944175720215, 2.3762965202331543, 2.518998861312866, 2.661700963973999, 2.804403066635132, 2.9471051692962646, 3.0898072719573975, 3.2325093746185303, 3.375211715698242, 3.517913818359375, 3.660615921020508, 3.8033180236816406, 3.9460201263427734, 4.088722229003906, 4.231424331665039, 4.374126434326172, 4.516828536987305, 4.6595306396484375, 4.80223274230957, 4.944934844970703, 5.087636947631836, 5.230339050292969, 5.373041152954102, 5.515743255615234, 5.658445358276367, 5.8011474609375, 5.943849563598633, 6.086551666259766, 6.229254245758057]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 6.0, 5.0, 19.0, 17.0, 17.0, 24.0, 33.0, 29.0, 34.0, 51.0, 49.0, 44.0, 60.0, 47.0, 62.0, 52.0, 45.0, 58.0, 40.0, 51.0, 36.0, 42.0, 36.0, 27.0, 26.0, 23.0, 15.0, 15.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0103719234466553, -2.907381772994995, -2.804391384124756, -2.7014012336730957, -2.5984108448028564, -2.4954206943511963, -2.392430305480957, -2.289440155029297, -2.1864500045776367, -2.0834598541259766, -1.9804694652557373, -1.8774793148040771, -1.7744890451431274, -1.6714987754821777, -1.568508505821228, -1.4655182361602783, -1.3625279664993286, -1.259537696838379, -1.1565474271774292, -1.0535571575164795, -0.9505670070648193, -0.8475767374038696, -0.7445864677429199, -0.641596257686615, -0.5386059880256653, -0.43561574816703796, -0.33262550830841064, -0.22963523864746094, -0.12664499878883362, -0.0236547589302063, 0.07933551073074341, 0.18232572078704834, 0.28531599044799805, 0.38830623030662537, 0.4912964701652527, 0.5942867398262024, 0.6972769498825073, 0.800267219543457, 0.9032574892044067, 1.0062477588653564, 1.1092379093170166, 1.2122281789779663, 1.315218448638916, 1.4182085990905762, 1.5211988687515259, 1.6241891384124756, 1.7271794080734253, 1.830169677734375, 1.9331599473953247, 2.0361502170562744, 2.1391403675079346, 2.242130756378174, 2.345120906829834, 2.448111057281494, 2.5511014461517334, 2.6540915966033936, 2.757081985473633, 2.860072135925293, 2.9630625247955322, 3.0660526752471924, 3.1690430641174316, 3.272033214569092, 3.375023365020752, 3.478013753890991, 3.5810039043426514]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 5.0, 3.0, 2.0, 5.0, 9.0, 11.0, 11.0, 9.0, 12.0, 23.0, 34.0, 45.0, 68.0, 98.0, 160.0, 296.0, 461.0, 778.0, 1639.0, 3986.0, 15256.0, 213345.0, 3794245.0, 140270.0, 14421.0, 4736.0, 2041.0, 918.0, 490.0, 292.0, 203.0, 111.0, 88.0, 62.0, 39.0, 40.0, 25.0, 11.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.111328125, -3.0324859619140625, -2.953643798828125, -2.8748016357421875, -2.79595947265625, -2.7171173095703125, -2.638275146484375, -2.5594329833984375, -2.4805908203125, -2.4017486572265625, -2.322906494140625, -2.2440643310546875, -2.16522216796875, -2.0863800048828125, -2.007537841796875, -1.9286956787109375, -1.849853515625, -1.7710113525390625, -1.692169189453125, -1.6133270263671875, -1.53448486328125, -1.4556427001953125, -1.376800537109375, -1.2979583740234375, -1.2191162109375, -1.1402740478515625, -1.061431884765625, -0.9825897216796875, -0.90374755859375, -0.8249053955078125, -0.746063232421875, -0.6672210693359375, -0.58837890625, -0.5095367431640625, -0.430694580078125, -0.3518524169921875, -0.27301025390625, -0.1941680908203125, -0.115325927734375, -0.0364837646484375, 0.0423583984375, 0.1212005615234375, 0.200042724609375, 0.2788848876953125, 0.35772705078125, 0.4365692138671875, 0.515411376953125, 0.5942535400390625, 0.673095703125, 0.7519378662109375, 0.830780029296875, 0.9096221923828125, 0.98846435546875, 1.0673065185546875, 1.146148681640625, 1.2249908447265625, 1.3038330078125, 1.3826751708984375, 1.461517333984375, 1.5403594970703125, 1.61920166015625, 1.6980438232421875, 1.776885986328125, 1.8557281494140625, 1.9345703125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 6.0, 14.0, 22.0, 30.0, 42.0, 54.0, 65.0, 95.0, 110.0, 94.0, 93.0, 85.0, 71.0, 61.0, 38.0, 26.0, 26.0, 24.0, 13.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8837890625, -1.833709716796875, -1.78363037109375, -1.733551025390625, -1.6834716796875, -1.633392333984375, -1.58331298828125, -1.533233642578125, -1.483154296875, -1.433074951171875, -1.38299560546875, -1.332916259765625, -1.2828369140625, -1.232757568359375, -1.18267822265625, -1.132598876953125, -1.08251953125, -1.032440185546875, -0.98236083984375, -0.932281494140625, -0.8822021484375, -0.832122802734375, -0.78204345703125, -0.731964111328125, -0.681884765625, -0.631805419921875, -0.58172607421875, -0.531646728515625, -0.4815673828125, -0.431488037109375, -0.38140869140625, -0.331329345703125, -0.28125, -0.231170654296875, -0.18109130859375, -0.131011962890625, -0.0809326171875, -0.030853271484375, 0.01922607421875, 0.069305419921875, 0.119384765625, 0.169464111328125, 0.21954345703125, 0.269622802734375, 0.3197021484375, 0.369781494140625, 0.41986083984375, 0.469940185546875, 0.52001953125, 0.570098876953125, 0.62017822265625, 0.670257568359375, 0.7203369140625, 0.770416259765625, 0.82049560546875, 0.870574951171875, 0.920654296875, 0.970733642578125, 1.02081298828125, 1.070892333984375, 1.1209716796875, 1.171051025390625, 1.22113037109375, 1.271209716796875, 1.3212890625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 5.0, 13.0, 16.0, 18.0, 31.0, 43.0, 55.0, 70.0, 112.0, 193.0, 336.0, 555.0, 1086.0, 2335.0, 5272.0, 15379.0, 82500.0, 3821435.0, 227651.0, 23966.0, 7162.0, 2847.0, 1383.0, 765.0, 379.0, 231.0, 149.0, 88.0, 56.0, 43.0, 22.0, 17.0, 12.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.923828125, -1.861083984375, -1.79833984375, -1.735595703125, -1.6728515625, -1.610107421875, -1.54736328125, -1.484619140625, -1.421875, -1.359130859375, -1.29638671875, -1.233642578125, -1.1708984375, -1.108154296875, -1.04541015625, -0.982666015625, -0.919921875, -0.857177734375, -0.79443359375, -0.731689453125, -0.6689453125, -0.606201171875, -0.54345703125, -0.480712890625, -0.41796875, -0.355224609375, -0.29248046875, -0.229736328125, -0.1669921875, -0.104248046875, -0.04150390625, 0.021240234375, 0.083984375, 0.146728515625, 0.20947265625, 0.272216796875, 0.3349609375, 0.397705078125, 0.46044921875, 0.523193359375, 0.5859375, 0.648681640625, 0.71142578125, 0.774169921875, 0.8369140625, 0.899658203125, 0.96240234375, 1.025146484375, 1.087890625, 1.150634765625, 1.21337890625, 1.276123046875, 1.3388671875, 1.401611328125, 1.46435546875, 1.527099609375, 1.58984375, 1.652587890625, 1.71533203125, 1.778076171875, 1.8408203125, 1.903564453125, 1.96630859375, 2.029052734375, 2.091796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 3.0, 3.0, 10.0, 5.0, 8.0, 17.0, 12.0, 18.0, 29.0, 36.0, 83.0, 191.0, 476.0, 1287.0, 1072.0, 434.0, 161.0, 70.0, 43.0, 24.0, 17.0, 16.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5994491577148438, -0.5812225341796875, -0.5629959106445312, -0.544769287109375, -0.5265426635742188, -0.5083160400390625, -0.49008941650390625, -0.47186279296875, -0.45363616943359375, -0.4354095458984375, -0.41718292236328125, -0.398956298828125, -0.38072967529296875, -0.3625030517578125, -0.34427642822265625, -0.3260498046875, -0.30782318115234375, -0.2895965576171875, -0.27136993408203125, -0.253143310546875, -0.23491668701171875, -0.2166900634765625, -0.19846343994140625, -0.18023681640625, -0.16201019287109375, -0.1437835693359375, -0.12555694580078125, -0.107330322265625, -0.08910369873046875, -0.0708770751953125, -0.05265045166015625, -0.034423828125, -0.01619720458984375, 0.0020294189453125, 0.02025604248046875, 0.038482666015625, 0.05670928955078125, 0.0749359130859375, 0.09316253662109375, 0.11138916015625, 0.12961578369140625, 0.1478424072265625, 0.16606903076171875, 0.184295654296875, 0.20252227783203125, 0.2207489013671875, 0.23897552490234375, 0.2572021484375, 0.27542877197265625, 0.2936553955078125, 0.31188201904296875, 0.330108642578125, 0.34833526611328125, 0.3665618896484375, 0.38478851318359375, 0.40301513671875, 0.42124176025390625, 0.4394683837890625, 0.45769500732421875, 0.475921630859375, 0.49414825439453125, 0.5123748779296875, 0.5306015014648438, 0.548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 19.0, 17.0, 52.0, 51.0, 103.0, 130.0, 176.0, 158.0, 100.0, 59.0, 34.0, 29.0, 16.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7705849409103394, -1.701843023300171, -1.6331011056900024, -1.564359188079834, -1.495617151260376, -1.4268752336502075, -1.358133316040039, -1.2893913984298706, -1.2206494808197021, -1.1519075632095337, -1.0831656455993652, -1.0144236087799072, -0.9456816911697388, -0.8769397735595703, -0.8081978559494019, -0.7394559383392334, -0.6707139015197754, -0.6019719839096069, -0.5332300066947937, -0.46448808908462524, -0.3957461416721344, -0.32700419425964355, -0.2582622766494751, -0.18952032923698425, -0.12077838182449341, -0.05203644186258316, 0.016705498099327087, 0.08544743061065674, 0.15418937802314758, 0.22293132543563843, 0.2916732430458069, 0.36041519045829773, 0.4291572570800781, 0.49789920449256897, 0.5666411519050598, 0.6353830695152283, 0.7041250467300415, 0.77286696434021, 0.8416088819503784, 0.9103507995605469, 0.9790927767753601, 1.0478347539901733, 1.1165766716003418, 1.1853185892105103, 1.2540605068206787, 1.3228025436401367, 1.3915443420410156, 1.4602863788604736, 1.529028296470642, 1.5977702140808105, 1.666512131690979, 1.7352540493011475, 1.8039960861206055, 1.872738003730774, 1.9414799213409424, 2.0102219581604004, 2.0789637565612793, 2.1477057933807373, 2.216447591781616, 2.285189628601074, 2.353931427001953, 2.422673463821411, 2.491415500640869, 2.560157299041748, 2.628899335861206]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 1.0, 12.0, 13.0, 20.0, 22.0, 30.0, 42.0, 36.0, 41.0, 52.0, 69.0, 67.0, 65.0, 61.0, 55.0, 57.0, 61.0, 41.0, 53.0, 32.0, 43.0, 24.0, 27.0, 23.0, 9.0, 16.0, 12.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4072253704071045, -1.364511489868164, -1.3217976093292236, -1.2790837287902832, -1.2363698482513428, -1.1936559677124023, -1.150942087173462, -1.1082282066345215, -1.065514326095581, -1.0228004455566406, -0.9800865650177002, -0.9373726844787598, -0.8946588039398193, -0.8519449234008789, -0.8092310428619385, -0.766517162322998, -0.7238032817840576, -0.6810894012451172, -0.6383755207061768, -0.5956616401672363, -0.5529477596282959, -0.5102338790893555, -0.46751999855041504, -0.4248061180114746, -0.3820922374725342, -0.33937835693359375, -0.2966644763946533, -0.2539505958557129, -0.21123671531677246, -0.16852283477783203, -0.1258089542388916, -0.08309507369995117, -0.04038119316101074, 0.0023326873779296875, 0.04504656791687012, 0.08776044845581055, 0.13047432899475098, 0.1731882095336914, 0.21590209007263184, 0.25861597061157227, 0.3013298511505127, 0.3440437316894531, 0.38675761222839355, 0.429471492767334, 0.4721853733062744, 0.5148992538452148, 0.5576131343841553, 0.6003270149230957, 0.6430408954620361, 0.6857547760009766, 0.728468656539917, 0.7711825370788574, 0.8138964176177979, 0.8566102981567383, 0.8993241786956787, 0.9420380592346191, 0.9847519397735596, 1.0274658203125, 1.0701797008514404, 1.1128935813903809, 1.1556074619293213, 1.1983213424682617, 1.2410352230072021, 1.2837491035461426, 1.326462984085083]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 13.0, 17.0, 23.0, 56.0, 82.0, 151.0, 290.0, 519.0, 1208.0, 3037.0, 9980.0, 69193.0, 847330.0, 98462.0, 12087.0, 3389.0, 1388.0, 643.0, 299.0, 150.0, 65.0, 40.0, 36.0, 33.0, 11.0, 13.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.43233489990234375, -0.4139862060546875, -0.39563751220703125, -0.377288818359375, -0.35894012451171875, -0.3405914306640625, -0.32224273681640625, -0.30389404296875, -0.28554534912109375, -0.2671966552734375, -0.24884796142578125, -0.230499267578125, -0.21215057373046875, -0.1938018798828125, -0.17545318603515625, -0.1571044921875, -0.13875579833984375, -0.1204071044921875, -0.10205841064453125, -0.083709716796875, -0.06536102294921875, -0.0470123291015625, -0.02866363525390625, -0.01031494140625, 0.00803375244140625, 0.0263824462890625, 0.04473114013671875, 0.063079833984375, 0.08142852783203125, 0.0997772216796875, 0.11812591552734375, 0.136474609375, 0.15482330322265625, 0.1731719970703125, 0.19152069091796875, 0.209869384765625, 0.22821807861328125, 0.2465667724609375, 0.26491546630859375, 0.28326416015625, 0.30161285400390625, 0.3199615478515625, 0.33831024169921875, 0.356658935546875, 0.37500762939453125, 0.3933563232421875, 0.41170501708984375, 0.4300537109375, 0.44840240478515625, 0.4667510986328125, 0.48509979248046875, 0.503448486328125, 0.5217971801757812, 0.5401458740234375, 0.5584945678710938, 0.57684326171875, 0.5951919555664062, 0.6135406494140625, 0.6318893432617188, 0.650238037109375, 0.6685867309570312, 0.6869354248046875, 0.7052841186523438, 0.7236328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 2.0, 4.0, 8.0, 11.0, 16.0, 23.0, 43.0, 51.0, 48.0, 73.0, 87.0, 105.0, 103.0, 87.0, 80.0, 73.0, 50.0, 42.0, 28.0, 24.0, 23.0, 14.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6376953125, -1.5970611572265625, -1.556427001953125, -1.5157928466796875, -1.47515869140625, -1.4345245361328125, -1.393890380859375, -1.3532562255859375, -1.3126220703125, -1.2719879150390625, -1.231353759765625, -1.1907196044921875, -1.15008544921875, -1.1094512939453125, -1.068817138671875, -1.0281829833984375, -0.987548828125, -0.9469146728515625, -0.906280517578125, -0.8656463623046875, -0.82501220703125, -0.7843780517578125, -0.743743896484375, -0.7031097412109375, -0.6624755859375, -0.6218414306640625, -0.581207275390625, -0.5405731201171875, -0.49993896484375, -0.4593048095703125, -0.418670654296875, -0.3780364990234375, -0.33740234375, -0.2967681884765625, -0.256134033203125, -0.2154998779296875, -0.17486572265625, -0.1342315673828125, -0.093597412109375, -0.0529632568359375, -0.0123291015625, 0.0283050537109375, 0.068939208984375, 0.1095733642578125, 0.15020751953125, 0.1908416748046875, 0.231475830078125, 0.2721099853515625, 0.312744140625, 0.3533782958984375, 0.394012451171875, 0.4346466064453125, 0.47528076171875, 0.5159149169921875, 0.556549072265625, 0.5971832275390625, 0.6378173828125, 0.6784515380859375, 0.719085693359375, 0.7597198486328125, 0.80035400390625, 0.8409881591796875, 0.881622314453125, 0.9222564697265625, 0.962890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 20.0, 22.0, 27.0, 56.0, 73.0, 144.0, 220.0, 299.0, 552.0, 942.0, 1705.0, 3222.0, 7259.0, 21659.0, 112437.0, 694756.0, 161212.0, 27231.0, 8364.0, 3823.0, 1815.0, 1053.0, 620.0, 343.0, 217.0, 149.0, 98.0, 64.0, 42.0, 23.0, 24.0, 14.0, 13.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2727622985839844, -0.26354217529296875, -0.2543220520019531, -0.2451019287109375, -0.23588180541992188, -0.22666168212890625, -0.21744155883789062, -0.208221435546875, -0.19900131225585938, -0.18978118896484375, -0.18056106567382812, -0.1713409423828125, -0.16212081909179688, -0.15290069580078125, -0.14368057250976562, -0.13446044921875, -0.12524032592773438, -0.11602020263671875, -0.10680007934570312, -0.0975799560546875, -0.08835983276367188, -0.07913970947265625, -0.06991958618164062, -0.060699462890625, -0.051479339599609375, -0.04225921630859375, -0.033039093017578125, -0.0238189697265625, -0.014598846435546875, -0.00537872314453125, 0.003841400146484375, 0.0130615234375, 0.022281646728515625, 0.03150177001953125, 0.040721893310546875, 0.0499420166015625, 0.059162139892578125, 0.06838226318359375, 0.07760238647460938, 0.086822509765625, 0.09604263305664062, 0.10526275634765625, 0.11448287963867188, 0.1237030029296875, 0.13292312622070312, 0.14214324951171875, 0.15136337280273438, 0.16058349609375, 0.16980361938476562, 0.17902374267578125, 0.18824386596679688, 0.1974639892578125, 0.20668411254882812, 0.21590423583984375, 0.22512435913085938, 0.234344482421875, 0.24356460571289062, 0.25278472900390625, 0.2620048522949219, 0.2712249755859375, 0.2804450988769531, 0.28966522216796875, 0.2988853454589844, 0.30810546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 3.0, 10.0, 4.0, 11.0, 7.0, 10.0, 14.0, 15.0, 29.0, 18.0, 25.0, 31.0, 38.0, 34.0, 35.0, 52.0, 40.0, 46.0, 56.0, 38.0, 49.0, 35.0, 47.0, 40.0, 38.0, 48.0, 30.0, 29.0, 30.0, 19.0, 23.0, 20.0, 9.0, 8.0, 7.0, 10.0, 12.0, 3.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0264739990234375, -0.989471435546875, -0.9524688720703125, -0.91546630859375, -0.8784637451171875, -0.841461181640625, -0.8044586181640625, -0.7674560546875, -0.7304534912109375, -0.693450927734375, -0.6564483642578125, -0.61944580078125, -0.5824432373046875, -0.545440673828125, -0.5084381103515625, -0.471435546875, -0.4344329833984375, -0.397430419921875, -0.3604278564453125, -0.32342529296875, -0.2864227294921875, -0.249420166015625, -0.2124176025390625, -0.1754150390625, -0.1384124755859375, -0.101409912109375, -0.0644073486328125, -0.02740478515625, 0.0095977783203125, 0.046600341796875, 0.0836029052734375, 0.12060546875, 0.1576080322265625, 0.194610595703125, 0.2316131591796875, 0.26861572265625, 0.3056182861328125, 0.342620849609375, 0.3796234130859375, 0.4166259765625, 0.4536285400390625, 0.490631103515625, 0.5276336669921875, 0.56463623046875, 0.6016387939453125, 0.638641357421875, 0.6756439208984375, 0.712646484375, 0.7496490478515625, 0.786651611328125, 0.8236541748046875, 0.86065673828125, 0.8976593017578125, 0.934661865234375, 0.9716644287109375, 1.0086669921875, 1.0456695556640625, 1.082672119140625, 1.1196746826171875, 1.15667724609375, 1.1936798095703125, 1.230682373046875, 1.2676849365234375, 1.3046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 13.0, 15.0, 23.0, 31.0, 71.0, 130.0, 241.0, 640.0, 1949.0, 8591.0, 86737.0, 883729.0, 56718.0, 6816.0, 1680.0, 605.0, 234.0, 116.0, 77.0, 38.0, 39.0, 16.0, 12.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.1275005340576172, -0.12267684936523438, -0.11785316467285156, -0.11302947998046875, -0.10820579528808594, -0.10338211059570312, -0.09855842590332031, -0.0937347412109375, -0.08891105651855469, -0.08408737182617188, -0.07926368713378906, -0.07444000244140625, -0.06961631774902344, -0.06479263305664062, -0.05996894836425781, -0.055145263671875, -0.05032157897949219, -0.045497894287109375, -0.04067420959472656, -0.03585052490234375, -0.031026840209960938, -0.026203155517578125, -0.021379470825195312, -0.0165557861328125, -0.011732101440429688, -0.006908416748046875, -0.0020847320556640625, 0.00273895263671875, 0.0075626373291015625, 0.012386322021484375, 0.017210006713867188, 0.02203369140625, 0.026857376098632812, 0.031681060791015625, 0.03650474548339844, 0.04132843017578125, 0.04615211486816406, 0.050975799560546875, 0.05579948425292969, 0.0606231689453125, 0.06544685363769531, 0.07027053833007812, 0.07509422302246094, 0.07991790771484375, 0.08474159240722656, 0.08956527709960938, 0.09438896179199219, 0.099212646484375, 0.10403633117675781, 0.10886001586914062, 0.11368370056152344, 0.11850738525390625, 0.12333106994628906, 0.12815475463867188, 0.1329784393310547, 0.1378021240234375, 0.1426258087158203, 0.14744949340820312, 0.15227317810058594, 0.15709686279296875, 0.16192054748535156, 0.16674423217773438, 0.1715679168701172, 0.1763916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 32.0, 57.0, 148.0, 276.0, 254.0, 115.0, 41.0, 12.0, 13.0, 10.0, 6.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011628866195678711, -0.00011304859071969986, -0.00010980851948261261, -0.00010656844824552536, -0.00010332837700843811, -0.00010008830577135086, -9.684823453426361e-05, -9.360816329717636e-05, -9.036809206008911e-05, -8.712802082300186e-05, -8.388794958591461e-05, -8.064787834882736e-05, -7.740780711174011e-05, -7.416773587465286e-05, -7.092766463756561e-05, -6.768759340047836e-05, -6.444752216339111e-05, -6.120745092630386e-05, -5.7967379689216614e-05, -5.4727308452129364e-05, -5.1487237215042114e-05, -4.8247165977954865e-05, -4.5007094740867615e-05, -4.1767023503780365e-05, -3.8526952266693115e-05, -3.5286881029605865e-05, -3.2046809792518616e-05, -2.8806738555431366e-05, -2.5566667318344116e-05, -2.2326596081256866e-05, -1.9086524844169617e-05, -1.5846453607082367e-05, -1.2606382369995117e-05, -9.366311132907867e-06, -6.126239895820618e-06, -2.886168658733368e-06, 3.5390257835388184e-07, 3.5939738154411316e-06, 6.834045052528381e-06, 1.0074116289615631e-05, 1.3314187526702881e-05, 1.655425876379013e-05, 1.979433000087738e-05, 2.303440123796463e-05, 2.627447247505188e-05, 2.951454371213913e-05, 3.275461494922638e-05, 3.599468618631363e-05, 3.923475742340088e-05, 4.247482866048813e-05, 4.571489989757538e-05, 4.895497113466263e-05, 5.219504237174988e-05, 5.543511360883713e-05, 5.867518484592438e-05, 6.191525608301163e-05, 6.515532732009888e-05, 6.839539855718613e-05, 7.163546979427338e-05, 7.487554103136063e-05, 7.811561226844788e-05, 8.135568350553513e-05, 8.459575474262238e-05, 8.783582597970963e-05, 9.107589721679688e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 4.0, 8.0, 8.0, 8.0, 13.0, 18.0, 35.0, 40.0, 52.0, 74.0, 107.0, 169.0, 240.0, 379.0, 580.0, 980.0, 1519.0, 2935.0, 5630.0, 13212.0, 41811.0, 213342.0, 585486.0, 130760.0, 29874.0, 10464.0, 4631.0, 2353.0, 1390.0, 813.0, 537.0, 345.0, 209.0, 138.0, 112.0, 78.0, 44.0, 44.0, 28.0, 19.0, 10.0, 23.0, 6.0, 5.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07021045684814453, -0.06797218322753906, -0.0657339096069336, -0.06349563598632812, -0.061257362365722656, -0.05901908874511719, -0.05678081512451172, -0.05454254150390625, -0.05230426788330078, -0.05006599426269531, -0.047827720642089844, -0.045589447021484375, -0.043351173400878906, -0.04111289978027344, -0.03887462615966797, -0.0366363525390625, -0.03439807891845703, -0.03215980529785156, -0.029921531677246094, -0.027683258056640625, -0.025444984436035156, -0.023206710815429688, -0.02096843719482422, -0.01873016357421875, -0.01649188995361328, -0.014253616333007812, -0.012015342712402344, -0.009777069091796875, -0.007538795471191406, -0.0053005218505859375, -0.0030622482299804688, -0.000823974609375, 0.0014142990112304688, 0.0036525726318359375, 0.005890846252441406, 0.008129119873046875, 0.010367393493652344, 0.012605667114257812, 0.014843940734863281, 0.01708221435546875, 0.01932048797607422, 0.021558761596679688, 0.023797035217285156, 0.026035308837890625, 0.028273582458496094, 0.030511856079101562, 0.03275012969970703, 0.0349884033203125, 0.03722667694091797, 0.03946495056152344, 0.041703224182128906, 0.043941497802734375, 0.046179771423339844, 0.04841804504394531, 0.05065631866455078, 0.05289459228515625, 0.05513286590576172, 0.05737113952636719, 0.059609413146972656, 0.061847686767578125, 0.0640859603881836, 0.06632423400878906, 0.06856250762939453, 0.07080078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 18.0, 14.0, 26.0, 41.0, 51.0, 94.0, 117.0, 140.0, 123.0, 89.0, 77.0, 56.0, 43.0, 25.0, 17.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024139404296875, -0.02335071563720703, -0.022562026977539062, -0.021773338317871094, -0.020984649658203125, -0.020195960998535156, -0.019407272338867188, -0.01861858367919922, -0.01782989501953125, -0.01704120635986328, -0.016252517700195312, -0.015463829040527344, -0.014675140380859375, -0.013886451721191406, -0.013097763061523438, -0.012309074401855469, -0.0115203857421875, -0.010731697082519531, -0.009943008422851562, -0.009154319763183594, -0.008365631103515625, -0.007576942443847656, -0.0067882537841796875, -0.005999565124511719, -0.00521087646484375, -0.004422187805175781, -0.0036334991455078125, -0.0028448104858398438, -0.002056121826171875, -0.0012674331665039062, -0.0004787445068359375, 0.00030994415283203125, 0.0010986328125, 0.0018873214721679688, 0.0026760101318359375, 0.0034646987915039062, 0.004253387451171875, 0.005042076110839844, 0.0058307647705078125, 0.006619453430175781, 0.00740814208984375, 0.008196830749511719, 0.008985519409179688, 0.009774208068847656, 0.010562896728515625, 0.011351585388183594, 0.012140274047851562, 0.012928962707519531, 0.0137176513671875, 0.014506340026855469, 0.015295028686523438, 0.016083717346191406, 0.016872406005859375, 0.017661094665527344, 0.018449783325195312, 0.01923847198486328, 0.02002716064453125, 0.02081584930419922, 0.021604537963867188, 0.022393226623535156, 0.023181915283203125, 0.023970603942871094, 0.024759292602539062, 0.02554798126220703, 0.026336669921875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 16.0, 50.0, 109.0, 299.0, 309.0, 125.0, 47.0, 13.0, 13.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.703280448913574, -3.613175392150879, -3.5230703353881836, -3.4329652786254883, -3.342860221862793, -3.2527554035186768, -3.1626503467559814, -3.072545289993286, -2.982440233230591, -2.8923351764678955, -2.8022301197052, -2.712125062942505, -2.6220202445983887, -2.5319151878356934, -2.441810131072998, -2.3517050743103027, -2.2616000175476074, -2.171494960784912, -2.081389904022217, -1.991284966468811, -1.9011799097061157, -1.8110748529434204, -1.7209699153900146, -1.6308648586273193, -1.540759801864624, -1.4506547451019287, -1.3605496883392334, -1.2704447507858276, -1.1803396940231323, -1.090234637260437, -1.0001296997070312, -0.9100246429443359, -0.8199193477630615, -0.7298142910003662, -0.6397092938423157, -0.5496042966842651, -0.4594992399215698, -0.3693942129611969, -0.279289186000824, -0.18918418884277344, -0.09907913208007812, -0.0089741051197052, 0.08113092184066772, 0.17123594880104065, 0.2613409757614136, 0.3514460027217865, 0.4415510296821594, 0.53165602684021, 0.6217610836029053, 0.7118661403656006, 0.8019711375236511, 0.8920761346817017, 0.982181191444397, 1.0722862482070923, 1.162391185760498, 1.2524962425231934, 1.3426012992858887, 1.432706356048584, 1.5228114128112793, 1.612916350364685, 1.7030214071273804, 1.7931264638900757, 1.8832314014434814, 1.9733364582061768, 2.063441514968872]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 17.0, 19.0, 26.0, 41.0, 52.0, 55.0, 64.0, 102.0, 96.0, 78.0, 81.0, 78.0, 66.0, 55.0, 41.0, 36.0, 29.0, 23.0, 16.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.436684250831604, -1.4001200199127197, -1.3635557889938354, -1.3269915580749512, -1.2904272079467773, -1.253862977027893, -1.2172987461090088, -1.1807345151901245, -1.1441702842712402, -1.107606053352356, -1.0710418224334717, -1.0344775915145874, -0.9979133009910583, -0.9613490700721741, -0.924784779548645, -0.8882205486297607, -0.8516563177108765, -0.8150920867919922, -0.7785278558731079, -0.7419635653495789, -0.7053993344306946, -0.6688351035118103, -0.6322708129882812, -0.595706582069397, -0.5591423511505127, -0.5225781202316284, -0.48601385951042175, -0.4494495987892151, -0.4128853678703308, -0.37632113695144653, -0.33975687623023987, -0.3031926155090332, -0.2666285037994385, -0.230064257979393, -0.19350001215934753, -0.15693576633930206, -0.12037152051925659, -0.08380727469921112, -0.04724302887916565, -0.010678768157958984, 0.025885462760925293, 0.062449708580970764, 0.09901395440101624, 0.1355782002210617, 0.17214244604110718, 0.20870669186115265, 0.24527093768119812, 0.2818351984024048, 0.31839942932128906, 0.35496366024017334, 0.39152792096138, 0.42809218168258667, 0.46465641260147095, 0.5012206435203552, 0.5377849340438843, 0.5743491649627686, 0.6109133958816528, 0.6474776268005371, 0.6840418577194214, 0.7206061482429504, 0.7571703791618347, 0.793734610080719, 0.830298900604248, 0.8668631315231323, 0.9034273624420166]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 17.0, 21.0, 32.0, 36.0, 54.0, 101.0, 137.0, 227.0, 414.0, 719.0, 1419.0, 3575.0, 9913.0, 41643.0, 758965.0, 196415.0, 23149.0, 6718.0, 2482.0, 1082.0, 561.0, 301.0, 207.0, 113.0, 83.0, 50.0, 34.0, 22.0, 11.0, 13.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.802734375, -0.7775039672851562, -0.7522735595703125, -0.7270431518554688, -0.701812744140625, -0.6765823364257812, -0.6513519287109375, -0.6261215209960938, -0.60089111328125, -0.5756607055664062, -0.5504302978515625, -0.5251998901367188, -0.499969482421875, -0.47473907470703125, -0.4495086669921875, -0.42427825927734375, -0.3990478515625, -0.37381744384765625, -0.3485870361328125, -0.32335662841796875, -0.298126220703125, -0.27289581298828125, -0.2476654052734375, -0.22243499755859375, -0.19720458984375, -0.17197418212890625, -0.1467437744140625, -0.12151336669921875, -0.096282958984375, -0.07105255126953125, -0.0458221435546875, -0.02059173583984375, 0.004638671875, 0.02986907958984375, 0.0550994873046875, 0.08032989501953125, 0.105560302734375, 0.13079071044921875, 0.1560211181640625, 0.18125152587890625, 0.20648193359375, 0.23171234130859375, 0.2569427490234375, 0.28217315673828125, 0.307403564453125, 0.33263397216796875, 0.3578643798828125, 0.38309478759765625, 0.4083251953125, 0.43355560302734375, 0.4587860107421875, 0.48401641845703125, 0.509246826171875, 0.5344772338867188, 0.5597076416015625, 0.5849380493164062, 0.61016845703125, 0.6353988647460938, 0.6606292724609375, 0.6858596801757812, 0.711090087890625, 0.7363204956054688, 0.7615509033203125, 0.7867813110351562, 0.81201171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 24.0, 19.0, 29.0, 31.0, 44.0, 46.0, 61.0, 80.0, 81.0, 87.0, 72.0, 76.0, 68.0, 52.0, 48.0, 32.0, 24.0, 26.0, 25.0, 14.0, 16.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.984466552734375, -1.92010498046875, -1.855743408203125, -1.7913818359375, -1.727020263671875, -1.66265869140625, -1.598297119140625, -1.533935546875, -1.469573974609375, -1.40521240234375, -1.340850830078125, -1.2764892578125, -1.212127685546875, -1.14776611328125, -1.083404541015625, -1.01904296875, -0.954681396484375, -0.89031982421875, -0.825958251953125, -0.7615966796875, -0.697235107421875, -0.63287353515625, -0.568511962890625, -0.504150390625, -0.439788818359375, -0.37542724609375, -0.311065673828125, -0.2467041015625, -0.182342529296875, -0.11798095703125, -0.053619384765625, 0.0107421875, 0.075103759765625, 0.13946533203125, 0.203826904296875, 0.2681884765625, 0.332550048828125, 0.39691162109375, 0.461273193359375, 0.525634765625, 0.589996337890625, 0.65435791015625, 0.718719482421875, 0.7830810546875, 0.847442626953125, 0.91180419921875, 0.976165771484375, 1.04052734375, 1.104888916015625, 1.16925048828125, 1.233612060546875, 1.2979736328125, 1.362335205078125, 1.42669677734375, 1.491058349609375, 1.555419921875, 1.619781494140625, 1.68414306640625, 1.748504638671875, 1.8128662109375, 1.877227783203125, 1.94158935546875, 2.005950927734375, 2.0703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 16.0, 24.0, 30.0, 31.0, 46.0, 54.0, 77.0, 237.0, 1648.0, 75516.0, 966168.0, 3843.0, 398.0, 126.0, 81.0, 49.0, 37.0, 35.0, 26.0, 19.0, 14.0, 22.0, 10.0, 3.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8011474609375, -1.723388671875, -1.6456298828125, -1.56787109375, -1.4901123046875, -1.412353515625, -1.3345947265625, -1.2568359375, -1.1790771484375, -1.101318359375, -1.0235595703125, -0.94580078125, -0.8680419921875, -0.790283203125, -0.7125244140625, -0.634765625, -0.5570068359375, -0.479248046875, -0.4014892578125, -0.32373046875, -0.2459716796875, -0.168212890625, -0.0904541015625, -0.0126953125, 0.0650634765625, 0.142822265625, 0.2205810546875, 0.29833984375, 0.3760986328125, 0.453857421875, 0.5316162109375, 0.609375, 0.6871337890625, 0.764892578125, 0.8426513671875, 0.92041015625, 0.9981689453125, 1.075927734375, 1.1536865234375, 1.2314453125, 1.3092041015625, 1.386962890625, 1.4647216796875, 1.54248046875, 1.6202392578125, 1.697998046875, 1.7757568359375, 1.853515625, 1.9312744140625, 2.009033203125, 2.0867919921875, 2.16455078125, 2.2423095703125, 2.320068359375, 2.3978271484375, 2.4755859375, 2.5533447265625, 2.631103515625, 2.7088623046875, 2.78662109375, 2.8643798828125, 2.942138671875, 3.0198974609375, 3.09765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 7.0, 14.0, 16.0, 27.0, 29.0, 32.0, 53.0, 41.0, 58.0, 49.0, 50.0, 57.0, 72.0, 65.0, 48.0, 78.0, 52.0, 42.0, 36.0, 32.0, 24.0, 25.0, 21.0, 17.0, 9.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.34649658203125, -1.2886962890625, -1.23089599609375, -1.173095703125, -1.11529541015625, -1.0574951171875, -0.99969482421875, -0.94189453125, -0.88409423828125, -0.8262939453125, -0.76849365234375, -0.710693359375, -0.65289306640625, -0.5950927734375, -0.53729248046875, -0.4794921875, -0.42169189453125, -0.3638916015625, -0.30609130859375, -0.248291015625, -0.19049072265625, -0.1326904296875, -0.07489013671875, -0.01708984375, 0.04071044921875, 0.0985107421875, 0.15631103515625, 0.214111328125, 0.27191162109375, 0.3297119140625, 0.38751220703125, 0.4453125, 0.50311279296875, 0.5609130859375, 0.61871337890625, 0.676513671875, 0.73431396484375, 0.7921142578125, 0.84991455078125, 0.90771484375, 0.96551513671875, 1.0233154296875, 1.08111572265625, 1.138916015625, 1.19671630859375, 1.2545166015625, 1.31231689453125, 1.3701171875, 1.42791748046875, 1.4857177734375, 1.54351806640625, 1.601318359375, 1.65911865234375, 1.7169189453125, 1.77471923828125, 1.83251953125, 1.89031982421875, 1.9481201171875, 2.00592041015625, 2.063720703125, 2.12152099609375, 2.1793212890625, 2.23712158203125, 2.294921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 14.0, 11.0, 17.0, 25.0, 41.0, 65.0, 108.0, 184.0, 371.0, 775.0, 1686.0, 4969.0, 26331.0, 921795.0, 79576.0, 7987.0, 2447.0, 1020.0, 491.0, 241.0, 141.0, 79.0, 43.0, 32.0, 21.0, 24.0, 7.0, 10.0, 4.0, 11.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.55810546875, -0.5432968139648438, -0.5284881591796875, -0.5136795043945312, -0.498870849609375, -0.48406219482421875, -0.4692535400390625, -0.45444488525390625, -0.43963623046875, -0.42482757568359375, -0.4100189208984375, -0.39521026611328125, -0.380401611328125, -0.36559295654296875, -0.3507843017578125, -0.33597564697265625, -0.3211669921875, -0.30635833740234375, -0.2915496826171875, -0.27674102783203125, -0.261932373046875, -0.24712371826171875, -0.2323150634765625, -0.21750640869140625, -0.20269775390625, -0.18788909912109375, -0.1730804443359375, -0.15827178955078125, -0.143463134765625, -0.12865447998046875, -0.1138458251953125, -0.09903717041015625, -0.084228515625, -0.06941986083984375, -0.0546112060546875, -0.03980255126953125, -0.024993896484375, -0.01018524169921875, 0.0046234130859375, 0.01943206787109375, 0.03424072265625, 0.04904937744140625, 0.0638580322265625, 0.07866668701171875, 0.093475341796875, 0.10828399658203125, 0.1230926513671875, 0.13790130615234375, 0.1527099609375, 0.16751861572265625, 0.1823272705078125, 0.19713592529296875, 0.211944580078125, 0.22675323486328125, 0.2415618896484375, 0.25637054443359375, 0.27117919921875, 0.28598785400390625, 0.3007965087890625, 0.31560516357421875, 0.330413818359375, 0.34522247314453125, 0.3600311279296875, 0.37483978271484375, 0.3896484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 21.0, 24.0, 45.0, 96.0, 381.0, 216.0, 83.0, 38.0, 24.0, 17.0, 15.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.599592208862305e-05, -7.368717342615128e-05, -7.13784247636795e-05, -6.906967610120773e-05, -6.676092743873596e-05, -6.445217877626419e-05, -6.214343011379242e-05, -5.983468145132065e-05, -5.752593278884888e-05, -5.5217184126377106e-05, -5.2908435463905334e-05, -5.059968680143356e-05, -4.829093813896179e-05, -4.598218947649002e-05, -4.367344081401825e-05, -4.136469215154648e-05, -3.905594348907471e-05, -3.6747194826602936e-05, -3.4438446164131165e-05, -3.212969750165939e-05, -2.9820948839187622e-05, -2.751220017671585e-05, -2.520345151424408e-05, -2.289470285177231e-05, -2.0585954189300537e-05, -1.8277205526828766e-05, -1.5968456864356995e-05, -1.3659708201885223e-05, -1.1350959539413452e-05, -9.042210876941681e-06, -6.73346221446991e-06, -4.4247135519981384e-06, -2.115964889526367e-06, 1.9278377294540405e-07, 2.5015324354171753e-06, 4.8102810978889465e-06, 7.119029760360718e-06, 9.427778422832489e-06, 1.173652708530426e-05, 1.4045275747776031e-05, 1.6354024410247803e-05, 1.8662773072719574e-05, 2.0971521735191345e-05, 2.3280270397663116e-05, 2.5589019060134888e-05, 2.789776772260666e-05, 3.020651638507843e-05, 3.25152650475502e-05, 3.482401371002197e-05, 3.7132762372493744e-05, 3.9441511034965515e-05, 4.1750259697437286e-05, 4.405900835990906e-05, 4.636775702238083e-05, 4.86765056848526e-05, 5.098525434732437e-05, 5.329400300979614e-05, 5.5602751672267914e-05, 5.7911500334739685e-05, 6.0220248997211456e-05, 6.252899765968323e-05, 6.4837746322155e-05, 6.714649498462677e-05, 6.945524364709854e-05, 7.176399230957031e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 10.0, 11.0, 19.0, 21.0, 35.0, 42.0, 78.0, 98.0, 145.0, 222.0, 385.0, 721.0, 1488.0, 4754.0, 26597.0, 925338.0, 76092.0, 8075.0, 2232.0, 906.0, 491.0, 249.0, 180.0, 110.0, 80.0, 49.0, 35.0, 29.0, 18.0, 8.0, 7.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438232421875, -0.4211692810058594, -0.40410614013671875, -0.3870429992675781, -0.3699798583984375, -0.3529167175292969, -0.33585357666015625, -0.3187904357910156, -0.301727294921875, -0.2846641540527344, -0.26760101318359375, -0.2505378723144531, -0.2334747314453125, -0.21641159057617188, -0.19934844970703125, -0.18228530883789062, -0.16522216796875, -0.14815902709960938, -0.13109588623046875, -0.11403274536132812, -0.0969696044921875, -0.07990646362304688, -0.06284332275390625, -0.045780181884765625, -0.028717041015625, -0.011653900146484375, 0.00540924072265625, 0.022472381591796875, 0.0395355224609375, 0.056598663330078125, 0.07366180419921875, 0.09072494506835938, 0.1077880859375, 0.12485122680664062, 0.14191436767578125, 0.15897750854492188, 0.1760406494140625, 0.19310379028320312, 0.21016693115234375, 0.22723007202148438, 0.244293212890625, 0.2613563537597656, 0.27841949462890625, 0.2954826354980469, 0.3125457763671875, 0.3296089172363281, 0.34667205810546875, 0.3637351989746094, 0.38079833984375, 0.3978614807128906, 0.41492462158203125, 0.4319877624511719, 0.4490509033203125, 0.4661140441894531, 0.48317718505859375, 0.5002403259277344, 0.517303466796875, 0.5343666076660156, 0.5514297485351562, 0.5684928894042969, 0.5855560302734375, 0.6026191711425781, 0.6196823120117188, 0.6367454528808594, 0.65380859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 18.0, 31.0, 50.0, 137.0, 531.0, 109.0, 40.0, 32.0, 11.0, 7.0, 12.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3245868682861328, -0.3159217834472656, -0.30725669860839844, -0.29859161376953125, -0.28992652893066406, -0.2812614440917969, -0.2725963592529297, -0.2639312744140625, -0.2552661895751953, -0.24660110473632812, -0.23793601989746094, -0.22927093505859375, -0.22060585021972656, -0.21194076538085938, -0.2032756805419922, -0.194610595703125, -0.1859455108642578, -0.17728042602539062, -0.16861534118652344, -0.15995025634765625, -0.15128517150878906, -0.14262008666992188, -0.1339550018310547, -0.1252899169921875, -0.11662483215332031, -0.10795974731445312, -0.09929466247558594, -0.09062957763671875, -0.08196449279785156, -0.07329940795898438, -0.06463432312011719, -0.05596923828125, -0.04730415344238281, -0.038639068603515625, -0.029973983764648438, -0.02130889892578125, -0.012643814086914062, -0.003978729248046875, 0.0046863555908203125, 0.0133514404296875, 0.022016525268554688, 0.030681610107421875, 0.03934669494628906, 0.04801177978515625, 0.05667686462402344, 0.06534194946289062, 0.07400703430175781, 0.082672119140625, 0.09133720397949219, 0.10000228881835938, 0.10866737365722656, 0.11733245849609375, 0.12599754333496094, 0.13466262817382812, 0.1433277130126953, 0.1519927978515625, 0.1606578826904297, 0.16932296752929688, 0.17798805236816406, 0.18665313720703125, 0.19531822204589844, 0.20398330688476562, 0.2126483917236328, 0.2213134765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 16.0, 42.0, 108.0, 314.0, 312.0, 121.0, 42.0, 18.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.555488586425781, -9.352388381958008, -9.149288177490234, -8.946187019348145, -8.743086814880371, -8.539986610412598, -8.336885452270508, -8.133785247802734, -7.930685043334961, -7.7275848388671875, -7.524484157562256, -7.321383476257324, -7.118283271789551, -6.915183067321777, -6.712082386016846, -6.508981704711914, -6.305881500244141, -6.102781295776367, -5.8996806144714355, -5.696579933166504, -5.4934797286987305, -5.290379524230957, -5.087278842926025, -4.884178161621094, -4.68107795715332, -4.477977752685547, -4.274877071380615, -4.071776390075684, -3.86867618560791, -3.6655757427215576, -3.462475299835205, -3.2593748569488525, -3.056274890899658, -2.8531744480133057, -2.650074005126953, -2.4469735622406006, -2.243873119354248, -2.0407726764678955, -1.837672233581543, -1.6345717906951904, -1.431471347808838, -1.2283709049224854, -1.0252704620361328, -0.8221700191497803, -0.6190695762634277, -0.4159691333770752, -0.21286869049072266, -0.009768247604370117, 0.19333219528198242, 0.39643263816833496, 0.5995330810546875, 0.80263352394104, 1.0057339668273926, 1.2088344097137451, 1.4119348526000977, 1.6150352954864502, 1.8181357383728027, 2.0212361812591553, 2.224336624145508, 2.4274370670318604, 2.630537509918213, 2.8336379528045654, 3.036738395690918, 3.2398388385772705, 3.442939281463623]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 3.0, 7.0, 7.0, 19.0, 9.0, 16.0, 18.0, 24.0, 27.0, 26.0, 31.0, 32.0, 21.0, 41.0, 36.0, 47.0, 41.0, 54.0, 34.0, 40.0, 47.0, 43.0, 40.0, 32.0, 39.0, 37.0, 27.0, 27.0, 19.0, 19.0, 22.0, 12.0, 20.0, 13.0, 7.0, 8.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.3098936080932617, -2.2411890029907227, -2.1724843978881836, -2.1037797927856445, -2.0350751876831055, -1.9663704633712769, -1.8976657390594482, -1.8289611339569092, -1.7602565288543701, -1.691551923751831, -1.622847318649292, -1.5541425943374634, -1.4854379892349243, -1.4167333841323853, -1.3480286598205566, -1.2793240547180176, -1.2106194496154785, -1.1419148445129395, -1.0732102394104004, -1.0045055150985718, -0.9358009099960327, -0.8670963048934937, -0.7983916401863098, -0.729686975479126, -0.6609823703765869, -0.5922777652740479, -0.523573100566864, -0.45486846566200256, -0.3861638307571411, -0.31745919585227966, -0.2487545609474182, -0.18004992604255676, -0.11134552955627441, -0.042640894651412964, 0.026063740253448486, 0.09476837515830994, 0.1634730100631714, 0.23217764496803284, 0.3008822798728943, 0.36958691477775574, 0.4382915496826172, 0.5069961547851562, 0.5757008194923401, 0.6444054841995239, 0.713110089302063, 0.781814694404602, 0.8505193591117859, 0.9192240238189697, 0.9879286289215088, 1.0566332340240479, 1.125337839126587, 1.1940425634384155, 1.2627471685409546, 1.3314517736434937, 1.4001564979553223, 1.4688611030578613, 1.5375657081604004, 1.6062703132629395, 1.6749749183654785, 1.7436796426773071, 1.8123842477798462, 1.8810888528823853, 1.9497935771942139, 2.018498182296753, 2.087202787399292]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 0.0, 9.0, 7.0, 8.0, 10.0, 17.0, 38.0, 48.0, 69.0, 119.0, 167.0, 263.0, 523.0, 918.0, 2076.0, 6992.0, 67754.0, 3995969.0, 105785.0, 8640.0, 2476.0, 1033.0, 532.0, 309.0, 178.0, 103.0, 76.0, 52.0, 29.0, 23.0, 21.0, 10.0, 2.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.35546875, -3.255462646484375, -3.15545654296875, -3.055450439453125, -2.9554443359375, -2.855438232421875, -2.75543212890625, -2.655426025390625, -2.555419921875, -2.455413818359375, -2.35540771484375, -2.255401611328125, -2.1553955078125, -2.055389404296875, -1.95538330078125, -1.855377197265625, -1.75537109375, -1.655364990234375, -1.55535888671875, -1.455352783203125, -1.3553466796875, -1.255340576171875, -1.15533447265625, -1.055328369140625, -0.955322265625, -0.855316162109375, -0.75531005859375, -0.655303955078125, -0.5552978515625, -0.455291748046875, -0.35528564453125, -0.255279541015625, -0.1552734375, -0.055267333984375, 0.04473876953125, 0.144744873046875, 0.2447509765625, 0.344757080078125, 0.44476318359375, 0.544769287109375, 0.644775390625, 0.744781494140625, 0.84478759765625, 0.944793701171875, 1.0447998046875, 1.144805908203125, 1.24481201171875, 1.344818115234375, 1.44482421875, 1.544830322265625, 1.64483642578125, 1.744842529296875, 1.8448486328125, 1.944854736328125, 2.04486083984375, 2.144866943359375, 2.244873046875, 2.344879150390625, 2.44488525390625, 2.544891357421875, 2.6448974609375, 2.744903564453125, 2.84490966796875, 2.944915771484375, 3.044921875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 11.0, 3.0, 6.0, 12.0, 17.0, 29.0, 30.0, 48.0, 47.0, 57.0, 77.0, 92.0, 98.0, 76.0, 95.0, 66.0, 50.0, 39.0, 38.0, 38.0, 22.0, 24.0, 9.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1889190673828125, -1.150299072265625, -1.1116790771484375, -1.07305908203125, -1.0344390869140625, -0.995819091796875, -0.9571990966796875, -0.9185791015625, -0.8799591064453125, -0.841339111328125, -0.8027191162109375, -0.76409912109375, -0.7254791259765625, -0.686859130859375, -0.6482391357421875, -0.609619140625, -0.5709991455078125, -0.532379150390625, -0.4937591552734375, -0.45513916015625, -0.4165191650390625, -0.377899169921875, -0.3392791748046875, -0.3006591796875, -0.2620391845703125, -0.223419189453125, -0.1847991943359375, -0.14617919921875, -0.1075592041015625, -0.068939208984375, -0.0303192138671875, 0.00830078125, 0.0469207763671875, 0.085540771484375, 0.1241607666015625, 0.16278076171875, 0.2014007568359375, 0.240020751953125, 0.2786407470703125, 0.3172607421875, 0.3558807373046875, 0.394500732421875, 0.4331207275390625, 0.47174072265625, 0.5103607177734375, 0.548980712890625, 0.5876007080078125, 0.626220703125, 0.6648406982421875, 0.703460693359375, 0.7420806884765625, 0.78070068359375, 0.8193206787109375, 0.857940673828125, 0.8965606689453125, 0.9351806640625, 0.9738006591796875, 1.012420654296875, 1.0510406494140625, 1.08966064453125, 1.1282806396484375, 1.166900634765625, 1.2055206298828125, 1.244140625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 7.0, 6.0, 12.0, 9.0, 24.0, 41.0, 66.0, 145.0, 261.0, 585.0, 1511.0, 4606.0, 22111.0, 741533.0, 3382705.0, 31462.0, 6049.0, 1757.0, 732.0, 311.0, 151.0, 70.0, 49.0, 23.0, 21.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.074951171875, -2.98974609375, -2.904541015625, -2.8193359375, -2.734130859375, -2.64892578125, -2.563720703125, -2.478515625, -2.393310546875, -2.30810546875, -2.222900390625, -2.1376953125, -2.052490234375, -1.96728515625, -1.882080078125, -1.796875, -1.711669921875, -1.62646484375, -1.541259765625, -1.4560546875, -1.370849609375, -1.28564453125, -1.200439453125, -1.115234375, -1.030029296875, -0.94482421875, -0.859619140625, -0.7744140625, -0.689208984375, -0.60400390625, -0.518798828125, -0.43359375, -0.348388671875, -0.26318359375, -0.177978515625, -0.0927734375, -0.007568359375, 0.07763671875, 0.162841796875, 0.248046875, 0.333251953125, 0.41845703125, 0.503662109375, 0.5888671875, 0.674072265625, 0.75927734375, 0.844482421875, 0.9296875, 1.014892578125, 1.10009765625, 1.185302734375, 1.2705078125, 1.355712890625, 1.44091796875, 1.526123046875, 1.611328125, 1.696533203125, 1.78173828125, 1.866943359375, 1.9521484375, 2.037353515625, 2.12255859375, 2.207763671875, 2.29296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 8.0, 8.0, 12.0, 9.0, 19.0, 24.0, 25.0, 60.0, 122.0, 305.0, 953.0, 1550.0, 536.0, 207.0, 86.0, 43.0, 31.0, 19.0, 17.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5350570678710938, -0.5154266357421875, -0.49579620361328125, -0.476165771484375, -0.45653533935546875, -0.4369049072265625, -0.41727447509765625, -0.39764404296875, -0.37801361083984375, -0.3583831787109375, -0.33875274658203125, -0.319122314453125, -0.29949188232421875, -0.2798614501953125, -0.26023101806640625, -0.2406005859375, -0.22097015380859375, -0.2013397216796875, -0.18170928955078125, -0.162078857421875, -0.14244842529296875, -0.1228179931640625, -0.10318756103515625, -0.08355712890625, -0.06392669677734375, -0.0442962646484375, -0.02466583251953125, -0.005035400390625, 0.01459503173828125, 0.0342254638671875, 0.05385589599609375, 0.073486328125, 0.09311676025390625, 0.1127471923828125, 0.13237762451171875, 0.152008056640625, 0.17163848876953125, 0.1912689208984375, 0.21089935302734375, 0.23052978515625, 0.25016021728515625, 0.2697906494140625, 0.28942108154296875, 0.309051513671875, 0.32868194580078125, 0.3483123779296875, 0.36794281005859375, 0.3875732421875, 0.40720367431640625, 0.4268341064453125, 0.44646453857421875, 0.466094970703125, 0.48572540283203125, 0.5053558349609375, 0.5249862670898438, 0.54461669921875, 0.5642471313476562, 0.5838775634765625, 0.6035079956054688, 0.623138427734375, 0.6427688598632812, 0.6623992919921875, 0.6820297241210938, 0.70166015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 10.0, 19.0, 32.0, 47.0, 89.0, 143.0, 198.0, 194.0, 97.0, 59.0, 38.0, 23.0, 15.0, 15.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3228342533111572, -3.2410762310028076, -3.159317970275879, -3.0775599479675293, -2.9958016872406006, -2.914043664932251, -2.8322854042053223, -2.7505273818969727, -2.668769359588623, -2.5870113372802734, -2.5052530765533447, -2.423495054244995, -2.3417367935180664, -2.259978771209717, -2.178220748901367, -2.0964624881744385, -2.0147042274475098, -1.9329460859298706, -1.8511879444122314, -1.7694299221038818, -1.6876717805862427, -1.6059136390686035, -1.5241554975509644, -1.4423973560333252, -1.3606393337249756, -1.2788811922073364, -1.1971230506896973, -1.1153650283813477, -1.0336068868637085, -0.9518487453460693, -0.8700906038284302, -0.7883325219154358, -0.7065744400024414, -0.6248162984848022, -0.5430582165718079, -0.4613000750541687, -0.37954196333885193, -0.29778385162353516, -0.216025710105896, -0.1342676281929016, -0.05250948667526245, 0.029248632490634918, 0.11100675165653229, 0.19276487827301025, 0.274522989988327, 0.3562811017036438, 0.43803924322128296, 0.5197973251342773, 0.6015554666519165, 0.6833136081695557, 0.76507169008255, 0.8468298316001892, 0.9285879135131836, 1.0103460550308228, 1.092104196548462, 1.1738622188568115, 1.2556204795837402, 1.3373786211013794, 1.4191367626190186, 1.5008947849273682, 1.5826529264450073, 1.6644110679626465, 1.7461692094802856, 1.8279273509979248, 1.9096853733062744]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 3.0, 11.0, 15.0, 15.0, 15.0, 28.0, 29.0, 27.0, 41.0, 29.0, 49.0, 56.0, 60.0, 44.0, 53.0, 50.0, 53.0, 61.0, 48.0, 46.0, 45.0, 38.0, 34.0, 32.0, 22.0, 15.0, 14.0, 13.0, 8.0, 12.0, 11.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0057085752487183, -0.9715639352798462, -0.9374192357063293, -0.9032745957374573, -0.8691298961639404, -0.8349852561950684, -0.8008406162261963, -0.7666959762573242, -0.7325512766838074, -0.6984066367149353, -0.6642619371414185, -0.6301172971725464, -0.5959726572036743, -0.5618279576301575, -0.5276833176612854, -0.49353864789009094, -0.4593939781188965, -0.425249308347702, -0.39110463857650757, -0.3569599986076355, -0.32281532883644104, -0.2886706590652466, -0.2545260190963745, -0.22038134932518005, -0.1862366795539856, -0.15209200978279114, -0.11794735491275787, -0.08380269259214401, -0.04965803027153015, -0.015513360500335693, 0.01863129436969757, 0.052775949239730835, 0.08692061901092529, 0.12106528133153915, 0.15520994365215302, 0.18935459852218628, 0.22349926829338074, 0.2576439380645752, 0.29178857803344727, 0.3259332478046417, 0.3600779175758362, 0.39422258734703064, 0.4283672571182251, 0.46251189708709717, 0.4966565668582916, 0.5308012366294861, 0.5649458765983582, 0.599090576171875, 0.6332352161407471, 0.6673798561096191, 0.701524555683136, 0.7356691956520081, 0.7698138952255249, 0.803958535194397, 0.838103175163269, 0.8722478151321411, 0.906392514705658, 0.94053715467453, 0.9746818542480469, 1.008826494216919, 1.042971134185791, 1.077115774154663, 1.1112605333328247, 1.1454051733016968, 1.1795498132705688]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 1.0, 8.0, 8.0, 18.0, 27.0, 38.0, 51.0, 125.0, 188.0, 320.0, 610.0, 1244.0, 2685.0, 7043.0, 25783.0, 331371.0, 629034.0, 35328.0, 8512.0, 3169.0, 1397.0, 681.0, 358.0, 229.0, 115.0, 68.0, 50.0, 24.0, 23.0, 16.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7705078125, -0.747222900390625, -0.72393798828125, -0.700653076171875, -0.6773681640625, -0.654083251953125, -0.63079833984375, -0.607513427734375, -0.584228515625, -0.560943603515625, -0.53765869140625, -0.514373779296875, -0.4910888671875, -0.467803955078125, -0.44451904296875, -0.421234130859375, -0.39794921875, -0.374664306640625, -0.35137939453125, -0.328094482421875, -0.3048095703125, -0.281524658203125, -0.25823974609375, -0.234954833984375, -0.211669921875, -0.188385009765625, -0.16510009765625, -0.141815185546875, -0.1185302734375, -0.095245361328125, -0.07196044921875, -0.048675537109375, -0.025390625, -0.002105712890625, 0.02117919921875, 0.044464111328125, 0.0677490234375, 0.091033935546875, 0.11431884765625, 0.137603759765625, 0.160888671875, 0.184173583984375, 0.20745849609375, 0.230743408203125, 0.2540283203125, 0.277313232421875, 0.30059814453125, 0.323883056640625, 0.34716796875, 0.370452880859375, 0.39373779296875, 0.417022705078125, 0.4403076171875, 0.463592529296875, 0.48687744140625, 0.510162353515625, 0.533447265625, 0.556732177734375, 0.58001708984375, 0.603302001953125, 0.6265869140625, 0.649871826171875, 0.67315673828125, 0.696441650390625, 0.7197265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 27.0, 27.0, 45.0, 40.0, 36.0, 69.0, 75.0, 69.0, 69.0, 65.0, 72.0, 61.0, 62.0, 56.0, 47.0, 32.0, 25.0, 15.0, 10.0, 17.0, 14.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -1.0159378051757812, -0.9859771728515625, -0.9560165405273438, -0.926055908203125, -0.8960952758789062, -0.8661346435546875, -0.8361740112304688, -0.80621337890625, -0.7762527465820312, -0.7462921142578125, -0.7163314819335938, -0.686370849609375, -0.6564102172851562, -0.6264495849609375, -0.5964889526367188, -0.5665283203125, -0.5365676879882812, -0.5066070556640625, -0.47664642333984375, -0.446685791015625, -0.41672515869140625, -0.3867645263671875, -0.35680389404296875, -0.32684326171875, -0.29688262939453125, -0.2669219970703125, -0.23696136474609375, -0.207000732421875, -0.17704010009765625, -0.1470794677734375, -0.11711883544921875, -0.087158203125, -0.05719757080078125, -0.0272369384765625, 0.00272369384765625, 0.032684326171875, 0.06264495849609375, 0.0926055908203125, 0.12256622314453125, 0.15252685546875, 0.18248748779296875, 0.2124481201171875, 0.24240875244140625, 0.272369384765625, 0.30233001708984375, 0.3322906494140625, 0.36225128173828125, 0.3922119140625, 0.42217254638671875, 0.4521331787109375, 0.48209381103515625, 0.512054443359375, 0.5420150756835938, 0.5719757080078125, 0.6019363403320312, 0.63189697265625, 0.6618576049804688, 0.6918182373046875, 0.7217788696289062, 0.751739501953125, 0.7817001342773438, 0.8116607666015625, 0.8416213989257812, 0.87158203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 4.0, 10.0, 13.0, 26.0, 29.0, 46.0, 78.0, 130.0, 210.0, 355.0, 686.0, 1357.0, 3040.0, 7381.0, 23880.0, 174959.0, 726814.0, 83043.0, 16053.0, 5517.0, 2391.0, 1089.0, 612.0, 326.0, 157.0, 97.0, 66.0, 42.0, 23.0, 29.0, 9.0, 17.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.46728515625, -0.45368194580078125, -0.4400787353515625, -0.42647552490234375, -0.412872314453125, -0.39926910400390625, -0.3856658935546875, -0.37206268310546875, -0.35845947265625, -0.34485626220703125, -0.3312530517578125, -0.31764984130859375, -0.304046630859375, -0.29044342041015625, -0.2768402099609375, -0.26323699951171875, -0.2496337890625, -0.23603057861328125, -0.2224273681640625, -0.20882415771484375, -0.195220947265625, -0.18161773681640625, -0.1680145263671875, -0.15441131591796875, -0.14080810546875, -0.12720489501953125, -0.1136016845703125, -0.09999847412109375, -0.086395263671875, -0.07279205322265625, -0.0591888427734375, -0.04558563232421875, -0.031982421875, -0.01837921142578125, -0.0047760009765625, 0.00882720947265625, 0.022430419921875, 0.03603363037109375, 0.0496368408203125, 0.06324005126953125, 0.07684326171875, 0.09044647216796875, 0.1040496826171875, 0.11765289306640625, 0.131256103515625, 0.14485931396484375, 0.1584625244140625, 0.17206573486328125, 0.1856689453125, 0.19927215576171875, 0.2128753662109375, 0.22647857666015625, 0.240081787109375, 0.25368499755859375, 0.2672882080078125, 0.28089141845703125, 0.29449462890625, 0.30809783935546875, 0.3217010498046875, 0.33530426025390625, 0.348907470703125, 0.36251068115234375, 0.3761138916015625, 0.38971710205078125, 0.4033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 7.0, 7.0, 10.0, 8.0, 19.0, 24.0, 20.0, 18.0, 32.0, 29.0, 29.0, 37.0, 44.0, 47.0, 44.0, 39.0, 46.0, 46.0, 58.0, 34.0, 42.0, 45.0, 27.0, 49.0, 46.0, 27.0, 30.0, 26.0, 24.0, 13.0, 13.0, 8.0, 12.0, 9.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.1720123291015625, -1.131134033203125, -1.0902557373046875, -1.04937744140625, -1.0084991455078125, -0.967620849609375, -0.9267425537109375, -0.8858642578125, -0.8449859619140625, -0.804107666015625, -0.7632293701171875, -0.72235107421875, -0.6814727783203125, -0.640594482421875, -0.5997161865234375, -0.558837890625, -0.5179595947265625, -0.477081298828125, -0.4362030029296875, -0.39532470703125, -0.3544464111328125, -0.313568115234375, -0.2726898193359375, -0.2318115234375, -0.1909332275390625, -0.150054931640625, -0.1091766357421875, -0.06829833984375, -0.0274200439453125, 0.013458251953125, 0.0543365478515625, 0.09521484375, 0.1360931396484375, 0.176971435546875, 0.2178497314453125, 0.25872802734375, 0.2996063232421875, 0.340484619140625, 0.3813629150390625, 0.4222412109375, 0.4631195068359375, 0.503997802734375, 0.5448760986328125, 0.58575439453125, 0.6266326904296875, 0.667510986328125, 0.7083892822265625, 0.749267578125, 0.7901458740234375, 0.831024169921875, 0.8719024658203125, 0.91278076171875, 0.9536590576171875, 0.994537353515625, 1.0354156494140625, 1.0762939453125, 1.1171722412109375, 1.158050537109375, 1.1989288330078125, 1.23980712890625, 1.2806854248046875, 1.321563720703125, 1.3624420166015625, 1.4033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 8.0, 14.0, 18.0, 41.0, 43.0, 78.0, 94.0, 165.0, 232.0, 332.0, 567.0, 945.0, 1649.0, 3130.0, 6716.0, 19275.0, 84589.0, 621443.0, 248304.0, 39653.0, 11095.0, 4596.0, 2179.0, 1256.0, 768.0, 430.0, 314.0, 197.0, 106.0, 88.0, 61.0, 47.0, 30.0, 22.0, 12.0, 12.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07757568359375, -0.07505416870117188, -0.07253265380859375, -0.07001113891601562, -0.0674896240234375, -0.06496810913085938, -0.06244659423828125, -0.059925079345703125, -0.057403564453125, -0.054882049560546875, -0.05236053466796875, -0.049839019775390625, -0.0473175048828125, -0.044795989990234375, -0.04227447509765625, -0.039752960205078125, -0.0372314453125, -0.034709930419921875, -0.03218841552734375, -0.029666900634765625, -0.0271453857421875, -0.024623870849609375, -0.02210235595703125, -0.019580841064453125, -0.017059326171875, -0.014537811279296875, -0.01201629638671875, -0.009494781494140625, -0.0069732666015625, -0.004451751708984375, -0.00193023681640625, 0.000591278076171875, 0.00311279296875, 0.005634307861328125, 0.00815582275390625, 0.010677337646484375, 0.0131988525390625, 0.015720367431640625, 0.01824188232421875, 0.020763397216796875, 0.023284912109375, 0.025806427001953125, 0.02832794189453125, 0.030849456787109375, 0.0333709716796875, 0.035892486572265625, 0.03841400146484375, 0.040935516357421875, 0.04345703125, 0.045978546142578125, 0.04850006103515625, 0.051021575927734375, 0.0535430908203125, 0.056064605712890625, 0.05858612060546875, 0.061107635498046875, 0.063629150390625, 0.06615066528320312, 0.06867218017578125, 0.07119369506835938, 0.0737152099609375, 0.07623672485351562, 0.07875823974609375, 0.08127975463867188, 0.08380126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 20.0, 33.0, 54.0, 79.0, 107.0, 198.0, 174.0, 126.0, 62.0, 35.0, 30.0, 13.0, 11.0, 13.0, 4.0, 7.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97834587097168e-05, -5.797017365694046e-05, -5.6156888604164124e-05, -5.434360355138779e-05, -5.253031849861145e-05, -5.0717033445835114e-05, -4.890374839305878e-05, -4.709046334028244e-05, -4.5277178287506104e-05, -4.346389323472977e-05, -4.165060818195343e-05, -3.9837323129177094e-05, -3.802403807640076e-05, -3.621075302362442e-05, -3.4397467970848083e-05, -3.258418291807175e-05, -3.077089786529541e-05, -2.8957612812519073e-05, -2.7144327759742737e-05, -2.53310427069664e-05, -2.3517757654190063e-05, -2.1704472601413727e-05, -1.989118754863739e-05, -1.8077902495861053e-05, -1.6264617443084717e-05, -1.445133239030838e-05, -1.2638047337532043e-05, -1.0824762284755707e-05, -9.01147723197937e-06, -7.1981921792030334e-06, -5.384907126426697e-06, -3.57162207365036e-06, -1.7583370208740234e-06, 5.494803190231323e-08, 1.86823308467865e-06, 3.6815181374549866e-06, 5.494803190231323e-06, 7.30808824300766e-06, 9.121373295783997e-06, 1.0934658348560333e-05, 1.274794340133667e-05, 1.4561228454113007e-05, 1.6374513506889343e-05, 1.818779855966568e-05, 2.0001083612442017e-05, 2.1814368665218353e-05, 2.362765371799469e-05, 2.5440938770771027e-05, 2.7254223823547363e-05, 2.90675088763237e-05, 3.088079392910004e-05, 3.269407898187637e-05, 3.450736403465271e-05, 3.632064908742905e-05, 3.813393414020538e-05, 3.994721919298172e-05, 4.176050424575806e-05, 4.357378929853439e-05, 4.538707435131073e-05, 4.720035940408707e-05, 4.90136444568634e-05, 5.082692950963974e-05, 5.264021456241608e-05, 5.445349961519241e-05, 5.626678466796875e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 13.0, 15.0, 29.0, 25.0, 33.0, 55.0, 92.0, 151.0, 218.0, 341.0, 528.0, 986.0, 1756.0, 3372.0, 6967.0, 16221.0, 44395.0, 156668.0, 530194.0, 198350.0, 53153.0, 18460.0, 7972.0, 3808.0, 1944.0, 1099.0, 610.0, 373.0, 232.0, 152.0, 98.0, 70.0, 53.0, 28.0, 23.0, 16.0, 4.0, 7.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.07537841796875, -0.07325983047485352, -0.07114124298095703, -0.06902265548706055, -0.06690406799316406, -0.06478548049926758, -0.0626668930053711, -0.06054830551147461, -0.058429718017578125, -0.05631113052368164, -0.054192543029785156, -0.05207395553588867, -0.04995536804199219, -0.0478367805480957, -0.04571819305419922, -0.043599605560302734, -0.04148101806640625, -0.039362430572509766, -0.03724384307861328, -0.0351252555847168, -0.03300666809082031, -0.030888080596923828, -0.028769493103027344, -0.02665090560913086, -0.024532318115234375, -0.02241373062133789, -0.020295143127441406, -0.018176555633544922, -0.016057968139648438, -0.013939380645751953, -0.011820793151855469, -0.009702205657958984, -0.0075836181640625, -0.005465030670166016, -0.0033464431762695312, -0.0012278556823730469, 0.0008907318115234375, 0.003009319305419922, 0.005127906799316406, 0.007246494293212891, 0.009365081787109375, 0.01148366928100586, 0.013602256774902344, 0.015720844268798828, 0.017839431762695312, 0.019958019256591797, 0.02207660675048828, 0.024195194244384766, 0.02631378173828125, 0.028432369232177734, 0.03055095672607422, 0.0326695442199707, 0.03478813171386719, 0.03690671920776367, 0.039025306701660156, 0.04114389419555664, 0.043262481689453125, 0.04538106918334961, 0.047499656677246094, 0.04961824417114258, 0.05173683166503906, 0.05385541915893555, 0.05597400665283203, 0.058092594146728516, 0.060211181640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 3.0, 6.0, 16.0, 19.0, 11.0, 18.0, 37.0, 39.0, 44.0, 54.0, 57.0, 88.0, 104.0, 120.0, 75.0, 60.0, 49.0, 30.0, 31.0, 20.0, 21.0, 20.0, 11.0, 7.0, 10.0, 10.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186614990234375, -0.018013715744018555, -0.01736593246459961, -0.016718149185180664, -0.01607036590576172, -0.015422582626342773, -0.014774799346923828, -0.014127016067504883, -0.013479232788085938, -0.012831449508666992, -0.012183666229248047, -0.011535882949829102, -0.010888099670410156, -0.010240316390991211, -0.009592533111572266, -0.00894474983215332, -0.008296966552734375, -0.00764918327331543, -0.007001399993896484, -0.006353616714477539, -0.005705833435058594, -0.0050580501556396484, -0.004410266876220703, -0.003762483596801758, -0.0031147003173828125, -0.002466917037963867, -0.0018191337585449219, -0.0011713504791259766, -0.0005235671997070312, 0.00012421607971191406, 0.0007719993591308594, 0.0014197826385498047, 0.00206756591796875, 0.0027153491973876953, 0.0033631324768066406, 0.004010915756225586, 0.004658699035644531, 0.0053064823150634766, 0.005954265594482422, 0.006602048873901367, 0.0072498321533203125, 0.007897615432739258, 0.008545398712158203, 0.009193181991577148, 0.009840965270996094, 0.010488748550415039, 0.011136531829833984, 0.01178431510925293, 0.012432098388671875, 0.01307988166809082, 0.013727664947509766, 0.014375448226928711, 0.015023231506347656, 0.0156710147857666, 0.016318798065185547, 0.016966581344604492, 0.017614364624023438, 0.018262147903442383, 0.018909931182861328, 0.019557714462280273, 0.02020549774169922, 0.020853281021118164, 0.02150106430053711, 0.022148847579956055, 0.022796630859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 13.0, 10.0, 27.0, 41.0, 52.0, 81.0, 124.0, 143.0, 146.0, 111.0, 73.0, 49.0, 30.0, 17.0, 19.0, 10.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.304758071899414, -1.2662726640701294, -1.2277873754501343, -1.1893019676208496, -1.150816559791565, -1.1123311519622803, -1.0738458633422852, -1.0353604555130005, -0.9968751072883606, -0.9583897590637207, -0.919904351234436, -0.8814190030097961, -0.8429336547851562, -0.8044482469558716, -0.7659628987312317, -0.7274775505065918, -0.6889921426773071, -0.6505067944526672, -0.6120213866233826, -0.5735360383987427, -0.535050630569458, -0.4965652823448181, -0.4580799341201782, -0.41959455609321594, -0.38110917806625366, -0.3426238000392914, -0.3041384220123291, -0.2656530737876892, -0.22716769576072693, -0.18868231773376465, -0.15019695460796356, -0.11171159148216248, -0.07322633266448975, -0.03474096208810806, 0.0037444084882736206, 0.042229779064655304, 0.08071514964103699, 0.11920052766799927, 0.15768589079380035, 0.19617125391960144, 0.23465663194656372, 0.273142009973526, 0.3116273880004883, 0.3501127362251282, 0.38859811425209045, 0.42708349227905273, 0.4655688405036926, 0.5040541887283325, 0.5425395965576172, 0.5810249447822571, 0.6195103526115417, 0.6579957008361816, 0.6964811086654663, 0.7349664568901062, 0.7734518051147461, 0.8119372129440308, 0.8504225611686707, 0.8889079093933105, 0.9273933172225952, 0.9658786654472351, 1.004364013671875, 1.0428494215011597, 1.0813348293304443, 1.1198201179504395, 1.1583055257797241]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 10.0, 5.0, 8.0, 19.0, 9.0, 17.0, 28.0, 32.0, 37.0, 44.0, 43.0, 67.0, 67.0, 56.0, 56.0, 63.0, 69.0, 62.0, 45.0, 58.0, 39.0, 39.0, 31.0, 20.0, 9.0, 19.0, 19.0, 8.0, 9.0, 9.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9158645868301392, -0.8896703720092773, -0.8634761571884155, -0.8372819423675537, -0.8110877275466919, -0.7848935127258301, -0.7586992383003235, -0.7325050234794617, -0.7063108086585999, -0.680116593837738, -0.6539223790168762, -0.6277281641960144, -0.6015338897705078, -0.575339674949646, -0.5491454601287842, -0.5229512453079224, -0.49675703048706055, -0.47056281566619873, -0.4443686008453369, -0.4181743562221527, -0.3919801414012909, -0.3657859265804291, -0.3395916819572449, -0.31339746713638306, -0.28720325231552124, -0.2610090374946594, -0.2348148077726364, -0.2086205780506134, -0.1824263632297516, -0.15623214840888977, -0.13003791868686676, -0.10384368896484375, -0.07764947414398193, -0.05145525187253952, -0.025261029601097107, 0.0009331926703453064, 0.02712741494178772, 0.053321629762649536, 0.07951585948467255, 0.10571008920669556, 0.13190430402755737, 0.1580985188484192, 0.1842927485704422, 0.2104869782924652, 0.23668119311332703, 0.26287540793418884, 0.28906965255737305, 0.31526386737823486, 0.3414580821990967, 0.3676522970199585, 0.3938465118408203, 0.4200407564640045, 0.44623497128486633, 0.47242918610572815, 0.49862343072891235, 0.5248176455497742, 0.551011860370636, 0.5772060751914978, 0.6034002900123596, 0.6295945048332214, 0.655788779258728, 0.6819829940795898, 0.7081772089004517, 0.7343714237213135, 0.7605656385421753]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 11.0, 9.0, 14.0, 17.0, 25.0, 25.0, 48.0, 71.0, 105.0, 158.0, 245.0, 367.0, 578.0, 1086.0, 2016.0, 4324.0, 10959.0, 40761.0, 422892.0, 500046.0, 43922.0, 11549.0, 4357.0, 2091.0, 1102.0, 659.0, 378.0, 236.0, 164.0, 90.0, 71.0, 50.0, 27.0, 30.0, 17.0, 17.0, 12.0, 10.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7343902587890625, -0.711456298828125, -0.6885223388671875, -0.66558837890625, -0.6426544189453125, -0.619720458984375, -0.5967864990234375, -0.5738525390625, -0.5509185791015625, -0.527984619140625, -0.5050506591796875, -0.48211669921875, -0.4591827392578125, -0.436248779296875, -0.4133148193359375, -0.390380859375, -0.3674468994140625, -0.344512939453125, -0.3215789794921875, -0.29864501953125, -0.2757110595703125, -0.252777099609375, -0.2298431396484375, -0.2069091796875, -0.1839752197265625, -0.161041259765625, -0.1381072998046875, -0.11517333984375, -0.0922393798828125, -0.069305419921875, -0.0463714599609375, -0.0234375, -0.0005035400390625, 0.022430419921875, 0.0453643798828125, 0.06829833984375, 0.0912322998046875, 0.114166259765625, 0.1371002197265625, 0.1600341796875, 0.1829681396484375, 0.205902099609375, 0.2288360595703125, 0.25177001953125, 0.2747039794921875, 0.297637939453125, 0.3205718994140625, 0.343505859375, 0.3664398193359375, 0.389373779296875, 0.4123077392578125, 0.43524169921875, 0.4581756591796875, 0.481109619140625, 0.5040435791015625, 0.5269775390625, 0.5499114990234375, 0.572845458984375, 0.5957794189453125, 0.61871337890625, 0.6416473388671875, 0.664581298828125, 0.6875152587890625, 0.71044921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 3.0, 10.0, 8.0, 13.0, 12.0, 19.0, 23.0, 26.0, 38.0, 44.0, 38.0, 55.0, 55.0, 56.0, 45.0, 73.0, 81.0, 60.0, 55.0, 49.0, 48.0, 34.0, 31.0, 26.0, 17.0, 20.0, 8.0, 9.0, 12.0, 9.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.6640625, -1.61419677734375, -1.5643310546875, -1.51446533203125, -1.464599609375, -1.41473388671875, -1.3648681640625, -1.31500244140625, -1.26513671875, -1.21527099609375, -1.1654052734375, -1.11553955078125, -1.065673828125, -1.01580810546875, -0.9659423828125, -0.91607666015625, -0.8662109375, -0.81634521484375, -0.7664794921875, -0.71661376953125, -0.666748046875, -0.61688232421875, -0.5670166015625, -0.51715087890625, -0.46728515625, -0.41741943359375, -0.3675537109375, -0.31768798828125, -0.267822265625, -0.21795654296875, -0.1680908203125, -0.11822509765625, -0.068359375, -0.01849365234375, 0.0313720703125, 0.08123779296875, 0.131103515625, 0.18096923828125, 0.2308349609375, 0.28070068359375, 0.33056640625, 0.38043212890625, 0.4302978515625, 0.48016357421875, 0.530029296875, 0.57989501953125, 0.6297607421875, 0.67962646484375, 0.7294921875, 0.77935791015625, 0.8292236328125, 0.87908935546875, 0.928955078125, 0.97882080078125, 1.0286865234375, 1.07855224609375, 1.12841796875, 1.17828369140625, 1.2281494140625, 1.27801513671875, 1.327880859375, 1.37774658203125, 1.4276123046875, 1.47747802734375, 1.52734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 11.0, 13.0, 11.0, 16.0, 19.0, 14.0, 21.0, 16.0, 29.0, 45.0, 54.0, 73.0, 175.0, 335.0, 1132.0, 8879.0, 956885.0, 76253.0, 3299.0, 582.0, 237.0, 111.0, 74.0, 34.0, 38.0, 34.0, 25.0, 22.0, 19.0, 10.0, 20.0, 10.0, 7.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.275390625, -2.20147705078125, -2.1275634765625, -2.05364990234375, -1.979736328125, -1.90582275390625, -1.8319091796875, -1.75799560546875, -1.68408203125, -1.61016845703125, -1.5362548828125, -1.46234130859375, -1.388427734375, -1.31451416015625, -1.2406005859375, -1.16668701171875, -1.0927734375, -1.01885986328125, -0.9449462890625, -0.87103271484375, -0.797119140625, -0.72320556640625, -0.6492919921875, -0.57537841796875, -0.50146484375, -0.42755126953125, -0.3536376953125, -0.27972412109375, -0.205810546875, -0.13189697265625, -0.0579833984375, 0.01593017578125, 0.08984375, 0.16375732421875, 0.2376708984375, 0.31158447265625, 0.385498046875, 0.45941162109375, 0.5333251953125, 0.60723876953125, 0.68115234375, 0.75506591796875, 0.8289794921875, 0.90289306640625, 0.976806640625, 1.05072021484375, 1.1246337890625, 1.19854736328125, 1.2724609375, 1.34637451171875, 1.4202880859375, 1.49420166015625, 1.568115234375, 1.64202880859375, 1.7159423828125, 1.78985595703125, 1.86376953125, 1.93768310546875, 2.0115966796875, 2.08551025390625, 2.159423828125, 2.23333740234375, 2.3072509765625, 2.38116455078125, 2.455078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 10.0, 11.0, 8.0, 16.0, 10.0, 9.0, 20.0, 24.0, 24.0, 28.0, 28.0, 31.0, 38.0, 31.0, 36.0, 42.0, 39.0, 35.0, 54.0, 56.0, 45.0, 45.0, 41.0, 38.0, 27.0, 42.0, 29.0, 30.0, 26.0, 23.0, 11.0, 17.0, 15.0, 13.0, 13.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4541015625, -1.4105987548828125, -1.367095947265625, -1.3235931396484375, -1.28009033203125, -1.2365875244140625, -1.193084716796875, -1.1495819091796875, -1.1060791015625, -1.0625762939453125, -1.019073486328125, -0.9755706787109375, -0.93206787109375, -0.8885650634765625, -0.845062255859375, -0.8015594482421875, -0.758056640625, -0.7145538330078125, -0.671051025390625, -0.6275482177734375, -0.58404541015625, -0.5405426025390625, -0.497039794921875, -0.4535369873046875, -0.4100341796875, -0.3665313720703125, -0.323028564453125, -0.2795257568359375, -0.23602294921875, -0.1925201416015625, -0.149017333984375, -0.1055145263671875, -0.06201171875, -0.0185089111328125, 0.024993896484375, 0.0684967041015625, 0.11199951171875, 0.1555023193359375, 0.199005126953125, 0.2425079345703125, 0.2860107421875, 0.3295135498046875, 0.373016357421875, 0.4165191650390625, 0.46002197265625, 0.5035247802734375, 0.547027587890625, 0.5905303955078125, 0.634033203125, 0.6775360107421875, 0.721038818359375, 0.7645416259765625, 0.80804443359375, 0.8515472412109375, 0.895050048828125, 0.9385528564453125, 0.9820556640625, 1.0255584716796875, 1.069061279296875, 1.1125640869140625, 1.15606689453125, 1.1995697021484375, 1.243072509765625, 1.2865753173828125, 1.330078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 10.0, 20.0, 24.0, 46.0, 76.0, 172.0, 364.0, 948.0, 2925.0, 12579.0, 139968.0, 849730.0, 33564.0, 5507.0, 1490.0, 537.0, 253.0, 111.0, 61.0, 39.0, 25.0, 20.0, 16.0, 9.0, 10.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.3703498840332031, -0.35886383056640625, -0.3473777770996094, -0.3358917236328125, -0.3244056701660156, -0.31291961669921875, -0.3014335632324219, -0.289947509765625, -0.2784614562988281, -0.26697540283203125, -0.2554893493652344, -0.2440032958984375, -0.23251724243164062, -0.22103118896484375, -0.20954513549804688, -0.19805908203125, -0.18657302856445312, -0.17508697509765625, -0.16360092163085938, -0.1521148681640625, -0.14062881469726562, -0.12914276123046875, -0.11765670776367188, -0.106170654296875, -0.09468460083007812, -0.08319854736328125, -0.07171249389648438, -0.0602264404296875, -0.048740386962890625, -0.03725433349609375, -0.025768280029296875, -0.0142822265625, -0.002796173095703125, 0.00868988037109375, 0.020175933837890625, 0.0316619873046875, 0.043148040771484375, 0.05463409423828125, 0.06612014770507812, 0.077606201171875, 0.08909225463867188, 0.10057830810546875, 0.11206436157226562, 0.1235504150390625, 0.13503646850585938, 0.14652252197265625, 0.15800857543945312, 0.16949462890625, 0.18098068237304688, 0.19246673583984375, 0.20395278930664062, 0.2154388427734375, 0.22692489624023438, 0.23841094970703125, 0.24989700317382812, 0.261383056640625, 0.2728691101074219, 0.28435516357421875, 0.2958412170410156, 0.3073272705078125, 0.3188133239746094, 0.33029937744140625, 0.3417854309082031, 0.353271484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 11.0, 18.0, 34.0, 43.0, 91.0, 256.0, 301.0, 91.0, 54.0, 28.0, 13.0, 12.0, 12.0, 8.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.240606307983398e-05, -6.0395337641239166e-05, -5.838461220264435e-05, -5.637388676404953e-05, -5.436316132545471e-05, -5.2352435886859894e-05, -5.0341710448265076e-05, -4.833098500967026e-05, -4.632025957107544e-05, -4.430953413248062e-05, -4.22988086938858e-05, -4.0288083255290985e-05, -3.827735781669617e-05, -3.626663237810135e-05, -3.425590693950653e-05, -3.224518150091171e-05, -3.0234456062316895e-05, -2.8223730623722076e-05, -2.6213005185127258e-05, -2.420227974653244e-05, -2.2191554307937622e-05, -2.0180828869342804e-05, -1.8170103430747986e-05, -1.6159377992153168e-05, -1.414865255355835e-05, -1.2137927114963531e-05, -1.0127201676368713e-05, -8.116476237773895e-06, -6.105750799179077e-06, -4.095025360584259e-06, -2.084299921989441e-06, -7.35744833946228e-08, 1.9371509552001953e-06, 3.9478763937950134e-06, 5.9586018323898315e-06, 7.96932727098465e-06, 9.980052709579468e-06, 1.1990778148174286e-05, 1.4001503586769104e-05, 1.6012229025363922e-05, 1.802295446395874e-05, 2.003367990255356e-05, 2.2044405341148376e-05, 2.4055130779743195e-05, 2.6065856218338013e-05, 2.807658165693283e-05, 3.008730709552765e-05, 3.209803253412247e-05, 3.4108757972717285e-05, 3.61194834113121e-05, 3.813020884990692e-05, 4.014093428850174e-05, 4.215165972709656e-05, 4.4162385165691376e-05, 4.6173110604286194e-05, 4.818383604288101e-05, 5.019456148147583e-05, 5.220528692007065e-05, 5.4216012358665466e-05, 5.6226737797260284e-05, 5.82374632358551e-05, 6.024818867444992e-05, 6.225891411304474e-05, 6.426963955163956e-05, 6.628036499023438e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 9.0, 20.0, 22.0, 36.0, 53.0, 60.0, 148.0, 271.0, 562.0, 1355.0, 5568.0, 44041.0, 915266.0, 71124.0, 6955.0, 1655.0, 626.0, 314.0, 177.0, 104.0, 59.0, 37.0, 19.0, 16.0, 11.0, 2.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.35384368896484375, -0.3400115966796875, -0.32617950439453125, -0.312347412109375, -0.29851531982421875, -0.2846832275390625, -0.27085113525390625, -0.25701904296875, -0.24318695068359375, -0.2293548583984375, -0.21552276611328125, -0.201690673828125, -0.18785858154296875, -0.1740264892578125, -0.16019439697265625, -0.1463623046875, -0.13253021240234375, -0.1186981201171875, -0.10486602783203125, -0.091033935546875, -0.07720184326171875, -0.0633697509765625, -0.04953765869140625, -0.03570556640625, -0.02187347412109375, -0.0080413818359375, 0.00579071044921875, 0.019622802734375, 0.03345489501953125, 0.0472869873046875, 0.06111907958984375, 0.074951171875, 0.08878326416015625, 0.1026153564453125, 0.11644744873046875, 0.130279541015625, 0.14411163330078125, 0.1579437255859375, 0.17177581787109375, 0.18560791015625, 0.19944000244140625, 0.2132720947265625, 0.22710418701171875, 0.240936279296875, 0.25476837158203125, 0.2686004638671875, 0.28243255615234375, 0.2962646484375, 0.31009674072265625, 0.3239288330078125, 0.33776092529296875, 0.351593017578125, 0.36542510986328125, 0.3792572021484375, 0.39308929443359375, 0.40692138671875, 0.42075347900390625, 0.4345855712890625, 0.44841766357421875, 0.462249755859375, 0.47608184814453125, 0.4899139404296875, 0.5037460327148438, 0.517578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 12.0, 13.0, 20.0, 48.0, 77.0, 178.0, 373.0, 141.0, 59.0, 35.0, 22.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2556629180908203, -0.24863052368164062, -0.24159812927246094, -0.23456573486328125, -0.22753334045410156, -0.22050094604492188, -0.2134685516357422, -0.2064361572265625, -0.1994037628173828, -0.19237136840820312, -0.18533897399902344, -0.17830657958984375, -0.17127418518066406, -0.16424179077148438, -0.1572093963623047, -0.150177001953125, -0.1431446075439453, -0.13611221313476562, -0.12907981872558594, -0.12204742431640625, -0.11501502990722656, -0.10798263549804688, -0.10095024108886719, -0.0939178466796875, -0.08688545227050781, -0.07985305786132812, -0.07282066345214844, -0.06578826904296875, -0.05875587463378906, -0.051723480224609375, -0.04469108581542969, -0.03765869140625, -0.030626296997070312, -0.023593902587890625, -0.016561508178710938, -0.00952911376953125, -0.0024967193603515625, 0.004535675048828125, 0.011568069458007812, 0.0186004638671875, 0.025632858276367188, 0.032665252685546875, 0.03969764709472656, 0.04673004150390625, 0.05376243591308594, 0.060794830322265625, 0.06782722473144531, 0.074859619140625, 0.08189201354980469, 0.08892440795898438, 0.09595680236816406, 0.10298919677734375, 0.11002159118652344, 0.11705398559570312, 0.12408638000488281, 0.1311187744140625, 0.1381511688232422, 0.14518356323242188, 0.15221595764160156, 0.15924835205078125, 0.16628074645996094, 0.17331314086914062, 0.1803455352783203, 0.1873779296875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 12.0, 18.0, 39.0, 100.0, 234.0, 312.0, 151.0, 64.0, 35.0, 17.0, 16.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0284457206726074, -2.8633882999420166, -2.698330879211426, -2.533273696899414, -2.3682162761688232, -2.2031588554382324, -2.0381014347076416, -1.8730441331863403, -1.7079867124557495, -1.5429292917251587, -1.3778719902038574, -1.2128145694732666, -1.0477571487426758, -0.8826998472213745, -0.7176424264907837, -0.5525851249694824, -0.3875277042388916, -0.22247032821178436, -0.057412952184677124, 0.10764443874359131, 0.27270179986953735, 0.4377591609954834, 0.6028165817260742, 0.7678738832473755, 0.9329313039779663, 1.0979887247085571, 1.2630460262298584, 1.4281034469604492, 1.59316086769104, 1.7582181692123413, 1.9232755899429321, 2.0883328914642334, 2.253390312194824, 2.418447732925415, 2.583505153656006, 2.7485623359680176, 2.9136197566986084, 3.078677177429199, 3.24373459815979, 3.408792018890381, 3.5738492012023926, 3.7389066219329834, 3.903964042663574, 4.069021224975586, 4.234078884124756, 4.399136066436768, 4.5641937255859375, 4.729250907897949, 4.894308090209961, 5.059365272521973, 5.224422931671143, 5.389480113983154, 5.554537773132324, 5.719594955444336, 5.884652137756348, 6.049709796905518, 6.2147674560546875, 6.379824638366699, 6.544882297515869, 6.709939479827881, 6.874997138977051, 7.0400543212890625, 7.205111503601074, 7.370169162750244, 7.535226345062256]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 11.0, 8.0, 14.0, 12.0, 13.0, 22.0, 20.0, 17.0, 26.0, 26.0, 28.0, 26.0, 32.0, 28.0, 29.0, 28.0, 51.0, 34.0, 33.0, 33.0, 45.0, 38.0, 40.0, 31.0, 26.0, 43.0, 31.0, 32.0, 29.0, 27.0, 14.0, 23.0, 12.0, 10.0, 14.0, 15.0, 11.0, 12.0, 10.0, 6.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.9444060325622559, -1.8847922086715698, -1.8251783847808838, -1.7655645608901978, -1.7059507369995117, -1.6463369131088257, -1.5867230892181396, -1.5271092653274536, -1.4674954414367676, -1.4078816175460815, -1.3482677936553955, -1.2886539697647095, -1.2290401458740234, -1.1694263219833374, -1.1098124980926514, -1.0501986742019653, -0.9905848503112793, -0.9309710264205933, -0.8713572025299072, -0.8117433786392212, -0.7521295547485352, -0.6925157308578491, -0.6329019069671631, -0.573288083076477, -0.513674259185791, -0.454060435295105, -0.39444661140441895, -0.3348327875137329, -0.2752189636230469, -0.21560513973236084, -0.1559913158416748, -0.09637749195098877, -0.036763668060302734, 0.0228501558303833, 0.08246397972106934, 0.14207780361175537, 0.2016916275024414, 0.26130545139312744, 0.3209192752838135, 0.3805330991744995, 0.44014692306518555, 0.4997607469558716, 0.5593745708465576, 0.6189883947372437, 0.6786022186279297, 0.7382160425186157, 0.7978298664093018, 0.8574436902999878, 0.9170575141906738, 0.9766713380813599, 1.036285161972046, 1.095898985862732, 1.155512809753418, 1.215126633644104, 1.27474045753479, 1.334354281425476, 1.393968105316162, 1.4535819292068481, 1.5131957530975342, 1.5728095769882202, 1.6324234008789062, 1.6920372247695923, 1.7516510486602783, 1.8112648725509644, 1.8708786964416504]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 7.0, 16.0, 18.0, 38.0, 35.0, 62.0, 96.0, 151.0, 259.0, 437.0, 757.0, 1415.0, 2520.0, 5225.0, 17767.0, 150203.0, 3615512.0, 364729.0, 21289.0, 7154.0, 2983.0, 1485.0, 818.0, 485.0, 290.0, 170.0, 108.0, 77.0, 47.0, 42.0, 21.0, 17.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.846893310546875, -1.78656005859375, -1.726226806640625, -1.6658935546875, -1.605560302734375, -1.54522705078125, -1.484893798828125, -1.424560546875, -1.364227294921875, -1.30389404296875, -1.243560791015625, -1.1832275390625, -1.122894287109375, -1.06256103515625, -1.002227783203125, -0.94189453125, -0.881561279296875, -0.82122802734375, -0.760894775390625, -0.7005615234375, -0.640228271484375, -0.57989501953125, -0.519561767578125, -0.459228515625, -0.398895263671875, -0.33856201171875, -0.278228759765625, -0.2178955078125, -0.157562255859375, -0.09722900390625, -0.036895751953125, 0.0234375, 0.083770751953125, 0.14410400390625, 0.204437255859375, 0.2647705078125, 0.325103759765625, 0.38543701171875, 0.445770263671875, 0.506103515625, 0.566436767578125, 0.62677001953125, 0.687103271484375, 0.7474365234375, 0.807769775390625, 0.86810302734375, 0.928436279296875, 0.98876953125, 1.049102783203125, 1.10943603515625, 1.169769287109375, 1.2301025390625, 1.290435791015625, 1.35076904296875, 1.411102294921875, 1.471435546875, 1.531768798828125, 1.59210205078125, 1.652435302734375, 1.7127685546875, 1.773101806640625, 1.83343505859375, 1.893768310546875, 1.9541015625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 6.0, 8.0, 10.0, 20.0, 19.0, 21.0, 34.0, 47.0, 47.0, 66.0, 60.0, 76.0, 76.0, 77.0, 69.0, 68.0, 65.0, 55.0, 47.0, 29.0, 22.0, 28.0, 17.0, 9.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.208984375, -1.1755828857421875, -1.142181396484375, -1.1087799072265625, -1.07537841796875, -1.0419769287109375, -1.008575439453125, -0.9751739501953125, -0.9417724609375, -0.9083709716796875, -0.874969482421875, -0.8415679931640625, -0.80816650390625, -0.7747650146484375, -0.741363525390625, -0.7079620361328125, -0.674560546875, -0.6411590576171875, -0.607757568359375, -0.5743560791015625, -0.54095458984375, -0.5075531005859375, -0.474151611328125, -0.4407501220703125, -0.4073486328125, -0.3739471435546875, -0.340545654296875, -0.3071441650390625, -0.27374267578125, -0.2403411865234375, -0.206939697265625, -0.1735382080078125, -0.14013671875, -0.1067352294921875, -0.073333740234375, -0.0399322509765625, -0.00653076171875, 0.0268707275390625, 0.060272216796875, 0.0936737060546875, 0.1270751953125, 0.1604766845703125, 0.193878173828125, 0.2272796630859375, 0.26068115234375, 0.2940826416015625, 0.327484130859375, 0.3608856201171875, 0.394287109375, 0.4276885986328125, 0.461090087890625, 0.4944915771484375, 0.52789306640625, 0.5612945556640625, 0.594696044921875, 0.6280975341796875, 0.6614990234375, 0.6949005126953125, 0.728302001953125, 0.7617034912109375, 0.79510498046875, 0.8285064697265625, 0.861907958984375, 0.8953094482421875, 0.9287109375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 23.0, 18.0, 23.0, 33.0, 39.0, 69.0, 105.0, 195.0, 360.0, 838.0, 2448.0, 8412.0, 45247.0, 3793443.0, 314737.0, 20619.0, 4856.0, 1591.0, 549.0, 247.0, 133.0, 79.0, 61.0, 43.0, 28.0, 20.0, 14.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.47265625, -3.38311767578125, -3.2935791015625, -3.20404052734375, -3.114501953125, -3.02496337890625, -2.9354248046875, -2.84588623046875, -2.75634765625, -2.66680908203125, -2.5772705078125, -2.48773193359375, -2.398193359375, -2.30865478515625, -2.2191162109375, -2.12957763671875, -2.0400390625, -1.95050048828125, -1.8609619140625, -1.77142333984375, -1.681884765625, -1.59234619140625, -1.5028076171875, -1.41326904296875, -1.32373046875, -1.23419189453125, -1.1446533203125, -1.05511474609375, -0.965576171875, -0.87603759765625, -0.7864990234375, -0.69696044921875, -0.607421875, -0.51788330078125, -0.4283447265625, -0.33880615234375, -0.249267578125, -0.15972900390625, -0.0701904296875, 0.01934814453125, 0.10888671875, 0.19842529296875, 0.2879638671875, 0.37750244140625, 0.467041015625, 0.55657958984375, 0.6461181640625, 0.73565673828125, 0.8251953125, 0.91473388671875, 1.0042724609375, 1.09381103515625, 1.183349609375, 1.27288818359375, 1.3624267578125, 1.45196533203125, 1.54150390625, 1.63104248046875, 1.7205810546875, 1.81011962890625, 1.899658203125, 1.98919677734375, 2.0787353515625, 2.16827392578125, 2.2578125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 3.0, 6.0, 15.0, 27.0, 16.0, 29.0, 52.0, 81.0, 245.0, 743.0, 1649.0, 747.0, 249.0, 74.0, 32.0, 31.0, 13.0, 10.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486572265625, -0.4628105163574219, -0.43904876708984375, -0.4152870178222656, -0.3915252685546875, -0.3677635192871094, -0.34400177001953125, -0.3202400207519531, -0.296478271484375, -0.2727165222167969, -0.24895477294921875, -0.22519302368164062, -0.2014312744140625, -0.17766952514648438, -0.15390777587890625, -0.13014602661132812, -0.10638427734375, -0.08262252807617188, -0.05886077880859375, -0.035099029541015625, -0.0113372802734375, 0.012424468994140625, 0.03618621826171875, 0.059947967529296875, 0.083709716796875, 0.10747146606445312, 0.13123321533203125, 0.15499496459960938, 0.1787567138671875, 0.20251846313476562, 0.22628021240234375, 0.2500419616699219, 0.2738037109375, 0.2975654602050781, 0.32132720947265625, 0.3450889587402344, 0.3688507080078125, 0.3926124572753906, 0.41637420654296875, 0.4401359558105469, 0.463897705078125, 0.4876594543457031, 0.5114212036132812, 0.5351829528808594, 0.5589447021484375, 0.5827064514160156, 0.6064682006835938, 0.6302299499511719, 0.65399169921875, 0.6777534484863281, 0.7015151977539062, 0.7252769470214844, 0.7490386962890625, 0.7728004455566406, 0.7965621948242188, 0.8203239440917969, 0.844085693359375, 0.8678474426269531, 0.8916091918945312, 0.9153709411621094, 0.9391326904296875, 0.9628944396972656, 0.9866561889648438, 1.0104179382324219, 1.0341796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 12.0, 15.0, 27.0, 33.0, 53.0, 78.0, 115.0, 139.0, 139.0, 124.0, 81.0, 59.0, 41.0, 22.0, 18.0, 12.0, 8.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62961483001709, -2.5625107288360596, -2.4954066276550293, -2.428302526473999, -2.3611984252929688, -2.2940940856933594, -2.226990222930908, -2.159885883331299, -2.0927817821502686, -2.0256776809692383, -1.958573579788208, -1.8914694786071777, -1.824365258216858, -1.7572611570358276, -1.6901570558547974, -1.623052954673767, -1.5559488534927368, -1.4888447523117065, -1.4217406511306763, -1.3546364307403564, -1.2875323295593262, -1.220428228378296, -1.1533241271972656, -1.0862200260162354, -1.019115924835205, -0.9520118236541748, -0.8849076628684998, -0.8178035616874695, -0.7506994009017944, -0.6835952997207642, -0.6164911985397339, -0.5493870973587036, -0.48228275775909424, -0.4151786267757416, -0.3480744957923889, -0.28097039461135864, -0.21386626362800598, -0.14676213264465332, -0.07965803146362305, -0.012553900480270386, 0.054550230503082275, 0.12165435403585434, 0.1887584775686264, 0.25586259365081787, 0.32296672463417053, 0.3900708556175232, 0.45717495679855347, 0.5242791175842285, 0.5913832187652588, 0.6584873199462891, 0.7255914807319641, 0.7926955819129944, 0.8597997426986694, 0.9269038438796997, 0.99400794506073, 1.0611120462417603, 1.12821626663208, 1.1953203678131104, 1.2624244689941406, 1.329528570175171, 1.3966327905654907, 1.463736891746521, 1.5308409929275513, 1.5979450941085815, 1.6650491952896118]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 11.0, 10.0, 24.0, 25.0, 27.0, 40.0, 31.0, 39.0, 53.0, 40.0, 43.0, 43.0, 45.0, 57.0, 49.0, 41.0, 46.0, 60.0, 36.0, 31.0, 34.0, 21.0, 28.0, 29.0, 26.0, 8.0, 12.0, 11.0, 10.0, 12.0, 7.0, 5.0, 7.0, 0.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9882547855377197, -0.9553248286247253, -0.922394871711731, -0.8894649147987366, -0.8565349578857422, -0.823604941368103, -0.7906749844551086, -0.7577450275421143, -0.7248150706291199, -0.6918851137161255, -0.6589551568031311, -0.6260251998901367, -0.5930951833724976, -0.560165286064148, -0.5272352695465088, -0.4943053126335144, -0.46137535572052, -0.42844539880752563, -0.39551544189453125, -0.3625854551792145, -0.3296554982662201, -0.2967255413532257, -0.26379555463790894, -0.23086559772491455, -0.19793564081192017, -0.16500568389892578, -0.1320757120847702, -0.09914574772119522, -0.06621578335762024, -0.033285826444625854, -0.0003558546304702759, 0.0325741171836853, 0.06550419330596924, 0.09843415766954422, 0.1313641220331192, 0.16429409384727478, 0.19722405076026917, 0.23015400767326355, 0.2630839943885803, 0.2960139513015747, 0.3289439082145691, 0.3618738651275635, 0.39480382204055786, 0.42773380875587463, 0.460663765668869, 0.4935937225818634, 0.5265237092971802, 0.5594536662101746, 0.592383623123169, 0.6253135800361633, 0.6582435369491577, 0.6911734938621521, 0.7241034507751465, 0.7570334672927856, 0.78996342420578, 0.8228933811187744, 0.8558233380317688, 0.8887532949447632, 0.9216832518577576, 0.954613208770752, 0.9875432252883911, 1.0204731225967407, 1.0534031391143799, 1.0863330364227295, 1.1192630529403687]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 12.0, 8.0, 12.0, 21.0, 35.0, 45.0, 53.0, 102.0, 161.0, 223.0, 372.0, 706.0, 1299.0, 2778.0, 6736.0, 23649.0, 217912.0, 719673.0, 55169.0, 11492.0, 4061.0, 1772.0, 922.0, 491.0, 298.0, 182.0, 103.0, 92.0, 61.0, 38.0, 26.0, 15.0, 9.0, 9.0, 6.0, 5.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.626953125, -0.6062164306640625, -0.585479736328125, -0.5647430419921875, -0.54400634765625, -0.5232696533203125, -0.502532958984375, -0.4817962646484375, -0.4610595703125, -0.4403228759765625, -0.419586181640625, -0.3988494873046875, -0.37811279296875, -0.3573760986328125, -0.336639404296875, -0.3159027099609375, -0.295166015625, -0.2744293212890625, -0.253692626953125, -0.2329559326171875, -0.21221923828125, -0.1914825439453125, -0.170745849609375, -0.1500091552734375, -0.1292724609375, -0.1085357666015625, -0.087799072265625, -0.0670623779296875, -0.04632568359375, -0.0255889892578125, -0.004852294921875, 0.0158843994140625, 0.03662109375, 0.0573577880859375, 0.078094482421875, 0.0988311767578125, 0.11956787109375, 0.1403045654296875, 0.161041259765625, 0.1817779541015625, 0.2025146484375, 0.2232513427734375, 0.243988037109375, 0.2647247314453125, 0.28546142578125, 0.3061981201171875, 0.326934814453125, 0.3476715087890625, 0.368408203125, 0.3891448974609375, 0.409881591796875, 0.4306182861328125, 0.45135498046875, 0.4720916748046875, 0.492828369140625, 0.5135650634765625, 0.5343017578125, 0.5550384521484375, 0.575775146484375, 0.5965118408203125, 0.61724853515625, 0.6379852294921875, 0.658721923828125, 0.6794586181640625, 0.7001953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 5.0, 11.0, 16.0, 14.0, 24.0, 16.0, 28.0, 39.0, 39.0, 60.0, 57.0, 62.0, 56.0, 68.0, 68.0, 64.0, 63.0, 52.0, 47.0, 39.0, 32.0, 30.0, 29.0, 17.0, 11.0, 11.0, 14.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7861328125, -0.7613601684570312, -0.7365875244140625, -0.7118148803710938, -0.687042236328125, -0.6622695922851562, -0.6374969482421875, -0.6127243041992188, -0.58795166015625, -0.5631790161132812, -0.5384063720703125, -0.5136337280273438, -0.488861083984375, -0.46408843994140625, -0.4393157958984375, -0.41454315185546875, -0.3897705078125, -0.36499786376953125, -0.3402252197265625, -0.31545257568359375, -0.290679931640625, -0.26590728759765625, -0.2411346435546875, -0.21636199951171875, -0.19158935546875, -0.16681671142578125, -0.1420440673828125, -0.11727142333984375, -0.092498779296875, -0.06772613525390625, -0.0429534912109375, -0.01818084716796875, 0.006591796875, 0.03136444091796875, 0.0561370849609375, 0.08090972900390625, 0.105682373046875, 0.13045501708984375, 0.1552276611328125, 0.18000030517578125, 0.20477294921875, 0.22954559326171875, 0.2543182373046875, 0.27909088134765625, 0.303863525390625, 0.32863616943359375, 0.3534088134765625, 0.37818145751953125, 0.4029541015625, 0.42772674560546875, 0.4524993896484375, 0.47727203369140625, 0.502044677734375, 0.5268173217773438, 0.5515899658203125, 0.5763626098632812, 0.60113525390625, 0.6259078979492188, 0.6506805419921875, 0.6754531860351562, 0.700225830078125, 0.7249984741210938, 0.7497711181640625, 0.7745437622070312, 0.79931640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 20.0, 34.0, 58.0, 116.0, 201.0, 431.0, 926.0, 2478.0, 8355.0, 43527.0, 558814.0, 389976.0, 32953.0, 6829.0, 2185.0, 887.0, 347.0, 173.0, 85.0, 44.0, 30.0, 17.0, 11.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.461181640625, -0.4471778869628906, -0.43317413330078125, -0.4191703796386719, -0.4051666259765625, -0.3911628723144531, -0.37715911865234375, -0.3631553649902344, -0.349151611328125, -0.3351478576660156, -0.32114410400390625, -0.3071403503417969, -0.2931365966796875, -0.2791328430175781, -0.26512908935546875, -0.2511253356933594, -0.23712158203125, -0.22311782836914062, -0.20911407470703125, -0.19511032104492188, -0.1811065673828125, -0.16710281372070312, -0.15309906005859375, -0.13909530639648438, -0.125091552734375, -0.11108779907226562, -0.09708404541015625, -0.08308029174804688, -0.0690765380859375, -0.055072784423828125, -0.04106903076171875, -0.027065277099609375, -0.0130615234375, 0.000942230224609375, 0.01494598388671875, 0.028949737548828125, 0.0429534912109375, 0.056957244873046875, 0.07096099853515625, 0.08496475219726562, 0.098968505859375, 0.11297225952148438, 0.12697601318359375, 0.14097976684570312, 0.1549835205078125, 0.16898727416992188, 0.18299102783203125, 0.19699478149414062, 0.21099853515625, 0.22500228881835938, 0.23900604248046875, 0.2530097961425781, 0.2670135498046875, 0.2810173034667969, 0.29502105712890625, 0.3090248107910156, 0.323028564453125, 0.3370323181152344, 0.35103607177734375, 0.3650398254394531, 0.3790435791015625, 0.3930473327636719, 0.40705108642578125, 0.4210548400878906, 0.43505859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 3.0, 8.0, 5.0, 7.0, 9.0, 15.0, 13.0, 16.0, 15.0, 25.0, 20.0, 31.0, 32.0, 26.0, 42.0, 45.0, 36.0, 51.0, 48.0, 53.0, 52.0, 75.0, 41.0, 39.0, 37.0, 35.0, 30.0, 31.0, 25.0, 18.0, 21.0, 20.0, 11.0, 13.0, 7.0, 7.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3486328125, -1.3122634887695312, -1.2758941650390625, -1.2395248413085938, -1.203155517578125, -1.1667861938476562, -1.1304168701171875, -1.0940475463867188, -1.05767822265625, -1.0213088989257812, -0.9849395751953125, -0.9485702514648438, -0.912200927734375, -0.8758316040039062, -0.8394622802734375, -0.8030929565429688, -0.7667236328125, -0.7303543090820312, -0.6939849853515625, -0.6576156616210938, -0.621246337890625, -0.5848770141601562, -0.5485076904296875, -0.5121383666992188, -0.47576904296875, -0.43939971923828125, -0.4030303955078125, -0.36666107177734375, -0.330291748046875, -0.29392242431640625, -0.2575531005859375, -0.22118377685546875, -0.184814453125, -0.14844512939453125, -0.1120758056640625, -0.07570648193359375, -0.039337158203125, -0.00296783447265625, 0.0334014892578125, 0.06977081298828125, 0.10614013671875, 0.14250946044921875, 0.1788787841796875, 0.21524810791015625, 0.251617431640625, 0.28798675537109375, 0.3243560791015625, 0.36072540283203125, 0.3970947265625, 0.43346405029296875, 0.4698333740234375, 0.5062026977539062, 0.542572021484375, 0.5789413452148438, 0.6153106689453125, 0.6516799926757812, 0.68804931640625, 0.7244186401367188, 0.7607879638671875, 0.7971572875976562, 0.833526611328125, 0.8698959350585938, 0.9062652587890625, 0.9426345825195312, 0.97900390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 9.0, 7.0, 15.0, 14.0, 29.0, 42.0, 74.0, 83.0, 140.0, 226.0, 352.0, 640.0, 1293.0, 2747.0, 6982.0, 21630.0, 99719.0, 662744.0, 199559.0, 34613.0, 10045.0, 3909.0, 1664.0, 831.0, 480.0, 235.0, 168.0, 96.0, 62.0, 40.0, 29.0, 21.0, 11.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10595703125, -0.10261154174804688, -0.09926605224609375, -0.09592056274414062, -0.0925750732421875, -0.08922958374023438, -0.08588409423828125, -0.08253860473632812, -0.079193115234375, -0.07584762573242188, -0.07250213623046875, -0.06915664672851562, -0.0658111572265625, -0.062465667724609375, -0.05912017822265625, -0.055774688720703125, -0.05242919921875, -0.049083709716796875, -0.04573822021484375, -0.042392730712890625, -0.0390472412109375, -0.035701751708984375, -0.03235626220703125, -0.029010772705078125, -0.025665283203125, -0.022319793701171875, -0.01897430419921875, -0.015628814697265625, -0.0122833251953125, -0.008937835693359375, -0.00559234619140625, -0.002246856689453125, 0.0010986328125, 0.004444122314453125, 0.00778961181640625, 0.011135101318359375, 0.0144805908203125, 0.017826080322265625, 0.02117156982421875, 0.024517059326171875, 0.027862548828125, 0.031208038330078125, 0.03455352783203125, 0.037899017333984375, 0.0412445068359375, 0.044589996337890625, 0.04793548583984375, 0.051280975341796875, 0.05462646484375, 0.057971954345703125, 0.06131744384765625, 0.06466293334960938, 0.0680084228515625, 0.07135391235351562, 0.07469940185546875, 0.07804489135742188, 0.081390380859375, 0.08473587036132812, 0.08808135986328125, 0.09142684936523438, 0.0947723388671875, 0.09811782836914062, 0.10146331787109375, 0.10480880737304688, 0.108154296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 11.0, 17.0, 25.0, 40.0, 54.0, 85.0, 113.0, 192.0, 154.0, 81.0, 49.0, 39.0, 27.0, 32.0, 9.0, 11.0, 9.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.350090891122818e-05, -7.160194218158722e-05, -6.970297545194626e-05, -6.78040087223053e-05, -6.590504199266434e-05, -6.400607526302338e-05, -6.210710853338242e-05, -6.0208141803741455e-05, -5.8309175074100494e-05, -5.6410208344459534e-05, -5.451124161481857e-05, -5.261227488517761e-05, -5.071330815553665e-05, -4.881434142589569e-05, -4.691537469625473e-05, -4.501640796661377e-05, -4.311744123697281e-05, -4.121847450733185e-05, -3.931950777769089e-05, -3.742054104804993e-05, -3.5521574318408966e-05, -3.3622607588768005e-05, -3.1723640859127045e-05, -2.9824674129486084e-05, -2.7925707399845123e-05, -2.6026740670204163e-05, -2.4127773940563202e-05, -2.222880721092224e-05, -2.032984048128128e-05, -1.843087375164032e-05, -1.653190702199936e-05, -1.4632940292358398e-05, -1.2733973562717438e-05, -1.0835006833076477e-05, -8.936040103435516e-06, -7.037073373794556e-06, -5.138106644153595e-06, -3.2391399145126343e-06, -1.3401731848716736e-06, 5.587935447692871e-07, 2.457760274410248e-06, 4.3567270040512085e-06, 6.255693733692169e-06, 8.15466046333313e-06, 1.005362719297409e-05, 1.1952593922615051e-05, 1.3851560652256012e-05, 1.5750527381896973e-05, 1.7649494111537933e-05, 1.9548460841178894e-05, 2.1447427570819855e-05, 2.3346394300460815e-05, 2.5245361030101776e-05, 2.7144327759742737e-05, 2.9043294489383698e-05, 3.094226121902466e-05, 3.284122794866562e-05, 3.474019467830658e-05, 3.663916140794754e-05, 3.85381281375885e-05, 4.043709486722946e-05, 4.233606159687042e-05, 4.423502832651138e-05, 4.6133995056152344e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 11.0, 11.0, 14.0, 14.0, 28.0, 36.0, 59.0, 96.0, 171.0, 209.0, 344.0, 593.0, 978.0, 1552.0, 2726.0, 5051.0, 9586.0, 19531.0, 43465.0, 113458.0, 389513.0, 298276.0, 90794.0, 36319.0, 16905.0, 8282.0, 4415.0, 2454.0, 1446.0, 805.0, 533.0, 272.0, 204.0, 144.0, 80.0, 45.0, 47.0, 28.0, 17.0, 14.0, 8.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06494140625, -0.06276893615722656, -0.060596466064453125, -0.05842399597167969, -0.05625152587890625, -0.05407905578613281, -0.051906585693359375, -0.04973411560058594, -0.0475616455078125, -0.04538917541503906, -0.043216705322265625, -0.04104423522949219, -0.03887176513671875, -0.03669929504394531, -0.034526824951171875, -0.03235435485839844, -0.030181884765625, -0.028009414672851562, -0.025836944580078125, -0.023664474487304688, -0.02149200439453125, -0.019319534301757812, -0.017147064208984375, -0.014974594116210938, -0.0128021240234375, -0.010629653930664062, -0.008457183837890625, -0.0062847137451171875, -0.00411224365234375, -0.0019397735595703125, 0.000232696533203125, 0.0024051666259765625, 0.00457763671875, 0.0067501068115234375, 0.008922576904296875, 0.011095046997070312, 0.01326751708984375, 0.015439987182617188, 0.017612457275390625, 0.019784927368164062, 0.0219573974609375, 0.024129867553710938, 0.026302337646484375, 0.028474807739257812, 0.03064727783203125, 0.03281974792480469, 0.034992218017578125, 0.03716468811035156, 0.039337158203125, 0.04150962829589844, 0.043682098388671875, 0.04585456848144531, 0.04802703857421875, 0.05019950866699219, 0.052371978759765625, 0.05454444885253906, 0.0567169189453125, 0.05888938903808594, 0.061061859130859375, 0.06323432922363281, 0.06540679931640625, 0.06757926940917969, 0.06975173950195312, 0.07192420959472656, 0.0740966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 10.0, 6.0, 8.0, 10.0, 15.0, 18.0, 23.0, 24.0, 23.0, 29.0, 39.0, 59.0, 64.0, 62.0, 89.0, 83.0, 83.0, 59.0, 51.0, 41.0, 38.0, 37.0, 19.0, 17.0, 16.0, 16.0, 13.0, 7.0, 7.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.02039480209350586, -0.01977825164794922, -0.019161701202392578, -0.018545150756835938, -0.017928600311279297, -0.017312049865722656, -0.016695499420166016, -0.016078948974609375, -0.015462398529052734, -0.014845848083496094, -0.014229297637939453, -0.013612747192382812, -0.012996196746826172, -0.012379646301269531, -0.01176309585571289, -0.01114654541015625, -0.01052999496459961, -0.009913444519042969, -0.009296894073486328, -0.008680343627929688, -0.008063793182373047, -0.007447242736816406, -0.006830692291259766, -0.006214141845703125, -0.005597591400146484, -0.004981040954589844, -0.004364490509033203, -0.0037479400634765625, -0.003131389617919922, -0.0025148391723632812, -0.0018982887268066406, -0.00128173828125, -0.0006651878356933594, -4.863739013671875e-05, 0.0005679130554199219, 0.0011844635009765625, 0.0018010139465332031, 0.0024175643920898438, 0.0030341148376464844, 0.003650665283203125, 0.004267215728759766, 0.004883766174316406, 0.005500316619873047, 0.0061168670654296875, 0.006733417510986328, 0.007349967956542969, 0.00796651840209961, 0.00858306884765625, 0.00919961929321289, 0.009816169738769531, 0.010432720184326172, 0.011049270629882812, 0.011665821075439453, 0.012282371520996094, 0.012898921966552734, 0.013515472412109375, 0.014132022857666016, 0.014748573303222656, 0.015365123748779297, 0.015981674194335938, 0.016598224639892578, 0.01721477508544922, 0.01783132553100586, 0.0184478759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 6.0, 16.0, 34.0, 35.0, 58.0, 68.0, 110.0, 137.0, 140.0, 116.0, 69.0, 60.0, 46.0, 27.0, 18.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1575431823730469, -1.1226516962051392, -1.087760090827942, -1.0528686046600342, -1.0179771184921265, -0.9830855131149292, -0.9481940269470215, -0.913302481174469, -0.8784109354019165, -0.843519389629364, -0.8086279034614563, -0.7737363576889038, -0.7388448119163513, -0.7039532661437988, -0.6690617799758911, -0.6341702342033386, -0.5992787480354309, -0.5643872022628784, -0.5294957160949707, -0.4946041703224182, -0.4597126245498657, -0.4248211085796356, -0.3899295926094055, -0.355038046836853, -0.3201465308666229, -0.2852550148963928, -0.25036346912384033, -0.21547195315361023, -0.18058042228221893, -0.14568889141082764, -0.11079737544059753, -0.07590584456920624, -0.04101431369781494, -0.0061227865517139435, 0.028768740594387054, 0.06366026401519775, 0.09855179488658905, 0.13344332575798035, 0.16833484172821045, 0.20322637259960175, 0.23811790347099304, 0.27300941944122314, 0.30790096521377563, 0.34279248118400574, 0.37768399715423584, 0.41257554292678833, 0.44746705889701843, 0.48235857486724854, 0.517250120639801, 0.5521416664123535, 0.5870331525802612, 0.6219246983528137, 0.6568162441253662, 0.6917077302932739, 0.7265992760658264, 0.7614908218383789, 0.7963823080062866, 0.8312738537788391, 0.8661653399467468, 0.9010568857192993, 0.9359484314918518, 0.9708399772644043, 1.005731463432312, 1.0406229496002197, 1.075514554977417]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 12.0, 15.0, 13.0, 35.0, 38.0, 45.0, 46.0, 63.0, 68.0, 56.0, 71.0, 74.0, 61.0, 77.0, 56.0, 50.0, 37.0, 36.0, 36.0, 22.0, 13.0, 18.0, 12.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9620012044906616, -0.9360266327857971, -0.9100520610809326, -0.8840775489807129, -0.8581029772758484, -0.8321284055709839, -0.8061538934707642, -0.7801793217658997, -0.7542047500610352, -0.7282301783561707, -0.7022556066513062, -0.6762810945510864, -0.6503065228462219, -0.6243319511413574, -0.5983574390411377, -0.5723828673362732, -0.5464082956314087, -0.5204337239265442, -0.4944591820240021, -0.46848464012145996, -0.44251006841659546, -0.41653549671173096, -0.39056095480918884, -0.36458641290664673, -0.3386118412017822, -0.3126372694969177, -0.2866627275943756, -0.2606881856918335, -0.234713613986969, -0.20873905718326569, -0.18276450037956238, -0.15678994357585907, -0.13081538677215576, -0.10484082996845245, -0.07886627316474915, -0.05289171636104584, -0.02691715955734253, -0.0009426027536392212, 0.025031954050064087, 0.051006510853767395, 0.0769810676574707, 0.10295562446117401, 0.12893018126487732, 0.15490473806858063, 0.18087929487228394, 0.20685385167598724, 0.23282840847969055, 0.25880295038223267, 0.28477752208709717, 0.31075209379196167, 0.3367266356945038, 0.3627011775970459, 0.3886757493019104, 0.4146503210067749, 0.440624862909317, 0.46659940481185913, 0.49257397651672363, 0.5185485482215881, 0.5445231199264526, 0.5704976320266724, 0.5964722037315369, 0.6224467754364014, 0.6484212875366211, 0.6743958592414856, 0.7003704309463501]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 4.0, 16.0, 27.0, 22.0, 43.0, 73.0, 118.0, 198.0, 325.0, 635.0, 1197.0, 2264.0, 5187.0, 14524.0, 94261.0, 842424.0, 65874.0, 12410.0, 4610.0, 2062.0, 989.0, 517.0, 292.0, 191.0, 99.0, 64.0, 34.0, 23.0, 19.0, 20.0, 4.0, 8.0, 4.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2387237548828125, -1.183502197265625, -1.1282806396484375, -1.07305908203125, -1.0178375244140625, -0.962615966796875, -0.9073944091796875, -0.8521728515625, -0.7969512939453125, -0.741729736328125, -0.6865081787109375, -0.63128662109375, -0.5760650634765625, -0.520843505859375, -0.4656219482421875, -0.410400390625, -0.3551788330078125, -0.299957275390625, -0.2447357177734375, -0.18951416015625, -0.1342926025390625, -0.079071044921875, -0.0238494873046875, 0.0313720703125, 0.0865936279296875, 0.141815185546875, 0.1970367431640625, 0.25225830078125, 0.3074798583984375, 0.362701416015625, 0.4179229736328125, 0.47314453125, 0.5283660888671875, 0.583587646484375, 0.6388092041015625, 0.69403076171875, 0.7492523193359375, 0.804473876953125, 0.8596954345703125, 0.9149169921875, 0.9701385498046875, 1.025360107421875, 1.0805816650390625, 1.13580322265625, 1.1910247802734375, 1.246246337890625, 1.3014678955078125, 1.356689453125, 1.4119110107421875, 1.467132568359375, 1.5223541259765625, 1.57757568359375, 1.6327972412109375, 1.688018798828125, 1.7432403564453125, 1.7984619140625, 1.8536834716796875, 1.908905029296875, 1.9641265869140625, 2.01934814453125, 2.0745697021484375, 2.129791259765625, 2.1850128173828125, 2.240234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 6.0, 4.0, 6.0, 10.0, 15.0, 18.0, 16.0, 32.0, 55.0, 51.0, 67.0, 60.0, 87.0, 69.0, 74.0, 66.0, 75.0, 54.0, 52.0, 41.0, 36.0, 25.0, 22.0, 13.0, 13.0, 11.0, 5.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.0403900146484375, -1.985076904296875, -1.9297637939453125, -1.87445068359375, -1.8191375732421875, -1.763824462890625, -1.7085113525390625, -1.6531982421875, -1.5978851318359375, -1.542572021484375, -1.4872589111328125, -1.43194580078125, -1.3766326904296875, -1.321319580078125, -1.2660064697265625, -1.210693359375, -1.1553802490234375, -1.100067138671875, -1.0447540283203125, -0.98944091796875, -0.9341278076171875, -0.878814697265625, -0.8235015869140625, -0.7681884765625, -0.7128753662109375, -0.657562255859375, -0.6022491455078125, -0.54693603515625, -0.4916229248046875, -0.436309814453125, -0.3809967041015625, -0.32568359375, -0.2703704833984375, -0.215057373046875, -0.1597442626953125, -0.10443115234375, -0.0491180419921875, 0.006195068359375, 0.0615081787109375, 0.1168212890625, 0.1721343994140625, 0.227447509765625, 0.2827606201171875, 0.33807373046875, 0.3933868408203125, 0.448699951171875, 0.5040130615234375, 0.559326171875, 0.6146392822265625, 0.669952392578125, 0.7252655029296875, 0.78057861328125, 0.8358917236328125, 0.891204833984375, 0.9465179443359375, 1.0018310546875, 1.0571441650390625, 1.112457275390625, 1.1677703857421875, 1.22308349609375, 1.2783966064453125, 1.333709716796875, 1.3890228271484375, 1.4443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 16.0, 2.0, 13.0, 22.0, 13.0, 28.0, 35.0, 46.0, 94.0, 134.0, 176.0, 377.0, 642.0, 1132.0, 2330.0, 4767.0, 12747.0, 53016.0, 710364.0, 221088.0, 25985.0, 8110.0, 3493.0, 1759.0, 899.0, 505.0, 279.0, 159.0, 83.0, 79.0, 49.0, 40.0, 21.0, 13.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.0835723876953125, -1.043121337890625, -1.0026702880859375, -0.96221923828125, -0.9217681884765625, -0.881317138671875, -0.8408660888671875, -0.8004150390625, -0.7599639892578125, -0.719512939453125, -0.6790618896484375, -0.63861083984375, -0.5981597900390625, -0.557708740234375, -0.5172576904296875, -0.476806640625, -0.4363555908203125, -0.395904541015625, -0.3554534912109375, -0.31500244140625, -0.2745513916015625, -0.234100341796875, -0.1936492919921875, -0.1531982421875, -0.1127471923828125, -0.072296142578125, -0.0318450927734375, 0.00860595703125, 0.0490570068359375, 0.089508056640625, 0.1299591064453125, 0.17041015625, 0.2108612060546875, 0.251312255859375, 0.2917633056640625, 0.33221435546875, 0.3726654052734375, 0.413116455078125, 0.4535675048828125, 0.4940185546875, 0.5344696044921875, 0.574920654296875, 0.6153717041015625, 0.65582275390625, 0.6962738037109375, 0.736724853515625, 0.7771759033203125, 0.817626953125, 0.8580780029296875, 0.898529052734375, 0.9389801025390625, 0.97943115234375, 1.0198822021484375, 1.060333251953125, 1.1007843017578125, 1.1412353515625, 1.1816864013671875, 1.222137451171875, 1.2625885009765625, 1.30303955078125, 1.3434906005859375, 1.383941650390625, 1.4243927001953125, 1.46484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 10.0, 12.0, 9.0, 15.0, 18.0, 24.0, 32.0, 37.0, 37.0, 46.0, 49.0, 40.0, 48.0, 48.0, 53.0, 41.0, 54.0, 56.0, 52.0, 37.0, 39.0, 36.0, 24.0, 24.0, 23.0, 21.0, 18.0, 15.0, 14.0, 7.0, 15.0, 11.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4306640625, -1.3872222900390625, -1.343780517578125, -1.3003387451171875, -1.25689697265625, -1.2134552001953125, -1.170013427734375, -1.1265716552734375, -1.0831298828125, -1.0396881103515625, -0.996246337890625, -0.9528045654296875, -0.90936279296875, -0.8659210205078125, -0.822479248046875, -0.7790374755859375, -0.735595703125, -0.6921539306640625, -0.648712158203125, -0.6052703857421875, -0.56182861328125, -0.5183868408203125, -0.474945068359375, -0.4315032958984375, -0.3880615234375, -0.3446197509765625, -0.301177978515625, -0.2577362060546875, -0.21429443359375, -0.1708526611328125, -0.127410888671875, -0.0839691162109375, -0.04052734375, 0.0029144287109375, 0.046356201171875, 0.0897979736328125, 0.13323974609375, 0.1766815185546875, 0.220123291015625, 0.2635650634765625, 0.3070068359375, 0.3504486083984375, 0.393890380859375, 0.4373321533203125, 0.48077392578125, 0.5242156982421875, 0.567657470703125, 0.6110992431640625, 0.654541015625, 0.6979827880859375, 0.741424560546875, 0.7848663330078125, 0.82830810546875, 0.8717498779296875, 0.915191650390625, 0.9586334228515625, 1.0020751953125, 1.0455169677734375, 1.088958740234375, 1.1324005126953125, 1.17584228515625, 1.2192840576171875, 1.262725830078125, 1.3061676025390625, 1.349609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 19.0, 23.0, 32.0, 55.0, 76.0, 124.0, 200.0, 254.0, 452.0, 817.0, 1416.0, 2925.0, 7840.0, 33002.0, 701655.0, 264636.0, 23239.0, 6206.0, 2541.0, 1105.0, 679.0, 444.0, 286.0, 186.0, 123.0, 57.0, 44.0, 22.0, 16.0, 15.0, 14.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.448486328125, -0.4356346130371094, -0.42278289794921875, -0.4099311828613281, -0.3970794677734375, -0.3842277526855469, -0.37137603759765625, -0.3585243225097656, -0.345672607421875, -0.3328208923339844, -0.31996917724609375, -0.3071174621582031, -0.2942657470703125, -0.2814140319824219, -0.26856231689453125, -0.2557106018066406, -0.24285888671875, -0.23000717163085938, -0.21715545654296875, -0.20430374145507812, -0.1914520263671875, -0.17860031127929688, -0.16574859619140625, -0.15289688110351562, -0.140045166015625, -0.12719345092773438, -0.11434173583984375, -0.10149002075195312, -0.0886383056640625, -0.07578659057617188, -0.06293487548828125, -0.050083160400390625, -0.0372314453125, -0.024379730224609375, -0.01152801513671875, 0.001323699951171875, 0.0141754150390625, 0.027027130126953125, 0.03987884521484375, 0.052730560302734375, 0.065582275390625, 0.07843399047851562, 0.09128570556640625, 0.10413742065429688, 0.1169891357421875, 0.12984085083007812, 0.14269256591796875, 0.15554428100585938, 0.16839599609375, 0.18124771118164062, 0.19409942626953125, 0.20695114135742188, 0.2198028564453125, 0.23265457153320312, 0.24550628662109375, 0.2583580017089844, 0.271209716796875, 0.2840614318847656, 0.29691314697265625, 0.3097648620605469, 0.3226165771484375, 0.3354682922363281, 0.34832000732421875, 0.3611717224121094, 0.3740234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 18.0, 24.0, 82.0, 198.0, 423.0, 127.0, 55.0, 25.0, 11.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.896257400512695e-05, -6.571691483259201e-05, -6.247125566005707e-05, -5.9225596487522125e-05, -5.597993731498718e-05, -5.273427814245224e-05, -4.94886189699173e-05, -4.6242959797382355e-05, -4.299730062484741e-05, -3.975164145231247e-05, -3.650598227977753e-05, -3.3260323107242584e-05, -3.001466393470764e-05, -2.67690047621727e-05, -2.3523345589637756e-05, -2.0277686417102814e-05, -1.703202724456787e-05, -1.3786368072032928e-05, -1.0540708899497986e-05, -7.295049726963043e-06, -4.049390554428101e-06, -8.03731381893158e-07, 2.4419277906417847e-06, 5.687586963176727e-06, 8.93324613571167e-06, 1.2178905308246613e-05, 1.5424564480781555e-05, 1.8670223653316498e-05, 2.191588282585144e-05, 2.5161541998386383e-05, 2.8407201170921326e-05, 3.165286034345627e-05, 3.489851951599121e-05, 3.8144178688526154e-05, 4.1389837861061096e-05, 4.463549703359604e-05, 4.788115620613098e-05, 5.1126815378665924e-05, 5.437247455120087e-05, 5.761813372373581e-05, 6.086379289627075e-05, 6.41094520688057e-05, 6.735511124134064e-05, 7.060077041387558e-05, 7.384642958641052e-05, 7.709208875894547e-05, 8.033774793148041e-05, 8.358340710401535e-05, 8.682906627655029e-05, 9.007472544908524e-05, 9.332038462162018e-05, 9.656604379415512e-05, 9.981170296669006e-05, 0.000103057362139225, 0.00010630302131175995, 0.00010954868048429489, 0.00011279433965682983, 0.00011603999882936478, 0.00011928565800189972, 0.00012253131717443466, 0.0001257769763469696, 0.00012902263551950455, 0.0001322682946920395, 0.00013551395386457443, 0.00013875961303710938]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 12.0, 6.0, 5.0, 34.0, 27.0, 37.0, 73.0, 93.0, 134.0, 193.0, 263.0, 402.0, 621.0, 1145.0, 2020.0, 3806.0, 8860.0, 30562.0, 311077.0, 627417.0, 41242.0, 10510.0, 4344.0, 2306.0, 1257.0, 701.0, 428.0, 298.0, 217.0, 148.0, 100.0, 68.0, 50.0, 30.0, 16.0, 14.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.37384796142578125, -0.3621978759765625, -0.35054779052734375, -0.338897705078125, -0.32724761962890625, -0.3155975341796875, -0.30394744873046875, -0.29229736328125, -0.28064727783203125, -0.2689971923828125, -0.25734710693359375, -0.245697021484375, -0.23404693603515625, -0.2223968505859375, -0.21074676513671875, -0.1990966796875, -0.18744659423828125, -0.1757965087890625, -0.16414642333984375, -0.152496337890625, -0.14084625244140625, -0.1291961669921875, -0.11754608154296875, -0.10589599609375, -0.09424591064453125, -0.0825958251953125, -0.07094573974609375, -0.059295654296875, -0.04764556884765625, -0.0359954833984375, -0.02434539794921875, -0.0126953125, -0.00104522705078125, 0.0106048583984375, 0.02225494384765625, 0.033905029296875, 0.04555511474609375, 0.0572052001953125, 0.06885528564453125, 0.08050537109375, 0.09215545654296875, 0.1038055419921875, 0.11545562744140625, 0.127105712890625, 0.13875579833984375, 0.1504058837890625, 0.16205596923828125, 0.1737060546875, 0.18535614013671875, 0.1970062255859375, 0.20865631103515625, 0.220306396484375, 0.23195648193359375, 0.2436065673828125, 0.25525665283203125, 0.26690673828125, 0.27855682373046875, 0.2902069091796875, 0.30185699462890625, 0.313507080078125, 0.32515716552734375, 0.3368072509765625, 0.34845733642578125, 0.360107421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 5.0, 20.0, 12.0, 12.0, 20.0, 22.0, 28.0, 47.0, 77.0, 79.0, 108.0, 158.0, 91.0, 65.0, 55.0, 40.0, 35.0, 22.0, 8.0, 15.0, 14.0, 10.0, 9.0, 10.0, 5.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06546783447265625, -0.0625152587890625, -0.05956268310546875, -0.056610107421875, -0.05365753173828125, -0.0507049560546875, -0.04775238037109375, -0.0447998046875, -0.04184722900390625, -0.0388946533203125, -0.03594207763671875, -0.032989501953125, -0.03003692626953125, -0.0270843505859375, -0.02413177490234375, -0.02117919921875, -0.01822662353515625, -0.0152740478515625, -0.01232147216796875, -0.009368896484375, -0.00641632080078125, -0.0034637451171875, -0.00051116943359375, 0.00244140625, 0.00539398193359375, 0.0083465576171875, 0.01129913330078125, 0.014251708984375, 0.01720428466796875, 0.0201568603515625, 0.02310943603515625, 0.02606201171875, 0.02901458740234375, 0.0319671630859375, 0.03491973876953125, 0.037872314453125, 0.04082489013671875, 0.0437774658203125, 0.04673004150390625, 0.0496826171875, 0.05263519287109375, 0.0555877685546875, 0.05854034423828125, 0.061492919921875, 0.06444549560546875, 0.0673980712890625, 0.07035064697265625, 0.07330322265625, 0.07625579833984375, 0.0792083740234375, 0.08216094970703125, 0.085113525390625, 0.08806610107421875, 0.0910186767578125, 0.09397125244140625, 0.096923828125, 0.09987640380859375, 0.1028289794921875, 0.10578155517578125, 0.108734130859375, 0.11168670654296875, 0.1146392822265625, 0.11759185791015625, 0.12054443359375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 17.0, 34.0, 20.0, 45.0, 50.0, 79.0, 104.0, 100.0, 137.0, 103.0, 97.0, 53.0, 41.0, 31.0, 16.0, 16.0, 12.0, 7.0, 5.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.9285340309143066, -2.860914945602417, -2.7932960987091064, -2.725677013397217, -2.658057928085327, -2.5904388427734375, -2.522819995880127, -2.4552009105682373, -2.3875818252563477, -2.319962739944458, -2.2523438930511475, -2.184724807739258, -2.117105722427368, -2.0494866371154785, -1.981867790222168, -1.9142487049102783, -1.8466298580169678, -1.7790108919143677, -1.711391806602478, -1.643772840499878, -1.5761537551879883, -1.5085347890853882, -1.440915822982788, -1.3732967376708984, -1.3056777715682983, -1.2380588054656982, -1.1704397201538086, -1.1028207540512085, -1.0352017879486084, -0.9675827026367188, -0.8999637365341187, -0.8323447108268738, -0.7647258043289185, -0.6971067786216736, -0.6294877529144287, -0.5618687868118286, -0.49424976110458374, -0.42663073539733887, -0.3590117394924164, -0.2913927435874939, -0.22377371788024902, -0.15615470707416534, -0.08853569626808167, -0.020916685461997986, 0.04670232534408569, 0.11432135105133057, 0.18194034695625305, 0.24955934286117554, 0.3171783685684204, 0.3847973942756653, 0.45241639018058777, 0.5200353860855103, 0.5876544117927551, 0.6552734375, 0.7228924036026001, 0.790511429309845, 0.8581304550170898, 0.9257494807243347, 0.9933685064315796, 1.0609874725341797, 1.1286065578460693, 1.1962255239486694, 1.2638444900512695, 1.3314635753631592, 1.3990825414657593]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 5.0, 6.0, 9.0, 11.0, 16.0, 16.0, 11.0, 28.0, 22.0, 30.0, 19.0, 29.0, 25.0, 31.0, 26.0, 42.0, 38.0, 34.0, 38.0, 48.0, 38.0, 27.0, 38.0, 38.0, 40.0, 40.0, 36.0, 33.0, 31.0, 28.0, 20.0, 20.0, 20.0, 10.0, 16.0, 17.0, 17.0, 12.0, 8.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734708309173584, -1.677946925163269, -1.621185541152954, -1.5644241571426392, -1.5076627731323242, -1.4509012699127197, -1.3941398859024048, -1.3373785018920898, -1.280617117881775, -1.22385573387146, -1.167094349861145, -1.11033296585083, -1.0535714626312256, -0.9968101382255554, -0.9400486946105957, -0.8832873106002808, -0.8265259265899658, -0.7697645425796509, -0.7130031585693359, -0.6562417149543762, -0.5994803309440613, -0.5427189469337463, -0.485957533121109, -0.4291961193084717, -0.37243473529815674, -0.3156733512878418, -0.25891193747520447, -0.20215053856372833, -0.1453891396522522, -0.08862775564193726, -0.03186634182929993, 0.024895071983337402, 0.0816565752029419, 0.13841797411441803, 0.19517937302589417, 0.2519407868385315, 0.30870217084884644, 0.3654635548591614, 0.4222249686717987, 0.47898638248443604, 0.535747766494751, 0.5925091505050659, 0.6492705345153809, 0.7060319781303406, 0.7627933621406555, 0.8195547461509705, 0.8763161897659302, 0.9330775737762451, 0.9898389577865601, 1.046600341796875, 1.10336172580719, 1.1601231098175049, 1.2168846130371094, 1.2736458778381348, 1.3304073810577393, 1.3871687650680542, 1.4439301490783691, 1.500691533088684, 1.557452917098999, 1.614214301109314, 1.670975685119629, 1.7277371883392334, 1.7844985723495483, 1.8412599563598633, 1.8980213403701782]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 12.0, 9.0, 20.0, 25.0, 28.0, 40.0, 50.0, 70.0, 98.0, 146.0, 225.0, 361.0, 536.0, 870.0, 1553.0, 3030.0, 6471.0, 18384.0, 84824.0, 2029415.0, 1929681.0, 86393.0, 18296.0, 6571.0, 3007.0, 1627.0, 911.0, 541.0, 354.0, 232.0, 148.0, 79.0, 65.0, 66.0, 25.0, 28.0, 23.0, 15.0, 7.0, 11.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.7275390625, -1.6781768798828125, -1.628814697265625, -1.5794525146484375, -1.53009033203125, -1.4807281494140625, -1.431365966796875, -1.3820037841796875, -1.3326416015625, -1.2832794189453125, -1.233917236328125, -1.1845550537109375, -1.13519287109375, -1.0858306884765625, -1.036468505859375, -0.9871063232421875, -0.937744140625, -0.8883819580078125, -0.839019775390625, -0.7896575927734375, -0.74029541015625, -0.6909332275390625, -0.641571044921875, -0.5922088623046875, -0.5428466796875, -0.4934844970703125, -0.444122314453125, -0.3947601318359375, -0.34539794921875, -0.2960357666015625, -0.246673583984375, -0.1973114013671875, -0.14794921875, -0.0985870361328125, -0.049224853515625, 0.0001373291015625, 0.04949951171875, 0.0988616943359375, 0.148223876953125, 0.1975860595703125, 0.2469482421875, 0.2963104248046875, 0.345672607421875, 0.3950347900390625, 0.44439697265625, 0.4937591552734375, 0.543121337890625, 0.5924835205078125, 0.641845703125, 0.6912078857421875, 0.740570068359375, 0.7899322509765625, 0.83929443359375, 0.8886566162109375, 0.938018798828125, 0.9873809814453125, 1.0367431640625, 1.0861053466796875, 1.135467529296875, 1.1848297119140625, 1.23419189453125, 1.2835540771484375, 1.332916259765625, 1.3822784423828125, 1.431640625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 10.0, 13.0, 20.0, 18.0, 23.0, 44.0, 42.0, 48.0, 53.0, 55.0, 84.0, 66.0, 70.0, 60.0, 75.0, 75.0, 40.0, 42.0, 29.0, 28.0, 28.0, 17.0, 7.0, 13.0, 7.0, 6.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80517578125, -0.778228759765625, -0.75128173828125, -0.724334716796875, -0.6973876953125, -0.670440673828125, -0.64349365234375, -0.616546630859375, -0.589599609375, -0.562652587890625, -0.53570556640625, -0.508758544921875, -0.4818115234375, -0.454864501953125, -0.42791748046875, -0.400970458984375, -0.3740234375, -0.347076416015625, -0.32012939453125, -0.293182373046875, -0.2662353515625, -0.239288330078125, -0.21234130859375, -0.185394287109375, -0.158447265625, -0.131500244140625, -0.10455322265625, -0.077606201171875, -0.0506591796875, -0.023712158203125, 0.00323486328125, 0.030181884765625, 0.05712890625, 0.084075927734375, 0.11102294921875, 0.137969970703125, 0.1649169921875, 0.191864013671875, 0.21881103515625, 0.245758056640625, 0.272705078125, 0.299652099609375, 0.32659912109375, 0.353546142578125, 0.3804931640625, 0.407440185546875, 0.43438720703125, 0.461334228515625, 0.48828125, 0.515228271484375, 0.54217529296875, 0.569122314453125, 0.5960693359375, 0.623016357421875, 0.64996337890625, 0.676910400390625, 0.703857421875, 0.730804443359375, 0.75775146484375, 0.784698486328125, 0.8116455078125, 0.838592529296875, 0.86553955078125, 0.892486572265625, 0.91943359375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 7.0, 7.0, 15.0, 18.0, 27.0, 46.0, 64.0, 168.0, 381.0, 1023.0, 3139.0, 11415.0, 60130.0, 3343917.0, 725429.0, 36759.0, 7995.0, 2309.0, 770.0, 308.0, 135.0, 70.0, 45.0, 25.0, 20.0, 10.0, 6.0, 9.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.556976318359375, -2.47137451171875, -2.385772705078125, -2.3001708984375, -2.214569091796875, -2.12896728515625, -2.043365478515625, -1.957763671875, -1.872161865234375, -1.78656005859375, -1.700958251953125, -1.6153564453125, -1.529754638671875, -1.44415283203125, -1.358551025390625, -1.27294921875, -1.187347412109375, -1.10174560546875, -1.016143798828125, -0.9305419921875, -0.844940185546875, -0.75933837890625, -0.673736572265625, -0.588134765625, -0.502532958984375, -0.41693115234375, -0.331329345703125, -0.2457275390625, -0.160125732421875, -0.07452392578125, 0.011077880859375, 0.0966796875, 0.182281494140625, 0.26788330078125, 0.353485107421875, 0.4390869140625, 0.524688720703125, 0.61029052734375, 0.695892333984375, 0.781494140625, 0.867095947265625, 0.95269775390625, 1.038299560546875, 1.1239013671875, 1.209503173828125, 1.29510498046875, 1.380706787109375, 1.46630859375, 1.551910400390625, 1.63751220703125, 1.723114013671875, 1.8087158203125, 1.894317626953125, 1.97991943359375, 2.065521240234375, 2.151123046875, 2.236724853515625, 2.32232666015625, 2.407928466796875, 2.4935302734375, 2.579132080078125, 2.66473388671875, 2.750335693359375, 2.8359375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 8.0, 13.0, 18.0, 16.0, 14.0, 23.0, 41.0, 68.0, 65.0, 126.0, 241.0, 559.0, 1055.0, 848.0, 408.0, 203.0, 100.0, 51.0, 51.0, 40.0, 22.0, 17.0, 15.0, 12.0, 12.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5979537963867188, -0.5792083740234375, -0.5604629516601562, -0.541717529296875, -0.5229721069335938, -0.5042266845703125, -0.48548126220703125, -0.46673583984375, -0.44799041748046875, -0.4292449951171875, -0.41049957275390625, -0.391754150390625, -0.37300872802734375, -0.3542633056640625, -0.33551788330078125, -0.3167724609375, -0.29802703857421875, -0.2792816162109375, -0.26053619384765625, -0.241790771484375, -0.22304534912109375, -0.2042999267578125, -0.18555450439453125, -0.16680908203125, -0.14806365966796875, -0.1293182373046875, -0.11057281494140625, -0.091827392578125, -0.07308197021484375, -0.0543365478515625, -0.03559112548828125, -0.016845703125, 0.00189971923828125, 0.0206451416015625, 0.03939056396484375, 0.058135986328125, 0.07688140869140625, 0.0956268310546875, 0.11437225341796875, 0.13311767578125, 0.15186309814453125, 0.1706085205078125, 0.18935394287109375, 0.208099365234375, 0.22684478759765625, 0.2455902099609375, 0.26433563232421875, 0.2830810546875, 0.30182647705078125, 0.3205718994140625, 0.33931732177734375, 0.358062744140625, 0.37680816650390625, 0.3955535888671875, 0.41429901123046875, 0.43304443359375, 0.45178985595703125, 0.4705352783203125, 0.48928070068359375, 0.508026123046875, 0.5267715454101562, 0.5455169677734375, 0.5642623901367188, 0.5830078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 8.0, 5.0, 6.0, 13.0, 12.0, 22.0, 27.0, 32.0, 53.0, 55.0, 76.0, 75.0, 86.0, 83.0, 82.0, 73.0, 65.0, 55.0, 31.0, 24.0, 33.0, 11.0, 16.0, 10.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1894127130508423, -1.1456818580627441, -1.1019511222839355, -1.058220386505127, -1.0144895315170288, -0.9707587361335754, -0.9270279407501221, -0.8832971453666687, -0.8395663499832153, -0.795835554599762, -0.7521047592163086, -0.7083739638328552, -0.6646431684494019, -0.6209123730659485, -0.5771815776824951, -0.5334507822990417, -0.4897199869155884, -0.445989191532135, -0.40225839614868164, -0.35852760076522827, -0.3147968053817749, -0.27106600999832153, -0.22733521461486816, -0.1836044192314148, -0.13987362384796143, -0.09614282846450806, -0.05241203308105469, -0.008681237697601318, 0.03504955768585205, 0.07878035306930542, 0.12251114845275879, 0.16624194383621216, 0.20997262001037598, 0.25370341539382935, 0.2974342107772827, 0.3411650061607361, 0.38489580154418945, 0.4286265969276428, 0.4723573923110962, 0.5160881876945496, 0.5598189830780029, 0.6035497784614563, 0.6472805738449097, 0.691011369228363, 0.7347421646118164, 0.7784729599952698, 0.8222037553787231, 0.8659345507621765, 0.9096653461456299, 0.9533961415290833, 0.9971269369125366, 1.0408577919006348, 1.0845885276794434, 1.128319263458252, 1.17205011844635, 1.2157809734344482, 1.2595117092132568, 1.3032424449920654, 1.3469732999801636, 1.3907041549682617, 1.4344348907470703, 1.478165626525879, 1.521896481513977, 1.5656273365020752, 1.6093580722808838]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 11.0, 7.0, 6.0, 12.0, 16.0, 18.0, 26.0, 24.0, 25.0, 32.0, 36.0, 39.0, 35.0, 36.0, 44.0, 41.0, 49.0, 37.0, 46.0, 42.0, 40.0, 45.0, 38.0, 37.0, 39.0, 19.0, 26.0, 33.0, 28.0, 17.0, 15.0, 14.0, 14.0, 13.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0004099607467651, -0.9704493880271912, -0.9404888153076172, -0.910528302192688, -0.880567729473114, -0.85060715675354, -0.8206465840339661, -0.7906860113143921, -0.7607254981994629, -0.7307649254798889, -0.7008043527603149, -0.6708438396453857, -0.6408832669258118, -0.6109226942062378, -0.5809621214866638, -0.5510015487670898, -0.5210410356521606, -0.49108046293258667, -0.4611199200153351, -0.4311593472957611, -0.4011988043785095, -0.37123823165893555, -0.3412776589393616, -0.31131711602211, -0.2813565135002136, -0.25139594078063965, -0.22143539786338806, -0.1914748251438141, -0.1615142822265625, -0.13155370950698853, -0.10159315168857574, -0.07163259387016296, -0.04167205095291138, -0.011711491271853447, 0.018249068409204483, 0.04820962995290756, 0.07817018777132034, 0.10813075304031372, 0.1380913108587265, 0.16805186867713928, 0.19801242649555206, 0.22797298431396484, 0.2579335570335388, 0.2878940999507904, 0.3178546726703644, 0.34781521558761597, 0.37777578830718994, 0.4077363610267639, 0.4376969039440155, 0.4676574766635895, 0.49761801958084106, 0.527578592300415, 0.557539165019989, 0.587499737739563, 0.6174602508544922, 0.6474208235740662, 0.6773813962936401, 0.7073419690132141, 0.7373025417327881, 0.7672630548477173, 0.7972236275672913, 0.8271842002868652, 0.8571447730064392, 0.8871053457260132, 0.9170658588409424]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 14.0, 18.0, 38.0, 34.0, 59.0, 118.0, 188.0, 292.0, 630.0, 1175.0, 2387.0, 5285.0, 12928.0, 48206.0, 615524.0, 311472.0, 31541.0, 10100.0, 4330.0, 1987.0, 975.0, 524.0, 240.0, 197.0, 96.0, 71.0, 46.0, 22.0, 16.0, 12.0, 7.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68359375, -0.6660079956054688, -0.6484222412109375, -0.6308364868164062, -0.613250732421875, -0.5956649780273438, -0.5780792236328125, -0.5604934692382812, -0.54290771484375, -0.5253219604492188, -0.5077362060546875, -0.49015045166015625, -0.472564697265625, -0.45497894287109375, -0.4373931884765625, -0.41980743408203125, -0.4022216796875, -0.38463592529296875, -0.3670501708984375, -0.34946441650390625, -0.331878662109375, -0.31429290771484375, -0.2967071533203125, -0.27912139892578125, -0.26153564453125, -0.24394989013671875, -0.2263641357421875, -0.20877838134765625, -0.191192626953125, -0.17360687255859375, -0.1560211181640625, -0.13843536376953125, -0.120849609375, -0.10326385498046875, -0.0856781005859375, -0.06809234619140625, -0.050506591796875, -0.03292083740234375, -0.0153350830078125, 0.00225067138671875, 0.01983642578125, 0.03742218017578125, 0.0550079345703125, 0.07259368896484375, 0.090179443359375, 0.10776519775390625, 0.1253509521484375, 0.14293670654296875, 0.1605224609375, 0.17810821533203125, 0.1956939697265625, 0.21327972412109375, 0.230865478515625, 0.24845123291015625, 0.2660369873046875, 0.28362274169921875, 0.30120849609375, 0.31879425048828125, 0.3363800048828125, 0.35396575927734375, 0.371551513671875, 0.38913726806640625, 0.4067230224609375, 0.42430877685546875, 0.44189453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 10.0, 5.0, 11.0, 15.0, 15.0, 34.0, 21.0, 40.0, 30.0, 37.0, 46.0, 50.0, 36.0, 57.0, 49.0, 40.0, 53.0, 48.0, 50.0, 53.0, 38.0, 36.0, 37.0, 28.0, 36.0, 22.0, 19.0, 18.0, 17.0, 12.0, 4.0, 10.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.84765625, -0.825592041015625, -0.80352783203125, -0.781463623046875, -0.7593994140625, -0.737335205078125, -0.71527099609375, -0.693206787109375, -0.671142578125, -0.649078369140625, -0.62701416015625, -0.604949951171875, -0.5828857421875, -0.560821533203125, -0.53875732421875, -0.516693115234375, -0.49462890625, -0.472564697265625, -0.45050048828125, -0.428436279296875, -0.4063720703125, -0.384307861328125, -0.36224365234375, -0.340179443359375, -0.318115234375, -0.296051025390625, -0.27398681640625, -0.251922607421875, -0.2298583984375, -0.207794189453125, -0.18572998046875, -0.163665771484375, -0.1416015625, -0.119537353515625, -0.09747314453125, -0.075408935546875, -0.0533447265625, -0.031280517578125, -0.00921630859375, 0.012847900390625, 0.034912109375, 0.056976318359375, 0.07904052734375, 0.101104736328125, 0.1231689453125, 0.145233154296875, 0.16729736328125, 0.189361572265625, 0.21142578125, 0.233489990234375, 0.25555419921875, 0.277618408203125, 0.2996826171875, 0.321746826171875, 0.34381103515625, 0.365875244140625, 0.387939453125, 0.410003662109375, 0.43206787109375, 0.454132080078125, 0.4761962890625, 0.498260498046875, 0.52032470703125, 0.542388916015625, 0.564453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 22.0, 22.0, 46.0, 53.0, 114.0, 252.0, 520.0, 1207.0, 3482.0, 12540.0, 84895.0, 772555.0, 147641.0, 18077.0, 4414.0, 1412.0, 630.0, 290.0, 149.0, 66.0, 49.0, 37.0, 26.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4892578125, -0.47377777099609375, -0.4582977294921875, -0.44281768798828125, -0.427337646484375, -0.41185760498046875, -0.3963775634765625, -0.38089752197265625, -0.36541748046875, -0.34993743896484375, -0.3344573974609375, -0.31897735595703125, -0.303497314453125, -0.28801727294921875, -0.2725372314453125, -0.25705718994140625, -0.2415771484375, -0.22609710693359375, -0.2106170654296875, -0.19513702392578125, -0.179656982421875, -0.16417694091796875, -0.1486968994140625, -0.13321685791015625, -0.11773681640625, -0.10225677490234375, -0.0867767333984375, -0.07129669189453125, -0.055816650390625, -0.04033660888671875, -0.0248565673828125, -0.00937652587890625, 0.006103515625, 0.02158355712890625, 0.0370635986328125, 0.05254364013671875, 0.068023681640625, 0.08350372314453125, 0.0989837646484375, 0.11446380615234375, 0.12994384765625, 0.14542388916015625, 0.1609039306640625, 0.17638397216796875, 0.191864013671875, 0.20734405517578125, 0.2228240966796875, 0.23830413818359375, 0.2537841796875, 0.26926422119140625, 0.2847442626953125, 0.30022430419921875, 0.315704345703125, 0.33118438720703125, 0.3466644287109375, 0.36214447021484375, 0.37762451171875, 0.39310455322265625, 0.4085845947265625, 0.42406463623046875, 0.439544677734375, 0.45502471923828125, 0.4705047607421875, 0.48598480224609375, 0.50146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 6.0, 9.0, 5.0, 15.0, 7.0, 21.0, 23.0, 31.0, 37.0, 37.0, 40.0, 44.0, 47.0, 43.0, 55.0, 56.0, 59.0, 61.0, 55.0, 43.0, 37.0, 45.0, 37.0, 36.0, 29.0, 23.0, 16.0, 19.0, 11.0, 12.0, 10.0, 3.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.643096923828125, -1.58795166015625, -1.532806396484375, -1.4776611328125, -1.422515869140625, -1.36737060546875, -1.312225341796875, -1.257080078125, -1.201934814453125, -1.14678955078125, -1.091644287109375, -1.0364990234375, -0.981353759765625, -0.92620849609375, -0.871063232421875, -0.81591796875, -0.760772705078125, -0.70562744140625, -0.650482177734375, -0.5953369140625, -0.540191650390625, -0.48504638671875, -0.429901123046875, -0.374755859375, -0.319610595703125, -0.26446533203125, -0.209320068359375, -0.1541748046875, -0.099029541015625, -0.04388427734375, 0.011260986328125, 0.06640625, 0.121551513671875, 0.17669677734375, 0.231842041015625, 0.2869873046875, 0.342132568359375, 0.39727783203125, 0.452423095703125, 0.507568359375, 0.562713623046875, 0.61785888671875, 0.673004150390625, 0.7281494140625, 0.783294677734375, 0.83843994140625, 0.893585205078125, 0.94873046875, 1.003875732421875, 1.05902099609375, 1.114166259765625, 1.1693115234375, 1.224456787109375, 1.27960205078125, 1.334747314453125, 1.389892578125, 1.445037841796875, 1.50018310546875, 1.555328369140625, 1.6104736328125, 1.665618896484375, 1.72076416015625, 1.775909423828125, 1.8310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 5.0, 19.0, 18.0, 28.0, 39.0, 54.0, 95.0, 140.0, 238.0, 440.0, 926.0, 1989.0, 5927.0, 28599.0, 635084.0, 346664.0, 19947.0, 4819.0, 1690.0, 751.0, 378.0, 233.0, 158.0, 85.0, 49.0, 44.0, 37.0, 20.0, 13.0, 14.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2506828308105469, -0.24306488037109375, -0.23544692993164062, -0.2278289794921875, -0.22021102905273438, -0.21259307861328125, -0.20497512817382812, -0.197357177734375, -0.18973922729492188, -0.18212127685546875, -0.17450332641601562, -0.1668853759765625, -0.15926742553710938, -0.15164947509765625, -0.14403152465820312, -0.13641357421875, -0.12879562377929688, -0.12117767333984375, -0.11355972290039062, -0.1059417724609375, -0.09832382202148438, -0.09070587158203125, -0.08308792114257812, -0.075469970703125, -0.06785202026367188, -0.06023406982421875, -0.052616119384765625, -0.0449981689453125, -0.037380218505859375, -0.02976226806640625, -0.022144317626953125, -0.0145263671875, -0.006908416748046875, 0.00070953369140625, 0.008327484130859375, 0.0159454345703125, 0.023563385009765625, 0.03118133544921875, 0.038799285888671875, 0.046417236328125, 0.054035186767578125, 0.06165313720703125, 0.06927108764648438, 0.0768890380859375, 0.08450698852539062, 0.09212493896484375, 0.09974288940429688, 0.10736083984375, 0.11497879028320312, 0.12259674072265625, 0.13021469116210938, 0.1378326416015625, 0.14545059204101562, 0.15306854248046875, 0.16068649291992188, 0.168304443359375, 0.17592239379882812, 0.18354034423828125, 0.19115829467773438, 0.1987762451171875, 0.20639419555664062, 0.21401214599609375, 0.22163009643554688, 0.229248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 14.0, 9.0, 22.0, 26.0, 44.0, 68.0, 94.0, 127.0, 185.0, 162.0, 78.0, 60.0, 38.0, 16.0, 13.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.814168930053711e-05, -7.53011554479599e-05, -7.246062159538269e-05, -6.962008774280548e-05, -6.677955389022827e-05, -6.393902003765106e-05, -6.109848618507385e-05, -5.825795233249664e-05, -5.5417418479919434e-05, -5.2576884627342224e-05, -4.9736350774765015e-05, -4.6895816922187805e-05, -4.4055283069610596e-05, -4.1214749217033386e-05, -3.837421536445618e-05, -3.553368151187897e-05, -3.269314765930176e-05, -2.985261380672455e-05, -2.701207995414734e-05, -2.417154610157013e-05, -2.133101224899292e-05, -1.849047839641571e-05, -1.56499445438385e-05, -1.2809410691261292e-05, -9.968876838684082e-06, -7.1283429861068726e-06, -4.287809133529663e-06, -1.4472752809524536e-06, 1.3932585716247559e-06, 4.233792424201965e-06, 7.074326276779175e-06, 9.914860129356384e-06, 1.2755393981933594e-05, 1.5595927834510803e-05, 1.8436461687088013e-05, 2.1276995539665222e-05, 2.411752939224243e-05, 2.695806324481964e-05, 2.979859709739685e-05, 3.263913094997406e-05, 3.547966480255127e-05, 3.832019865512848e-05, 4.116073250770569e-05, 4.40012663602829e-05, 4.684180021286011e-05, 4.968233406543732e-05, 5.2522867918014526e-05, 5.5363401770591736e-05, 5.8203935623168945e-05, 6.104446947574615e-05, 6.388500332832336e-05, 6.672553718090057e-05, 6.956607103347778e-05, 7.240660488605499e-05, 7.52471387386322e-05, 7.808767259120941e-05, 8.092820644378662e-05, 8.376874029636383e-05, 8.660927414894104e-05, 8.944980800151825e-05, 9.229034185409546e-05, 9.513087570667267e-05, 9.797140955924988e-05, 0.00010081194341182709, 0.0001036524772644043]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 4.0, 18.0, 22.0, 25.0, 30.0, 45.0, 65.0, 91.0, 106.0, 173.0, 222.0, 288.0, 460.0, 601.0, 946.0, 1491.0, 2508.0, 4821.0, 10367.0, 27506.0, 89970.0, 385482.0, 383153.0, 90109.0, 27786.0, 10464.0, 4547.0, 2537.0, 1430.0, 995.0, 626.0, 445.0, 294.0, 241.0, 162.0, 129.0, 95.0, 63.0, 53.0, 58.0, 29.0, 27.0, 14.0, 15.0, 8.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1241455078125, -0.12026596069335938, -0.11638641357421875, -0.11250686645507812, -0.1086273193359375, -0.10474777221679688, -0.10086822509765625, -0.09698867797851562, -0.093109130859375, -0.08922958374023438, -0.08535003662109375, -0.08147048950195312, -0.0775909423828125, -0.07371139526367188, -0.06983184814453125, -0.06595230102539062, -0.06207275390625, -0.058193206787109375, -0.05431365966796875, -0.050434112548828125, -0.0465545654296875, -0.042675018310546875, -0.03879547119140625, -0.034915924072265625, -0.031036376953125, -0.027156829833984375, -0.02327728271484375, -0.019397735595703125, -0.0155181884765625, -0.011638641357421875, -0.00775909423828125, -0.003879547119140625, 0.0, 0.003879547119140625, 0.00775909423828125, 0.011638641357421875, 0.0155181884765625, 0.019397735595703125, 0.02327728271484375, 0.027156829833984375, 0.031036376953125, 0.034915924072265625, 0.03879547119140625, 0.042675018310546875, 0.0465545654296875, 0.050434112548828125, 0.05431365966796875, 0.058193206787109375, 0.06207275390625, 0.06595230102539062, 0.06983184814453125, 0.07371139526367188, 0.0775909423828125, 0.08147048950195312, 0.08535003662109375, 0.08922958374023438, 0.093109130859375, 0.09698867797851562, 0.10086822509765625, 0.10474777221679688, 0.1086273193359375, 0.11250686645507812, 0.11638641357421875, 0.12026596069335938, 0.1241455078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 4.0, 12.0, 10.0, 30.0, 40.0, 52.0, 62.0, 111.0, 115.0, 126.0, 110.0, 83.0, 66.0, 53.0, 34.0, 25.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048858642578125, -0.047251224517822266, -0.04564380645751953, -0.0440363883972168, -0.04242897033691406, -0.04082155227661133, -0.039214134216308594, -0.03760671615600586, -0.035999298095703125, -0.03439188003540039, -0.032784461975097656, -0.031177043914794922, -0.029569625854492188, -0.027962207794189453, -0.02635478973388672, -0.024747371673583984, -0.02313995361328125, -0.021532535552978516, -0.01992511749267578, -0.018317699432373047, -0.016710281372070312, -0.015102863311767578, -0.013495445251464844, -0.01188802719116211, -0.010280609130859375, -0.00867319107055664, -0.007065773010253906, -0.005458354949951172, -0.0038509368896484375, -0.002243518829345703, -0.0006361007690429688, 0.0009713172912597656, 0.0025787353515625, 0.004186153411865234, 0.005793571472167969, 0.007400989532470703, 0.009008407592773438, 0.010615825653076172, 0.012223243713378906, 0.01383066177368164, 0.015438079833984375, 0.01704549789428711, 0.018652915954589844, 0.020260334014892578, 0.021867752075195312, 0.023475170135498047, 0.02508258819580078, 0.026690006256103516, 0.02829742431640625, 0.029904842376708984, 0.03151226043701172, 0.03311967849731445, 0.03472709655761719, 0.03633451461791992, 0.037941932678222656, 0.03954935073852539, 0.041156768798828125, 0.04276418685913086, 0.044371604919433594, 0.04597902297973633, 0.04758644104003906, 0.0491938591003418, 0.05080127716064453, 0.052408695220947266, 0.05401611328125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 18.0, 16.0, 26.0, 25.0, 56.0, 46.0, 62.0, 72.0, 72.0, 80.0, 73.0, 74.0, 66.0, 59.0, 51.0, 40.0, 28.0, 17.0, 13.0, 18.0, 12.0, 11.0, 2.0, 4.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7586199641227722, -0.7334376573562622, -0.7082552909851074, -0.6830729842185974, -0.6578906178474426, -0.6327083110809326, -0.6075259447097778, -0.5823436379432678, -0.5571613311767578, -0.5319790244102478, -0.506796658039093, -0.481614351272583, -0.4564320147037506, -0.4312496781349182, -0.4060673415660858, -0.3808850049972534, -0.355702668428421, -0.3305203318595886, -0.3053379952907562, -0.28015565872192383, -0.2549733519554138, -0.22979101538658142, -0.20460867881774902, -0.17942635715007782, -0.15424402058124542, -0.12906168401241302, -0.10387936234474182, -0.07869702577590942, -0.05351469665765762, -0.028332367539405823, -0.0031500309705734253, 0.02203229069709778, 0.047214627265930176, 0.07239695638418198, 0.09757928550243378, 0.12276162207126617, 0.14794394373893738, 0.17312628030776978, 0.19830861687660217, 0.22349093854427338, 0.24867327511310577, 0.273855596780777, 0.2990379333496094, 0.3242202699184418, 0.34940260648727417, 0.3745849132537842, 0.39976727962493896, 0.424949586391449, 0.45013192296028137, 0.47531425952911377, 0.5004965662956238, 0.5256789326667786, 0.5508612394332886, 0.5760436058044434, 0.6012259125709534, 0.6264082193374634, 0.6515905857086182, 0.6767728924751282, 0.701955258846283, 0.727137565612793, 0.7523199319839478, 0.7775022387504578, 0.8026845455169678, 0.8278669118881226, 0.8530492186546326]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 14.0, 16.0, 21.0, 31.0, 26.0, 23.0, 28.0, 37.0, 44.0, 42.0, 41.0, 37.0, 55.0, 44.0, 43.0, 54.0, 47.0, 40.0, 32.0, 38.0, 34.0, 38.0, 24.0, 38.0, 24.0, 20.0, 19.0, 8.0, 14.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.7005771994590759, -0.6812631487846375, -0.6619490385055542, -0.6426349878311157, -0.6233208775520325, -0.604006826877594, -0.5846927165985107, -0.5653786659240723, -0.5460646152496338, -0.5267505645751953, -0.5074364542961121, -0.4881224036216736, -0.4688083231449127, -0.44949424266815186, -0.430180162191391, -0.4108660817146301, -0.39155200123786926, -0.3722379207611084, -0.35292384028434753, -0.33360975980758667, -0.3142957091331482, -0.29498162865638733, -0.27566754817962646, -0.256353497505188, -0.23703940212726593, -0.21772532165050507, -0.1984112560749054, -0.17909717559814453, -0.15978309512138367, -0.140469029545784, -0.12115494906902313, -0.10184088349342346, -0.0825268030166626, -0.06321272999048233, -0.043898653239011765, -0.0245845764875412, -0.005270503461360931, 0.014043569564819336, 0.0333576500415802, 0.05267171561717987, 0.07198579609394073, 0.091299869120121, 0.11061394214630127, 0.12992802262306213, 0.149242103099823, 0.16855616867542267, 0.18787024915218353, 0.2071843147277832, 0.22649839520454407, 0.24581247568130493, 0.2651265561580658, 0.28444063663482666, 0.30375468730926514, 0.323068767786026, 0.34238284826278687, 0.36169689893722534, 0.3810110092163086, 0.40032508969306946, 0.4196391701698303, 0.4389532208442688, 0.45826730132102966, 0.4775813817977905, 0.4968954622745514, 0.5162095427513123, 0.5355235934257507]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 2.0, 3.0, 8.0, 6.0, 21.0, 19.0, 20.0, 31.0, 35.0, 44.0, 87.0, 109.0, 165.0, 264.0, 480.0, 756.0, 1327.0, 2248.0, 4301.0, 8302.0, 18792.0, 54336.0, 236580.0, 524740.0, 132702.0, 35209.0, 13510.0, 6345.0, 3337.0, 1881.0, 1130.0, 654.0, 379.0, 226.0, 155.0, 105.0, 72.0, 36.0, 33.0, 30.0, 23.0, 15.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.95263671875, -0.9222183227539062, -0.8917999267578125, -0.8613815307617188, -0.830963134765625, -0.8005447387695312, -0.7701263427734375, -0.7397079467773438, -0.70928955078125, -0.6788711547851562, -0.6484527587890625, -0.6180343627929688, -0.587615966796875, -0.5571975708007812, -0.5267791748046875, -0.49636077880859375, -0.4659423828125, -0.43552398681640625, -0.4051055908203125, -0.37468719482421875, -0.344268798828125, -0.31385040283203125, -0.2834320068359375, -0.25301361083984375, -0.22259521484375, -0.19217681884765625, -0.1617584228515625, -0.13134002685546875, -0.100921630859375, -0.07050323486328125, -0.0400848388671875, -0.00966644287109375, 0.020751953125, 0.05117034912109375, 0.0815887451171875, 0.11200714111328125, 0.142425537109375, 0.17284393310546875, 0.2032623291015625, 0.23368072509765625, 0.26409912109375, 0.29451751708984375, 0.3249359130859375, 0.35535430908203125, 0.385772705078125, 0.41619110107421875, 0.4466094970703125, 0.47702789306640625, 0.5074462890625, 0.5378646850585938, 0.5682830810546875, 0.5987014770507812, 0.629119873046875, 0.6595382690429688, 0.6899566650390625, 0.7203750610351562, 0.75079345703125, 0.7812118530273438, 0.8116302490234375, 0.8420486450195312, 0.872467041015625, 0.9028854370117188, 0.9333038330078125, 0.9637222290039062, 0.994140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 9.0, 15.0, 14.0, 15.0, 22.0, 19.0, 18.0, 28.0, 38.0, 29.0, 40.0, 44.0, 28.0, 48.0, 53.0, 44.0, 62.0, 53.0, 47.0, 41.0, 34.0, 34.0, 41.0, 26.0, 29.0, 28.0, 22.0, 16.0, 17.0, 13.0, 11.0, 6.0, 10.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0615234375, -1.028961181640625, -0.99639892578125, -0.963836669921875, -0.9312744140625, -0.898712158203125, -0.86614990234375, -0.833587646484375, -0.801025390625, -0.768463134765625, -0.73590087890625, -0.703338623046875, -0.6707763671875, -0.638214111328125, -0.60565185546875, -0.573089599609375, -0.54052734375, -0.507965087890625, -0.47540283203125, -0.442840576171875, -0.4102783203125, -0.377716064453125, -0.34515380859375, -0.312591552734375, -0.280029296875, -0.247467041015625, -0.21490478515625, -0.182342529296875, -0.1497802734375, -0.117218017578125, -0.08465576171875, -0.052093505859375, -0.01953125, 0.013031005859375, 0.04559326171875, 0.078155517578125, 0.1107177734375, 0.143280029296875, 0.17584228515625, 0.208404541015625, 0.240966796875, 0.273529052734375, 0.30609130859375, 0.338653564453125, 0.3712158203125, 0.403778076171875, 0.43634033203125, 0.468902587890625, 0.50146484375, 0.534027099609375, 0.56658935546875, 0.599151611328125, 0.6317138671875, 0.664276123046875, 0.69683837890625, 0.729400634765625, 0.761962890625, 0.794525146484375, 0.82708740234375, 0.859649658203125, 0.8922119140625, 0.924774169921875, 0.95733642578125, 0.989898681640625, 1.0224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 13.0, 17.0, 17.0, 26.0, 35.0, 47.0, 68.0, 94.0, 112.0, 166.0, 259.0, 403.0, 691.0, 1244.0, 2454.0, 5443.0, 14264.0, 43643.0, 188959.0, 586459.0, 145739.0, 36216.0, 12094.0, 4857.0, 2183.0, 1147.0, 630.0, 391.0, 259.0, 178.0, 125.0, 77.0, 58.0, 39.0, 46.0, 20.0, 17.0, 11.0, 8.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.275970458984375, -1.23260498046875, -1.189239501953125, -1.1458740234375, -1.102508544921875, -1.05914306640625, -1.015777587890625, -0.972412109375, -0.929046630859375, -0.88568115234375, -0.842315673828125, -0.7989501953125, -0.755584716796875, -0.71221923828125, -0.668853759765625, -0.62548828125, -0.582122802734375, -0.53875732421875, -0.495391845703125, -0.4520263671875, -0.408660888671875, -0.36529541015625, -0.321929931640625, -0.278564453125, -0.235198974609375, -0.19183349609375, -0.148468017578125, -0.1051025390625, -0.061737060546875, -0.01837158203125, 0.024993896484375, 0.068359375, 0.111724853515625, 0.15509033203125, 0.198455810546875, 0.2418212890625, 0.285186767578125, 0.32855224609375, 0.371917724609375, 0.415283203125, 0.458648681640625, 0.50201416015625, 0.545379638671875, 0.5887451171875, 0.632110595703125, 0.67547607421875, 0.718841552734375, 0.76220703125, 0.805572509765625, 0.84893798828125, 0.892303466796875, 0.9356689453125, 0.979034423828125, 1.02239990234375, 1.065765380859375, 1.109130859375, 1.152496337890625, 1.19586181640625, 1.239227294921875, 1.2825927734375, 1.325958251953125, 1.36932373046875, 1.412689208984375, 1.4560546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 4.0, 9.0, 6.0, 14.0, 8.0, 14.0, 15.0, 12.0, 17.0, 25.0, 31.0, 37.0, 22.0, 35.0, 42.0, 45.0, 44.0, 48.0, 40.0, 42.0, 31.0, 46.0, 44.0, 48.0, 38.0, 35.0, 38.0, 37.0, 37.0, 25.0, 15.0, 19.0, 12.0, 10.0, 8.0, 13.0, 11.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.171875, -1.13525390625, -1.0986328125, -1.06201171875, -1.025390625, -0.98876953125, -0.9521484375, -0.91552734375, -0.87890625, -0.84228515625, -0.8056640625, -0.76904296875, -0.732421875, -0.69580078125, -0.6591796875, -0.62255859375, -0.5859375, -0.54931640625, -0.5126953125, -0.47607421875, -0.439453125, -0.40283203125, -0.3662109375, -0.32958984375, -0.29296875, -0.25634765625, -0.2197265625, -0.18310546875, -0.146484375, -0.10986328125, -0.0732421875, -0.03662109375, 0.0, 0.03662109375, 0.0732421875, 0.10986328125, 0.146484375, 0.18310546875, 0.2197265625, 0.25634765625, 0.29296875, 0.32958984375, 0.3662109375, 0.40283203125, 0.439453125, 0.47607421875, 0.5126953125, 0.54931640625, 0.5859375, 0.62255859375, 0.6591796875, 0.69580078125, 0.732421875, 0.76904296875, 0.8056640625, 0.84228515625, 0.87890625, 0.91552734375, 0.9521484375, 0.98876953125, 1.025390625, 1.06201171875, 1.0986328125, 1.13525390625, 1.171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 15.0, 18.0, 25.0, 38.0, 40.0, 81.0, 83.0, 138.0, 167.0, 303.0, 472.0, 809.0, 1425.0, 2705.0, 5335.0, 11501.0, 28575.0, 89616.0, 555786.0, 255008.0, 57938.0, 20360.0, 8752.0, 4214.0, 2117.0, 1179.0, 686.0, 356.0, 238.0, 180.0, 120.0, 78.0, 47.0, 42.0, 21.0, 22.0, 14.0, 10.0, 10.0, 8.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18408203125, -0.17811012268066406, -0.17213821411132812, -0.1661663055419922, -0.16019439697265625, -0.1542224884033203, -0.14825057983398438, -0.14227867126464844, -0.1363067626953125, -0.13033485412597656, -0.12436294555664062, -0.11839103698730469, -0.11241912841796875, -0.10644721984863281, -0.10047531127929688, -0.09450340270996094, -0.088531494140625, -0.08255958557128906, -0.07658767700195312, -0.07061576843261719, -0.06464385986328125, -0.05867195129394531, -0.052700042724609375, -0.04672813415527344, -0.0407562255859375, -0.03478431701660156, -0.028812408447265625, -0.022840499877929688, -0.01686859130859375, -0.010896682739257812, -0.004924774169921875, 0.0010471343994140625, 0.00701904296875, 0.012990951538085938, 0.018962860107421875, 0.024934768676757812, 0.03090667724609375, 0.03687858581542969, 0.042850494384765625, 0.04882240295410156, 0.0547943115234375, 0.06076622009277344, 0.06673812866210938, 0.07271003723144531, 0.07868194580078125, 0.08465385437011719, 0.09062576293945312, 0.09659767150878906, 0.102569580078125, 0.10854148864746094, 0.11451339721679688, 0.12048530578613281, 0.12645721435546875, 0.1324291229248047, 0.13840103149414062, 0.14437294006347656, 0.1503448486328125, 0.15631675720214844, 0.16228866577148438, 0.1682605743408203, 0.17423248291015625, 0.1802043914794922, 0.18617630004882812, 0.19214820861816406, 0.1981201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 11.0, 27.0, 19.0, 28.0, 47.0, 63.0, 86.0, 239.0, 175.0, 79.0, 56.0, 49.0, 30.0, 18.0, 14.0, 15.0, 6.0, 4.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.1856040954589844e-05, -5.0487928092479706e-05, -4.911981523036957e-05, -4.775170236825943e-05, -4.638358950614929e-05, -4.5015476644039154e-05, -4.3647363781929016e-05, -4.227925091981888e-05, -4.091113805770874e-05, -3.95430251955986e-05, -3.8174912333488464e-05, -3.6806799471378326e-05, -3.543868660926819e-05, -3.407057374715805e-05, -3.270246088504791e-05, -3.1334348022937775e-05, -2.9966235160827637e-05, -2.85981222987175e-05, -2.723000943660736e-05, -2.5861896574497223e-05, -2.4493783712387085e-05, -2.3125670850276947e-05, -2.175755798816681e-05, -2.038944512605667e-05, -1.9021332263946533e-05, -1.7653219401836395e-05, -1.6285106539726257e-05, -1.491699367761612e-05, -1.3548880815505981e-05, -1.2180767953395844e-05, -1.0812655091285706e-05, -9.444542229175568e-06, -8.07642936706543e-06, -6.708316504955292e-06, -5.340203642845154e-06, -3.972090780735016e-06, -2.603977918624878e-06, -1.23586505651474e-06, 1.3224780559539795e-07, 1.5003606677055359e-06, 2.868473529815674e-06, 4.236586391925812e-06, 5.60469925403595e-06, 6.972812116146088e-06, 8.340924978256226e-06, 9.709037840366364e-06, 1.1077150702476501e-05, 1.244526356458664e-05, 1.3813376426696777e-05, 1.5181489288806915e-05, 1.6549602150917053e-05, 1.791771501302719e-05, 1.928582787513733e-05, 2.0653940737247467e-05, 2.2022053599357605e-05, 2.3390166461467743e-05, 2.475827932357788e-05, 2.612639218568802e-05, 2.7494505047798157e-05, 2.8862617909908295e-05, 3.0230730772018433e-05, 3.159884363412857e-05, 3.296695649623871e-05, 3.4335069358348846e-05, 3.5703182220458984e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 15.0, 17.0, 24.0, 25.0, 36.0, 64.0, 88.0, 115.0, 161.0, 243.0, 370.0, 565.0, 909.0, 1498.0, 2737.0, 5152.0, 10620.0, 25096.0, 80468.0, 614696.0, 224532.0, 46868.0, 17058.0, 7766.0, 3769.0, 2189.0, 1227.0, 708.0, 451.0, 330.0, 209.0, 154.0, 120.0, 68.0, 50.0, 41.0, 28.0, 22.0, 10.0, 11.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.260498046875, -0.2523040771484375, -0.244110107421875, -0.2359161376953125, -0.22772216796875, -0.2195281982421875, -0.211334228515625, -0.2031402587890625, -0.1949462890625, -0.1867523193359375, -0.178558349609375, -0.1703643798828125, -0.16217041015625, -0.1539764404296875, -0.145782470703125, -0.1375885009765625, -0.12939453125, -0.1212005615234375, -0.113006591796875, -0.1048126220703125, -0.09661865234375, -0.0884246826171875, -0.080230712890625, -0.0720367431640625, -0.0638427734375, -0.0556488037109375, -0.047454833984375, -0.0392608642578125, -0.03106689453125, -0.0228729248046875, -0.014678955078125, -0.0064849853515625, 0.001708984375, 0.0099029541015625, 0.018096923828125, 0.0262908935546875, 0.03448486328125, 0.0426788330078125, 0.050872802734375, 0.0590667724609375, 0.0672607421875, 0.0754547119140625, 0.083648681640625, 0.0918426513671875, 0.10003662109375, 0.1082305908203125, 0.116424560546875, 0.1246185302734375, 0.1328125, 0.1410064697265625, 0.149200439453125, 0.1573944091796875, 0.16558837890625, 0.1737823486328125, 0.181976318359375, 0.1901702880859375, 0.1983642578125, 0.2065582275390625, 0.214752197265625, 0.2229461669921875, 0.23114013671875, 0.2393341064453125, 0.247528076171875, 0.2557220458984375, 0.263916015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 7.0, 7.0, 8.0, 5.0, 17.0, 8.0, 11.0, 23.0, 31.0, 30.0, 50.0, 67.0, 90.0, 163.0, 118.0, 98.0, 45.0, 42.0, 36.0, 18.0, 21.0, 14.0, 12.0, 10.0, 8.0, 13.0, 8.0, 2.0, 8.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12017822265625, -0.1166372299194336, -0.11309623718261719, -0.10955524444580078, -0.10601425170898438, -0.10247325897216797, -0.09893226623535156, -0.09539127349853516, -0.09185028076171875, -0.08830928802490234, -0.08476829528808594, -0.08122730255126953, -0.07768630981445312, -0.07414531707763672, -0.07060432434082031, -0.0670633316040039, -0.0635223388671875, -0.059981346130371094, -0.05644035339355469, -0.05289936065673828, -0.049358367919921875, -0.04581737518310547, -0.04227638244628906, -0.038735389709472656, -0.03519439697265625, -0.031653404235839844, -0.028112411499023438, -0.02457141876220703, -0.021030426025390625, -0.01748943328857422, -0.013948440551757812, -0.010407447814941406, -0.006866455078125, -0.0033254623413085938, 0.0002155303955078125, 0.0037565231323242188, 0.007297515869140625, 0.010838508605957031, 0.014379501342773438, 0.017920494079589844, 0.02146148681640625, 0.025002479553222656, 0.028543472290039062, 0.03208446502685547, 0.035625457763671875, 0.03916645050048828, 0.04270744323730469, 0.046248435974121094, 0.0497894287109375, 0.053330421447753906, 0.05687141418457031, 0.06041240692138672, 0.06395339965820312, 0.06749439239501953, 0.07103538513183594, 0.07457637786865234, 0.07811737060546875, 0.08165836334228516, 0.08519935607910156, 0.08874034881591797, 0.09228134155273438, 0.09582233428955078, 0.09936332702636719, 0.1029043197631836, 0.1064453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 14.0, 22.0, 28.0, 39.0, 76.0, 111.0, 117.0, 132.0, 148.0, 110.0, 67.0, 38.0, 29.0, 19.0, 11.0, 15.0, 4.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0309042930603027, -1.945160984992981, -1.8594176769256592, -1.7736742496490479, -1.687930941581726, -1.6021876335144043, -1.516444206237793, -1.4307008981704712, -1.3449575901031494, -1.2592142820358276, -1.1734709739685059, -1.0877275466918945, -1.0019842386245728, -0.916240930557251, -0.8304975628852844, -0.7447541952133179, -0.6590108871459961, -0.5732675790786743, -0.48752421140670776, -0.4017808735370636, -0.31603753566741943, -0.23029419779777527, -0.1445508599281311, -0.05880749225616455, 0.026935815811157227, 0.11267915368080139, 0.19842249155044556, 0.2841658294200897, 0.3699091672897339, 0.45565250515937805, 0.5413958430290222, 0.6271392107009888, 0.7128827571868896, 0.7986260652542114, 0.884369432926178, 0.9701128005981445, 1.0558561086654663, 1.141599416732788, 1.2273428440093994, 1.3130861520767212, 1.398829460144043, 1.4845727682113647, 1.5703160762786865, 1.6560595035552979, 1.7418028116226196, 1.8275461196899414, 1.9132895469665527, 1.9990328550338745, 2.0847761631011963, 2.1705195903778076, 2.25626277923584, 2.342006206512451, 2.4277496337890625, 2.5134928226470947, 2.599236249923706, 2.6849794387817383, 2.7707228660583496, 2.856466293334961, 2.942209482192993, 3.0279529094696045, 3.1136960983276367, 3.199439525604248, 3.2851829528808594, 3.3709263801574707, 3.456669569015503]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 5.0, 8.0, 6.0, 11.0, 17.0, 19.0, 15.0, 12.0, 16.0, 34.0, 26.0, 22.0, 26.0, 28.0, 36.0, 39.0, 40.0, 60.0, 44.0, 32.0, 45.0, 36.0, 39.0, 40.0, 28.0, 38.0, 33.0, 29.0, 31.0, 16.0, 20.0, 28.0, 16.0, 12.0, 16.0, 13.0, 10.0, 4.0, 5.0, 2.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8244893550872803, -1.7670289278030396, -1.7095686197280884, -1.6521081924438477, -1.5946478843688965, -1.5371874570846558, -1.479727029800415, -1.4222667217254639, -1.3648064136505127, -1.307345986366272, -1.2498856782913208, -1.19242525100708, -1.134964942932129, -1.0775045156478882, -1.0200440883636475, -0.9625837802886963, -0.9051233530044556, -0.8476629853248596, -0.7902026176452637, -0.732742190361023, -0.6752818822860718, -0.617821455001831, -0.5603610873222351, -0.5029007196426392, -0.4454403519630432, -0.38797998428344727, -0.3305196166038513, -0.273059219121933, -0.21559885144233704, -0.1581384837627411, -0.10067808628082275, -0.04321771860122681, 0.01424252986907959, 0.07170290499925613, 0.12916328012943268, 0.18662366271018982, 0.24408403038978577, 0.3015443980693817, 0.35900479555130005, 0.416465163230896, 0.47392553091049194, 0.5313858985900879, 0.5888462662696838, 0.6463066339492798, 0.7037670612335205, 0.7612273693084717, 0.8186877965927124, 0.8761481642723083, 0.9336085319519043, 0.9910688996315002, 1.0485292673110962, 1.105989694595337, 1.163450002670288, 1.2209104299545288, 1.2783708572387695, 1.3358311653137207, 1.3932914733886719, 1.4507519006729126, 1.5082122087478638, 1.5656726360321045, 1.6231329441070557, 1.6805933713912964, 1.738053798675537, 1.7955141067504883, 1.852974534034729]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 3.0, 11.0, 12.0, 5.0, 19.0, 24.0, 29.0, 33.0, 38.0, 41.0, 48.0, 79.0, 77.0, 126.0, 148.0, 158.0, 225.0, 313.0, 474.0, 1032.0, 3191.0, 1040823.0, 1503.0, 585.0, 363.0, 257.0, 198.0, 154.0, 147.0, 80.0, 92.0, 62.0, 46.0, 37.0, 40.0, 23.0, 19.0, 20.0, 15.0, 9.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.803248643875122, -2.71335506439209, -2.6234614849090576, -2.5335679054260254, -2.443674325942993, -2.353780746459961, -2.2638869285583496, -2.1739933490753174, -2.084099769592285, -1.994206190109253, -1.9043126106262207, -1.8144190311431885, -1.7245253324508667, -1.6346317529678345, -1.5447381734848022, -1.4548444747924805, -1.3649510145187378, -1.2750574350357056, -1.1851638555526733, -1.0952701568603516, -1.0053765773773193, -0.9154829978942871, -0.8255894184112549, -0.7356957793235779, -0.6458021998405457, -0.5559086203575134, -0.4660149812698364, -0.3761214017868042, -0.2862277925014496, -0.19633418321609497, -0.10644060373306274, -0.016546964645385742, 0.07334661483764648, 0.1632402241230011, 0.2531338334083557, 0.34302741289138794, 0.43292102217674255, 0.5228146314620972, 0.6127082109451294, 0.7026018500328064, 0.7924954295158386, 0.8823890089988708, 0.9722826480865479, 1.06217622756958, 1.1520698070526123, 1.2419633865356445, 1.3318569660186768, 1.4217506647109985, 1.5116442441940308, 1.601537823677063, 1.6914314031600952, 1.781325101852417, 1.8712186813354492, 1.9611122608184814, 2.0510058403015137, 2.140899419784546, 2.230792999267578, 2.3206865787506104, 2.4105801582336426, 2.500473737716675, 2.590367317199707, 2.6802611351013184, 2.7701544761657715, 2.860048294067383, 2.949941873550415]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 8.0, 12.0, 20.0, 36.0, 34.0, 52.0, 72.0, 104.0, 141.0, 189.0, 317.0, 541.0, 1109.0, 3470.0, 51455272.0, 5843.0, 1321.0, 668.0, 330.0, 216.0, 145.0, 102.0, 78.0, 74.0, 44.0, 40.0, 26.0, 14.0, 8.0, 13.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.327807426452637, -11.8970308303833, -11.466254234313965, -11.035478591918945, -10.60470199584961, -10.173925399780273, -9.743148803710938, -9.312372207641602, -8.881596565246582, -8.450819969177246, -8.02004337310791, -7.589267253875732, -7.158491134643555, -6.727714538574219, -6.296937942504883, -5.866161823272705, -5.435385227203369, -5.004608631134033, -4.5738325119018555, -4.1430559158325195, -3.712279796600342, -3.281503200531006, -2.850726842880249, -2.419950485229492, -1.9891741275787354, -1.5583977699279785, -1.1276214122772217, -0.6968449354171753, -0.26606857776641846, 0.16470789909362793, 0.5954842567443848, 1.0262606143951416, 1.4570369720458984, 1.8878133296966553, 2.318589687347412, 2.749366283416748, 3.180142402648926, 3.6109189987182617, 4.041695594787598, 4.472471714019775, 4.903247833251953, 5.334024429321289, 5.764800548553467, 6.195577144622803, 6.6263532638549805, 7.057129859924316, 7.487906455993652, 7.91868257522583, 8.349458694458008, 8.780235290527344, 9.21101188659668, 9.6417875289917, 10.072564125061035, 10.503340721130371, 10.934117317199707, 11.364892959594727, 11.795670509338379, 12.226447105407715, 12.65722370147705, 13.08799934387207, 13.518775939941406, 13.949552536010742, 14.380329132080078, 14.811105728149414, 15.241881370544434]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 12.0, 14.0, 21.0, 26.0, 45.0, 64.0, 85.0, 149.0, 228.0, 342.0, 473.0, 762.0, 1194.0, 1898.0, 2865.0, 4780.0, 7847.0, 13950.0, 24462.0, 46299.0, 87612.0, 169525.0, 320098.0, 567118.0, 3707758.0, 608206.0, 339730.0, 181425.0, 93769.0, 49019.0, 25884.0, 14412.0, 8160.0, 4854.0, 2985.0, 1858.0, 1228.0, 783.0, 496.0, 347.0, 241.0, 145.0, 88.0, 69.0, 43.0, 23.0, 15.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.78759765625, -0.76263427734375, -0.7376708984375, -0.71270751953125, -0.687744140625, -0.66278076171875, -0.6378173828125, -0.61285400390625, -0.587890625, -0.56292724609375, -0.5379638671875, -0.51300048828125, -0.488037109375, -0.46307373046875, -0.4381103515625, -0.41314697265625, -0.38818359375, -0.36322021484375, -0.3382568359375, -0.31329345703125, -0.288330078125, -0.26336669921875, -0.2384033203125, -0.21343994140625, -0.1884765625, -0.16351318359375, -0.1385498046875, -0.11358642578125, -0.088623046875, -0.06365966796875, -0.0386962890625, -0.01373291015625, 0.01123046875, 0.03619384765625, 0.0611572265625, 0.08612060546875, 0.111083984375, 0.13604736328125, 0.1610107421875, 0.18597412109375, 0.2109375, 0.23590087890625, 0.2608642578125, 0.28582763671875, 0.310791015625, 0.33575439453125, 0.3607177734375, 0.38568115234375, 0.41064453125, 0.43560791015625, 0.4605712890625, 0.48553466796875, 0.510498046875, 0.53546142578125, 0.5604248046875, 0.58538818359375, 0.6103515625, 0.63531494140625, 0.6602783203125, 0.68524169921875, 0.710205078125, 0.73516845703125, 0.7601318359375, 0.78509521484375, 0.81005859375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 9.0, 20.0, 14.0, 22.0, 21.0, 29.0, 31.0, 34.0, 34.0, 42.0, 46.0, 43.0, 49.0, 90.0, 969.0, 108.0, 54.0, 57.0, 42.0, 41.0, 44.0, 31.0, 22.0, 32.0, 20.0, 24.0, 15.0, 11.0, 6.0, 16.0, 5.0, 7.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.390625, -9.110595703125, -8.83056640625, -8.550537109375, -8.2705078125, -7.990478515625, -7.71044921875, -7.430419921875, -7.150390625, -6.870361328125, -6.59033203125, -6.310302734375, -6.0302734375, -5.750244140625, -5.47021484375, -5.190185546875, -4.91015625, -4.630126953125, -4.35009765625, -4.070068359375, -3.7900390625, -3.510009765625, -3.22998046875, -2.949951171875, -2.669921875, -2.389892578125, -2.10986328125, -1.829833984375, -1.5498046875, -1.269775390625, -0.98974609375, -0.709716796875, -0.4296875, -0.149658203125, 0.13037109375, 0.410400390625, 0.6904296875, 0.970458984375, 1.25048828125, 1.530517578125, 1.810546875, 2.090576171875, 2.37060546875, 2.650634765625, 2.9306640625, 3.210693359375, 3.49072265625, 3.770751953125, 4.05078125, 4.330810546875, 4.61083984375, 4.890869140625, 5.1708984375, 5.450927734375, 5.73095703125, 6.010986328125, 6.291015625, 6.571044921875, 6.85107421875, 7.131103515625, 7.4111328125, 7.691162109375, 7.97119140625, 8.251220703125, 8.53125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 14.0, 21.0, 34.0, 44.0, 69.0, 118.0, 137.0, 203.0, 321.0, 456.0, 732.0, 1045.0, 1656.0, 2637.0, 4053.0, 6611.0, 10897.0, 17666.0, 30548.0, 51360.0, 89208.0, 149477.0, 243964.0, 362976.0, 608303.0, 3491047.0, 429515.0, 306232.0, 195766.0, 117228.0, 68352.0, 39872.0, 23387.0, 14168.0, 8637.0, 5303.0, 3302.0, 2136.0, 1305.0, 871.0, 578.0, 347.0, 268.0, 170.0, 125.0, 85.0, 61.0, 38.0, 26.0, 20.0, 12.0, 13.0, 7.0, 7.0, 1.0, 0.0, 2.0], "bins": [-0.4912109375, -0.4759864807128906, -0.46076202392578125, -0.4455375671386719, -0.4303131103515625, -0.4150886535644531, -0.39986419677734375, -0.3846397399902344, -0.369415283203125, -0.3541908264160156, -0.33896636962890625, -0.3237419128417969, -0.3085174560546875, -0.2932929992675781, -0.27806854248046875, -0.2628440856933594, -0.24761962890625, -0.23239517211914062, -0.21717071533203125, -0.20194625854492188, -0.1867218017578125, -0.17149734497070312, -0.15627288818359375, -0.14104843139648438, -0.125823974609375, -0.11059951782226562, -0.09537506103515625, -0.08015060424804688, -0.0649261474609375, -0.049701690673828125, -0.03447723388671875, -0.019252777099609375, -0.0040283203125, 0.011196136474609375, 0.02642059326171875, 0.041645050048828125, 0.0568695068359375, 0.07209396362304688, 0.08731842041015625, 0.10254287719726562, 0.117767333984375, 0.13299179077148438, 0.14821624755859375, 0.16344070434570312, 0.1786651611328125, 0.19388961791992188, 0.20911407470703125, 0.22433853149414062, 0.23956298828125, 0.2547874450683594, 0.27001190185546875, 0.2852363586425781, 0.3004608154296875, 0.3156852722167969, 0.33090972900390625, 0.3461341857910156, 0.361358642578125, 0.3765830993652344, 0.39180755615234375, 0.4070320129394531, 0.4222564697265625, 0.4374809265136719, 0.45270538330078125, 0.4679298400878906, 0.483154296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 12.0, 10.0, 14.0, 18.0, 25.0, 15.0, 22.0, 24.0, 33.0, 37.0, 35.0, 41.0, 36.0, 35.0, 37.0, 38.0, 422.0, 684.0, 46.0, 44.0, 38.0, 44.0, 27.0, 32.0, 31.0, 31.0, 25.0, 25.0, 30.0, 13.0, 14.0, 18.0, 9.0, 9.0, 6.0, 5.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1640625, -6.94091796875, -6.7177734375, -6.49462890625, -6.271484375, -6.04833984375, -5.8251953125, -5.60205078125, -5.37890625, -5.15576171875, -4.9326171875, -4.70947265625, -4.486328125, -4.26318359375, -4.0400390625, -3.81689453125, -3.59375, -3.37060546875, -3.1474609375, -2.92431640625, -2.701171875, -2.47802734375, -2.2548828125, -2.03173828125, -1.80859375, -1.58544921875, -1.3623046875, -1.13916015625, -0.916015625, -0.69287109375, -0.4697265625, -0.24658203125, -0.0234375, 0.19970703125, 0.4228515625, 0.64599609375, 0.869140625, 1.09228515625, 1.3154296875, 1.53857421875, 1.76171875, 1.98486328125, 2.2080078125, 2.43115234375, 2.654296875, 2.87744140625, 3.1005859375, 3.32373046875, 3.546875, 3.77001953125, 3.9931640625, 4.21630859375, 4.439453125, 4.66259765625, 4.8857421875, 5.10888671875, 5.33203125, 5.55517578125, 5.7783203125, 6.00146484375, 6.224609375, 6.44775390625, 6.6708984375, 6.89404296875, 7.1171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 15.0, 14.0, 22.0, 33.0, 42.0, 65.0, 114.0, 155.0, 223.0, 292.0, 459.0, 693.0, 1046.0, 1751.0, 2905.0, 4997.0, 8948.0, 16815.0, 33974.0, 69716.0, 159678.0, 5644188.0, 188231.0, 77260.0, 37278.0, 18605.0, 9896.0, 5532.0, 3168.0, 1852.0, 1161.0, 733.0, 493.0, 328.0, 193.0, 170.0, 109.0, 75.0, 51.0, 42.0, 42.0, 15.0, 22.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.63671875, -1.584869384765625, -1.53302001953125, -1.481170654296875, -1.4293212890625, -1.377471923828125, -1.32562255859375, -1.273773193359375, -1.221923828125, -1.170074462890625, -1.11822509765625, -1.066375732421875, -1.0145263671875, -0.962677001953125, -0.91082763671875, -0.858978271484375, -0.80712890625, -0.755279541015625, -0.70343017578125, -0.651580810546875, -0.5997314453125, -0.547882080078125, -0.49603271484375, -0.444183349609375, -0.392333984375, -0.340484619140625, -0.28863525390625, -0.236785888671875, -0.1849365234375, -0.133087158203125, -0.08123779296875, -0.029388427734375, 0.0224609375, 0.074310302734375, 0.12615966796875, 0.178009033203125, 0.2298583984375, 0.281707763671875, 0.33355712890625, 0.385406494140625, 0.437255859375, 0.489105224609375, 0.54095458984375, 0.592803955078125, 0.6446533203125, 0.696502685546875, 0.74835205078125, 0.800201416015625, 0.85205078125, 0.903900146484375, 0.95574951171875, 1.007598876953125, 1.0594482421875, 1.111297607421875, 1.16314697265625, 1.214996337890625, 1.266845703125, 1.318695068359375, 1.37054443359375, 1.422393798828125, 1.4742431640625, 1.526092529296875, 1.57794189453125, 1.629791259765625, 1.681640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 6.0, 12.0, 8.0, 17.0, 12.0, 12.0, 14.0, 28.0, 19.0, 37.0, 29.0, 29.0, 38.0, 44.0, 43.0, 43.0, 27.0, 60.0, 1028.0, 78.0, 42.0, 40.0, 49.0, 41.0, 42.0, 37.0, 24.0, 26.0, 24.0, 13.0, 17.0, 14.0, 9.0, 12.0, 15.0, 14.0, 0.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.52801513671875, -7.2552490234375, -6.98248291015625, -6.709716796875, -6.43695068359375, -6.1641845703125, -5.89141845703125, -5.61865234375, -5.34588623046875, -5.0731201171875, -4.80035400390625, -4.527587890625, -4.25482177734375, -3.9820556640625, -3.70928955078125, -3.4365234375, -3.16375732421875, -2.8909912109375, -2.61822509765625, -2.345458984375, -2.07269287109375, -1.7999267578125, -1.52716064453125, -1.25439453125, -0.98162841796875, -0.7088623046875, -0.43609619140625, -0.163330078125, 0.10943603515625, 0.3822021484375, 0.65496826171875, 0.927734375, 1.20050048828125, 1.4732666015625, 1.74603271484375, 2.018798828125, 2.29156494140625, 2.5643310546875, 2.83709716796875, 3.10986328125, 3.38262939453125, 3.6553955078125, 3.92816162109375, 4.200927734375, 4.47369384765625, 4.7464599609375, 5.01922607421875, 5.2919921875, 5.56475830078125, 5.8375244140625, 6.11029052734375, 6.383056640625, 6.65582275390625, 6.9285888671875, 7.20135498046875, 7.47412109375, 7.74688720703125, 8.0196533203125, 8.29241943359375, 8.565185546875, 8.83795166015625, 9.1107177734375, 9.38348388671875, 9.65625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 19.0, 49.0, 100.0, 280.0, 302.0, 132.0, 49.0, 22.0, 11.0, 11.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.92098045349121, -25.890653610229492, -24.860328674316406, -23.830001831054688, -22.79967498779297, -21.76934814453125, -20.73902130126953, -19.708696365356445, -18.678369522094727, -17.648042678833008, -16.617717742919922, -15.587390899658203, -14.557064056396484, -13.526737213134766, -12.496411323547363, -11.466085433959961, -10.435758590698242, -9.405431747436523, -8.375105857849121, -7.3447794914245605, -6.314453125, -5.2841267585754395, -4.253800392150879, -3.2234740257263184, -2.193147659301758, -1.1628212928771973, -0.13249492645263672, 0.8978314399719238, 1.9281578063964844, 2.958484172821045, 3.9888105392456055, 5.019136905670166, 6.049465179443359, 7.07979154586792, 8.11011791229248, 9.140443801879883, 10.170770645141602, 11.20109748840332, 12.231423377990723, 13.261749267578125, 14.292076110839844, 15.322402954101562, 16.35272979736328, 17.383054733276367, 18.413381576538086, 19.443708419799805, 20.47403335571289, 21.50436019897461, 22.534687042236328, 23.565013885498047, 24.595340728759766, 25.62566566467285, 26.65599250793457, 27.68631935119629, 28.716644287109375, 29.746971130371094, 30.777297973632812, 31.80762481689453, 32.83795166015625, 33.86827850341797, 34.89860534667969, 35.92892837524414, 36.95925521850586, 37.98958206176758, 39.0199089050293]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 6.0, 5.0, 8.0, 11.0, 15.0, 25.0, 28.0, 36.0, 41.0, 54.0, 77.0, 95.0, 102.0, 111.0, 94.0, 63.0, 51.0, 29.0, 25.0, 19.0, 23.0, 16.0, 10.0, 10.0, 7.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.89131164550781, -36.70288848876953, -35.514469146728516, -34.326045989990234, -33.13762664794922, -31.949203491210938, -30.760780334472656, -29.572359085083008, -28.38393783569336, -27.19551658630371, -26.007095336914062, -24.81867218017578, -23.630250930786133, -22.441829681396484, -21.253406524658203, -20.064985275268555, -18.876564025878906, -17.688142776489258, -16.49972152709961, -15.311298370361328, -14.12287712097168, -12.934455871582031, -11.746033668518066, -10.557611465454102, -9.369190216064453, -8.180768966674805, -6.99234676361084, -5.803925037384033, -4.615503311157227, -3.42708158493042, -2.2386598587036133, -1.0502376556396484, 0.13818359375, 1.3266053199768066, 2.5150270462036133, 3.70344877243042, 4.891870498657227, 6.080292224884033, 7.26871395111084, 8.457136154174805, 9.645557403564453, 10.833978652954102, 12.022400856018066, 13.210823059082031, 14.39924430847168, 15.587665557861328, 16.77608871459961, 17.964509963989258, 19.152931213378906, 20.341352462768555, 21.529773712158203, 22.718196868896484, 23.906618118286133, 25.09503936767578, 26.283462524414062, 27.47188377380371, 28.66030502319336, 29.848726272583008, 31.037147521972656, 32.22557067871094, 33.41399383544922, 34.602413177490234, 35.790836334228516, 36.97925567626953, 38.16767883300781]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 3.0, 2.0, 7.0, 9.0, 6.0, 7.0, 12.0, 17.0, 30.0, 45.0, 47.0, 92.0, 141.0, 225.0, 363.0, 612.0, 983.0, 1657.0, 3410.0, 7133.0, 22565.0, 639471.0, 3477702.0, 24569.0, 7503.0, 3331.0, 1713.0, 1010.0, 578.0, 343.0, 216.0, 146.0, 97.0, 59.0, 45.0, 40.0, 27.0, 15.0, 16.0, 12.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.143798828125, -0.13866806030273438, -0.13353729248046875, -0.12840652465820312, -0.1232757568359375, -0.11814498901367188, -0.11301422119140625, -0.10788345336914062, -0.102752685546875, -0.09762191772460938, -0.09249114990234375, -0.08736038208007812, -0.0822296142578125, -0.07709884643554688, -0.07196807861328125, -0.06683731079101562, -0.06170654296875, -0.056575775146484375, -0.05144500732421875, -0.046314239501953125, -0.0411834716796875, -0.036052703857421875, -0.03092193603515625, -0.025791168212890625, -0.020660400390625, -0.015529632568359375, -0.01039886474609375, -0.005268096923828125, -0.0001373291015625, 0.004993438720703125, 0.01012420654296875, 0.015254974365234375, 0.0203857421875, 0.025516510009765625, 0.03064727783203125, 0.035778045654296875, 0.0409088134765625, 0.046039581298828125, 0.05117034912109375, 0.056301116943359375, 0.061431884765625, 0.06656265258789062, 0.07169342041015625, 0.07682418823242188, 0.0819549560546875, 0.08708572387695312, 0.09221649169921875, 0.09734725952148438, 0.10247802734375, 0.10760879516601562, 0.11273956298828125, 0.11787033081054688, 0.1230010986328125, 0.12813186645507812, 0.13326263427734375, 0.13839340209960938, 0.143524169921875, 0.14865493774414062, 0.15378570556640625, 0.15891647338867188, 0.1640472412109375, 0.16917800903320312, 0.17430877685546875, 0.17943954467773438, 0.1845703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 3.0, 11.0, 3.0, 13.0, 11.0, 14.0, 20.0, 43.0, 555.0, 142.0, 43.0, 13.0, 6.0, 12.0, 10.0, 13.0, 8.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.06247138977050781, -0.060306549072265625, -0.05814170837402344, -0.05597686767578125, -0.05381202697753906, -0.051647186279296875, -0.04948234558105469, -0.0473175048828125, -0.04515266418457031, -0.042987823486328125, -0.04082298278808594, -0.03865814208984375, -0.03649330139160156, -0.034328460693359375, -0.03216361999511719, -0.029998779296875, -0.027833938598632812, -0.025669097900390625, -0.023504257202148438, -0.02133941650390625, -0.019174575805664062, -0.017009735107421875, -0.014844894409179688, -0.0126800537109375, -0.010515213012695312, -0.008350372314453125, -0.0061855316162109375, -0.00402069091796875, -0.0018558502197265625, 0.000308990478515625, 0.0024738311767578125, 0.004638671875, 0.0068035125732421875, 0.008968353271484375, 0.011133193969726562, 0.01329803466796875, 0.015462875366210938, 0.017627716064453125, 0.019792556762695312, 0.0219573974609375, 0.024122238159179688, 0.026287078857421875, 0.028451919555664062, 0.03061676025390625, 0.03278160095214844, 0.034946441650390625, 0.03711128234863281, 0.039276123046875, 0.04144096374511719, 0.043605804443359375, 0.04577064514160156, 0.04793548583984375, 0.05010032653808594, 0.052265167236328125, 0.05443000793457031, 0.0565948486328125, 0.05875968933105469, 0.060924530029296875, 0.06308937072753906, 0.06525421142578125, 0.06741905212402344, 0.06958389282226562, 0.07174873352050781, 0.07391357421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 5.0, 8.0, 7.0, 7.0, 12.0, 19.0, 37.0, 61.0, 162.0, 385.0, 898.0, 2628.0, 10303.0, 76534.0, 3835437.0, 243155.0, 18806.0, 4011.0, 1144.0, 384.0, 117.0, 54.0, 44.0, 14.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256103515625, -0.2487201690673828, -0.24133682250976562, -0.23395347595214844, -0.22657012939453125, -0.21918678283691406, -0.21180343627929688, -0.2044200897216797, -0.1970367431640625, -0.1896533966064453, -0.18227005004882812, -0.17488670349121094, -0.16750335693359375, -0.16012001037597656, -0.15273666381835938, -0.1453533172607422, -0.137969970703125, -0.1305866241455078, -0.12320327758789062, -0.11581993103027344, -0.10843658447265625, -0.10105323791503906, -0.09366989135742188, -0.08628654479980469, -0.0789031982421875, -0.07151985168457031, -0.06413650512695312, -0.05675315856933594, -0.04936981201171875, -0.04198646545410156, -0.034603118896484375, -0.027219772338867188, -0.01983642578125, -0.012453079223632812, -0.005069732666015625, 0.0023136138916015625, 0.00969696044921875, 0.017080307006835938, 0.024463653564453125, 0.03184700012207031, 0.0392303466796875, 0.04661369323730469, 0.053997039794921875, 0.06138038635253906, 0.06876373291015625, 0.07614707946777344, 0.08353042602539062, 0.09091377258300781, 0.098297119140625, 0.10568046569824219, 0.11306381225585938, 0.12044715881347656, 0.12783050537109375, 0.13521385192871094, 0.14259719848632812, 0.1499805450439453, 0.1573638916015625, 0.1647472381591797, 0.17213058471679688, 0.17951393127441406, 0.18689727783203125, 0.19428062438964844, 0.20166397094726562, 0.2090473175048828, 0.2164306640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 11.0, 13.0, 15.0, 16.0, 17.0, 31.0, 37.0, 64.0, 95.0, 190.0, 497.0, 1629.0, 848.0, 237.0, 131.0, 66.0, 42.0, 26.0, 25.0, 18.0, 14.0, 14.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.0864400863647461, -0.08395195007324219, -0.08146381378173828, -0.07897567749023438, -0.07648754119873047, -0.07399940490722656, -0.07151126861572266, -0.06902313232421875, -0.06653499603271484, -0.06404685974121094, -0.06155872344970703, -0.059070587158203125, -0.05658245086669922, -0.05409431457519531, -0.051606178283691406, -0.0491180419921875, -0.046629905700683594, -0.04414176940917969, -0.04165363311767578, -0.039165496826171875, -0.03667736053466797, -0.03418922424316406, -0.031701087951660156, -0.02921295166015625, -0.026724815368652344, -0.024236679077148438, -0.02174854278564453, -0.019260406494140625, -0.01677227020263672, -0.014284133911132812, -0.011795997619628906, -0.009307861328125, -0.006819725036621094, -0.0043315887451171875, -0.0018434524536132812, 0.000644683837890625, 0.0031328201293945312, 0.0056209564208984375, 0.008109092712402344, 0.01059722900390625, 0.013085365295410156, 0.015573501586914062, 0.01806163787841797, 0.020549774169921875, 0.02303791046142578, 0.025526046752929688, 0.028014183044433594, 0.0305023193359375, 0.032990455627441406, 0.03547859191894531, 0.03796672821044922, 0.040454864501953125, 0.04294300079345703, 0.04543113708496094, 0.047919273376464844, 0.05040740966796875, 0.052895545959472656, 0.05538368225097656, 0.05787181854248047, 0.060359954833984375, 0.06284809112548828, 0.06533622741699219, 0.0678243637084961, 0.0703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 9.0, 45.0, 321.0, 552.0, 60.0, 10.0, 4.0, 1.0, 1.0], "bins": [-2.028738260269165, -1.9939026832580566, -1.9590669870376587, -1.9242314100265503, -1.8893957138061523, -1.854560136795044, -1.819724440574646, -1.7848888635635376, -1.7500531673431396, -1.7152175903320312, -1.6803818941116333, -1.645546317100525, -1.610710620880127, -1.5758750438690186, -1.5410393476486206, -1.5062037706375122, -1.4713681936264038, -1.4365326166152954, -1.4016969203948975, -1.366861343383789, -1.3320256471633911, -1.2971900701522827, -1.2623543739318848, -1.2275187969207764, -1.192683219909668, -1.1578476428985596, -1.1230119466781616, -1.0881763696670532, -1.0533406734466553, -1.0185050964355469, -0.9836694598197937, -0.9488338232040405, -0.9139982461929321, -0.879162609577179, -0.8443269729614258, -0.8094913363456726, -0.7746556997299194, -0.739820122718811, -0.7049844861030579, -0.6701488494873047, -0.6353132128715515, -0.6004775762557983, -0.5656419396400452, -0.530806303024292, -0.4959706962108612, -0.46113505959510803, -0.42629945278167725, -0.3914638161659241, -0.3566281795501709, -0.3217925429344177, -0.28695690631866455, -0.25212129950523376, -0.2172856628894806, -0.18245002627372742, -0.14761440455913544, -0.11277878284454346, -0.07794314622879028, -0.043107517063617706, -0.00827188789844513, 0.026563741266727448, 0.061399370431900024, 0.0962350070476532, 0.13107062876224518, 0.16590625047683716, 0.20074188709259033]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 11.0, 17.0, 16.0, 26.0, 26.0, 26.0, 45.0, 45.0, 48.0, 42.0, 51.0, 70.0, 57.0, 59.0, 61.0, 59.0, 54.0, 42.0, 36.0, 40.0, 29.0, 30.0, 25.0, 10.0, 14.0, 15.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548907995223999, -0.2457183450460434, -0.2365458905696869, -0.22737343609333038, -0.21820098161697388, -0.20902852714061737, -0.19985607266426086, -0.19068363308906555, -0.18151116371154785, -0.17233870923519135, -0.16316625475883484, -0.15399380028247833, -0.14482134580612183, -0.13564889132976532, -0.1264764368534088, -0.1173039898276329, -0.108131542801857, -0.09895908832550049, -0.08978663384914398, -0.08061417937278748, -0.07144172489643097, -0.06226927414536476, -0.05309682339429855, -0.04392436891794205, -0.03475191444158554, -0.025579459965229034, -0.016407007351517677, -0.00723455473780632, 0.0019378997385501862, 0.011110354214906693, 0.0202828049659729, 0.029455259442329407, 0.03862771391868591, 0.04780016839504242, 0.056972622871398926, 0.06614507734775543, 0.07531753182411194, 0.08448998630046844, 0.09366243332624435, 0.10283488780260086, 0.11200734227895737, 0.12117979675531387, 0.13035224378108978, 0.1395246982574463, 0.1486971527338028, 0.1578696072101593, 0.1670420616865158, 0.17621451616287231, 0.18538697063922882, 0.19455942511558533, 0.20373187959194183, 0.21290433406829834, 0.22207678854465485, 0.23124924302101135, 0.24042168259620667, 0.24959415197372437, 0.2587665915489197, 0.267939031124115, 0.2771115005016327, 0.286283940076828, 0.2954564094543457, 0.304628849029541, 0.3138013184070587, 0.32297375798225403, 0.33214622735977173]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 8.0, 14.0, 22.0, 20.0, 24.0, 31.0, 71.0, 85.0, 132.0, 152.0, 246.0, 378.0, 480.0, 699.0, 1135.0, 1628.0, 2450.0, 3811.0, 6190.0, 10296.0, 19216.0, 44230.0, 804667.0, 90915.0, 26485.0, 13639.0, 7797.0, 4742.0, 2901.0, 1959.0, 1311.0, 845.0, 605.0, 397.0, 284.0, 201.0, 143.0, 91.0, 70.0, 51.0, 51.0, 19.0, 18.0, 12.0, 10.0, 8.0, 9.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2327880859375, -0.2254505157470703, -0.21811294555664062, -0.21077537536621094, -0.20343780517578125, -0.19610023498535156, -0.18876266479492188, -0.1814250946044922, -0.1740875244140625, -0.1667499542236328, -0.15941238403320312, -0.15207481384277344, -0.14473724365234375, -0.13739967346191406, -0.13006210327148438, -0.12272453308105469, -0.115386962890625, -0.10804939270019531, -0.10071182250976562, -0.09337425231933594, -0.08603668212890625, -0.07869911193847656, -0.07136154174804688, -0.06402397155761719, -0.0566864013671875, -0.04934883117675781, -0.042011260986328125, -0.03467369079589844, -0.02733612060546875, -0.019998550415039062, -0.012660980224609375, -0.0053234100341796875, 0.00201416015625, 0.009351730346679688, 0.016689300537109375, 0.024026870727539062, 0.03136444091796875, 0.03870201110839844, 0.046039581298828125, 0.05337715148925781, 0.0607147216796875, 0.06805229187011719, 0.07538986206054688, 0.08272743225097656, 0.09006500244140625, 0.09740257263183594, 0.10474014282226562, 0.11207771301269531, 0.119415283203125, 0.1267528533935547, 0.13409042358398438, 0.14142799377441406, 0.14876556396484375, 0.15610313415527344, 0.16344070434570312, 0.1707782745361328, 0.1781158447265625, 0.1854534149169922, 0.19279098510742188, 0.20012855529785156, 0.20746612548828125, 0.21480369567871094, 0.22214126586914062, 0.2294788360595703, 0.23681640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 8.0, 4.0, 4.0, 7.0, 2.0, 5.0, 12.0, 11.0, 14.0, 14.0, 23.0, 53.0, 437.0, 243.0, 40.0, 19.0, 8.0, 11.0, 14.0, 9.0, 10.0, 5.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.06182289123535156, -0.059680938720703125, -0.05753898620605469, -0.05539703369140625, -0.05325508117675781, -0.051113128662109375, -0.04897117614746094, -0.0468292236328125, -0.04468727111816406, -0.042545318603515625, -0.04040336608886719, -0.03826141357421875, -0.03611946105957031, -0.033977508544921875, -0.03183555603027344, -0.029693603515625, -0.027551651000976562, -0.025409698486328125, -0.023267745971679688, -0.02112579345703125, -0.018983840942382812, -0.016841888427734375, -0.014699935913085938, -0.0125579833984375, -0.010416030883789062, -0.008274078369140625, -0.0061321258544921875, -0.00399017333984375, -0.0018482208251953125, 0.000293731689453125, 0.0024356842041015625, 0.00457763671875, 0.0067195892333984375, 0.008861541748046875, 0.011003494262695312, 0.01314544677734375, 0.015287399291992188, 0.017429351806640625, 0.019571304321289062, 0.0217132568359375, 0.023855209350585938, 0.025997161865234375, 0.028139114379882812, 0.03028106689453125, 0.03242301940917969, 0.034564971923828125, 0.03670692443847656, 0.038848876953125, 0.04099082946777344, 0.043132781982421875, 0.04527473449707031, 0.04741668701171875, 0.04955863952636719, 0.051700592041015625, 0.05384254455566406, 0.0559844970703125, 0.05812644958496094, 0.060268402099609375, 0.06241035461425781, 0.06455230712890625, 0.06669425964355469, 0.06883621215820312, 0.07097816467285156, 0.0731201171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 8.0, 16.0, 15.0, 21.0, 20.0, 36.0, 45.0, 70.0, 61.0, 95.0, 132.0, 206.0, 371.0, 728.0, 1555.0, 3538.0, 8115.0, 23018.0, 79520.0, 406666.0, 407787.0, 78802.0, 23000.0, 8146.0, 3308.0, 1481.0, 715.0, 353.0, 203.0, 139.0, 83.0, 63.0, 51.0, 42.0, 42.0, 19.0, 26.0, 15.0, 9.0, 8.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15586090087890625, -0.1508331298828125, -0.14580535888671875, -0.140777587890625, -0.13574981689453125, -0.1307220458984375, -0.12569427490234375, -0.12066650390625, -0.11563873291015625, -0.1106109619140625, -0.10558319091796875, -0.100555419921875, -0.09552764892578125, -0.0904998779296875, -0.08547210693359375, -0.0804443359375, -0.07541656494140625, -0.0703887939453125, -0.06536102294921875, -0.060333251953125, -0.05530548095703125, -0.0502777099609375, -0.04524993896484375, -0.04022216796875, -0.03519439697265625, -0.0301666259765625, -0.02513885498046875, -0.020111083984375, -0.01508331298828125, -0.0100555419921875, -0.00502777099609375, 0.0, 0.00502777099609375, 0.0100555419921875, 0.01508331298828125, 0.020111083984375, 0.02513885498046875, 0.0301666259765625, 0.03519439697265625, 0.04022216796875, 0.04524993896484375, 0.0502777099609375, 0.05530548095703125, 0.060333251953125, 0.06536102294921875, 0.0703887939453125, 0.07541656494140625, 0.0804443359375, 0.08547210693359375, 0.0904998779296875, 0.09552764892578125, 0.100555419921875, 0.10558319091796875, 0.1106109619140625, 0.11563873291015625, 0.12066650390625, 0.12569427490234375, 0.1307220458984375, 0.13574981689453125, 0.140777587890625, 0.14580535888671875, 0.1508331298828125, 0.15586090087890625, 0.160888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 7.0, 7.0, 7.0, 10.0, 17.0, 15.0, 10.0, 7.0, 26.0, 31.0, 35.0, 21.0, 45.0, 46.0, 42.0, 38.0, 47.0, 46.0, 42.0, 50.0, 47.0, 47.0, 57.0, 39.0, 31.0, 41.0, 20.0, 26.0, 31.0, 18.0, 12.0, 17.0, 20.0, 11.0, 6.0, 6.0, 4.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24152374267578125, -0.2340240478515625, -0.22652435302734375, -0.219024658203125, -0.21152496337890625, -0.2040252685546875, -0.19652557373046875, -0.18902587890625, -0.18152618408203125, -0.1740264892578125, -0.16652679443359375, -0.159027099609375, -0.15152740478515625, -0.1440277099609375, -0.13652801513671875, -0.1290283203125, -0.12152862548828125, -0.1140289306640625, -0.10652923583984375, -0.099029541015625, -0.09152984619140625, -0.0840301513671875, -0.07653045654296875, -0.06903076171875, -0.06153106689453125, -0.0540313720703125, -0.04653167724609375, -0.039031982421875, -0.03153228759765625, -0.0240325927734375, -0.01653289794921875, -0.009033203125, -0.00153350830078125, 0.0059661865234375, 0.01346588134765625, 0.020965576171875, 0.02846527099609375, 0.0359649658203125, 0.04346466064453125, 0.05096435546875, 0.05846405029296875, 0.0659637451171875, 0.07346343994140625, 0.080963134765625, 0.08846282958984375, 0.0959625244140625, 0.10346221923828125, 0.1109619140625, 0.11846160888671875, 0.1259613037109375, 0.13346099853515625, 0.140960693359375, 0.14846038818359375, 0.1559600830078125, 0.16345977783203125, 0.17095947265625, 0.17845916748046875, 0.1859588623046875, 0.19345855712890625, 0.200958251953125, 0.20845794677734375, 0.2159576416015625, 0.22345733642578125, 0.23095703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 9.0, 12.0, 21.0, 22.0, 39.0, 63.0, 113.0, 167.0, 318.0, 604.0, 1379.0, 3385.0, 10342.0, 47908.0, 487145.0, 437328.0, 44059.0, 9766.0, 3245.0, 1310.0, 565.0, 299.0, 178.0, 93.0, 70.0, 34.0, 17.0, 13.0, 9.0, 11.0, 7.0, 6.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086669921875, -0.08395957946777344, -0.08124923706054688, -0.07853889465332031, -0.07582855224609375, -0.07311820983886719, -0.07040786743164062, -0.06769752502441406, -0.0649871826171875, -0.06227684020996094, -0.059566497802734375, -0.05685615539550781, -0.05414581298828125, -0.05143547058105469, -0.048725128173828125, -0.04601478576660156, -0.043304443359375, -0.04059410095214844, -0.037883758544921875, -0.03517341613769531, -0.03246307373046875, -0.029752731323242188, -0.027042388916015625, -0.024332046508789062, -0.0216217041015625, -0.018911361694335938, -0.016201019287109375, -0.013490676879882812, -0.01078033447265625, -0.008069992065429688, -0.005359649658203125, -0.0026493072509765625, 6.103515625e-05, 0.0027713775634765625, 0.005481719970703125, 0.008192062377929688, 0.01090240478515625, 0.013612747192382812, 0.016323089599609375, 0.019033432006835938, 0.0217437744140625, 0.024454116821289062, 0.027164459228515625, 0.029874801635742188, 0.03258514404296875, 0.03529548645019531, 0.038005828857421875, 0.04071617126464844, 0.043426513671875, 0.04613685607910156, 0.048847198486328125, 0.05155754089355469, 0.05426788330078125, 0.05697822570800781, 0.059688568115234375, 0.06239891052246094, 0.0651092529296875, 0.06781959533691406, 0.07052993774414062, 0.07324028015136719, 0.07595062255859375, 0.07866096496582031, 0.08137130737304688, 0.08408164978027344, 0.0867919921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 11.0, 6.0, 15.0, 11.0, 14.0, 16.0, 22.0, 29.0, 35.0, 38.0, 65.0, 58.0, 63.0, 63.0, 71.0, 64.0, 57.0, 57.0, 44.0, 28.0, 41.0, 31.0, 30.0, 14.0, 18.0, 13.0, 16.0, 10.0, 6.0, 9.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.430511474609375e-05, -1.3804063200950623e-05, -1.3303011655807495e-05, -1.2801960110664368e-05, -1.230090856552124e-05, -1.1799857020378113e-05, -1.1298805475234985e-05, -1.0797753930091858e-05, -1.029670238494873e-05, -9.795650839805603e-06, -9.294599294662476e-06, -8.793547749519348e-06, -8.29249620437622e-06, -7.791444659233093e-06, -7.290393114089966e-06, -6.789341568946838e-06, -6.288290023803711e-06, -5.7872384786605835e-06, -5.286186933517456e-06, -4.785135388374329e-06, -4.284083843231201e-06, -3.7830322980880737e-06, -3.2819807529449463e-06, -2.780929207801819e-06, -2.2798776626586914e-06, -1.778826117515564e-06, -1.2777745723724365e-06, -7.767230272293091e-07, -2.7567148208618164e-07, 2.253800630569458e-07, 7.264316082000732e-07, 1.2274831533432007e-06, 1.7285346984863281e-06, 2.2295862436294556e-06, 2.730637788772583e-06, 3.2316893339157104e-06, 3.732740879058838e-06, 4.233792424201965e-06, 4.734843969345093e-06, 5.23589551448822e-06, 5.736947059631348e-06, 6.237998604774475e-06, 6.7390501499176025e-06, 7.24010169506073e-06, 7.741153240203857e-06, 8.242204785346985e-06, 8.743256330490112e-06, 9.24430787563324e-06, 9.745359420776367e-06, 1.0246410965919495e-05, 1.0747462511062622e-05, 1.124851405620575e-05, 1.1749565601348877e-05, 1.2250617146492004e-05, 1.2751668691635132e-05, 1.325272023677826e-05, 1.3753771781921387e-05, 1.4254823327064514e-05, 1.4755874872207642e-05, 1.5256926417350769e-05, 1.5757977962493896e-05, 1.6259029507637024e-05, 1.676008105278015e-05, 1.726113259792328e-05, 1.7762184143066406e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 13.0, 17.0, 20.0, 59.0, 90.0, 138.0, 240.0, 602.0, 1592.0, 4777.0, 21573.0, 178881.0, 719144.0, 101171.0, 14390.0, 3657.0, 1199.0, 471.0, 224.0, 115.0, 66.0, 40.0, 16.0, 12.0, 14.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.08754253387451172, -0.08475303649902344, -0.08196353912353516, -0.07917404174804688, -0.0763845443725586, -0.07359504699707031, -0.07080554962158203, -0.06801605224609375, -0.06522655487060547, -0.06243705749511719, -0.059647560119628906, -0.056858062744140625, -0.054068565368652344, -0.05127906799316406, -0.04848957061767578, -0.0457000732421875, -0.04291057586669922, -0.04012107849121094, -0.037331581115722656, -0.034542083740234375, -0.031752586364746094, -0.028963088989257812, -0.02617359161376953, -0.02338409423828125, -0.02059459686279297, -0.017805099487304688, -0.015015602111816406, -0.012226104736328125, -0.009436607360839844, -0.0066471099853515625, -0.0038576126098632812, -0.001068115234375, 0.0017213821411132812, 0.0045108795166015625, 0.007300376892089844, 0.010089874267578125, 0.012879371643066406, 0.015668869018554688, 0.01845836639404297, 0.02124786376953125, 0.02403736114501953, 0.026826858520507812, 0.029616355895996094, 0.032405853271484375, 0.035195350646972656, 0.03798484802246094, 0.04077434539794922, 0.0435638427734375, 0.04635334014892578, 0.04914283752441406, 0.051932334899902344, 0.054721832275390625, 0.057511329650878906, 0.06030082702636719, 0.06309032440185547, 0.06587982177734375, 0.06866931915283203, 0.07145881652832031, 0.0742483139038086, 0.07703781127929688, 0.07982730865478516, 0.08261680603027344, 0.08540630340576172, 0.08819580078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 14.0, 25.0, 24.0, 28.0, 31.0, 37.0, 56.0, 64.0, 73.0, 70.0, 80.0, 90.0, 87.0, 66.0, 52.0, 40.0, 39.0, 32.0, 24.0, 10.0, 10.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06633663177490234, -0.06382560729980469, -0.06131458282470703, -0.058803558349609375, -0.05629253387451172, -0.05378150939941406, -0.051270484924316406, -0.04875946044921875, -0.046248435974121094, -0.04373741149902344, -0.04122638702392578, -0.038715362548828125, -0.03620433807373047, -0.03369331359863281, -0.031182289123535156, -0.0286712646484375, -0.026160240173339844, -0.023649215698242188, -0.02113819122314453, -0.018627166748046875, -0.01611614227294922, -0.013605117797851562, -0.011094093322753906, -0.00858306884765625, -0.006072044372558594, -0.0035610198974609375, -0.0010499954223632812, 0.001461029052734375, 0.003972053527832031, 0.0064830780029296875, 0.008994102478027344, 0.011505126953125, 0.014016151428222656, 0.016527175903320312, 0.01903820037841797, 0.021549224853515625, 0.02406024932861328, 0.026571273803710938, 0.029082298278808594, 0.03159332275390625, 0.034104347229003906, 0.03661537170410156, 0.03912639617919922, 0.041637420654296875, 0.04414844512939453, 0.04665946960449219, 0.049170494079589844, 0.0516815185546875, 0.054192543029785156, 0.05670356750488281, 0.05921459197998047, 0.061725616455078125, 0.06423664093017578, 0.06674766540527344, 0.0692586898803711, 0.07176971435546875, 0.0742807388305664, 0.07679176330566406, 0.07930278778076172, 0.08181381225585938, 0.08432483673095703, 0.08683586120605469, 0.08934688568115234, 0.09185791015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 4.0, 15.0, 35.0, 177.0, 576.0, 146.0, 40.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6978521943092346, -0.5693410038948059, -0.4408298134803772, -0.3123186230659485, -0.18380743265151978, -0.055296242237091064, 0.07321494817733765, 0.20172613859176636, 0.33023732900619507, 0.4587485194206238, 0.5872597098350525, 0.7157709002494812, 0.8442820906639099, 0.9727932810783386, 1.101304531097412, 1.2298157215118408, 1.3583269119262695, 1.4868381023406982, 1.615349292755127, 1.7438604831695557, 1.8723716735839844, 2.000882863998413, 2.129394054412842, 2.2579052448272705, 2.386416435241699, 2.514927625656128, 2.6434388160705566, 2.7719500064849854, 2.900461196899414, 3.0289723873138428, 3.1574835777282715, 3.2859947681427, 3.414505958557129, 3.5430171489715576, 3.6715283393859863, 3.800039529800415, 3.9285507202148438, 4.057062149047852, 4.185573101043701, 4.314084053039551, 4.442595481872559, 4.571106910705566, 4.699617862701416, 4.828128814697266, 4.956640243530273, 5.085151672363281, 5.213662624359131, 5.3421735763549805, 5.470685005187988, 5.599196434020996, 5.727707386016846, 5.856218338012695, 5.984729766845703, 6.113241195678711, 6.2417521476745605, 6.37026309967041, 6.498774528503418, 6.627285957336426, 6.755796909332275, 6.884307861328125, 7.012819290161133, 7.141330718994141, 7.26984167098999, 7.39835262298584, 7.526864051818848]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 2.0, 5.0, 3.0, 7.0, 9.0, 13.0, 20.0, 34.0, 51.0, 79.0, 108.0, 133.0, 140.0, 118.0, 83.0, 58.0, 39.0, 12.0, 16.0, 13.0, 6.0, 4.0, 7.0, 2.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.230095386505127, -4.105755805969238, -3.9814162254333496, -3.857076644897461, -3.7327370643615723, -3.6083974838256836, -3.484057903289795, -3.3597183227539062, -3.2353787422180176, -3.111039161682129, -2.9866995811462402, -2.8623600006103516, -2.738020420074463, -2.613680839538574, -2.4893412590026855, -2.365001678466797, -2.240662097930908, -2.1163225173950195, -1.9919829368591309, -1.8676433563232422, -1.7433037757873535, -1.6189641952514648, -1.4946246147155762, -1.3702850341796875, -1.245945692062378, -1.1216061115264893, -0.9972665309906006, -0.8729269504547119, -0.7485873699188232, -0.6242478489875793, -0.4999082684516907, -0.375568687915802, -0.25122904777526855, -0.12688946723937988, -0.002549901604652405, 0.12178966403007507, 0.24612924456596375, 0.37046879529953003, 0.4948083758354187, 0.6191479563713074, 0.743487536907196, 0.8678271174430847, 0.9921666979789734, 1.1165062189102173, 1.240845799446106, 1.3651853799819946, 1.4895249605178833, 1.613864541053772, 1.7382041215896606, 1.8625437021255493, 1.986883282661438, 2.111222743988037, 2.235562324523926, 2.3599019050598145, 2.484241485595703, 2.608581066131592, 2.7329206466674805, 2.857260227203369, 2.981599807739258, 3.1059393882751465, 3.230278968811035, 3.354618549346924, 3.4789581298828125, 3.603297710418701, 3.72763729095459]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 14.0, 20.0, 24.0, 43.0, 60.0, 74.0, 98.0, 136.0, 218.0, 298.0, 432.0, 654.0, 968.0, 1613.0, 2574.0, 4730.0, 10664.0, 32215.0, 807588.0, 3277268.0, 32567.0, 10307.0, 4837.0, 2609.0, 1473.0, 936.0, 576.0, 404.0, 269.0, 174.0, 114.0, 81.0, 60.0, 42.0, 38.0, 28.0, 7.0, 12.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431640625, -0.41815948486328125, -0.4046783447265625, -0.39119720458984375, -0.377716064453125, -0.36423492431640625, -0.3507537841796875, -0.33727264404296875, -0.32379150390625, -0.31031036376953125, -0.2968292236328125, -0.28334808349609375, -0.269866943359375, -0.25638580322265625, -0.2429046630859375, -0.22942352294921875, -0.2159423828125, -0.20246124267578125, -0.1889801025390625, -0.17549896240234375, -0.162017822265625, -0.14853668212890625, -0.1350555419921875, -0.12157440185546875, -0.10809326171875, -0.09461212158203125, -0.0811309814453125, -0.06764984130859375, -0.054168701171875, -0.04068756103515625, -0.0272064208984375, -0.01372528076171875, -0.000244140625, 0.01323699951171875, 0.0267181396484375, 0.04019927978515625, 0.053680419921875, 0.06716156005859375, 0.0806427001953125, 0.09412384033203125, 0.10760498046875, 0.12108612060546875, 0.1345672607421875, 0.14804840087890625, 0.161529541015625, 0.17501068115234375, 0.1884918212890625, 0.20197296142578125, 0.2154541015625, 0.22893524169921875, 0.2424163818359375, 0.25589752197265625, 0.269378662109375, 0.28285980224609375, 0.2963409423828125, 0.30982208251953125, 0.32330322265625, 0.33678436279296875, 0.3502655029296875, 0.36374664306640625, 0.377227783203125, 0.39070892333984375, 0.4041900634765625, 0.41767120361328125, 0.43115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 20.0, 19.0, 39.0, 123.0, 374.0, 197.0, 60.0, 19.0, 13.0, 16.0, 9.0, 8.0, 12.0, 6.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06637763977050781, -0.06427383422851562, -0.06217002868652344, -0.06006622314453125, -0.05796241760253906, -0.055858612060546875, -0.05375480651855469, -0.0516510009765625, -0.04954719543457031, -0.047443389892578125, -0.04533958435058594, -0.04323577880859375, -0.04113197326660156, -0.039028167724609375, -0.03692436218261719, -0.034820556640625, -0.03271675109863281, -0.030612945556640625, -0.028509140014648438, -0.02640533447265625, -0.024301528930664062, -0.022197723388671875, -0.020093917846679688, -0.0179901123046875, -0.015886306762695312, -0.013782501220703125, -0.011678695678710938, -0.00957489013671875, -0.0074710845947265625, -0.005367279052734375, -0.0032634735107421875, -0.00115966796875, 0.0009441375732421875, 0.003047943115234375, 0.0051517486572265625, 0.00725555419921875, 0.009359359741210938, 0.011463165283203125, 0.013566970825195312, 0.0156707763671875, 0.017774581909179688, 0.019878387451171875, 0.021982192993164062, 0.02408599853515625, 0.026189804077148438, 0.028293609619140625, 0.030397415161132812, 0.032501220703125, 0.03460502624511719, 0.036708831787109375, 0.03881263732910156, 0.04091644287109375, 0.04302024841308594, 0.045124053955078125, 0.04722785949707031, 0.0493316650390625, 0.05143547058105469, 0.053539276123046875, 0.05564308166503906, 0.05774688720703125, 0.05985069274902344, 0.061954498291015625, 0.06405830383300781, 0.066162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 8.0, 21.0, 21.0, 42.0, 82.0, 141.0, 343.0, 895.0, 3087.0, 15300.0, 168753.0, 3893035.0, 96939.0, 11388.0, 2675.0, 832.0, 351.0, 153.0, 74.0, 32.0, 25.0, 22.0, 12.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.380859375, -0.36525726318359375, -0.3496551513671875, -0.33405303955078125, -0.318450927734375, -0.30284881591796875, -0.2872467041015625, -0.27164459228515625, -0.25604248046875, -0.24044036865234375, -0.2248382568359375, -0.20923614501953125, -0.193634033203125, -0.17803192138671875, -0.1624298095703125, -0.14682769775390625, -0.1312255859375, -0.11562347412109375, -0.1000213623046875, -0.08441925048828125, -0.068817138671875, -0.05321502685546875, -0.0376129150390625, -0.02201080322265625, -0.00640869140625, 0.00919342041015625, 0.0247955322265625, 0.04039764404296875, 0.055999755859375, 0.07160186767578125, 0.0872039794921875, 0.10280609130859375, 0.118408203125, 0.13401031494140625, 0.1496124267578125, 0.16521453857421875, 0.180816650390625, 0.19641876220703125, 0.2120208740234375, 0.22762298583984375, 0.24322509765625, 0.25882720947265625, 0.2744293212890625, 0.29003143310546875, 0.305633544921875, 0.32123565673828125, 0.3368377685546875, 0.35243988037109375, 0.3680419921875, 0.38364410400390625, 0.3992462158203125, 0.41484832763671875, 0.430450439453125, 0.44605255126953125, 0.4616546630859375, 0.47725677490234375, 0.49285888671875, 0.5084609985351562, 0.5240631103515625, 0.5396652221679688, 0.555267333984375, 0.5708694458007812, 0.5864715576171875, 0.6020736694335938, 0.61767578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 3.0, 4.0, 4.0, 7.0, 7.0, 10.0, 17.0, 11.0, 23.0, 30.0, 43.0, 69.0, 93.0, 196.0, 368.0, 2101.0, 524.0, 192.0, 102.0, 72.0, 50.0, 30.0, 27.0, 18.0, 17.0, 13.0, 7.0, 8.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.04871988296508789, -0.04656696319580078, -0.04441404342651367, -0.04226112365722656, -0.04010820388793945, -0.037955284118652344, -0.035802364349365234, -0.033649444580078125, -0.031496524810791016, -0.029343605041503906, -0.027190685272216797, -0.025037765502929688, -0.022884845733642578, -0.02073192596435547, -0.01857900619506836, -0.01642608642578125, -0.01427316665649414, -0.012120246887207031, -0.009967327117919922, -0.007814407348632812, -0.005661487579345703, -0.0035085678100585938, -0.0013556480407714844, 0.000797271728515625, 0.0029501914978027344, 0.005103111267089844, 0.007256031036376953, 0.009408950805664062, 0.011561870574951172, 0.013714790344238281, 0.01586771011352539, 0.0180206298828125, 0.02017354965209961, 0.02232646942138672, 0.024479389190673828, 0.026632308959960938, 0.028785228729248047, 0.030938148498535156, 0.033091068267822266, 0.035243988037109375, 0.037396907806396484, 0.039549827575683594, 0.0417027473449707, 0.04385566711425781, 0.04600858688354492, 0.04816150665283203, 0.05031442642211914, 0.05246734619140625, 0.05462026596069336, 0.05677318572998047, 0.05892610549926758, 0.06107902526855469, 0.0632319450378418, 0.0653848648071289, 0.06753778457641602, 0.06969070434570312, 0.07184362411499023, 0.07399654388427734, 0.07614946365356445, 0.07830238342285156, 0.08045530319213867, 0.08260822296142578, 0.08476114273071289, 0.0869140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 30.0, 603.0, 342.0, 17.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39007556438446045, -0.3403872549533844, -0.29069894552230835, -0.2410106658935547, -0.19132235646247864, -0.1416340470314026, -0.09194576740264893, -0.042257457971572876, 0.007430851459503174, 0.05711915343999863, 0.10680745542049408, 0.15649574995040894, 0.20618405938148499, 0.25587236881256104, 0.3055606484413147, 0.35524895787239075, 0.4049372673034668, 0.45462557673454285, 0.5043138861656189, 0.5540021657943726, 0.603690505027771, 0.6533787846565247, 0.7030670642852783, 0.7527554035186768, 0.8024436831474304, 0.8521319627761841, 0.9018203020095825, 0.9515085816383362, 1.0011968612670898, 1.0508852005004883, 1.1005735397338867, 1.1502617597579956, 1.1999499797821045, 1.249638319015503, 1.2993265390396118, 1.3490148782730103, 1.3987032175064087, 1.4483914375305176, 1.498079776763916, 1.5477681159973145, 1.597456455230713, 1.6471447944641113, 1.6968330144882202, 1.7465213537216187, 1.796209692955017, 1.845897912979126, 1.8955862522125244, 1.9452745914459229, 1.9949628114700317, 2.0446510314941406, 2.094339370727539, 2.1440277099609375, 2.193716049194336, 2.2434043884277344, 2.293092727661133, 2.342780828475952, 2.3924691677093506, 2.442157506942749, 2.4918458461761475, 2.541533946990967, 2.5912222862243652, 2.6409106254577637, 2.690598964691162, 2.7402873039245605, 2.789975643157959]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 10.0, 7.0, 13.0, 14.0, 30.0, 34.0, 28.0, 34.0, 50.0, 57.0, 66.0, 74.0, 75.0, 74.0, 61.0, 78.0, 56.0, 40.0, 48.0, 36.0, 21.0, 23.0, 19.0, 12.0, 9.0, 7.0, 3.0, 6.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37470340728759766, -0.3640134930610657, -0.3533235788345337, -0.3426336646080017, -0.3319437801837921, -0.32125386595726013, -0.31056395173072815, -0.29987403750419617, -0.2891841530799866, -0.2784942388534546, -0.2678043246269226, -0.2571144104003906, -0.24642452597618103, -0.23573461174964905, -0.22504469752311707, -0.21435478329658508, -0.2036648690700531, -0.19297495484352112, -0.18228505551815033, -0.17159514129161835, -0.16090524196624756, -0.15021532773971558, -0.1395254135131836, -0.1288354992866516, -0.11814559996128082, -0.10745569318532944, -0.09676578640937805, -0.08607587218284607, -0.07538596540689468, -0.0646960586309433, -0.054006144404411316, -0.04331623762845993, -0.032626330852508545, -0.02193642221391201, -0.011246513575315475, -0.0005566030740737915, 0.010133303701877594, 0.02082321047782898, 0.03151312470436096, 0.04220303148031235, 0.05289293825626373, 0.06358284503221512, 0.0742727518081665, 0.08496266603469849, 0.09565257281064987, 0.10634247958660126, 0.11703239381313324, 0.12772229313850403, 0.138412207365036, 0.149102121591568, 0.15979202091693878, 0.17048193514347076, 0.18117183446884155, 0.19186174869537354, 0.20255166292190552, 0.2132415771484375, 0.2239314764738083, 0.23462139070034027, 0.24531129002571106, 0.25600120425224304, 0.266691118478775, 0.2773810029029846, 0.2880709171295166, 0.2987608313560486, 0.30945074558258057]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 16.0, 24.0, 25.0, 47.0, 65.0, 85.0, 149.0, 251.0, 384.0, 681.0, 1264.0, 2439.0, 5247.0, 13232.0, 45199.0, 799595.0, 140698.0, 23171.0, 8301.0, 3567.0, 1829.0, 913.0, 494.0, 285.0, 207.0, 117.0, 76.0, 56.0, 38.0, 16.0, 23.0, 11.0, 8.0, 6.0, 5.0, 1.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.3802146911621094, -0.36785125732421875, -0.3554878234863281, -0.3431243896484375, -0.3307609558105469, -0.31839752197265625, -0.3060340881347656, -0.293670654296875, -0.2813072204589844, -0.26894378662109375, -0.2565803527832031, -0.2442169189453125, -0.23185348510742188, -0.21949005126953125, -0.20712661743164062, -0.19476318359375, -0.18239974975585938, -0.17003631591796875, -0.15767288208007812, -0.1453094482421875, -0.13294601440429688, -0.12058258056640625, -0.10821914672851562, -0.095855712890625, -0.08349227905273438, -0.07112884521484375, -0.058765411376953125, -0.0464019775390625, -0.034038543701171875, -0.02167510986328125, -0.009311676025390625, 0.0030517578125, 0.015415191650390625, 0.02777862548828125, 0.040142059326171875, 0.0525054931640625, 0.06486892700195312, 0.07723236083984375, 0.08959579467773438, 0.101959228515625, 0.11432266235351562, 0.12668609619140625, 0.13904953002929688, 0.1514129638671875, 0.16377639770507812, 0.17613983154296875, 0.18850326538085938, 0.20086669921875, 0.21323013305664062, 0.22559356689453125, 0.23795700073242188, 0.2503204345703125, 0.2626838684082031, 0.27504730224609375, 0.2874107360839844, 0.299774169921875, 0.3121376037597656, 0.32450103759765625, 0.3368644714355469, 0.3492279052734375, 0.3615913391113281, 0.37395477294921875, 0.3863182067871094, 0.398681640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 3.0, 9.0, 10.0, 12.0, 12.0, 23.0, 41.0, 110.0, 268.0, 245.0, 98.0, 51.0, 19.0, 15.0, 11.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.06343650817871094, -0.061382293701171875, -0.05932807922363281, -0.05727386474609375, -0.05521965026855469, -0.053165435791015625, -0.05111122131347656, -0.0490570068359375, -0.04700279235839844, -0.044948577880859375, -0.04289436340332031, -0.04084014892578125, -0.03878593444824219, -0.036731719970703125, -0.03467750549316406, -0.032623291015625, -0.030569076538085938, -0.028514862060546875, -0.026460647583007812, -0.02440643310546875, -0.022352218627929688, -0.020298004150390625, -0.018243789672851562, -0.0161895751953125, -0.014135360717773438, -0.012081146240234375, -0.010026931762695312, -0.00797271728515625, -0.0059185028076171875, -0.003864288330078125, -0.0018100738525390625, 0.000244140625, 0.0022983551025390625, 0.004352569580078125, 0.0064067840576171875, 0.00846099853515625, 0.010515213012695312, 0.012569427490234375, 0.014623641967773438, 0.0166778564453125, 0.018732070922851562, 0.020786285400390625, 0.022840499877929688, 0.02489471435546875, 0.026948928833007812, 0.029003143310546875, 0.031057357788085938, 0.033111572265625, 0.03516578674316406, 0.037220001220703125, 0.03927421569824219, 0.04132843017578125, 0.04338264465332031, 0.045436859130859375, 0.04749107360839844, 0.0495452880859375, 0.05159950256347656, 0.053653717041015625, 0.05570793151855469, 0.05776214599609375, 0.05981636047363281, 0.061870574951171875, 0.06392478942871094, 0.06597900390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 13.0, 17.0, 14.0, 32.0, 31.0, 49.0, 73.0, 141.0, 217.0, 500.0, 1278.0, 3590.0, 12762.0, 65192.0, 573668.0, 336304.0, 41212.0, 8938.0, 2550.0, 954.0, 436.0, 223.0, 87.0, 54.0, 57.0, 34.0, 25.0, 15.0, 20.0, 12.0, 6.0, 6.0, 8.0, 7.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2415771484375, -0.23399734497070312, -0.22641754150390625, -0.21883773803710938, -0.2112579345703125, -0.20367813110351562, -0.19609832763671875, -0.18851852416992188, -0.180938720703125, -0.17335891723632812, -0.16577911376953125, -0.15819931030273438, -0.1506195068359375, -0.14303970336914062, -0.13545989990234375, -0.12788009643554688, -0.12030029296875, -0.11272048950195312, -0.10514068603515625, -0.09756088256835938, -0.0899810791015625, -0.08240127563476562, -0.07482147216796875, -0.06724166870117188, -0.059661865234375, -0.052082061767578125, -0.04450225830078125, -0.036922454833984375, -0.0293426513671875, -0.021762847900390625, -0.01418304443359375, -0.006603240966796875, 0.0009765625, 0.008556365966796875, 0.01613616943359375, 0.023715972900390625, 0.0312957763671875, 0.038875579833984375, 0.04645538330078125, 0.054035186767578125, 0.061614990234375, 0.06919479370117188, 0.07677459716796875, 0.08435440063476562, 0.0919342041015625, 0.09951400756835938, 0.10709381103515625, 0.11467361450195312, 0.12225341796875, 0.12983322143554688, 0.13741302490234375, 0.14499282836914062, 0.1525726318359375, 0.16015243530273438, 0.16773223876953125, 0.17531204223632812, 0.182891845703125, 0.19047164916992188, 0.19805145263671875, 0.20563125610351562, 0.2132110595703125, 0.22079086303710938, 0.22837066650390625, 0.23595046997070312, 0.2435302734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 13.0, 13.0, 13.0, 14.0, 22.0, 21.0, 19.0, 30.0, 31.0, 35.0, 31.0, 37.0, 50.0, 54.0, 60.0, 50.0, 51.0, 50.0, 56.0, 38.0, 41.0, 29.0, 41.0, 22.0, 16.0, 28.0, 25.0, 21.0, 9.0, 18.0, 12.0, 9.0, 7.0, 7.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.14720726013183594, -0.14207077026367188, -0.1369342803955078, -0.13179779052734375, -0.1266613006591797, -0.12152481079101562, -0.11638832092285156, -0.1112518310546875, -0.10611534118652344, -0.10097885131835938, -0.09584236145019531, -0.09070587158203125, -0.08556938171386719, -0.08043289184570312, -0.07529640197753906, -0.070159912109375, -0.06502342224121094, -0.059886932373046875, -0.05475044250488281, -0.04961395263671875, -0.04447746276855469, -0.039340972900390625, -0.03420448303222656, -0.0290679931640625, -0.023931503295898438, -0.018795013427734375, -0.013658523559570312, -0.00852203369140625, -0.0033855438232421875, 0.001750946044921875, 0.0068874359130859375, 0.01202392578125, 0.017160415649414062, 0.022296905517578125, 0.027433395385742188, 0.03256988525390625, 0.03770637512207031, 0.042842864990234375, 0.04797935485839844, 0.0531158447265625, 0.05825233459472656, 0.06338882446289062, 0.06852531433105469, 0.07366180419921875, 0.07879829406738281, 0.08393478393554688, 0.08907127380371094, 0.094207763671875, 0.09934425354003906, 0.10448074340820312, 0.10961723327636719, 0.11475372314453125, 0.11989021301269531, 0.12502670288085938, 0.13016319274902344, 0.1352996826171875, 0.14043617248535156, 0.14557266235351562, 0.1507091522216797, 0.15584564208984375, 0.1609821319580078, 0.16611862182617188, 0.17125511169433594, 0.1763916015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 12.0, 14.0, 9.0, 27.0, 64.0, 90.0, 133.0, 276.0, 630.0, 1937.0, 10080.0, 291906.0, 721612.0, 17500.0, 2706.0, 840.0, 325.0, 172.0, 89.0, 47.0, 28.0, 18.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.52294921875, -0.5113582611083984, -0.4997673034667969, -0.4881763458251953, -0.47658538818359375, -0.4649944305419922, -0.4534034729003906, -0.44181251525878906, -0.4302215576171875, -0.41863059997558594, -0.4070396423339844, -0.3954486846923828, -0.38385772705078125, -0.3722667694091797, -0.3606758117675781, -0.34908485412597656, -0.337493896484375, -0.32590293884277344, -0.3143119812011719, -0.3027210235595703, -0.29113006591796875, -0.2795391082763672, -0.2679481506347656, -0.25635719299316406, -0.2447662353515625, -0.23317527770996094, -0.22158432006835938, -0.2099933624267578, -0.19840240478515625, -0.1868114471435547, -0.17522048950195312, -0.16362953186035156, -0.15203857421875, -0.14044761657714844, -0.12885665893554688, -0.11726570129394531, -0.10567474365234375, -0.09408378601074219, -0.08249282836914062, -0.07090187072753906, -0.0593109130859375, -0.04771995544433594, -0.036128997802734375, -0.024538040161132812, -0.01294708251953125, -0.0013561248779296875, 0.010234832763671875, 0.021825790405273438, 0.033416748046875, 0.04500770568847656, 0.056598663330078125, 0.06818962097167969, 0.07978057861328125, 0.09137153625488281, 0.10296249389648438, 0.11455345153808594, 0.1261444091796875, 0.13773536682128906, 0.14932632446289062, 0.1609172821044922, 0.17250823974609375, 0.1840991973876953, 0.19569015502929688, 0.20728111267089844, 0.2188720703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 11.0, 9.0, 5.0, 11.0, 20.0, 27.0, 47.0, 46.0, 53.0, 77.0, 96.0, 84.0, 100.0, 95.0, 66.0, 64.0, 42.0, 42.0, 30.0, 11.0, 14.0, 6.0, 15.0, 6.0, 3.0, 1.0, 5.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.546476364135742e-05, -3.448314964771271e-05, -3.350153565406799e-05, -3.251992166042328e-05, -3.1538307666778564e-05, -3.055669367313385e-05, -2.9575079679489136e-05, -2.859346568584442e-05, -2.7611851692199707e-05, -2.6630237698554993e-05, -2.564862370491028e-05, -2.4667009711265564e-05, -2.368539571762085e-05, -2.2703781723976135e-05, -2.172216773033142e-05, -2.0740553736686707e-05, -1.9758939743041992e-05, -1.8777325749397278e-05, -1.7795711755752563e-05, -1.681409776210785e-05, -1.5832483768463135e-05, -1.485086977481842e-05, -1.3869255781173706e-05, -1.2887641787528992e-05, -1.1906027793884277e-05, -1.0924413800239563e-05, -9.942799806594849e-06, -8.961185812950134e-06, -7.97957181930542e-06, -6.9979578256607056e-06, -6.016343832015991e-06, -5.034729838371277e-06, -4.0531158447265625e-06, -3.071501851081848e-06, -2.089887857437134e-06, -1.1082738637924194e-06, -1.2665987014770508e-07, 8.549541234970093e-07, 1.8365681171417236e-06, 2.818182110786438e-06, 3.7997961044311523e-06, 4.781410098075867e-06, 5.763024091720581e-06, 6.744638085365295e-06, 7.72625207901001e-06, 8.707866072654724e-06, 9.689480066299438e-06, 1.0671094059944153e-05, 1.1652708053588867e-05, 1.2634322047233582e-05, 1.3615936040878296e-05, 1.459755003452301e-05, 1.5579164028167725e-05, 1.656077802181244e-05, 1.7542392015457153e-05, 1.8524006009101868e-05, 1.9505620002746582e-05, 2.0487233996391296e-05, 2.146884799003601e-05, 2.2450461983680725e-05, 2.343207597732544e-05, 2.4413689970970154e-05, 2.5395303964614868e-05, 2.6376917958259583e-05, 2.7358531951904297e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 14.0, 13.0, 16.0, 32.0, 50.0, 97.0, 211.0, 401.0, 990.0, 3615.0, 21476.0, 489862.0, 504561.0, 21887.0, 3615.0, 985.0, 329.0, 167.0, 77.0, 58.0, 41.0, 15.0, 7.0, 5.0, 6.0, 3.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3465614318847656, -0.33789825439453125, -0.3292350769042969, -0.3205718994140625, -0.3119087219238281, -0.30324554443359375, -0.2945823669433594, -0.285919189453125, -0.2772560119628906, -0.26859283447265625, -0.2599296569824219, -0.2512664794921875, -0.24260330200195312, -0.23394012451171875, -0.22527694702148438, -0.21661376953125, -0.20795059204101562, -0.19928741455078125, -0.19062423706054688, -0.1819610595703125, -0.17329788208007812, -0.16463470458984375, -0.15597152709960938, -0.147308349609375, -0.13864517211914062, -0.12998199462890625, -0.12131881713867188, -0.1126556396484375, -0.10399246215820312, -0.09532928466796875, -0.08666610717773438, -0.0780029296875, -0.06933975219726562, -0.06067657470703125, -0.052013397216796875, -0.0433502197265625, -0.034687042236328125, -0.02602386474609375, -0.017360687255859375, -0.008697509765625, -3.4332275390625e-05, 0.00862884521484375, 0.017292022705078125, 0.0259552001953125, 0.034618377685546875, 0.04328155517578125, 0.051944732666015625, 0.06060791015625, 0.06927108764648438, 0.07793426513671875, 0.08659744262695312, 0.0952606201171875, 0.10392379760742188, 0.11258697509765625, 0.12125015258789062, 0.129913330078125, 0.13857650756835938, 0.14723968505859375, 0.15590286254882812, 0.1645660400390625, 0.17322921752929688, 0.18189239501953125, 0.19055557250976562, 0.19921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 3.0, 14.0, 18.0, 40.0, 36.0, 44.0, 89.0, 136.0, 168.0, 161.0, 102.0, 62.0, 35.0, 15.0, 22.0, 14.0, 12.0, 10.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.2398223876953125, -0.233917236328125, -0.2280120849609375, -0.22210693359375, -0.2162017822265625, -0.210296630859375, -0.2043914794921875, -0.198486328125, -0.1925811767578125, -0.186676025390625, -0.1807708740234375, -0.17486572265625, -0.1689605712890625, -0.163055419921875, -0.1571502685546875, -0.1512451171875, -0.1453399658203125, -0.139434814453125, -0.1335296630859375, -0.12762451171875, -0.1217193603515625, -0.115814208984375, -0.1099090576171875, -0.10400390625, -0.0980987548828125, -0.092193603515625, -0.0862884521484375, -0.08038330078125, -0.0744781494140625, -0.068572998046875, -0.0626678466796875, -0.0567626953125, -0.0508575439453125, -0.044952392578125, -0.0390472412109375, -0.03314208984375, -0.0272369384765625, -0.021331787109375, -0.0154266357421875, -0.009521484375, -0.0036163330078125, 0.002288818359375, 0.0081939697265625, 0.01409912109375, 0.0200042724609375, 0.025909423828125, 0.0318145751953125, 0.0377197265625, 0.0436248779296875, 0.049530029296875, 0.0554351806640625, 0.06134033203125, 0.0672454833984375, 0.073150634765625, 0.0790557861328125, 0.0849609375, 0.0908660888671875, 0.096771240234375, 0.1026763916015625, 0.10858154296875, 0.1144866943359375, 0.120391845703125, 0.1262969970703125, 0.1322021484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 91.0, 746.0, 134.0, 17.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4037139415740967, -2.2271244525909424, -2.050535202026367, -1.873945713043213, -1.6973564624786377, -1.5207669734954834, -1.3441776037216187, -1.167588233947754, -0.9909988641738892, -0.8144094944000244, -0.6378201246261597, -0.46123069524765015, -0.2846413254737854, -0.10805195569992065, 0.06853747367858887, 0.2451268434524536, 0.42171621322631836, 0.5983055830001831, 0.7748949527740479, 0.9514843821525574, 1.1280736923217773, 1.3046631813049316, 1.4812525510787964, 1.6578419208526611, 1.8344312906265259, 2.0110206604003906, 2.187610149383545, 2.36419939994812, 2.5407888889312744, 2.7173781394958496, 2.893967628479004, 3.070557117462158, 3.2471461296081543, 3.4237356185913086, 3.600324869155884, 3.776914358139038, 3.9535036087036133, 4.130093097686768, 4.306682586669922, 4.483271598815918, 4.659861087799072, 4.836450576782227, 5.013040065765381, 5.189629077911377, 5.366218566894531, 5.5428080558776855, 5.71939754486084, 5.895986557006836, 6.072576522827148, 6.249166011810303, 6.425755500793457, 6.602344512939453, 6.778934001922607, 6.955523490905762, 7.132112979888916, 7.30870246887207, 7.485291481018066, 7.661880970001221, 7.838470458984375, 8.015059471130371, 8.191649436950684, 8.36823844909668, 8.544827461242676, 8.721417427062988, 8.898006439208984]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 8.0, 11.0, 16.0, 19.0, 21.0, 25.0, 34.0, 74.0, 62.0, 83.0, 97.0, 102.0, 69.0, 86.0, 73.0, 57.0, 34.0, 31.0, 26.0, 18.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.964937448501587, -1.9055211544036865, -1.8461049795150757, -1.7866886854171753, -1.7272725105285645, -1.667856216430664, -1.6084399223327637, -1.5490236282348633, -1.4896074533462524, -1.430191159248352, -1.3707749843597412, -1.3113586902618408, -1.2519423961639404, -1.1925262212753296, -1.1331099271774292, -1.0736937522888184, -1.014277458190918, -0.9548612236976624, -0.8954449892044067, -0.8360286951065063, -0.7766124606132507, -0.7171962261199951, -0.6577799320220947, -0.5983636975288391, -0.5389474630355835, -0.4795312285423279, -0.4201149642467499, -0.3606986999511719, -0.30128246545791626, -0.24186623096466064, -0.18244996666908264, -0.12303370237350464, -0.06361734867095947, -0.004201099276542664, 0.055215150117874146, 0.11463139951229095, 0.17404764890670776, 0.23346388339996338, 0.2928801476955414, 0.3522964119911194, 0.411712646484375, 0.4711288809776306, 0.5305451154708862, 0.5899614095687866, 0.6493776440620422, 0.7087938785552979, 0.7682101726531982, 0.8276264071464539, 0.8870426416397095, 0.9464588761329651, 1.0058751106262207, 1.065291404724121, 1.1247076988220215, 1.1841238737106323, 1.2435401678085327, 1.3029563426971436, 1.362372636795044, 1.4217889308929443, 1.4812051057815552, 1.5406213998794556, 1.6000375747680664, 1.6594538688659668, 1.7188701629638672, 1.7782864570617676, 1.8377026319503784]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 6.0, 6.0, 2.0, 3.0, 3.0, 13.0, 10.0, 15.0, 14.0, 22.0, 24.0, 29.0, 41.0, 69.0, 72.0, 89.0, 139.0, 188.0, 222.0, 370.0, 515.0, 814.0, 1201.0, 1973.0, 3632.0, 8720.0, 36898.0, 3933959.0, 175413.0, 17911.0, 5356.0, 2506.0, 1422.0, 880.0, 569.0, 404.0, 261.0, 174.0, 112.0, 69.0, 42.0, 32.0, 24.0, 14.0, 8.0, 9.0, 7.0, 5.0, 7.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6591796875, -0.6384353637695312, -0.6176910400390625, -0.5969467163085938, -0.576202392578125, -0.5554580688476562, -0.5347137451171875, -0.5139694213867188, -0.49322509765625, -0.47248077392578125, -0.4517364501953125, -0.43099212646484375, -0.410247802734375, -0.38950347900390625, -0.3687591552734375, -0.34801483154296875, -0.3272705078125, -0.30652618408203125, -0.2857818603515625, -0.26503753662109375, -0.244293212890625, -0.22354888916015625, -0.2028045654296875, -0.18206024169921875, -0.16131591796875, -0.14057159423828125, -0.1198272705078125, -0.09908294677734375, -0.078338623046875, -0.05759429931640625, -0.0368499755859375, -0.01610565185546875, 0.004638671875, 0.02538299560546875, 0.0461273193359375, 0.06687164306640625, 0.087615966796875, 0.10836029052734375, 0.1291046142578125, 0.14984893798828125, 0.17059326171875, 0.19133758544921875, 0.2120819091796875, 0.23282623291015625, 0.253570556640625, 0.27431488037109375, 0.2950592041015625, 0.31580352783203125, 0.3365478515625, 0.35729217529296875, 0.3780364990234375, 0.39878082275390625, 0.419525146484375, 0.44026947021484375, 0.4610137939453125, 0.48175811767578125, 0.50250244140625, 0.5232467651367188, 0.5439910888671875, 0.5647354125976562, 0.585479736328125, 0.6062240600585938, 0.6269683837890625, 0.6477127075195312, 0.66845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 10.0, 6.0, 12.0, 7.0, 15.0, 26.0, 65.0, 121.0, 238.0, 220.0, 122.0, 57.0, 22.0, 8.0, 12.0, 10.0, 10.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.0672750473022461, -0.06509208679199219, -0.06290912628173828, -0.060726165771484375, -0.05854320526123047, -0.05636024475097656, -0.054177284240722656, -0.05199432373046875, -0.049811363220214844, -0.04762840270996094, -0.04544544219970703, -0.043262481689453125, -0.04107952117919922, -0.03889656066894531, -0.036713600158691406, -0.0345306396484375, -0.032347679138183594, -0.030164718627929688, -0.02798175811767578, -0.025798797607421875, -0.02361583709716797, -0.021432876586914062, -0.019249916076660156, -0.01706695556640625, -0.014883995056152344, -0.012701034545898438, -0.010518074035644531, -0.008335113525390625, -0.006152153015136719, -0.0039691925048828125, -0.0017862319946289062, 0.000396728515625, 0.0025796890258789062, 0.0047626495361328125, 0.006945610046386719, 0.009128570556640625, 0.011311531066894531, 0.013494491577148438, 0.015677452087402344, 0.01786041259765625, 0.020043373107910156, 0.022226333618164062, 0.02440929412841797, 0.026592254638671875, 0.02877521514892578, 0.030958175659179688, 0.033141136169433594, 0.0353240966796875, 0.037507057189941406, 0.03969001770019531, 0.04187297821044922, 0.044055938720703125, 0.04623889923095703, 0.04842185974121094, 0.050604820251464844, 0.05278778076171875, 0.054970741271972656, 0.05715370178222656, 0.05933666229248047, 0.061519622802734375, 0.06370258331298828, 0.06588554382324219, 0.0680685043334961, 0.07025146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 5.0, 8.0, 8.0, 7.0, 7.0, 12.0, 15.0, 27.0, 47.0, 66.0, 139.0, 328.0, 1158.0, 4772.0, 29905.0, 3692246.0, 443837.0, 17197.0, 3117.0, 854.0, 256.0, 92.0, 47.0, 38.0, 15.0, 13.0, 15.0, 11.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6919403076171875, -0.669525146484375, -0.6471099853515625, -0.62469482421875, -0.6022796630859375, -0.579864501953125, -0.5574493408203125, -0.5350341796875, -0.5126190185546875, -0.490203857421875, -0.4677886962890625, -0.44537353515625, -0.4229583740234375, -0.400543212890625, -0.3781280517578125, -0.355712890625, -0.3332977294921875, -0.310882568359375, -0.2884674072265625, -0.26605224609375, -0.2436370849609375, -0.221221923828125, -0.1988067626953125, -0.1763916015625, -0.1539764404296875, -0.131561279296875, -0.1091461181640625, -0.08673095703125, -0.0643157958984375, -0.041900634765625, -0.0194854736328125, 0.0029296875, 0.0253448486328125, 0.047760009765625, 0.0701751708984375, 0.09259033203125, 0.1150054931640625, 0.137420654296875, 0.1598358154296875, 0.1822509765625, 0.2046661376953125, 0.227081298828125, 0.2494964599609375, 0.27191162109375, 0.2943267822265625, 0.316741943359375, 0.3391571044921875, 0.361572265625, 0.3839874267578125, 0.406402587890625, 0.4288177490234375, 0.45123291015625, 0.4736480712890625, 0.496063232421875, 0.5184783935546875, 0.5408935546875, 0.5633087158203125, 0.585723876953125, 0.6081390380859375, 0.63055419921875, 0.6529693603515625, 0.675384521484375, 0.6977996826171875, 0.72021484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 8.0, 8.0, 16.0, 37.0, 68.0, 114.0, 218.0, 710.0, 2140.0, 334.0, 159.0, 84.0, 40.0, 27.0, 21.0, 17.0, 5.0, 9.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07810592651367188, -0.07534027099609375, -0.07257461547851562, -0.0698089599609375, -0.06704330444335938, -0.06427764892578125, -0.061511993408203125, -0.058746337890625, -0.055980682373046875, -0.05321502685546875, -0.050449371337890625, -0.0476837158203125, -0.044918060302734375, -0.04215240478515625, -0.039386749267578125, -0.03662109375, -0.033855438232421875, -0.03108978271484375, -0.028324127197265625, -0.0255584716796875, -0.022792816162109375, -0.02002716064453125, -0.017261505126953125, -0.014495849609375, -0.011730194091796875, -0.00896453857421875, -0.006198883056640625, -0.0034332275390625, -0.000667572021484375, 0.00209808349609375, 0.004863739013671875, 0.00762939453125, 0.010395050048828125, 0.01316070556640625, 0.015926361083984375, 0.0186920166015625, 0.021457672119140625, 0.02422332763671875, 0.026988983154296875, 0.029754638671875, 0.032520294189453125, 0.03528594970703125, 0.038051605224609375, 0.0408172607421875, 0.043582916259765625, 0.04634857177734375, 0.049114227294921875, 0.0518798828125, 0.054645538330078125, 0.05741119384765625, 0.060176849365234375, 0.0629425048828125, 0.06570816040039062, 0.06847381591796875, 0.07123947143554688, 0.074005126953125, 0.07677078247070312, 0.07953643798828125, 0.08230209350585938, 0.0850677490234375, 0.08783340454101562, 0.09059906005859375, 0.09336471557617188, 0.09613037109375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 8.0, 14.0, 39.0, 84.0, 236.0, 267.0, 204.0, 89.0, 35.0, 13.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25120946764945984, -0.23506291210651398, -0.21891635656356812, -0.20276981592178345, -0.1866232454776764, -0.17047670483589172, -0.15433014929294586, -0.13818359375, -0.12203703820705414, -0.10589048266410828, -0.08974392712116241, -0.07359737902879715, -0.05745082348585129, -0.041304267942905426, -0.02515771985054016, -0.0090111643075943, 0.0071353912353515625, 0.023281944915652275, 0.03942849859595299, 0.05557505041360855, 0.07172160595655441, 0.08786816149950027, 0.10401470959186554, 0.1201612651348114, 0.13630782067775726, 0.15245437622070312, 0.168600931763649, 0.18474748730659485, 0.20089402794837952, 0.21704059839248657, 0.23318713903427124, 0.2493336945772171, 0.26548027992248535, 0.28162682056427, 0.2977733910083771, 0.31391993165016174, 0.3300665020942688, 0.34621304273605347, 0.36235958337783813, 0.3785061538219452, 0.39465272426605225, 0.4107992649078369, 0.42694583535194397, 0.44309237599372864, 0.4592389464378357, 0.47538548707962036, 0.49153202772140503, 0.5076786279678345, 0.5238251686096191, 0.5399717092514038, 0.5561182498931885, 0.5722648501396179, 0.5884113907814026, 0.6045579314231873, 0.6207044720649719, 0.6368510723114014, 0.6529975533485413, 0.6691440939903259, 0.6852906346321106, 0.70143723487854, 0.7175837755203247, 0.7337303161621094, 0.749876856803894, 0.7660233974456787, 0.7821699976921082]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 11.0, 13.0, 11.0, 21.0, 24.0, 27.0, 41.0, 50.0, 44.0, 79.0, 77.0, 78.0, 74.0, 64.0, 73.0, 66.0, 54.0, 50.0, 35.0, 29.0, 23.0, 8.0, 6.0, 9.0, 13.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3986917734146118, -0.3883019685745239, -0.37791216373443604, -0.36752235889434814, -0.35713255405426025, -0.34674274921417236, -0.3363529443740845, -0.3259631097316742, -0.3155733048915863, -0.3051835000514984, -0.2947936952114105, -0.28440389037132263, -0.27401408553123474, -0.26362425088882446, -0.2532344460487366, -0.24284464120864868, -0.23245485126972198, -0.2220650464296341, -0.2116752415895462, -0.20128542184829712, -0.19089561700820923, -0.18050581216812134, -0.17011600732803345, -0.15972620248794556, -0.14933639764785767, -0.13894659280776978, -0.12855678796768188, -0.1181669756770134, -0.10777716338634491, -0.09738735854625702, -0.08699755370616913, -0.07660774141550064, -0.06621792912483215, -0.055828120559453964, -0.045438311994075775, -0.035048507153987885, -0.024658698588609695, -0.014268890023231506, -0.0038790851831436157, 0.006510727107524872, 0.016900531947612762, 0.02729034051299095, 0.03768014907836914, 0.04806995391845703, 0.05845976248383522, 0.06884957104921341, 0.0792393758893013, 0.08962918817996979, 0.10001899302005768, 0.11040879786014557, 0.12079861015081406, 0.13118842244148254, 0.14157822728157043, 0.15196803212165833, 0.16235783696174622, 0.1727476418018341, 0.183137446641922, 0.1935272514820099, 0.20391705632209778, 0.21430686116218567, 0.22469668090343475, 0.23508648574352264, 0.24547629058361053, 0.2558661103248596, 0.2662559151649475]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 10.0, 9.0, 15.0, 13.0, 21.0, 38.0, 44.0, 76.0, 109.0, 142.0, 272.0, 503.0, 801.0, 1654.0, 3404.0, 9290.0, 32667.0, 444039.0, 504265.0, 34259.0, 9567.0, 3617.0, 1622.0, 818.0, 495.0, 276.0, 176.0, 107.0, 66.0, 41.0, 42.0, 26.0, 19.0, 15.0, 13.0, 11.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41959381103515625, -0.4046173095703125, -0.38964080810546875, -0.374664306640625, -0.35968780517578125, -0.3447113037109375, -0.32973480224609375, -0.31475830078125, -0.29978179931640625, -0.2848052978515625, -0.26982879638671875, -0.254852294921875, -0.23987579345703125, -0.2248992919921875, -0.20992279052734375, -0.1949462890625, -0.17996978759765625, -0.1649932861328125, -0.15001678466796875, -0.135040283203125, -0.12006378173828125, -0.1050872802734375, -0.09011077880859375, -0.07513427734375, -0.06015777587890625, -0.0451812744140625, -0.03020477294921875, -0.015228271484375, -0.00025177001953125, 0.0147247314453125, 0.02970123291015625, 0.044677734375, 0.05965423583984375, 0.0746307373046875, 0.08960723876953125, 0.104583740234375, 0.11956024169921875, 0.1345367431640625, 0.14951324462890625, 0.16448974609375, 0.17946624755859375, 0.1944427490234375, 0.20941925048828125, 0.224395751953125, 0.23937225341796875, 0.2543487548828125, 0.26932525634765625, 0.2843017578125, 0.29927825927734375, 0.3142547607421875, 0.32923126220703125, 0.344207763671875, 0.35918426513671875, 0.3741607666015625, 0.38913726806640625, 0.40411376953125, 0.41909027099609375, 0.4340667724609375, 0.44904327392578125, 0.464019775390625, 0.47899627685546875, 0.4939727783203125, 0.5089492797851562, 0.52392578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 15.0, 12.0, 22.0, 55.0, 108.0, 187.0, 218.0, 162.0, 71.0, 43.0, 14.0, 20.0, 13.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06855344772338867, -0.06648921966552734, -0.06442499160766602, -0.06236076354980469, -0.06029653549194336, -0.05823230743408203, -0.0561680793762207, -0.054103851318359375, -0.05203962326049805, -0.04997539520263672, -0.04791116714477539, -0.04584693908691406, -0.043782711029052734, -0.041718482971191406, -0.03965425491333008, -0.03759002685546875, -0.03552579879760742, -0.033461570739746094, -0.031397342681884766, -0.029333114624023438, -0.02726888656616211, -0.02520465850830078, -0.023140430450439453, -0.021076202392578125, -0.019011974334716797, -0.01694774627685547, -0.01488351821899414, -0.012819290161132812, -0.010755062103271484, -0.008690834045410156, -0.006626605987548828, -0.0045623779296875, -0.002498149871826172, -0.00043392181396484375, 0.0016303062438964844, 0.0036945343017578125, 0.005758762359619141, 0.007822990417480469, 0.009887218475341797, 0.011951446533203125, 0.014015674591064453, 0.01607990264892578, 0.01814413070678711, 0.020208358764648438, 0.022272586822509766, 0.024336814880371094, 0.026401042938232422, 0.02846527099609375, 0.030529499053955078, 0.032593727111816406, 0.034657955169677734, 0.03672218322753906, 0.03878641128540039, 0.04085063934326172, 0.04291486740112305, 0.044979095458984375, 0.0470433235168457, 0.04910755157470703, 0.05117177963256836, 0.05323600769042969, 0.055300235748291016, 0.057364463806152344, 0.05942869186401367, 0.061492919921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 9.0, 13.0, 10.0, 21.0, 19.0, 35.0, 48.0, 72.0, 110.0, 175.0, 299.0, 597.0, 1414.0, 5209.0, 34093.0, 492698.0, 473079.0, 32940.0, 4905.0, 1372.0, 607.0, 296.0, 162.0, 95.0, 71.0, 47.0, 30.0, 21.0, 20.0, 17.0, 10.0, 7.0, 10.0, 7.0, 3.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.51806640625, -0.5032615661621094, -0.48845672607421875, -0.4736518859863281, -0.4588470458984375, -0.4440422058105469, -0.42923736572265625, -0.4144325256347656, -0.399627685546875, -0.3848228454589844, -0.37001800537109375, -0.3552131652832031, -0.3404083251953125, -0.3256034851074219, -0.31079864501953125, -0.2959938049316406, -0.28118896484375, -0.2663841247558594, -0.25157928466796875, -0.23677444458007812, -0.2219696044921875, -0.20716476440429688, -0.19235992431640625, -0.17755508422851562, -0.162750244140625, -0.14794540405273438, -0.13314056396484375, -0.11833572387695312, -0.1035308837890625, -0.08872604370117188, -0.07392120361328125, -0.059116363525390625, -0.0443115234375, -0.029506683349609375, -0.01470184326171875, 0.000102996826171875, 0.0149078369140625, 0.029712677001953125, 0.04451751708984375, 0.059322357177734375, 0.074127197265625, 0.08893203735351562, 0.10373687744140625, 0.11854171752929688, 0.1333465576171875, 0.14815139770507812, 0.16295623779296875, 0.17776107788085938, 0.19256591796875, 0.20737075805664062, 0.22217559814453125, 0.23698043823242188, 0.2517852783203125, 0.2665901184082031, 0.28139495849609375, 0.2961997985839844, 0.311004638671875, 0.3258094787597656, 0.34061431884765625, 0.3554191589355469, 0.3702239990234375, 0.3850288391113281, 0.39983367919921875, 0.4146385192871094, 0.429443359375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 6.0, 9.0, 16.0, 13.0, 13.0, 30.0, 26.0, 20.0, 30.0, 38.0, 36.0, 29.0, 36.0, 47.0, 50.0, 54.0, 50.0, 35.0, 42.0, 56.0, 40.0, 34.0, 32.0, 42.0, 25.0, 28.0, 21.0, 16.0, 16.0, 19.0, 10.0, 17.0, 6.0, 5.0, 10.0, 6.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.193603515625, -0.18836593627929688, -0.18312835693359375, -0.17789077758789062, -0.1726531982421875, -0.16741561889648438, -0.16217803955078125, -0.15694046020507812, -0.151702880859375, -0.14646530151367188, -0.14122772216796875, -0.13599014282226562, -0.1307525634765625, -0.12551498413085938, -0.12027740478515625, -0.11503982543945312, -0.10980224609375, -0.10456466674804688, -0.09932708740234375, -0.09408950805664062, -0.0888519287109375, -0.08361434936523438, -0.07837677001953125, -0.07313919067382812, -0.067901611328125, -0.06266403198242188, -0.05742645263671875, -0.052188873291015625, -0.0469512939453125, -0.041713714599609375, -0.03647613525390625, -0.031238555908203125, -0.0260009765625, -0.020763397216796875, -0.01552581787109375, -0.010288238525390625, -0.0050506591796875, 0.000186920166015625, 0.00542449951171875, 0.010662078857421875, 0.015899658203125, 0.021137237548828125, 0.02637481689453125, 0.031612396240234375, 0.0368499755859375, 0.042087554931640625, 0.04732513427734375, 0.052562713623046875, 0.05780029296875, 0.06303787231445312, 0.06827545166015625, 0.07351303100585938, 0.0787506103515625, 0.08398818969726562, 0.08922576904296875, 0.09446334838867188, 0.099700927734375, 0.10493850708007812, 0.11017608642578125, 0.11541366577148438, 0.1206512451171875, 0.12588882446289062, 0.13112640380859375, 0.13636398315429688, 0.1416015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 7.0, 11.0, 25.0, 31.0, 48.0, 79.0, 141.0, 222.0, 464.0, 984.0, 2176.0, 5498.0, 16982.0, 64715.0, 321303.0, 490534.0, 106177.0, 25782.0, 7963.0, 2917.0, 1247.0, 571.0, 260.0, 148.0, 82.0, 52.0, 45.0, 30.0, 13.0, 9.0, 11.0, 4.0, 9.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143798828125, -0.1393280029296875, -0.134857177734375, -0.1303863525390625, -0.12591552734375, -0.1214447021484375, -0.116973876953125, -0.1125030517578125, -0.1080322265625, -0.1035614013671875, -0.099090576171875, -0.0946197509765625, -0.09014892578125, -0.0856781005859375, -0.081207275390625, -0.0767364501953125, -0.072265625, -0.0677947998046875, -0.063323974609375, -0.0588531494140625, -0.05438232421875, -0.0499114990234375, -0.045440673828125, -0.0409698486328125, -0.0364990234375, -0.0320281982421875, -0.027557373046875, -0.0230865478515625, -0.01861572265625, -0.0141448974609375, -0.009674072265625, -0.0052032470703125, -0.000732421875, 0.0037384033203125, 0.008209228515625, 0.0126800537109375, 0.01715087890625, 0.0216217041015625, 0.026092529296875, 0.0305633544921875, 0.0350341796875, 0.0395050048828125, 0.043975830078125, 0.0484466552734375, 0.05291748046875, 0.0573883056640625, 0.061859130859375, 0.0663299560546875, 0.07080078125, 0.0752716064453125, 0.079742431640625, 0.0842132568359375, 0.08868408203125, 0.0931549072265625, 0.097625732421875, 0.1020965576171875, 0.1065673828125, 0.1110382080078125, 0.115509033203125, 0.1199798583984375, 0.12445068359375, 0.1289215087890625, 0.133392333984375, 0.1378631591796875, 0.142333984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 11.0, 13.0, 4.0, 18.0, 15.0, 11.0, 23.0, 21.0, 24.0, 28.0, 46.0, 51.0, 53.0, 44.0, 49.0, 61.0, 45.0, 49.0, 62.0, 54.0, 39.0, 28.0, 44.0, 37.0, 30.0, 29.0, 22.0, 20.0, 13.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24249267578125e-05, -3.15103679895401e-05, -3.05958092212677e-05, -2.96812504529953e-05, -2.87666916847229e-05, -2.78521329164505e-05, -2.69375741481781e-05, -2.60230153799057e-05, -2.51084566116333e-05, -2.41938978433609e-05, -2.32793390750885e-05, -2.23647803068161e-05, -2.14502215385437e-05, -2.05356627702713e-05, -1.96211040019989e-05, -1.87065452337265e-05, -1.77919864654541e-05, -1.68774276971817e-05, -1.5962868928909302e-05, -1.5048310160636902e-05, -1.4133751392364502e-05, -1.3219192624092102e-05, -1.2304633855819702e-05, -1.1390075087547302e-05, -1.0475516319274902e-05, -9.560957551002502e-06, -8.646398782730103e-06, -7.731840014457703e-06, -6.817281246185303e-06, -5.902722477912903e-06, -4.988163709640503e-06, -4.073604941368103e-06, -3.159046173095703e-06, -2.2444874048233032e-06, -1.3299286365509033e-06, -4.153698682785034e-07, 4.991888999938965e-07, 1.4137476682662964e-06, 2.3283064365386963e-06, 3.242865204811096e-06, 4.157423973083496e-06, 5.071982741355896e-06, 5.986541509628296e-06, 6.901100277900696e-06, 7.815659046173096e-06, 8.730217814445496e-06, 9.644776582717896e-06, 1.0559335350990295e-05, 1.1473894119262695e-05, 1.2388452887535095e-05, 1.3303011655807495e-05, 1.4217570424079895e-05, 1.5132129192352295e-05, 1.6046687960624695e-05, 1.6961246728897095e-05, 1.7875805497169495e-05, 1.8790364265441895e-05, 1.9704923033714294e-05, 2.0619481801986694e-05, 2.1534040570259094e-05, 2.2448599338531494e-05, 2.3363158106803894e-05, 2.4277716875076294e-05, 2.5192275643348694e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 5.0, 12.0, 18.0, 12.0, 31.0, 43.0, 67.0, 97.0, 201.0, 401.0, 990.0, 3451.0, 20010.0, 250674.0, 702202.0, 60061.0, 7279.0, 1725.0, 604.0, 253.0, 149.0, 79.0, 48.0, 42.0, 14.0, 12.0, 13.0, 12.0, 5.0, 11.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.22545433044433594, -0.21799850463867188, -0.2105426788330078, -0.20308685302734375, -0.1956310272216797, -0.18817520141601562, -0.18071937561035156, -0.1732635498046875, -0.16580772399902344, -0.15835189819335938, -0.1508960723876953, -0.14344024658203125, -0.1359844207763672, -0.12852859497070312, -0.12107276916503906, -0.113616943359375, -0.10616111755371094, -0.09870529174804688, -0.09124946594238281, -0.08379364013671875, -0.07633781433105469, -0.06888198852539062, -0.06142616271972656, -0.0539703369140625, -0.04651451110839844, -0.039058685302734375, -0.03160285949707031, -0.02414703369140625, -0.016691207885742188, -0.009235382080078125, -0.0017795562744140625, 0.00567626953125, 0.013132095336914062, 0.020587921142578125, 0.028043746948242188, 0.03549957275390625, 0.04295539855957031, 0.050411224365234375, 0.05786705017089844, 0.0653228759765625, 0.07277870178222656, 0.08023452758789062, 0.08769035339355469, 0.09514617919921875, 0.10260200500488281, 0.11005783081054688, 0.11751365661621094, 0.124969482421875, 0.13242530822753906, 0.13988113403320312, 0.1473369598388672, 0.15479278564453125, 0.1622486114501953, 0.16970443725585938, 0.17716026306152344, 0.1846160888671875, 0.19207191467285156, 0.19952774047851562, 0.2069835662841797, 0.21443939208984375, 0.2218952178955078, 0.22935104370117188, 0.23680686950683594, 0.2442626953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 11.0, 12.0, 9.0, 11.0, 11.0, 15.0, 28.0, 29.0, 37.0, 42.0, 45.0, 52.0, 67.0, 67.0, 81.0, 84.0, 65.0, 52.0, 53.0, 37.0, 30.0, 28.0, 21.0, 18.0, 17.0, 12.0, 8.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07537841796875, -0.07311534881591797, -0.07085227966308594, -0.0685892105102539, -0.06632614135742188, -0.06406307220458984, -0.06180000305175781, -0.05953693389892578, -0.05727386474609375, -0.05501079559326172, -0.05274772644042969, -0.050484657287597656, -0.048221588134765625, -0.045958518981933594, -0.04369544982910156, -0.04143238067626953, -0.0391693115234375, -0.03690624237060547, -0.03464317321777344, -0.032380104064941406, -0.030117034912109375, -0.027853965759277344, -0.025590896606445312, -0.02332782745361328, -0.02106475830078125, -0.01880168914794922, -0.016538619995117188, -0.014275550842285156, -0.012012481689453125, -0.009749412536621094, -0.0074863433837890625, -0.005223274230957031, -0.002960205078125, -0.0006971359252929688, 0.0015659332275390625, 0.0038290023803710938, 0.006092071533203125, 0.008355140686035156, 0.010618209838867188, 0.012881278991699219, 0.01514434814453125, 0.01740741729736328, 0.019670486450195312, 0.021933555603027344, 0.024196624755859375, 0.026459693908691406, 0.028722763061523438, 0.03098583221435547, 0.0332489013671875, 0.03551197052001953, 0.03777503967285156, 0.040038108825683594, 0.042301177978515625, 0.044564247131347656, 0.04682731628417969, 0.04909038543701172, 0.05135345458984375, 0.05361652374267578, 0.05587959289550781, 0.058142662048339844, 0.060405731201171875, 0.0626688003540039, 0.06493186950683594, 0.06719493865966797, 0.0694580078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 23.0, 119.0, 474.0, 302.0, 56.0, 21.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.012691020965576, -1.855126142501831, -1.697561264038086, -1.5399965047836304, -1.3824316263198853, -1.2248667478561401, -1.0673019886016846, -0.9097371101379395, -0.7521722316741943, -0.5946073532104492, -0.4370425343513489, -0.27947768568992615, -0.12191283702850342, 0.0356520414352417, 0.19321686029434204, 0.3507816791534424, 0.5083465576171875, 0.6659114360809326, 0.823476254940033, 0.9810410737991333, 1.1386059522628784, 1.2961708307266235, 1.453735589981079, 1.6113004684448242, 1.7688653469085693, 1.9264302253723145, 2.0839951038360596, 2.2415599822998047, 2.3991246223449707, 2.556689739227295, 2.714254379272461, 2.871819257736206, 3.029383659362793, 3.186948537826538, 3.344513416290283, 3.5020782947540283, 3.6596431732177734, 3.8172078132629395, 3.9747726917266846, 4.13233757019043, 4.289902687072754, 4.44746732711792, 4.605032444000244, 4.76259708404541, 4.920162200927734, 5.0777268409729, 5.235291957855225, 5.392856597900391, 5.550421237945557, 5.707985877990723, 5.865550994873047, 6.023115634918213, 6.180680751800537, 6.338245391845703, 6.495810508728027, 6.653375148773193, 6.810939788818359, 6.968504428863525, 7.12606954574585, 7.283634185791016, 7.44119930267334, 7.598763942718506, 7.75632905960083, 7.913893699645996, 8.07145881652832]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 10.0, 20.0, 25.0, 24.0, 32.0, 40.0, 44.0, 38.0, 61.0, 67.0, 57.0, 66.0, 72.0, 51.0, 80.0, 42.0, 35.0, 40.0, 42.0, 33.0, 22.0, 17.0, 11.0, 12.0, 9.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9406133890151978, -1.8857911825180054, -1.8309688568115234, -1.776146650314331, -1.7213244438171387, -1.6665022373199463, -1.611680030822754, -1.556857705116272, -1.5020354986190796, -1.4472132921218872, -1.3923909664154053, -1.337568759918213, -1.2827465534210205, -1.2279243469238281, -1.1731021404266357, -1.1182798147201538, -1.0634576082229614, -1.008635401725769, -0.9538131356239319, -0.8989908695220947, -0.8441686630249023, -0.78934645652771, -0.7345241904258728, -0.6797019243240356, -0.6248797178268433, -0.5700575113296509, -0.5152352452278137, -0.46041300892829895, -0.4055907726287842, -0.3507685363292694, -0.29594630002975464, -0.24112406373023987, -0.18630194664001465, -0.13147971034049988, -0.07665747404098511, -0.021835237741470337, 0.032986998558044434, 0.0878092348575592, 0.14263147115707397, 0.19745370745658875, 0.2522759437561035, 0.3070981800556183, 0.36192041635513306, 0.4167426526546478, 0.4715648889541626, 0.526387095451355, 0.5812093615531921, 0.6360316276550293, 0.6908538341522217, 0.7456760406494141, 0.8004983067512512, 0.8553205728530884, 0.9101427793502808, 0.9649649858474731, 1.019787311553955, 1.0746095180511475, 1.1294317245483398, 1.1842539310455322, 1.2390761375427246, 1.2938984632492065, 1.348720669746399, 1.4035428762435913, 1.4583652019500732, 1.5131874084472656, 1.568009614944458]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 11.0, 15.0, 23.0, 38.0, 86.0, 164.0, 377.0, 1260.0, 9295.0, 4110605.0, 69112.0, 2482.0, 483.0, 155.0, 87.0, 26.0, 20.0, 12.0, 9.0, 5.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.467529296875, -1.41650390625, -1.365478515625, -1.314453125, -1.263427734375, -1.21240234375, -1.161376953125, -1.1103515625, -1.059326171875, -1.00830078125, -0.957275390625, -0.90625, -0.855224609375, -0.80419921875, -0.753173828125, -0.7021484375, -0.651123046875, -0.60009765625, -0.549072265625, -0.498046875, -0.447021484375, -0.39599609375, -0.344970703125, -0.2939453125, -0.242919921875, -0.19189453125, -0.140869140625, -0.08984375, -0.038818359375, 0.01220703125, 0.063232421875, 0.1142578125, 0.165283203125, 0.21630859375, 0.267333984375, 0.318359375, 0.369384765625, 0.42041015625, 0.471435546875, 0.5224609375, 0.573486328125, 0.62451171875, 0.675537109375, 0.7265625, 0.777587890625, 0.82861328125, 0.879638671875, 0.9306640625, 0.981689453125, 1.03271484375, 1.083740234375, 1.134765625, 1.185791015625, 1.23681640625, 1.287841796875, 1.3388671875, 1.389892578125, 1.44091796875, 1.491943359375, 1.54296875, 1.593994140625, 1.64501953125, 1.696044921875, 1.7470703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 8.0, 10.0, 9.0, 17.0, 42.0, 42.0, 83.0, 132.0, 182.0, 155.0, 121.0, 61.0, 47.0, 29.0, 19.0, 10.0, 6.0, 9.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06628894805908203, -0.06397438049316406, -0.061659812927246094, -0.059345245361328125, -0.057030677795410156, -0.05471611022949219, -0.05240154266357422, -0.05008697509765625, -0.04777240753173828, -0.04545783996582031, -0.043143272399902344, -0.040828704833984375, -0.038514137268066406, -0.03619956970214844, -0.03388500213623047, -0.0315704345703125, -0.02925586700439453, -0.026941299438476562, -0.024626731872558594, -0.022312164306640625, -0.019997596740722656, -0.017683029174804688, -0.015368461608886719, -0.01305389404296875, -0.010739326477050781, -0.008424758911132812, -0.006110191345214844, -0.003795623779296875, -0.0014810562133789062, 0.0008335113525390625, 0.0031480789184570312, 0.005462646484375, 0.007777214050292969, 0.010091781616210938, 0.012406349182128906, 0.014720916748046875, 0.017035484313964844, 0.019350051879882812, 0.02166461944580078, 0.02397918701171875, 0.02629375457763672, 0.028608322143554688, 0.030922889709472656, 0.033237457275390625, 0.035552024841308594, 0.03786659240722656, 0.04018115997314453, 0.0424957275390625, 0.04481029510498047, 0.04712486267089844, 0.049439430236816406, 0.051753997802734375, 0.054068565368652344, 0.05638313293457031, 0.05869770050048828, 0.06101226806640625, 0.06332683563232422, 0.06564140319824219, 0.06795597076416016, 0.07027053833007812, 0.0725851058959961, 0.07489967346191406, 0.07721424102783203, 0.07952880859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 8.0, 9.0, 30.0, 43.0, 85.0, 162.0, 320.0, 780.0, 2637.0, 11211.0, 80389.0, 3740875.0, 323037.0, 26662.0, 5431.0, 1479.0, 529.0, 239.0, 119.0, 68.0, 49.0, 29.0, 23.0, 17.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4329261779785156, -0.41785430908203125, -0.4027824401855469, -0.3877105712890625, -0.3726387023925781, -0.35756683349609375, -0.3424949645996094, -0.327423095703125, -0.3123512268066406, -0.29727935791015625, -0.2822074890136719, -0.2671356201171875, -0.2520637512207031, -0.23699188232421875, -0.22192001342773438, -0.20684814453125, -0.19177627563476562, -0.17670440673828125, -0.16163253784179688, -0.1465606689453125, -0.13148880004882812, -0.11641693115234375, -0.10134506225585938, -0.086273193359375, -0.07120132446289062, -0.05612945556640625, -0.041057586669921875, -0.0259857177734375, -0.010913848876953125, 0.00415802001953125, 0.019229888916015625, 0.0343017578125, 0.049373626708984375, 0.06444549560546875, 0.07951736450195312, 0.0945892333984375, 0.10966110229492188, 0.12473297119140625, 0.13980484008789062, 0.154876708984375, 0.16994857788085938, 0.18502044677734375, 0.20009231567382812, 0.2151641845703125, 0.23023605346679688, 0.24530792236328125, 0.2603797912597656, 0.27545166015625, 0.2905235290527344, 0.30559539794921875, 0.3206672668457031, 0.3357391357421875, 0.3508110046386719, 0.36588287353515625, 0.3809547424316406, 0.396026611328125, 0.4110984802246094, 0.42617034912109375, 0.4412422180175781, 0.4563140869140625, 0.4713859558105469, 0.48645782470703125, 0.5015296936035156, 0.5166015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 6.0, 14.0, 16.0, 22.0, 31.0, 42.0, 76.0, 84.0, 156.0, 327.0, 1228.0, 1235.0, 294.0, 156.0, 89.0, 65.0, 48.0, 28.0, 25.0, 20.0, 19.0, 15.0, 12.0, 8.0, 6.0, 10.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.07440185546875, -0.07221412658691406, -0.07002639770507812, -0.06783866882324219, -0.06565093994140625, -0.06346321105957031, -0.061275482177734375, -0.05908775329589844, -0.0569000244140625, -0.05471229553222656, -0.052524566650390625, -0.05033683776855469, -0.04814910888671875, -0.04596138000488281, -0.043773651123046875, -0.04158592224121094, -0.039398193359375, -0.03721046447753906, -0.035022735595703125, -0.03283500671386719, -0.03064727783203125, -0.028459548950195312, -0.026271820068359375, -0.024084091186523438, -0.0218963623046875, -0.019708633422851562, -0.017520904541015625, -0.015333175659179688, -0.01314544677734375, -0.010957717895507812, -0.008769989013671875, -0.0065822601318359375, -0.00439453125, -0.0022068023681640625, -1.9073486328125e-05, 0.0021686553955078125, 0.00435638427734375, 0.0065441131591796875, 0.008731842041015625, 0.010919570922851562, 0.0131072998046875, 0.015295028686523438, 0.017482757568359375, 0.019670486450195312, 0.02185821533203125, 0.024045944213867188, 0.026233673095703125, 0.028421401977539062, 0.030609130859375, 0.03279685974121094, 0.034984588623046875, 0.03717231750488281, 0.03936004638671875, 0.04154777526855469, 0.043735504150390625, 0.04592323303222656, 0.0481109619140625, 0.05029869079589844, 0.052486419677734375, 0.05467414855957031, 0.05686187744140625, 0.05904960632324219, 0.061237335205078125, 0.06342506408691406, 0.06561279296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 13.0, 68.0, 322.0, 442.0, 134.0, 23.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2751205265522003, -0.23692554235458374, -0.19873055815696716, -0.1605355590581894, -0.12234057486057281, -0.08414559066295624, -0.04595059156417847, -0.00775560736656189, 0.030439376831054688, 0.06863436102867126, 0.10682935267686844, 0.1450243443250656, 0.1832193285226822, 0.22141431272029877, 0.25960931181907654, 0.2978042960166931, 0.3359992802143097, 0.37419426441192627, 0.41238924860954285, 0.4505842328071594, 0.4887792468070984, 0.5269742012023926, 0.5651692152023315, 0.6033642292022705, 0.6415591835975647, 0.6797541975975037, 0.7179491519927979, 0.7561441659927368, 0.794339120388031, 0.83253413438797, 0.8707290887832642, 0.9089241027832031, 0.9471191167831421, 0.985314130783081, 1.02350914478302, 1.0617040395736694, 1.0998990535736084, 1.1380940675735474, 1.1762890815734863, 1.2144839763641357, 1.2526789903640747, 1.2908740043640137, 1.3290690183639526, 1.367263913154602, 1.405458927154541, 1.44365394115448, 1.481848955154419, 1.5200438499450684, 1.5582389831542969, 1.5964339971542358, 1.6346290111541748, 1.6728239059448242, 1.7110189199447632, 1.7492139339447021, 1.7874089479446411, 1.82560396194458, 1.8637988567352295, 1.9019938707351685, 1.9401888847351074, 1.9783837795257568, 2.0165789127349854, 2.0547738075256348, 2.092968702316284, 2.1311638355255127, 2.169358730316162]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 6.0, 13.0, 10.0, 6.0, 17.0, 18.0, 16.0, 19.0, 26.0, 28.0, 26.0, 28.0, 38.0, 32.0, 39.0, 43.0, 42.0, 49.0, 47.0, 43.0, 34.0, 50.0, 39.0, 28.0, 39.0, 29.0, 21.0, 26.0, 30.0, 28.0, 21.0, 23.0, 12.0, 9.0, 16.0, 10.0, 14.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21693402528762817, -0.20960736274719238, -0.2022807002067566, -0.1949540376663208, -0.187627375125885, -0.18030071258544922, -0.17297405004501343, -0.16564738750457764, -0.15832072496414185, -0.15099406242370605, -0.14366739988327026, -0.13634073734283447, -0.12901407480239868, -0.12168741226196289, -0.1143607497215271, -0.10703408718109131, -0.09970742464065552, -0.09238076210021973, -0.08505409955978394, -0.07772743701934814, -0.07040077447891235, -0.06307411193847656, -0.05574744939804077, -0.04842078685760498, -0.04109412431716919, -0.0337674617767334, -0.026440799236297607, -0.019114136695861816, -0.011787474155426025, -0.004460811614990234, 0.0028658509254455566, 0.010192513465881348, 0.01751917600631714, 0.02484583854675293, 0.03217250108718872, 0.03949916362762451, 0.0468258261680603, 0.054152488708496094, 0.061479151248931885, 0.06880581378936768, 0.07613247632980347, 0.08345913887023926, 0.09078580141067505, 0.09811246395111084, 0.10543912649154663, 0.11276578903198242, 0.12009245157241821, 0.127419114112854, 0.1347457766532898, 0.14207243919372559, 0.14939910173416138, 0.15672576427459717, 0.16405242681503296, 0.17137908935546875, 0.17870575189590454, 0.18603241443634033, 0.19335907697677612, 0.20068573951721191, 0.2080124020576477, 0.2153390645980835, 0.2226657271385193, 0.22999238967895508, 0.23731905221939087, 0.24464571475982666, 0.25197237730026245]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 9.0, 9.0, 6.0, 17.0, 17.0, 25.0, 32.0, 57.0, 61.0, 111.0, 150.0, 213.0, 356.0, 571.0, 1154.0, 2165.0, 4723.0, 13110.0, 52276.0, 385229.0, 495137.0, 66677.0, 15653.0, 5542.0, 2386.0, 1141.0, 640.0, 383.0, 215.0, 154.0, 97.0, 66.0, 44.0, 32.0, 25.0, 15.0, 12.0, 6.0, 5.0, 12.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.339111328125, -0.3285369873046875, -0.317962646484375, -0.3073883056640625, -0.29681396484375, -0.2862396240234375, -0.275665283203125, -0.2650909423828125, -0.2545166015625, -0.2439422607421875, -0.233367919921875, -0.2227935791015625, -0.21221923828125, -0.2016448974609375, -0.191070556640625, -0.1804962158203125, -0.169921875, -0.1593475341796875, -0.148773193359375, -0.1381988525390625, -0.12762451171875, -0.1170501708984375, -0.106475830078125, -0.0959014892578125, -0.0853271484375, -0.0747528076171875, -0.064178466796875, -0.0536041259765625, -0.04302978515625, -0.0324554443359375, -0.021881103515625, -0.0113067626953125, -0.000732421875, 0.0098419189453125, 0.020416259765625, 0.0309906005859375, 0.04156494140625, 0.0521392822265625, 0.062713623046875, 0.0732879638671875, 0.0838623046875, 0.0944366455078125, 0.105010986328125, 0.1155853271484375, 0.12615966796875, 0.1367340087890625, 0.147308349609375, 0.1578826904296875, 0.16845703125, 0.1790313720703125, 0.189605712890625, 0.2001800537109375, 0.21075439453125, 0.2213287353515625, 0.231903076171875, 0.2424774169921875, 0.2530517578125, 0.2636260986328125, 0.274200439453125, 0.2847747802734375, 0.29534912109375, 0.3059234619140625, 0.316497802734375, 0.3270721435546875, 0.337646484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 22.0, 29.0, 51.0, 81.0, 131.0, 140.0, 147.0, 122.0, 75.0, 71.0, 36.0, 23.0, 18.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07018089294433594, -0.06791305541992188, -0.06564521789550781, -0.06337738037109375, -0.06110954284667969, -0.058841705322265625, -0.05657386779785156, -0.0543060302734375, -0.05203819274902344, -0.049770355224609375, -0.04750251770019531, -0.04523468017578125, -0.04296684265136719, -0.040699005126953125, -0.03843116760253906, -0.036163330078125, -0.03389549255371094, -0.031627655029296875, -0.029359817504882812, -0.02709197998046875, -0.024824142456054688, -0.022556304931640625, -0.020288467407226562, -0.0180206298828125, -0.015752792358398438, -0.013484954833984375, -0.011217117309570312, -0.00894927978515625, -0.0066814422607421875, -0.004413604736328125, -0.0021457672119140625, 0.0001220703125, 0.0023899078369140625, 0.004657745361328125, 0.0069255828857421875, 0.00919342041015625, 0.011461257934570312, 0.013729095458984375, 0.015996932983398438, 0.0182647705078125, 0.020532608032226562, 0.022800445556640625, 0.025068283081054688, 0.02733612060546875, 0.029603958129882812, 0.031871795654296875, 0.03413963317871094, 0.036407470703125, 0.03867530822753906, 0.040943145751953125, 0.04321098327636719, 0.04547882080078125, 0.04774665832519531, 0.050014495849609375, 0.05228233337402344, 0.0545501708984375, 0.05681800842285156, 0.059085845947265625, 0.06135368347167969, 0.06362152099609375, 0.06588935852050781, 0.06815719604492188, 0.07042503356933594, 0.07269287109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 8.0, 4.0, 8.0, 7.0, 7.0, 14.0, 15.0, 26.0, 24.0, 37.0, 51.0, 90.0, 122.0, 218.0, 337.0, 650.0, 1420.0, 4443.0, 21404.0, 171660.0, 708476.0, 117052.0, 16297.0, 3491.0, 1174.0, 589.0, 302.0, 214.0, 119.0, 90.0, 47.0, 40.0, 26.0, 19.0, 10.0, 12.0, 12.0, 4.0, 5.0, 8.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3681640625, -0.354736328125, -0.34130859375, -0.327880859375, -0.314453125, -0.301025390625, -0.28759765625, -0.274169921875, -0.2607421875, -0.247314453125, -0.23388671875, -0.220458984375, -0.20703125, -0.193603515625, -0.18017578125, -0.166748046875, -0.1533203125, -0.139892578125, -0.12646484375, -0.113037109375, -0.099609375, -0.086181640625, -0.07275390625, -0.059326171875, -0.0458984375, -0.032470703125, -0.01904296875, -0.005615234375, 0.0078125, 0.021240234375, 0.03466796875, 0.048095703125, 0.0615234375, 0.074951171875, 0.08837890625, 0.101806640625, 0.115234375, 0.128662109375, 0.14208984375, 0.155517578125, 0.1689453125, 0.182373046875, 0.19580078125, 0.209228515625, 0.22265625, 0.236083984375, 0.24951171875, 0.262939453125, 0.2763671875, 0.289794921875, 0.30322265625, 0.316650390625, 0.330078125, 0.343505859375, 0.35693359375, 0.370361328125, 0.3837890625, 0.397216796875, 0.41064453125, 0.424072265625, 0.4375, 0.450927734375, 0.46435546875, 0.477783203125, 0.4912109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 13.0, 6.0, 6.0, 9.0, 16.0, 15.0, 19.0, 26.0, 34.0, 31.0, 34.0, 36.0, 39.0, 44.0, 44.0, 51.0, 59.0, 61.0, 47.0, 52.0, 57.0, 45.0, 36.0, 26.0, 38.0, 20.0, 21.0, 16.0, 12.0, 20.0, 13.0, 8.0, 10.0, 7.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2279052734375, -0.22083282470703125, -0.2137603759765625, -0.20668792724609375, -0.199615478515625, -0.19254302978515625, -0.1854705810546875, -0.17839813232421875, -0.17132568359375, -0.16425323486328125, -0.1571807861328125, -0.15010833740234375, -0.143035888671875, -0.13596343994140625, -0.1288909912109375, -0.12181854248046875, -0.11474609375, -0.10767364501953125, -0.1006011962890625, -0.09352874755859375, -0.086456298828125, -0.07938385009765625, -0.0723114013671875, -0.06523895263671875, -0.05816650390625, -0.05109405517578125, -0.0440216064453125, -0.03694915771484375, -0.029876708984375, -0.02280426025390625, -0.0157318115234375, -0.00865936279296875, -0.0015869140625, 0.00548553466796875, 0.0125579833984375, 0.01963043212890625, 0.026702880859375, 0.03377532958984375, 0.0408477783203125, 0.04792022705078125, 0.05499267578125, 0.06206512451171875, 0.0691375732421875, 0.07621002197265625, 0.083282470703125, 0.09035491943359375, 0.0974273681640625, 0.10449981689453125, 0.111572265625, 0.11864471435546875, 0.1257171630859375, 0.13278961181640625, 0.139862060546875, 0.14693450927734375, 0.1540069580078125, 0.16107940673828125, 0.16815185546875, 0.17522430419921875, 0.1822967529296875, 0.18936920166015625, 0.196441650390625, 0.20351409912109375, 0.2105865478515625, 0.21765899658203125, 0.2247314453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 17.0, 20.0, 27.0, 47.0, 55.0, 92.0, 133.0, 265.0, 435.0, 791.0, 1402.0, 2868.0, 6339.0, 14871.0, 44134.0, 197044.0, 583623.0, 138573.0, 34778.0, 12472.0, 5219.0, 2467.0, 1274.0, 635.0, 376.0, 205.0, 133.0, 80.0, 58.0, 33.0, 21.0, 15.0, 10.0, 7.0, 1.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.13743972778320312, -0.13242340087890625, -0.12740707397460938, -0.1223907470703125, -0.11737442016601562, -0.11235809326171875, -0.10734176635742188, -0.102325439453125, -0.09730911254882812, -0.09229278564453125, -0.08727645874023438, -0.0822601318359375, -0.07724380493164062, -0.07222747802734375, -0.06721115112304688, -0.06219482421875, -0.057178497314453125, -0.05216217041015625, -0.047145843505859375, -0.0421295166015625, -0.037113189697265625, -0.03209686279296875, -0.027080535888671875, -0.022064208984375, -0.017047882080078125, -0.01203155517578125, -0.007015228271484375, -0.0019989013671875, 0.003017425537109375, 0.00803375244140625, 0.013050079345703125, 0.01806640625, 0.023082733154296875, 0.02809906005859375, 0.033115386962890625, 0.0381317138671875, 0.043148040771484375, 0.04816436767578125, 0.053180694580078125, 0.058197021484375, 0.06321334838867188, 0.06822967529296875, 0.07324600219726562, 0.0782623291015625, 0.08327865600585938, 0.08829498291015625, 0.09331130981445312, 0.09832763671875, 0.10334396362304688, 0.10836029052734375, 0.11337661743164062, 0.1183929443359375, 0.12340927124023438, 0.12842559814453125, 0.13344192504882812, 0.138458251953125, 0.14347457885742188, 0.14849090576171875, 0.15350723266601562, 0.1585235595703125, 0.16353988647460938, 0.16855621337890625, 0.17357254028320312, 0.1785888671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 8.0, 13.0, 21.0, 30.0, 45.0, 43.0, 47.0, 66.0, 75.0, 90.0, 93.0, 105.0, 87.0, 73.0, 60.0, 37.0, 27.0, 21.0, 14.0, 8.0, 9.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.297494888305664e-05, -4.1513703763484955e-05, -4.005245864391327e-05, -3.859121352434158e-05, -3.71299684047699e-05, -3.566872328519821e-05, -3.4207478165626526e-05, -3.274623304605484e-05, -3.1284987926483154e-05, -2.982374280691147e-05, -2.8362497687339783e-05, -2.6901252567768097e-05, -2.544000744819641e-05, -2.3978762328624725e-05, -2.251751720905304e-05, -2.1056272089481354e-05, -1.9595026969909668e-05, -1.8133781850337982e-05, -1.6672536730766296e-05, -1.521129161119461e-05, -1.3750046491622925e-05, -1.2288801372051239e-05, -1.0827556252479553e-05, -9.366311132907867e-06, -7.905066013336182e-06, -6.443820893764496e-06, -4.98257577419281e-06, -3.5213306546211243e-06, -2.0600855350494385e-06, -5.988404154777527e-07, 8.624047040939331e-07, 2.323649823665619e-06, 3.7848949432373047e-06, 5.2461400628089905e-06, 6.707385182380676e-06, 8.168630301952362e-06, 9.629875421524048e-06, 1.1091120541095734e-05, 1.255236566066742e-05, 1.4013610780239105e-05, 1.547485589981079e-05, 1.6936101019382477e-05, 1.8397346138954163e-05, 1.985859125852585e-05, 2.1319836378097534e-05, 2.278108149766922e-05, 2.4242326617240906e-05, 2.570357173681259e-05, 2.7164816856384277e-05, 2.8626061975955963e-05, 3.008730709552765e-05, 3.1548552215099335e-05, 3.300979733467102e-05, 3.4471042454242706e-05, 3.593228757381439e-05, 3.739353269338608e-05, 3.8854777812957764e-05, 4.031602293252945e-05, 4.1777268052101135e-05, 4.323851317167282e-05, 4.469975829124451e-05, 4.616100341081619e-05, 4.762224853038788e-05, 4.9083493649959564e-05, 5.054473876953125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 10.0, 14.0, 21.0, 24.0, 49.0, 85.0, 162.0, 376.0, 1036.0, 3798.0, 28192.0, 801304.0, 198810.0, 11333.0, 2145.0, 641.0, 261.0, 108.0, 66.0, 31.0, 21.0, 12.0, 13.0, 7.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.43119049072265625, -0.4180450439453125, -0.40489959716796875, -0.391754150390625, -0.37860870361328125, -0.3654632568359375, -0.35231781005859375, -0.33917236328125, -0.32602691650390625, -0.3128814697265625, -0.29973602294921875, -0.286590576171875, -0.27344512939453125, -0.2602996826171875, -0.24715423583984375, -0.2340087890625, -0.22086334228515625, -0.2077178955078125, -0.19457244873046875, -0.181427001953125, -0.16828155517578125, -0.1551361083984375, -0.14199066162109375, -0.12884521484375, -0.11569976806640625, -0.1025543212890625, -0.08940887451171875, -0.076263427734375, -0.06311798095703125, -0.0499725341796875, -0.03682708740234375, -0.023681640625, -0.01053619384765625, 0.0026092529296875, 0.01575469970703125, 0.028900146484375, 0.04204559326171875, 0.0551910400390625, 0.06833648681640625, 0.08148193359375, 0.09462738037109375, 0.1077728271484375, 0.12091827392578125, 0.134063720703125, 0.14720916748046875, 0.1603546142578125, 0.17350006103515625, 0.1866455078125, 0.19979095458984375, 0.2129364013671875, 0.22608184814453125, 0.239227294921875, 0.25237274169921875, 0.2655181884765625, 0.27866363525390625, 0.29180908203125, 0.30495452880859375, 0.3180999755859375, 0.33124542236328125, 0.344390869140625, 0.35753631591796875, 0.3706817626953125, 0.38382720947265625, 0.39697265625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 7.0, 11.0, 9.0, 9.0, 12.0, 15.0, 29.0, 32.0, 51.0, 71.0, 77.0, 111.0, 151.0, 128.0, 79.0, 57.0, 31.0, 27.0, 18.0, 21.0, 11.0, 6.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.16032028198242188, -0.15547943115234375, -0.15063858032226562, -0.1457977294921875, -0.14095687866210938, -0.13611602783203125, -0.13127517700195312, -0.126434326171875, -0.12159347534179688, -0.11675262451171875, -0.11191177368164062, -0.1070709228515625, -0.10223007202148438, -0.09738922119140625, -0.09254837036132812, -0.08770751953125, -0.08286666870117188, -0.07802581787109375, -0.07318496704101562, -0.0683441162109375, -0.06350326538085938, -0.05866241455078125, -0.053821563720703125, -0.048980712890625, -0.044139862060546875, -0.03929901123046875, -0.034458160400390625, -0.0296173095703125, -0.024776458740234375, -0.01993560791015625, -0.015094757080078125, -0.01025390625, -0.005413055419921875, -0.00057220458984375, 0.004268646240234375, 0.0091094970703125, 0.013950347900390625, 0.01879119873046875, 0.023632049560546875, 0.028472900390625, 0.033313751220703125, 0.03815460205078125, 0.042995452880859375, 0.0478363037109375, 0.052677154541015625, 0.05751800537109375, 0.062358856201171875, 0.06719970703125, 0.07204055786132812, 0.07688140869140625, 0.08172225952148438, 0.0865631103515625, 0.09140396118164062, 0.09624481201171875, 0.10108566284179688, 0.105926513671875, 0.11076736450195312, 0.11560821533203125, 0.12044906616210938, 0.1252899169921875, 0.13013076782226562, 0.13497161865234375, 0.13981246948242188, 0.1446533203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 14.0, 86.0, 442.0, 394.0, 58.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3341137170791626, -1.1095914840698242, -0.8850691914558411, -0.6605468988418579, -0.43602466583251953, -0.21150243282318115, 0.013019919395446777, 0.23754215240478516, 0.46206438541412354, 0.6865866184234619, 0.9111089110374451, 1.1356312036514282, 1.3601534366607666, 1.584675669670105, 1.809198021888733, 2.0337202548980713, 2.258242607116699, 2.482764959335327, 2.707287073135376, 2.931809425354004, 3.1563315391540527, 3.3808538913726807, 3.6053762435913086, 3.8298983573913574, 4.054420471191406, 4.278942584991455, 4.503465175628662, 4.727987289428711, 4.95250940322876, 5.177031517028809, 5.401554107666016, 5.6260762214660645, 5.850598335266113, 6.075120449066162, 6.299643039703369, 6.524165153503418, 6.748687267303467, 6.973209381103516, 7.197731971740723, 7.4222540855407715, 7.64677619934082, 7.871298313140869, 8.095820426940918, 8.320343017578125, 8.544865608215332, 8.769387245178223, 8.99390983581543, 9.218432426452637, 9.442955017089844, 9.66747760772705, 9.891999244689941, 10.116521835327148, 10.341044425964355, 10.565566062927246, 10.790088653564453, 11.01461124420166, 11.23913288116455, 11.463655471801758, 11.688177108764648, 11.912699699401855, 12.137222290039062, 12.361743927001953, 12.58626651763916, 12.810789108276367, 13.035310745239258]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 7.0, 8.0, 9.0, 17.0, 20.0, 15.0, 16.0, 31.0, 27.0, 28.0, 34.0, 35.0, 29.0, 43.0, 31.0, 39.0, 42.0, 59.0, 40.0, 50.0, 44.0, 29.0, 45.0, 35.0, 38.0, 26.0, 36.0, 23.0, 18.0, 19.0, 15.0, 18.0, 15.0, 10.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2969822883605957, -1.2545192241668701, -1.2120561599731445, -1.1695929765701294, -1.1271299123764038, -1.0846668481826782, -1.042203664779663, -0.9997406005859375, -0.9572775363922119, -0.9148144721984863, -0.872351348400116, -0.8298882246017456, -0.78742516040802, -0.7449620962142944, -0.7024989724159241, -0.6600358486175537, -0.6175727844238281, -0.5751097202301025, -0.5326465964317322, -0.4901835024356842, -0.44772040843963623, -0.40525731444358826, -0.3627942204475403, -0.3203311264514923, -0.27786803245544434, -0.23540493845939636, -0.1929418444633484, -0.15047875046730042, -0.10801565647125244, -0.06555256247520447, -0.023089468479156494, 0.01937362551689148, 0.061836838722229004, 0.10429993271827698, 0.14676302671432495, 0.18922612071037292, 0.2316892147064209, 0.27415230870246887, 0.31661540269851685, 0.3590784966945648, 0.4015415906906128, 0.44400468468666077, 0.48646777868270874, 0.5289309024810791, 0.5713939666748047, 0.6138570308685303, 0.6563201546669006, 0.698783278465271, 0.7412463426589966, 0.7837094068527222, 0.8261725306510925, 0.8686356544494629, 0.9110987186431885, 0.9535617828369141, 0.9960249066352844, 1.0384880304336548, 1.0809510946273804, 1.123414158821106, 1.165877342224121, 1.2083404064178467, 1.2508034706115723, 1.2932665348052979, 1.3357295989990234, 1.3781927824020386, 1.4206558465957642]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 8.0, 12.0, 13.0, 20.0, 33.0, 50.0, 61.0, 122.0, 242.0, 437.0, 953.0, 2437.0, 8017.0, 58453.0, 3979016.0, 127187.0, 12173.0, 2938.0, 1036.0, 509.0, 212.0, 137.0, 81.0, 47.0, 23.0, 16.0, 12.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5166015625, -0.49973297119140625, -0.4828643798828125, -0.46599578857421875, -0.449127197265625, -0.43225860595703125, -0.4153900146484375, -0.39852142333984375, -0.38165283203125, -0.36478424072265625, -0.3479156494140625, -0.33104705810546875, -0.314178466796875, -0.29730987548828125, -0.2804412841796875, -0.26357269287109375, -0.2467041015625, -0.22983551025390625, -0.2129669189453125, -0.19609832763671875, -0.179229736328125, -0.16236114501953125, -0.1454925537109375, -0.12862396240234375, -0.11175537109375, -0.09488677978515625, -0.0780181884765625, -0.06114959716796875, -0.044281005859375, -0.02741241455078125, -0.0105438232421875, 0.00632476806640625, 0.023193359375, 0.04006195068359375, 0.0569305419921875, 0.07379913330078125, 0.090667724609375, 0.10753631591796875, 0.1244049072265625, 0.14127349853515625, 0.15814208984375, 0.17501068115234375, 0.1918792724609375, 0.20874786376953125, 0.225616455078125, 0.24248504638671875, 0.2593536376953125, 0.27622222900390625, 0.2930908203125, 0.30995941162109375, 0.3268280029296875, 0.34369659423828125, 0.360565185546875, 0.37743377685546875, 0.3943023681640625, 0.41117095947265625, 0.42803955078125, 0.44490814208984375, 0.4617767333984375, 0.47864532470703125, 0.495513916015625, 0.5123825073242188, 0.5292510986328125, 0.5461196899414062, 0.56298828125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 15.0, 22.0, 24.0, 52.0, 76.0, 93.0, 118.0, 109.0, 94.0, 96.0, 74.0, 69.0, 42.0, 39.0, 11.0, 11.0, 12.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06891059875488281, -0.06659317016601562, -0.06427574157714844, -0.06195831298828125, -0.05964088439941406, -0.057323455810546875, -0.05500602722167969, -0.0526885986328125, -0.05037117004394531, -0.048053741455078125, -0.04573631286621094, -0.04341888427734375, -0.04110145568847656, -0.038784027099609375, -0.03646659851074219, -0.034149169921875, -0.03183174133300781, -0.029514312744140625, -0.027196884155273438, -0.02487945556640625, -0.022562026977539062, -0.020244598388671875, -0.017927169799804688, -0.0156097412109375, -0.013292312622070312, -0.010974884033203125, -0.008657455444335938, -0.00634002685546875, -0.0040225982666015625, -0.001705169677734375, 0.0006122589111328125, 0.0029296875, 0.0052471160888671875, 0.007564544677734375, 0.009881973266601562, 0.01219940185546875, 0.014516830444335938, 0.016834259033203125, 0.019151687622070312, 0.0214691162109375, 0.023786544799804688, 0.026103973388671875, 0.028421401977539062, 0.03073883056640625, 0.03305625915527344, 0.035373687744140625, 0.03769111633300781, 0.040008544921875, 0.04232597351074219, 0.044643402099609375, 0.04696083068847656, 0.04927825927734375, 0.05159568786621094, 0.053913116455078125, 0.05623054504394531, 0.0585479736328125, 0.06086540222167969, 0.06318283081054688, 0.06550025939941406, 0.06781768798828125, 0.07013511657714844, 0.07245254516601562, 0.07476997375488281, 0.07708740234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 6.0, 6.0, 13.0, 26.0, 42.0, 75.0, 154.0, 294.0, 583.0, 1470.0, 3704.0, 11461.0, 49159.0, 605717.0, 3405345.0, 90489.0, 16936.0, 5258.0, 1930.0, 814.0, 377.0, 192.0, 89.0, 30.0, 22.0, 20.0, 8.0, 9.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3195762634277344, -0.30931854248046875, -0.2990608215332031, -0.2888031005859375, -0.2785453796386719, -0.26828765869140625, -0.2580299377441406, -0.247772216796875, -0.23751449584960938, -0.22725677490234375, -0.21699905395507812, -0.2067413330078125, -0.19648361206054688, -0.18622589111328125, -0.17596817016601562, -0.16571044921875, -0.15545272827148438, -0.14519500732421875, -0.13493728637695312, -0.1246795654296875, -0.11442184448242188, -0.10416412353515625, -0.09390640258789062, -0.083648681640625, -0.07339096069335938, -0.06313323974609375, -0.052875518798828125, -0.0426177978515625, -0.032360076904296875, -0.02210235595703125, -0.011844635009765625, -0.0015869140625, 0.008670806884765625, 0.01892852783203125, 0.029186248779296875, 0.0394439697265625, 0.049701690673828125, 0.05995941162109375, 0.07021713256835938, 0.080474853515625, 0.09073257446289062, 0.10099029541015625, 0.11124801635742188, 0.1215057373046875, 0.13176345825195312, 0.14202117919921875, 0.15227890014648438, 0.16253662109375, 0.17279434204101562, 0.18305206298828125, 0.19330978393554688, 0.2035675048828125, 0.21382522583007812, 0.22408294677734375, 0.23434066772460938, 0.244598388671875, 0.2548561096191406, 0.26511383056640625, 0.2753715515136719, 0.2856292724609375, 0.2958869934082031, 0.30614471435546875, 0.3164024353027344, 0.32666015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 7.0, 4.0, 7.0, 16.0, 20.0, 30.0, 30.0, 47.0, 91.0, 158.0, 325.0, 1703.0, 913.0, 289.0, 117.0, 95.0, 61.0, 37.0, 28.0, 21.0, 12.0, 7.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06473255157470703, -0.06232643127441406, -0.059920310974121094, -0.057514190673828125, -0.055108070373535156, -0.05270195007324219, -0.05029582977294922, -0.04788970947265625, -0.04548358917236328, -0.04307746887207031, -0.040671348571777344, -0.038265228271484375, -0.035859107971191406, -0.03345298767089844, -0.03104686737060547, -0.0286407470703125, -0.02623462677001953, -0.023828506469726562, -0.021422386169433594, -0.019016265869140625, -0.016610145568847656, -0.014204025268554688, -0.011797904968261719, -0.00939178466796875, -0.006985664367675781, -0.0045795440673828125, -0.0021734237670898438, 0.000232696533203125, 0.0026388168334960938, 0.0050449371337890625, 0.007451057434082031, 0.009857177734375, 0.012263298034667969, 0.014669418334960938, 0.017075538635253906, 0.019481658935546875, 0.021887779235839844, 0.024293899536132812, 0.02670001983642578, 0.02910614013671875, 0.03151226043701172, 0.03391838073730469, 0.036324501037597656, 0.038730621337890625, 0.041136741638183594, 0.04354286193847656, 0.04594898223876953, 0.0483551025390625, 0.05076122283935547, 0.05316734313964844, 0.055573463439941406, 0.057979583740234375, 0.060385704040527344, 0.06279182434082031, 0.06519794464111328, 0.06760406494140625, 0.07001018524169922, 0.07241630554199219, 0.07482242584228516, 0.07722854614257812, 0.0796346664428711, 0.08204078674316406, 0.08444690704345703, 0.08685302734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 8.0, 19.0, 154.0, 569.0, 229.0, 32.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7553646564483643, -2.6998515129089355, -2.644338369369507, -2.588825225830078, -2.5333120822906494, -2.4777989387512207, -2.422285795211792, -2.3667726516723633, -2.3112595081329346, -2.255746364593506, -2.200233221054077, -2.1447200775146484, -2.0892069339752197, -2.033693790435791, -1.9781806468963623, -1.9226675033569336, -1.8671542406082153, -1.8116410970687866, -1.756127953529358, -1.7006148099899292, -1.6451016664505005, -1.5895885229110718, -1.5340752601623535, -1.4785621166229248, -1.423048973083496, -1.3675358295440674, -1.3120226860046387, -1.25650954246521, -1.2009963989257812, -1.1454832553863525, -1.0899701118469238, -1.0344569683074951, -0.9789438247680664, -0.9234306812286377, -0.867917537689209, -0.8124043941497803, -0.7568912506103516, -0.7013781070709229, -0.6458649039268494, -0.5903517603874207, -0.5348386168479919, -0.47932547330856323, -0.4238123297691345, -0.3682991564273834, -0.3127860128879547, -0.257272869348526, -0.2017596960067749, -0.1462465524673462, -0.09073340892791748, -0.03522025793790817, 0.020292893052101135, 0.07580605149269104, 0.13131919503211975, 0.18683233857154846, 0.24234551191329956, 0.29785865545272827, 0.353371798992157, 0.4088849425315857, 0.4643980860710144, 0.5199112892150879, 0.5754244327545166, 0.6309375762939453, 0.686450719833374, 0.7419638633728027, 0.7974770069122314]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 9.0, 8.0, 14.0, 16.0, 21.0, 32.0, 28.0, 15.0, 34.0, 36.0, 48.0, 39.0, 24.0, 42.0, 32.0, 58.0, 42.0, 34.0, 51.0, 45.0, 45.0, 39.0, 31.0, 29.0, 29.0, 27.0, 23.0, 18.0, 18.0, 14.0, 16.0, 12.0, 9.0, 11.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2598996162414551, -0.2520107626914978, -0.24412190914154053, -0.23623305559158325, -0.22834420204162598, -0.2204553484916687, -0.21256649494171143, -0.20467764139175415, -0.19678878784179688, -0.1888999342918396, -0.18101108074188232, -0.17312222719192505, -0.16523337364196777, -0.1573445200920105, -0.14945566654205322, -0.14156681299209595, -0.13367794454097748, -0.1257890909910202, -0.11790023744106293, -0.11001138389110565, -0.10212253034114838, -0.0942336767911911, -0.08634481579065323, -0.07845596224069595, -0.07056710869073868, -0.0626782551407814, -0.05478940159082413, -0.04690054431557655, -0.03901169076561928, -0.031122837215662003, -0.02323397994041443, -0.015345126390457153, -0.007456272840499878, 0.0004325816407799721, 0.008321436122059822, 0.016210291534662247, 0.024099145084619522, 0.0319879986345768, 0.03987685590982437, 0.04776570945978165, 0.05565456300973892, 0.0635434165596962, 0.07143227010965347, 0.07932113111019135, 0.08720998466014862, 0.0950988382101059, 0.10298769176006317, 0.11087654531002045, 0.11876539885997772, 0.126654252409935, 0.13454310595989227, 0.14243195950984955, 0.15032081305980682, 0.1582096666097641, 0.16609853506088257, 0.17398738861083984, 0.18187624216079712, 0.1897650957107544, 0.19765394926071167, 0.20554280281066895, 0.21343165636062622, 0.2213205099105835, 0.22920936346054077, 0.23709821701049805, 0.24498707056045532]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 8.0, 9.0, 17.0, 22.0, 32.0, 31.0, 56.0, 74.0, 106.0, 129.0, 182.0, 225.0, 324.0, 579.0, 869.0, 1458.0, 2628.0, 5153.0, 11095.0, 25648.0, 66025.0, 193083.0, 409245.0, 208730.0, 71008.0, 27548.0, 11653.0, 5515.0, 2819.0, 1518.0, 897.0, 575.0, 365.0, 256.0, 171.0, 130.0, 106.0, 62.0, 45.0, 38.0, 28.0, 29.0, 17.0, 13.0, 10.0, 4.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.189453125, -0.18396759033203125, -0.1784820556640625, -0.17299652099609375, -0.167510986328125, -0.16202545166015625, -0.1565399169921875, -0.15105438232421875, -0.14556884765625, -0.14008331298828125, -0.1345977783203125, -0.12911224365234375, -0.123626708984375, -0.11814117431640625, -0.1126556396484375, -0.10717010498046875, -0.1016845703125, -0.09619903564453125, -0.0907135009765625, -0.08522796630859375, -0.079742431640625, -0.07425689697265625, -0.0687713623046875, -0.06328582763671875, -0.05780029296875, -0.05231475830078125, -0.0468292236328125, -0.04134368896484375, -0.035858154296875, -0.03037261962890625, -0.0248870849609375, -0.01940155029296875, -0.013916015625, -0.00843048095703125, -0.0029449462890625, 0.00254058837890625, 0.008026123046875, 0.01351165771484375, 0.0189971923828125, 0.02448272705078125, 0.02996826171875, 0.03545379638671875, 0.0409393310546875, 0.04642486572265625, 0.051910400390625, 0.05739593505859375, 0.0628814697265625, 0.06836700439453125, 0.0738525390625, 0.07933807373046875, 0.0848236083984375, 0.09030914306640625, 0.095794677734375, 0.10128021240234375, 0.1067657470703125, 0.11225128173828125, 0.11773681640625, 0.12322235107421875, 0.1287078857421875, 0.13419342041015625, 0.139678955078125, 0.14516448974609375, 0.1506500244140625, 0.15613555908203125, 0.16162109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 16.0, 21.0, 19.0, 39.0, 59.0, 65.0, 76.0, 103.0, 102.0, 103.0, 86.0, 89.0, 59.0, 57.0, 29.0, 12.0, 13.0, 14.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07379150390625, -0.07160377502441406, -0.06941604614257812, -0.06722831726074219, -0.06504058837890625, -0.06285285949707031, -0.060665130615234375, -0.05847740173339844, -0.0562896728515625, -0.05410194396972656, -0.051914215087890625, -0.04972648620605469, -0.04753875732421875, -0.04535102844238281, -0.043163299560546875, -0.04097557067871094, -0.038787841796875, -0.03660011291503906, -0.034412384033203125, -0.03222465515136719, -0.03003692626953125, -0.027849197387695312, -0.025661468505859375, -0.023473739624023438, -0.0212860107421875, -0.019098281860351562, -0.016910552978515625, -0.014722824096679688, -0.01253509521484375, -0.010347366333007812, -0.008159637451171875, -0.0059719085693359375, -0.0037841796875, -0.0015964508056640625, 0.000591278076171875, 0.0027790069580078125, 0.00496673583984375, 0.0071544647216796875, 0.009342193603515625, 0.011529922485351562, 0.0137176513671875, 0.015905380249023438, 0.018093109130859375, 0.020280838012695312, 0.02246856689453125, 0.024656295776367188, 0.026844024658203125, 0.029031753540039062, 0.031219482421875, 0.03340721130371094, 0.035594940185546875, 0.03778266906738281, 0.03997039794921875, 0.04215812683105469, 0.044345855712890625, 0.04653358459472656, 0.0487213134765625, 0.05090904235839844, 0.053096771240234375, 0.05528450012207031, 0.05747222900390625, 0.05965995788574219, 0.061847686767578125, 0.06403541564941406, 0.06622314453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 12.0, 18.0, 28.0, 30.0, 61.0, 84.0, 122.0, 228.0, 410.0, 805.0, 2125.0, 8448.0, 64309.0, 685742.0, 257273.0, 22138.0, 4105.0, 1251.0, 585.0, 313.0, 169.0, 96.0, 62.0, 39.0, 33.0, 18.0, 14.0, 10.0, 6.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3442878723144531, -0.33188629150390625, -0.3194847106933594, -0.3070831298828125, -0.2946815490722656, -0.28227996826171875, -0.2698783874511719, -0.257476806640625, -0.24507522583007812, -0.23267364501953125, -0.22027206420898438, -0.2078704833984375, -0.19546890258789062, -0.18306732177734375, -0.17066574096679688, -0.15826416015625, -0.14586257934570312, -0.13346099853515625, -0.12105941772460938, -0.1086578369140625, -0.09625625610351562, -0.08385467529296875, -0.07145309448242188, -0.059051513671875, -0.046649932861328125, -0.03424835205078125, -0.021846771240234375, -0.0094451904296875, 0.002956390380859375, 0.01535797119140625, 0.027759552001953125, 0.0401611328125, 0.052562713623046875, 0.06496429443359375, 0.07736587524414062, 0.0897674560546875, 0.10216903686523438, 0.11457061767578125, 0.12697219848632812, 0.139373779296875, 0.15177536010742188, 0.16417694091796875, 0.17657852172851562, 0.1889801025390625, 0.20138168334960938, 0.21378326416015625, 0.22618484497070312, 0.23858642578125, 0.2509880065917969, 0.26338958740234375, 0.2757911682128906, 0.2881927490234375, 0.3005943298339844, 0.31299591064453125, 0.3253974914550781, 0.337799072265625, 0.3502006530761719, 0.36260223388671875, 0.3750038146972656, 0.3874053955078125, 0.3998069763183594, 0.41220855712890625, 0.4246101379394531, 0.43701171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 7.0, 10.0, 23.0, 28.0, 41.0, 50.0, 38.0, 53.0, 55.0, 60.0, 72.0, 76.0, 77.0, 64.0, 75.0, 48.0, 43.0, 30.0, 32.0, 33.0, 15.0, 8.0, 13.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.2376537322998047, -0.22835922241210938, -0.21906471252441406, -0.20977020263671875, -0.20047569274902344, -0.19118118286132812, -0.1818866729736328, -0.1725921630859375, -0.1632976531982422, -0.15400314331054688, -0.14470863342285156, -0.13541412353515625, -0.12611961364746094, -0.11682510375976562, -0.10753059387207031, -0.098236083984375, -0.08894157409667969, -0.07964706420898438, -0.07035255432128906, -0.06105804443359375, -0.05176353454589844, -0.042469024658203125, -0.03317451477050781, -0.0238800048828125, -0.014585494995117188, -0.005290985107421875, 0.0040035247802734375, 0.01329803466796875, 0.022592544555664062, 0.031887054443359375, 0.04118156433105469, 0.05047607421875, 0.05977058410644531, 0.06906509399414062, 0.07835960388183594, 0.08765411376953125, 0.09694862365722656, 0.10624313354492188, 0.11553764343261719, 0.1248321533203125, 0.1341266632080078, 0.14342117309570312, 0.15271568298339844, 0.16201019287109375, 0.17130470275878906, 0.18059921264648438, 0.1898937225341797, 0.199188232421875, 0.2084827423095703, 0.21777725219726562, 0.22707176208496094, 0.23636627197265625, 0.24566078186035156, 0.2549552917480469, 0.2642498016357422, 0.2735443115234375, 0.2828388214111328, 0.2921333312988281, 0.30142784118652344, 0.31072235107421875, 0.32001686096191406, 0.3293113708496094, 0.3386058807373047, 0.347900390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 17.0, 10.0, 23.0, 23.0, 36.0, 57.0, 76.0, 97.0, 189.0, 300.0, 536.0, 1075.0, 1975.0, 4657.0, 12494.0, 47591.0, 345682.0, 537505.0, 68983.0, 16321.0, 5626.0, 2496.0, 1201.0, 627.0, 335.0, 198.0, 117.0, 96.0, 67.0, 37.0, 21.0, 17.0, 16.0, 10.0, 9.0, 4.0, 12.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1746826171875, -0.17009925842285156, -0.16551589965820312, -0.1609325408935547, -0.15634918212890625, -0.1517658233642578, -0.14718246459960938, -0.14259910583496094, -0.1380157470703125, -0.13343238830566406, -0.12884902954101562, -0.12426567077636719, -0.11968231201171875, -0.11509895324707031, -0.11051559448242188, -0.10593223571777344, -0.101348876953125, -0.09676551818847656, -0.09218215942382812, -0.08759880065917969, -0.08301544189453125, -0.07843208312988281, -0.07384872436523438, -0.06926536560058594, -0.0646820068359375, -0.06009864807128906, -0.055515289306640625, -0.05093193054199219, -0.04634857177734375, -0.04176521301269531, -0.037181854248046875, -0.03259849548339844, -0.02801513671875, -0.023431777954101562, -0.018848419189453125, -0.014265060424804688, -0.00968170166015625, -0.0050983428955078125, -0.000514984130859375, 0.0040683746337890625, 0.0086517333984375, 0.013235092163085938, 0.017818450927734375, 0.022401809692382812, 0.02698516845703125, 0.03156852722167969, 0.036151885986328125, 0.04073524475097656, 0.045318603515625, 0.04990196228027344, 0.054485321044921875, 0.05906867980957031, 0.06365203857421875, 0.06823539733886719, 0.07281875610351562, 0.07740211486816406, 0.0819854736328125, 0.08656883239746094, 0.09115219116210938, 0.09573554992675781, 0.10031890869140625, 0.10490226745605469, 0.10948562622070312, 0.11406898498535156, 0.11865234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 11.0, 13.0, 14.0, 13.0, 29.0, 33.0, 44.0, 55.0, 71.0, 82.0, 84.0, 82.0, 93.0, 66.0, 74.0, 50.0, 42.0, 31.0, 13.0, 26.0, 17.0, 10.0, 8.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9114227294921875e-05, -4.783552139997482e-05, -4.655681550502777e-05, -4.527810961008072e-05, -4.399940371513367e-05, -4.2720697820186615e-05, -4.144199192523956e-05, -4.016328603029251e-05, -3.888458013534546e-05, -3.760587424039841e-05, -3.6327168345451355e-05, -3.50484624505043e-05, -3.376975655555725e-05, -3.24910506606102e-05, -3.121234476566315e-05, -2.9933638870716095e-05, -2.8654932975769043e-05, -2.737622708082199e-05, -2.609752118587494e-05, -2.4818815290927887e-05, -2.3540109395980835e-05, -2.2261403501033783e-05, -2.098269760608673e-05, -1.970399171113968e-05, -1.8425285816192627e-05, -1.7146579921245575e-05, -1.5867874026298523e-05, -1.4589168131351471e-05, -1.3310462236404419e-05, -1.2031756341457367e-05, -1.0753050446510315e-05, -9.474344551563263e-06, -8.195638656616211e-06, -6.916932761669159e-06, -5.638226866722107e-06, -4.359520971775055e-06, -3.080815076828003e-06, -1.802109181880951e-06, -5.234032869338989e-07, 7.553026080131531e-07, 2.034008502960205e-06, 3.312714397907257e-06, 4.591420292854309e-06, 5.870126187801361e-06, 7.148832082748413e-06, 8.427537977695465e-06, 9.706243872642517e-06, 1.0984949767589569e-05, 1.2263655662536621e-05, 1.3542361557483673e-05, 1.4821067452430725e-05, 1.6099773347377777e-05, 1.737847924232483e-05, 1.865718513727188e-05, 1.9935891032218933e-05, 2.1214596927165985e-05, 2.2493302822113037e-05, 2.377200871706009e-05, 2.505071461200714e-05, 2.6329420506954193e-05, 2.7608126401901245e-05, 2.8886832296848297e-05, 3.016553819179535e-05, 3.14442440867424e-05, 3.272294998168945e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 14.0, 13.0, 21.0, 27.0, 74.0, 108.0, 172.0, 354.0, 691.0, 1867.0, 6039.0, 29380.0, 381784.0, 577290.0, 39444.0, 7369.0, 2154.0, 862.0, 381.0, 206.0, 98.0, 72.0, 38.0, 28.0, 13.0, 8.0, 10.0, 5.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.217529296875, -0.21114540100097656, -0.20476150512695312, -0.1983776092529297, -0.19199371337890625, -0.1856098175048828, -0.17922592163085938, -0.17284202575683594, -0.1664581298828125, -0.16007423400878906, -0.15369033813476562, -0.1473064422607422, -0.14092254638671875, -0.1345386505126953, -0.12815475463867188, -0.12177085876464844, -0.115386962890625, -0.10900306701660156, -0.10261917114257812, -0.09623527526855469, -0.08985137939453125, -0.08346748352050781, -0.07708358764648438, -0.07069969177246094, -0.0643157958984375, -0.05793190002441406, -0.051548004150390625, -0.04516410827636719, -0.03878021240234375, -0.03239631652832031, -0.026012420654296875, -0.019628524780273438, -0.01324462890625, -0.0068607330322265625, -0.000476837158203125, 0.0059070587158203125, 0.01229095458984375, 0.018674850463867188, 0.025058746337890625, 0.03144264221191406, 0.0378265380859375, 0.04421043395996094, 0.050594329833984375, 0.05697822570800781, 0.06336212158203125, 0.06974601745605469, 0.07612991333007812, 0.08251380920410156, 0.088897705078125, 0.09528160095214844, 0.10166549682617188, 0.10804939270019531, 0.11443328857421875, 0.12081718444824219, 0.12720108032226562, 0.13358497619628906, 0.1399688720703125, 0.14635276794433594, 0.15273666381835938, 0.1591205596923828, 0.16550445556640625, 0.1718883514404297, 0.17827224731445312, 0.18465614318847656, 0.1910400390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 11.0, 6.0, 6.0, 6.0, 16.0, 14.0, 26.0, 26.0, 26.0, 45.0, 80.0, 80.0, 105.0, 95.0, 110.0, 78.0, 59.0, 41.0, 40.0, 18.0, 27.0, 16.0, 8.0, 6.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.08046150207519531, -0.07779312133789062, -0.07512474060058594, -0.07245635986328125, -0.06978797912597656, -0.06711959838867188, -0.06445121765136719, -0.0617828369140625, -0.05911445617675781, -0.056446075439453125, -0.05377769470214844, -0.05110931396484375, -0.04844093322753906, -0.045772552490234375, -0.04310417175292969, -0.040435791015625, -0.03776741027832031, -0.035099029541015625, -0.03243064880371094, -0.02976226806640625, -0.027093887329101562, -0.024425506591796875, -0.021757125854492188, -0.0190887451171875, -0.016420364379882812, -0.013751983642578125, -0.011083602905273438, -0.00841522216796875, -0.0057468414306640625, -0.003078460693359375, -0.0004100799560546875, 0.00225830078125, 0.0049266815185546875, 0.007595062255859375, 0.010263442993164062, 0.01293182373046875, 0.015600204467773438, 0.018268585205078125, 0.020936965942382812, 0.0236053466796875, 0.026273727416992188, 0.028942108154296875, 0.03161048889160156, 0.03427886962890625, 0.03694725036621094, 0.039615631103515625, 0.04228401184082031, 0.044952392578125, 0.04762077331542969, 0.050289154052734375, 0.05295753479003906, 0.05562591552734375, 0.05829429626464844, 0.060962677001953125, 0.06363105773925781, 0.0662994384765625, 0.06896781921386719, 0.07163619995117188, 0.07430458068847656, 0.07697296142578125, 0.07964134216308594, 0.08230972290039062, 0.08497810363769531, 0.087646484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 10.0, 19.0, 25.0, 53.0, 89.0, 139.0, 149.0, 151.0, 129.0, 86.0, 63.0, 31.0, 21.0, 7.0, 9.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.450547218322754, -1.4065881967544556, -1.3626291751861572, -1.3186701536178589, -1.2747111320495605, -1.2307521104812622, -1.1867930889129639, -1.1428340673446655, -1.0988750457763672, -1.0549160242080688, -1.0109570026397705, -0.9669979810714722, -0.9230389595031738, -0.8790799379348755, -0.8351209163665771, -0.7911618947982788, -0.7472028136253357, -0.7032437920570374, -0.659284770488739, -0.6153257489204407, -0.5713667273521423, -0.527407705783844, -0.48344865441322327, -0.4394896328449249, -0.3955306112766266, -0.35157158970832825, -0.3076125681400299, -0.2636535167694092, -0.21969451010227203, -0.1757354885339737, -0.13177645206451416, -0.08781743049621582, -0.04385840892791748, 0.00010061636567115784, 0.044059641659259796, 0.08801867067813873, 0.13197769224643707, 0.1759367138147354, 0.21989575028419495, 0.2638547718524933, 0.3078137934207916, 0.35177281498908997, 0.3957318365573883, 0.43969088792800903, 0.4836499094963074, 0.5276089310646057, 0.571567952632904, 0.6155269742012024, 0.6594859957695007, 0.7034450173377991, 0.7474040389060974, 0.7913630604743958, 0.8353220820426941, 0.8792811036109924, 0.9232401847839355, 0.9671992063522339, 1.0111582279205322, 1.0551172494888306, 1.099076271057129, 1.1430352926254272, 1.1869943141937256, 1.230953335762024, 1.2749123573303223, 1.3188713788986206, 1.362830400466919]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 14.0, 12.0, 14.0, 16.0, 22.0, 20.0, 21.0, 26.0, 29.0, 39.0, 32.0, 31.0, 39.0, 33.0, 40.0, 32.0, 44.0, 50.0, 38.0, 43.0, 41.0, 38.0, 42.0, 31.0, 33.0, 36.0, 18.0, 12.0, 20.0, 22.0, 13.0, 15.0, 12.0, 9.0, 14.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0191164016723633, -0.9862051010131836, -0.9532938599586487, -0.9203826189041138, -0.8874713182449341, -0.8545600175857544, -0.8216487765312195, -0.7887375354766846, -0.7558262348175049, -0.7229149341583252, -0.6900036931037903, -0.6570924520492554, -0.6241811513900757, -0.591269850730896, -0.5583586096763611, -0.5254473686218262, -0.4925360679626465, -0.4596247971057892, -0.4267135262489319, -0.3938022553920746, -0.3608909845352173, -0.32797971367836, -0.2950684428215027, -0.2621571719646454, -0.22924590110778809, -0.1963346302509308, -0.1634233593940735, -0.1305120885372162, -0.09760081768035889, -0.06468954682350159, -0.03177827596664429, 0.0011329948902130127, 0.03404414653778076, 0.06695541739463806, 0.09986668825149536, 0.13277795910835266, 0.16568922996520996, 0.19860050082206726, 0.23151177167892456, 0.26442304253578186, 0.29733431339263916, 0.33024558424949646, 0.36315685510635376, 0.39606812596321106, 0.42897939682006836, 0.46189066767692566, 0.49480193853378296, 0.5277131795883179, 0.5606244802474976, 0.5935357809066772, 0.6264470219612122, 0.6593582630157471, 0.6922695636749268, 0.7251808643341064, 0.7580921053886414, 0.7910033464431763, 0.823914647102356, 0.8568259477615356, 0.8897371888160706, 0.9226484298706055, 0.9555597305297852, 0.9884710311889648, 1.0213823318481445, 1.0542935132980347, 1.0872048139572144]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 14.0, 7.0, 12.0, 19.0, 26.0, 47.0, 67.0, 153.0, 239.0, 531.0, 1253.0, 3712.0, 18489.0, 440281.0, 3693445.0, 28827.0, 4653.0, 1349.0, 563.0, 260.0, 135.0, 61.0, 50.0, 28.0, 20.0, 12.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.494873046875, -0.4799232482910156, -0.46497344970703125, -0.4500236511230469, -0.4350738525390625, -0.4201240539550781, -0.40517425537109375, -0.3902244567871094, -0.375274658203125, -0.3603248596191406, -0.34537506103515625, -0.3304252624511719, -0.3154754638671875, -0.3005256652832031, -0.28557586669921875, -0.2706260681152344, -0.25567626953125, -0.24072647094726562, -0.22577667236328125, -0.21082687377929688, -0.1958770751953125, -0.18092727661132812, -0.16597747802734375, -0.15102767944335938, -0.136077880859375, -0.12112808227539062, -0.10617828369140625, -0.09122848510742188, -0.0762786865234375, -0.061328887939453125, -0.04637908935546875, -0.031429290771484375, -0.0164794921875, -0.001529693603515625, 0.01342010498046875, 0.028369903564453125, 0.0433197021484375, 0.058269500732421875, 0.07321929931640625, 0.08816909790039062, 0.103118896484375, 0.11806869506835938, 0.13301849365234375, 0.14796829223632812, 0.1629180908203125, 0.17786788940429688, 0.19281768798828125, 0.20776748657226562, 0.22271728515625, 0.23766708374023438, 0.25261688232421875, 0.2675666809082031, 0.2825164794921875, 0.2974662780761719, 0.31241607666015625, 0.3273658752441406, 0.342315673828125, 0.3572654724121094, 0.37221527099609375, 0.3871650695800781, 0.4021148681640625, 0.4170646667480469, 0.43201446533203125, 0.4469642639160156, 0.4619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 11.0, 12.0, 27.0, 37.0, 55.0, 52.0, 71.0, 80.0, 78.0, 86.0, 96.0, 76.0, 81.0, 57.0, 50.0, 37.0, 21.0, 16.0, 11.0, 4.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.0672616958618164, -0.06518745422363281, -0.06311321258544922, -0.061038970947265625, -0.05896472930908203, -0.05689048767089844, -0.054816246032714844, -0.05274200439453125, -0.050667762756347656, -0.04859352111816406, -0.04651927947998047, -0.044445037841796875, -0.04237079620361328, -0.04029655456542969, -0.038222312927246094, -0.0361480712890625, -0.034073829650878906, -0.03199958801269531, -0.02992534637451172, -0.027851104736328125, -0.02577686309814453, -0.023702621459960938, -0.021628379821777344, -0.01955413818359375, -0.017479896545410156, -0.015405654907226562, -0.013331413269042969, -0.011257171630859375, -0.009182929992675781, -0.0071086883544921875, -0.005034446716308594, -0.002960205078125, -0.0008859634399414062, 0.0011882781982421875, 0.0032625198364257812, 0.005336761474609375, 0.007411003112792969, 0.009485244750976562, 0.011559486389160156, 0.01363372802734375, 0.015707969665527344, 0.017782211303710938, 0.01985645294189453, 0.021930694580078125, 0.02400493621826172, 0.026079177856445312, 0.028153419494628906, 0.0302276611328125, 0.032301902770996094, 0.03437614440917969, 0.03645038604736328, 0.038524627685546875, 0.04059886932373047, 0.04267311096191406, 0.044747352600097656, 0.04682159423828125, 0.048895835876464844, 0.05097007751464844, 0.05304431915283203, 0.055118560791015625, 0.05719280242919922, 0.05926704406738281, 0.061341285705566406, 0.06341552734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 11.0, 16.0, 40.0, 64.0, 153.0, 397.0, 1304.0, 5820.0, 45254.0, 3848256.0, 275038.0, 14260.0, 2510.0, 686.0, 240.0, 97.0, 58.0, 28.0, 14.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409912109375, -0.3933601379394531, -0.37680816650390625, -0.3602561950683594, -0.3437042236328125, -0.3271522521972656, -0.31060028076171875, -0.2940483093261719, -0.277496337890625, -0.2609443664550781, -0.24439239501953125, -0.22784042358398438, -0.2112884521484375, -0.19473648071289062, -0.17818450927734375, -0.16163253784179688, -0.14508056640625, -0.12852859497070312, -0.11197662353515625, -0.09542465209960938, -0.0788726806640625, -0.062320709228515625, -0.04576873779296875, -0.029216766357421875, -0.012664794921875, 0.003887176513671875, 0.02043914794921875, 0.036991119384765625, 0.0535430908203125, 0.07009506225585938, 0.08664703369140625, 0.10319900512695312, 0.1197509765625, 0.13630294799804688, 0.15285491943359375, 0.16940689086914062, 0.1859588623046875, 0.20251083374023438, 0.21906280517578125, 0.23561477661132812, 0.252166748046875, 0.2687187194824219, 0.28527069091796875, 0.3018226623535156, 0.3183746337890625, 0.3349266052246094, 0.35147857666015625, 0.3680305480957031, 0.38458251953125, 0.4011344909667969, 0.41768646240234375, 0.4342384338378906, 0.4507904052734375, 0.4673423767089844, 0.48389434814453125, 0.5004463195800781, 0.516998291015625, 0.5335502624511719, 0.5501022338867188, 0.5666542053222656, 0.5832061767578125, 0.5997581481933594, 0.6163101196289062, 0.6328620910644531, 0.6494140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 8.0, 10.0, 14.0, 8.0, 21.0, 30.0, 32.0, 66.0, 124.0, 187.0, 609.0, 2155.0, 382.0, 169.0, 88.0, 59.0, 39.0, 18.0, 17.0, 7.0, 3.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.0759744644165039, -0.07309150695800781, -0.07020854949951172, -0.06732559204101562, -0.06444263458251953, -0.06155967712402344, -0.058676719665527344, -0.05579376220703125, -0.052910804748535156, -0.05002784729003906, -0.04714488983154297, -0.044261932373046875, -0.04137897491455078, -0.03849601745605469, -0.035613059997558594, -0.0327301025390625, -0.029847145080566406, -0.026964187622070312, -0.02408123016357422, -0.021198272705078125, -0.01831531524658203, -0.015432357788085938, -0.012549400329589844, -0.00966644287109375, -0.006783485412597656, -0.0039005279541015625, -0.0010175704956054688, 0.001865386962890625, 0.004748344421386719, 0.0076313018798828125, 0.010514259338378906, 0.013397216796875, 0.016280174255371094, 0.019163131713867188, 0.02204608917236328, 0.024929046630859375, 0.02781200408935547, 0.030694961547851562, 0.033577919006347656, 0.03646087646484375, 0.039343833923339844, 0.04222679138183594, 0.04510974884033203, 0.047992706298828125, 0.05087566375732422, 0.05375862121582031, 0.056641578674316406, 0.0595245361328125, 0.062407493591308594, 0.06529045104980469, 0.06817340850830078, 0.07105636596679688, 0.07393932342529297, 0.07682228088378906, 0.07970523834228516, 0.08258819580078125, 0.08547115325927734, 0.08835411071777344, 0.09123706817626953, 0.09412002563476562, 0.09700298309326172, 0.09988594055175781, 0.1027688980102539, 0.10565185546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 46.0, 115.0, 291.0, 356.0, 141.0, 35.0, 12.0, 6.0, 0.0, 1.0, 2.0], "bins": [-1.8550047874450684, -1.8219696283340454, -1.788934588432312, -1.755899429321289, -1.7228642702102661, -1.6898291110992432, -1.6567940711975098, -1.6237589120864868, -1.5907237529754639, -1.557688593864441, -1.5246535539627075, -1.4916183948516846, -1.4585832357406616, -1.4255480766296387, -1.3925130367279053, -1.3594778776168823, -1.3264427185058594, -1.2934075593948364, -1.260372519493103, -1.22733736038208, -1.1943022012710571, -1.1612670421600342, -1.1282320022583008, -1.0951968431472778, -1.0621618032455444, -1.0291266441345215, -0.9960915446281433, -0.9630564451217651, -0.9300212860107422, -0.896986186504364, -0.8639510869979858, -0.8309159278869629, -0.7978808283805847, -0.7648457288742065, -0.7318105697631836, -0.6987754702568054, -0.6657403111457825, -0.6327052116394043, -0.5996700525283813, -0.5666349530220032, -0.533599853515625, -0.5005647540092468, -0.4675295948982239, -0.4344944953918457, -0.40145933628082275, -0.3684242367744446, -0.335389107465744, -0.30235397815704346, -0.2693188190460205, -0.23628368973731995, -0.20324856042861938, -0.17021344602108002, -0.13717831671237946, -0.1041431874036789, -0.07110807299613953, -0.038072943687438965, -0.005037814378738403, 0.02799731120467186, 0.06103243678808212, 0.09406755864620209, 0.12710268795490265, 0.1601378172636032, 0.19317293167114258, 0.22620806097984314, 0.2592431902885437]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 8.0, 25.0, 13.0, 16.0, 19.0, 29.0, 20.0, 27.0, 46.0, 33.0, 35.0, 51.0, 46.0, 46.0, 52.0, 52.0, 57.0, 50.0, 44.0, 45.0, 31.0, 37.0, 33.0, 29.0, 20.0, 19.0, 16.0, 14.0, 11.0, 10.0, 10.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2625809907913208, -0.25440624356269836, -0.24623146653175354, -0.2380567193031311, -0.22988195717334747, -0.22170719504356384, -0.2135324329137802, -0.20535767078399658, -0.19718292355537415, -0.18900816142559052, -0.18083339929580688, -0.17265865206718445, -0.16448388993740082, -0.1563091278076172, -0.14813436567783356, -0.13995960354804993, -0.1317848414182663, -0.12361007928848267, -0.11543532460927963, -0.107260562479496, -0.09908580780029297, -0.09091104567050934, -0.08273628354072571, -0.07456152141094208, -0.06638676673173904, -0.05821200832724571, -0.05003724992275238, -0.04186248779296875, -0.03368772938847542, -0.025512970983982086, -0.017338208854198456, -0.009163450449705124, -0.000988692045211792, 0.0071860672906041145, 0.015360826626420021, 0.023535586893558502, 0.031710345298051834, 0.039885103702545166, 0.048059865832328796, 0.05623462423682213, 0.06440938264131546, 0.07258414477109909, 0.08075889945030212, 0.08893366158008575, 0.09710842370986938, 0.10528317838907242, 0.11345794051885605, 0.12163269519805908, 0.1298074573278427, 0.13798221945762634, 0.14615698158740997, 0.1543317437171936, 0.16250649094581604, 0.17068125307559967, 0.1788560152053833, 0.18703077733516693, 0.19520553946495056, 0.2033803015947342, 0.21155506372451782, 0.21972981095314026, 0.2279045730829239, 0.23607933521270752, 0.24425409734249115, 0.2524288594722748, 0.2606036067008972]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 12.0, 12.0, 11.0, 31.0, 37.0, 67.0, 126.0, 191.0, 358.0, 620.0, 1297.0, 3346.0, 9480.0, 33091.0, 156531.0, 555692.0, 223254.0, 45103.0, 12038.0, 3908.0, 1608.0, 755.0, 384.0, 229.0, 145.0, 87.0, 46.0, 30.0, 26.0, 13.0, 14.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.26387977600097656, -0.2557868957519531, -0.2476940155029297, -0.23960113525390625, -0.2315082550048828, -0.22341537475585938, -0.21532249450683594, -0.2072296142578125, -0.19913673400878906, -0.19104385375976562, -0.1829509735107422, -0.17485809326171875, -0.1667652130126953, -0.15867233276367188, -0.15057945251464844, -0.142486572265625, -0.13439369201660156, -0.12630081176757812, -0.11820793151855469, -0.11011505126953125, -0.10202217102050781, -0.09392929077148438, -0.08583641052246094, -0.0777435302734375, -0.06965065002441406, -0.061557769775390625, -0.05346488952636719, -0.04537200927734375, -0.03727912902832031, -0.029186248779296875, -0.021093368530273438, -0.01300048828125, -0.0049076080322265625, 0.003185272216796875, 0.011278152465820312, 0.01937103271484375, 0.027463912963867188, 0.035556793212890625, 0.04364967346191406, 0.0517425537109375, 0.05983543395996094, 0.06792831420898438, 0.07602119445800781, 0.08411407470703125, 0.09220695495605469, 0.10029983520507812, 0.10839271545410156, 0.116485595703125, 0.12457847595214844, 0.13267135620117188, 0.1407642364501953, 0.14885711669921875, 0.1569499969482422, 0.16504287719726562, 0.17313575744628906, 0.1812286376953125, 0.18932151794433594, 0.19741439819335938, 0.2055072784423828, 0.21360015869140625, 0.2216930389404297, 0.22978591918945312, 0.23787879943847656, 0.2459716796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 17.0, 14.0, 22.0, 32.0, 48.0, 56.0, 58.0, 68.0, 77.0, 67.0, 80.0, 95.0, 67.0, 73.0, 63.0, 37.0, 42.0, 23.0, 9.0, 9.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07159423828125, -0.06954240798950195, -0.0674905776977539, -0.06543874740600586, -0.06338691711425781, -0.061335086822509766, -0.05928325653076172, -0.05723142623901367, -0.055179595947265625, -0.05312776565551758, -0.05107593536376953, -0.049024105072021484, -0.04697227478027344, -0.04492044448852539, -0.042868614196777344, -0.0408167839050293, -0.03876495361328125, -0.0367131233215332, -0.034661293029785156, -0.03260946273803711, -0.030557632446289062, -0.028505802154541016, -0.02645397186279297, -0.024402141571044922, -0.022350311279296875, -0.020298480987548828, -0.01824665069580078, -0.016194820404052734, -0.014142990112304688, -0.01209115982055664, -0.010039329528808594, -0.007987499237060547, -0.0059356689453125, -0.003883838653564453, -0.0018320083618164062, 0.00021982192993164062, 0.0022716522216796875, 0.004323482513427734, 0.006375312805175781, 0.008427143096923828, 0.010478973388671875, 0.012530803680419922, 0.014582633972167969, 0.016634464263916016, 0.018686294555664062, 0.02073812484741211, 0.022789955139160156, 0.024841785430908203, 0.02689361572265625, 0.028945446014404297, 0.030997276306152344, 0.03304910659790039, 0.03510093688964844, 0.037152767181396484, 0.03920459747314453, 0.04125642776489258, 0.043308258056640625, 0.04536008834838867, 0.04741191864013672, 0.049463748931884766, 0.05151557922363281, 0.05356740951538086, 0.055619239807128906, 0.05767107009887695, 0.059722900390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 13.0, 16.0, 18.0, 29.0, 55.0, 52.0, 99.0, 155.0, 259.0, 563.0, 1263.0, 3984.0, 21539.0, 239689.0, 691469.0, 76038.0, 9291.0, 2200.0, 842.0, 395.0, 194.0, 124.0, 71.0, 50.0, 35.0, 26.0, 14.0, 17.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.2946929931640625, -0.283477783203125, -0.2722625732421875, -0.26104736328125, -0.2498321533203125, -0.238616943359375, -0.2274017333984375, -0.2161865234375, -0.2049713134765625, -0.193756103515625, -0.1825408935546875, -0.17132568359375, -0.1601104736328125, -0.148895263671875, -0.1376800537109375, -0.12646484375, -0.1152496337890625, -0.104034423828125, -0.0928192138671875, -0.08160400390625, -0.0703887939453125, -0.059173583984375, -0.0479583740234375, -0.0367431640625, -0.0255279541015625, -0.014312744140625, -0.0030975341796875, 0.00811767578125, 0.0193328857421875, 0.030548095703125, 0.0417633056640625, 0.052978515625, 0.0641937255859375, 0.075408935546875, 0.0866241455078125, 0.09783935546875, 0.1090545654296875, 0.120269775390625, 0.1314849853515625, 0.1427001953125, 0.1539154052734375, 0.165130615234375, 0.1763458251953125, 0.18756103515625, 0.1987762451171875, 0.209991455078125, 0.2212066650390625, 0.232421875, 0.2436370849609375, 0.254852294921875, 0.2660675048828125, 0.27728271484375, 0.2884979248046875, 0.299713134765625, 0.3109283447265625, 0.3221435546875, 0.3333587646484375, 0.344573974609375, 0.3557891845703125, 0.36700439453125, 0.3782196044921875, 0.389434814453125, 0.4006500244140625, 0.411865234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 11.0, 7.0, 15.0, 21.0, 17.0, 25.0, 30.0, 37.0, 30.0, 45.0, 48.0, 48.0, 51.0, 45.0, 51.0, 49.0, 42.0, 44.0, 53.0, 42.0, 45.0, 36.0, 38.0, 19.0, 23.0, 18.0, 24.0, 18.0, 15.0, 4.0, 9.0, 6.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18701171875, -0.18027687072753906, -0.17354202270507812, -0.1668071746826172, -0.16007232666015625, -0.1533374786376953, -0.14660263061523438, -0.13986778259277344, -0.1331329345703125, -0.12639808654785156, -0.11966323852539062, -0.11292839050292969, -0.10619354248046875, -0.09945869445800781, -0.09272384643554688, -0.08598899841308594, -0.079254150390625, -0.07251930236816406, -0.06578445434570312, -0.05904960632324219, -0.05231475830078125, -0.04557991027832031, -0.038845062255859375, -0.03211021423339844, -0.0253753662109375, -0.018640518188476562, -0.011905670166015625, -0.0051708221435546875, 0.00156402587890625, 0.008298873901367188, 0.015033721923828125, 0.021768569946289062, 0.02850341796875, 0.03523826599121094, 0.041973114013671875, 0.04870796203613281, 0.05544281005859375, 0.06217765808105469, 0.06891250610351562, 0.07564735412597656, 0.0823822021484375, 0.08911705017089844, 0.09585189819335938, 0.10258674621582031, 0.10932159423828125, 0.11605644226074219, 0.12279129028320312, 0.12952613830566406, 0.136260986328125, 0.14299583435058594, 0.14973068237304688, 0.1564655303955078, 0.16320037841796875, 0.1699352264404297, 0.17667007446289062, 0.18340492248535156, 0.1901397705078125, 0.19687461853027344, 0.20360946655273438, 0.2103443145751953, 0.21707916259765625, 0.2238140106201172, 0.23054885864257812, 0.23728370666503906, 0.2440185546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 11.0, 23.0, 28.0, 47.0, 86.0, 113.0, 192.0, 351.0, 598.0, 1073.0, 2314.0, 5140.0, 13962.0, 48854.0, 276784.0, 557283.0, 102850.0, 23993.0, 8082.0, 3337.0, 1540.0, 758.0, 441.0, 259.0, 160.0, 96.0, 49.0, 30.0, 21.0, 23.0, 11.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.11199951171875, -0.1084136962890625, -0.104827880859375, -0.1012420654296875, -0.09765625, -0.0940704345703125, -0.090484619140625, -0.0868988037109375, -0.08331298828125, -0.0797271728515625, -0.076141357421875, -0.0725555419921875, -0.0689697265625, -0.0653839111328125, -0.061798095703125, -0.0582122802734375, -0.05462646484375, -0.0510406494140625, -0.047454833984375, -0.0438690185546875, -0.040283203125, -0.0366973876953125, -0.033111572265625, -0.0295257568359375, -0.02593994140625, -0.0223541259765625, -0.018768310546875, -0.0151824951171875, -0.0115966796875, -0.0080108642578125, -0.004425048828125, -0.0008392333984375, 0.00274658203125, 0.0063323974609375, 0.009918212890625, 0.0135040283203125, 0.01708984375, 0.0206756591796875, 0.024261474609375, 0.0278472900390625, 0.03143310546875, 0.0350189208984375, 0.038604736328125, 0.0421905517578125, 0.0457763671875, 0.0493621826171875, 0.052947998046875, 0.0565338134765625, 0.06011962890625, 0.0637054443359375, 0.067291259765625, 0.0708770751953125, 0.074462890625, 0.0780487060546875, 0.081634521484375, 0.0852203369140625, 0.08880615234375, 0.0923919677734375, 0.095977783203125, 0.0995635986328125, 0.1031494140625, 0.1067352294921875, 0.110321044921875, 0.1139068603515625, 0.11749267578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 17.0, 30.0, 47.0, 83.0, 108.0, 141.0, 163.0, 116.0, 101.0, 60.0, 43.0, 30.0, 23.0, 9.0, 13.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.8677978813648224e-05, -5.66188246011734e-05, -5.455967038869858e-05, -5.2500516176223755e-05, -5.044136196374893e-05, -4.838220775127411e-05, -4.6323053538799286e-05, -4.426389932632446e-05, -4.220474511384964e-05, -4.014559090137482e-05, -3.8086436688899994e-05, -3.602728247642517e-05, -3.396812826395035e-05, -3.1908974051475525e-05, -2.9849819839000702e-05, -2.779066562652588e-05, -2.5731511414051056e-05, -2.3672357201576233e-05, -2.161320298910141e-05, -1.9554048776626587e-05, -1.7494894564151764e-05, -1.543574035167694e-05, -1.3376586139202118e-05, -1.1317431926727295e-05, -9.258277714252472e-06, -7.199123501777649e-06, -5.139969289302826e-06, -3.080815076828003e-06, -1.02166086435318e-06, 1.037493348121643e-06, 3.096647560596466e-06, 5.155801773071289e-06, 7.214955985546112e-06, 9.274110198020935e-06, 1.1333264410495758e-05, 1.3392418622970581e-05, 1.5451572835445404e-05, 1.7510727047920227e-05, 1.956988126039505e-05, 2.1629035472869873e-05, 2.3688189685344696e-05, 2.574734389781952e-05, 2.7806498110294342e-05, 2.9865652322769165e-05, 3.192480653524399e-05, 3.398396074771881e-05, 3.6043114960193634e-05, 3.810226917266846e-05, 4.016142338514328e-05, 4.22205775976181e-05, 4.4279731810092926e-05, 4.633888602256775e-05, 4.839804023504257e-05, 5.0457194447517395e-05, 5.251634865999222e-05, 5.457550287246704e-05, 5.6634657084941864e-05, 5.869381129741669e-05, 6.075296550989151e-05, 6.281211972236633e-05, 6.487127393484116e-05, 6.693042814731598e-05, 6.89895823597908e-05, 7.104873657226562e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 5.0, 15.0, 12.0, 24.0, 46.0, 61.0, 147.0, 304.0, 876.0, 3620.0, 32883.0, 789359.0, 207528.0, 10901.0, 1779.0, 560.0, 202.0, 92.0, 54.0, 30.0, 21.0, 7.0, 5.0, 10.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.236572265625, -0.22888565063476562, -0.22119903564453125, -0.21351242065429688, -0.2058258056640625, -0.19813919067382812, -0.19045257568359375, -0.18276596069335938, -0.175079345703125, -0.16739273071289062, -0.15970611572265625, -0.15201950073242188, -0.1443328857421875, -0.13664627075195312, -0.12895965576171875, -0.12127304077148438, -0.11358642578125, -0.10589981079101562, -0.09821319580078125, -0.09052658081054688, -0.0828399658203125, -0.07515335083007812, -0.06746673583984375, -0.059780120849609375, -0.052093505859375, -0.044406890869140625, -0.03672027587890625, -0.029033660888671875, -0.0213470458984375, -0.013660430908203125, -0.00597381591796875, 0.001712799072265625, 0.0093994140625, 0.017086029052734375, 0.02477264404296875, 0.032459259033203125, 0.0401458740234375, 0.047832489013671875, 0.05551910400390625, 0.06320571899414062, 0.070892333984375, 0.07857894897460938, 0.08626556396484375, 0.09395217895507812, 0.1016387939453125, 0.10932540893554688, 0.11701202392578125, 0.12469863891601562, 0.13238525390625, 0.14007186889648438, 0.14775848388671875, 0.15544509887695312, 0.1631317138671875, 0.17081832885742188, 0.17850494384765625, 0.18619155883789062, 0.193878173828125, 0.20156478881835938, 0.20925140380859375, 0.21693801879882812, 0.2246246337890625, 0.23231124877929688, 0.23999786376953125, 0.24768447875976562, 0.25537109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 17.0, 14.0, 34.0, 30.0, 42.0, 76.0, 86.0, 96.0, 105.0, 116.0, 90.0, 66.0, 50.0, 52.0, 27.0, 28.0, 17.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10187721252441406, -0.09846878051757812, -0.09506034851074219, -0.09165191650390625, -0.08824348449707031, -0.08483505249023438, -0.08142662048339844, -0.0780181884765625, -0.07460975646972656, -0.07120132446289062, -0.06779289245605469, -0.06438446044921875, -0.06097602844238281, -0.057567596435546875, -0.05415916442871094, -0.050750732421875, -0.04734230041503906, -0.043933868408203125, -0.04052543640136719, -0.03711700439453125, -0.03370857238769531, -0.030300140380859375, -0.026891708374023438, -0.0234832763671875, -0.020074844360351562, -0.016666412353515625, -0.013257980346679688, -0.00984954833984375, -0.0064411163330078125, -0.003032684326171875, 0.0003757476806640625, 0.0037841796875, 0.0071926116943359375, 0.010601043701171875, 0.014009475708007812, 0.01741790771484375, 0.020826339721679688, 0.024234771728515625, 0.027643203735351562, 0.0310516357421875, 0.03446006774902344, 0.037868499755859375, 0.04127693176269531, 0.04468536376953125, 0.04809379577636719, 0.051502227783203125, 0.05491065979003906, 0.058319091796875, 0.06172752380371094, 0.06513595581054688, 0.06854438781738281, 0.07195281982421875, 0.07536125183105469, 0.07876968383789062, 0.08217811584472656, 0.0855865478515625, 0.08899497985839844, 0.09240341186523438, 0.09581184387207031, 0.09922027587890625, 0.10262870788574219, 0.10603713989257812, 0.10944557189941406, 0.11285400390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 49.0, 188.0, 385.0, 270.0, 84.0, 19.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1447193622589111, -1.0274990797042847, -0.9102786779403687, -0.7930583953857422, -0.675838053226471, -0.5586177110671997, -0.44139742851257324, -0.324177086353302, -0.20695674419403076, -0.08973641693592072, 0.02748391032218933, 0.14470422267913818, 0.2619245648384094, 0.37914490699768066, 0.49636518955230713, 0.6135855317115784, 0.7308058738708496, 0.8480262160301208, 0.9652465581893921, 1.0824668407440186, 1.1996872425079346, 1.316907525062561, 1.4341278076171875, 1.5513482093811035, 1.66856849193573, 1.7857887744903564, 1.9030091762542725, 2.0202293395996094, 2.1374497413635254, 2.2546701431274414, 2.3718905448913574, 2.4891107082366943, 2.6063313484191895, 2.7235517501831055, 2.8407719135284424, 2.9579923152923584, 3.0752127170562744, 3.1924328804016113, 3.3096532821655273, 3.4268736839294434, 3.5440940856933594, 3.6613144874572754, 3.7785346508026123, 3.8957550525665283, 4.012975215911865, 4.130195617675781, 4.247416019439697, 4.364636421203613, 4.481856346130371, 4.599076747894287, 4.716297149658203, 4.833517074584961, 4.950737476348877, 5.067957878112793, 5.185178279876709, 5.302398681640625, 5.419619083404541, 5.536839485168457, 5.654059886932373, 5.771280288696289, 5.888500213623047, 6.005720615386963, 6.122941017150879, 6.240161418914795, 6.357381820678711]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 7.0, 6.0, 6.0, 13.0, 14.0, 16.0, 21.0, 20.0, 19.0, 29.0, 28.0, 29.0, 36.0, 42.0, 34.0, 40.0, 58.0, 58.0, 49.0, 44.0, 42.0, 42.0, 42.0, 35.0, 38.0, 29.0, 40.0, 27.0, 22.0, 30.0, 17.0, 13.0, 7.0, 7.0, 9.0, 11.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1114375591278076, -1.0776102542877197, -1.0437829494476318, -1.009955644607544, -0.976128339767456, -0.9423010349273682, -0.9084737300872803, -0.8746464252471924, -0.8408191204071045, -0.8069918155670166, -0.7731645107269287, -0.7393372058868408, -0.7055099010467529, -0.671682596206665, -0.6378552913665771, -0.6040279865264893, -0.5702007412910461, -0.5363734364509583, -0.5025461316108704, -0.46871882677078247, -0.4348915219306946, -0.4010642170906067, -0.3672369420528412, -0.3334096372127533, -0.2995823323726654, -0.2657550275325775, -0.23192772269248962, -0.19810043275356293, -0.16427312791347504, -0.13044582307338715, -0.09661853313446045, -0.06279122829437256, -0.028963923454284668, 0.004863377660512924, 0.038690678775310516, 0.07251797616481781, 0.1063452810049057, 0.1401725858449936, 0.1739998757839203, 0.20782718062400818, 0.24165448546409607, 0.27548179030418396, 0.30930909514427185, 0.34313637018203735, 0.37696367502212524, 0.41079097986221313, 0.444618284702301, 0.4784455895423889, 0.5122728943824768, 0.5461001992225647, 0.5799275040626526, 0.6137548089027405, 0.6475821137428284, 0.6814094185829163, 0.7152366638183594, 0.7490639686584473, 0.7828912734985352, 0.816718578338623, 0.8505458831787109, 0.8843731880187988, 0.9182004928588867, 0.9520277976989746, 0.9858551025390625, 1.0196824073791504, 1.0535097122192383]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 10.0, 17.0, 12.0, 25.0, 37.0, 40.0, 72.0, 115.0, 157.0, 285.0, 493.0, 860.0, 1689.0, 3745.0, 9583.0, 30725.0, 157313.0, 3653209.0, 272545.0, 42615.0, 12082.0, 4505.0, 1967.0, 944.0, 490.0, 246.0, 178.0, 99.0, 62.0, 33.0, 30.0, 20.0, 18.0, 11.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24280738830566406, -0.23512649536132812, -0.2274456024169922, -0.21976470947265625, -0.2120838165283203, -0.20440292358398438, -0.19672203063964844, -0.1890411376953125, -0.18136024475097656, -0.17367935180664062, -0.1659984588623047, -0.15831756591796875, -0.1506366729736328, -0.14295578002929688, -0.13527488708496094, -0.127593994140625, -0.11991310119628906, -0.11223220825195312, -0.10455131530761719, -0.09687042236328125, -0.08918952941894531, -0.08150863647460938, -0.07382774353027344, -0.0661468505859375, -0.05846595764160156, -0.050785064697265625, -0.04310417175292969, -0.03542327880859375, -0.027742385864257812, -0.020061492919921875, -0.012380599975585938, -0.00469970703125, 0.0029811859130859375, 0.010662078857421875, 0.018342971801757812, 0.02602386474609375, 0.03370475769042969, 0.041385650634765625, 0.04906654357910156, 0.0567474365234375, 0.06442832946777344, 0.07210922241210938, 0.07979011535644531, 0.08747100830078125, 0.09515190124511719, 0.10283279418945312, 0.11051368713378906, 0.118194580078125, 0.12587547302246094, 0.13355636596679688, 0.1412372589111328, 0.14891815185546875, 0.1565990447998047, 0.16427993774414062, 0.17196083068847656, 0.1796417236328125, 0.18732261657714844, 0.19500350952148438, 0.2026844024658203, 0.21036529541015625, 0.2180461883544922, 0.22572708129882812, 0.23340797424316406, 0.2410888671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 11.0, 8.0, 18.0, 18.0, 23.0, 40.0, 40.0, 66.0, 69.0, 57.0, 65.0, 64.0, 74.0, 70.0, 65.0, 63.0, 55.0, 48.0, 49.0, 24.0, 15.0, 12.0, 12.0, 10.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0616455078125, -0.059771060943603516, -0.05789661407470703, -0.05602216720581055, -0.05414772033691406, -0.05227327346801758, -0.050398826599121094, -0.04852437973022461, -0.046649932861328125, -0.04477548599243164, -0.042901039123535156, -0.04102659225463867, -0.03915214538574219, -0.0372776985168457, -0.03540325164794922, -0.033528804779052734, -0.03165435791015625, -0.029779911041259766, -0.02790546417236328, -0.026031017303466797, -0.024156570434570312, -0.022282123565673828, -0.020407676696777344, -0.01853322982788086, -0.016658782958984375, -0.01478433609008789, -0.012909889221191406, -0.011035442352294922, -0.009160995483398438, -0.007286548614501953, -0.005412101745605469, -0.0035376548767089844, -0.0016632080078125, 0.00021123886108398438, 0.0020856857299804688, 0.003960132598876953, 0.0058345794677734375, 0.007709026336669922, 0.009583473205566406, 0.01145792007446289, 0.013332366943359375, 0.01520681381225586, 0.017081260681152344, 0.018955707550048828, 0.020830154418945312, 0.022704601287841797, 0.02457904815673828, 0.026453495025634766, 0.02832794189453125, 0.030202388763427734, 0.03207683563232422, 0.0339512825012207, 0.03582572937011719, 0.03770017623901367, 0.039574623107910156, 0.04144906997680664, 0.043323516845703125, 0.04519796371459961, 0.047072410583496094, 0.04894685745239258, 0.05082130432128906, 0.05269575119018555, 0.05457019805908203, 0.056444644927978516, 0.058319091796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 11.0, 12.0, 7.0, 16.0, 21.0, 69.0, 101.0, 185.0, 486.0, 1645.0, 7485.0, 58951.0, 3463896.0, 625782.0, 29355.0, 4460.0, 1117.0, 323.0, 152.0, 71.0, 35.0, 27.0, 21.0, 10.0, 6.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3215217590332031, -0.30954742431640625, -0.2975730895996094, -0.2855987548828125, -0.2736244201660156, -0.26165008544921875, -0.24967575073242188, -0.237701416015625, -0.22572708129882812, -0.21375274658203125, -0.20177841186523438, -0.1898040771484375, -0.17782974243164062, -0.16585540771484375, -0.15388107299804688, -0.14190673828125, -0.12993240356445312, -0.11795806884765625, -0.10598373413085938, -0.0940093994140625, -0.08203506469726562, -0.07006072998046875, -0.058086395263671875, -0.046112060546875, -0.034137725830078125, -0.02216339111328125, -0.010189056396484375, 0.0017852783203125, 0.013759613037109375, 0.02573394775390625, 0.037708282470703125, 0.0496826171875, 0.061656951904296875, 0.07363128662109375, 0.08560562133789062, 0.0975799560546875, 0.10955429077148438, 0.12152862548828125, 0.13350296020507812, 0.145477294921875, 0.15745162963867188, 0.16942596435546875, 0.18140029907226562, 0.1933746337890625, 0.20534896850585938, 0.21732330322265625, 0.22929763793945312, 0.24127197265625, 0.2532463073730469, 0.26522064208984375, 0.2771949768066406, 0.2891693115234375, 0.3011436462402344, 0.31311798095703125, 0.3250923156738281, 0.337066650390625, 0.3490409851074219, 0.36101531982421875, 0.3729896545410156, 0.3849639892578125, 0.3969383239746094, 0.40891265869140625, 0.4208869934082031, 0.432861328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 12.0, 14.0, 20.0, 34.0, 44.0, 61.0, 124.0, 184.0, 441.0, 1699.0, 745.0, 279.0, 158.0, 77.0, 51.0, 37.0, 18.0, 14.0, 9.0, 10.0, 8.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1416015625, -0.13812732696533203, -0.13465309143066406, -0.1311788558959961, -0.12770462036132812, -0.12423038482666016, -0.12075614929199219, -0.11728191375732422, -0.11380767822265625, -0.11033344268798828, -0.10685920715332031, -0.10338497161865234, -0.09991073608398438, -0.0964365005493164, -0.09296226501464844, -0.08948802947998047, -0.0860137939453125, -0.08253955841064453, -0.07906532287597656, -0.0755910873413086, -0.07211685180664062, -0.06864261627197266, -0.06516838073730469, -0.06169414520263672, -0.05821990966796875, -0.05474567413330078, -0.05127143859863281, -0.047797203063964844, -0.044322967529296875, -0.040848731994628906, -0.03737449645996094, -0.03390026092529297, -0.030426025390625, -0.02695178985595703, -0.023477554321289062, -0.020003318786621094, -0.016529083251953125, -0.013054847717285156, -0.009580612182617188, -0.006106376647949219, -0.00263214111328125, 0.0008420944213867188, 0.0043163299560546875, 0.007790565490722656, 0.011264801025390625, 0.014739036560058594, 0.018213272094726562, 0.02168750762939453, 0.0251617431640625, 0.02863597869873047, 0.03211021423339844, 0.035584449768066406, 0.039058685302734375, 0.042532920837402344, 0.04600715637207031, 0.04948139190673828, 0.05295562744140625, 0.05642986297607422, 0.05990409851074219, 0.06337833404541016, 0.06685256958007812, 0.0703268051147461, 0.07380104064941406, 0.07727527618408203, 0.08074951171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 17.0, 44.0, 64.0, 101.0, 151.0, 154.0, 160.0, 132.0, 83.0, 44.0, 21.0, 11.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9112545847892761, -0.8900306224822998, -0.8688066601753235, -0.8475827574729919, -0.8263587951660156, -0.8051348328590393, -0.783910870552063, -0.7626869678497314, -0.7414630055427551, -0.7202390432357788, -0.6990150809288025, -0.677791178226471, -0.6565672159194946, -0.6353432536125183, -0.614119291305542, -0.5928953886032104, -0.5716713666915894, -0.550447404384613, -0.5292234420776367, -0.5079995393753052, -0.48677557706832886, -0.46555161476135254, -0.4443276524543762, -0.4231037199497223, -0.40187978744506836, -0.38065582513809204, -0.3594318926334381, -0.3382079303264618, -0.31698399782180786, -0.29576003551483154, -0.2745360732078552, -0.2533121407032013, -0.23208820819854736, -0.21086426079273224, -0.18964031338691711, -0.1684163510799408, -0.14719241857528687, -0.12596845626831055, -0.10474450886249542, -0.0835205614566803, -0.06229661405086517, -0.04107266664505005, -0.019848715513944626, 0.0013752356171607971, 0.02259918302297592, 0.043823130428791046, 0.06504708528518677, 0.08627103269100189, 0.10749498009681702, 0.12871892750263214, 0.14994287490844727, 0.17116683721542358, 0.19239076972007751, 0.21361473202705383, 0.23483867943286896, 0.2560626268386841, 0.2772865891456604, 0.2985105514526367, 0.31973448395729065, 0.34095844626426697, 0.3621823787689209, 0.3834063410758972, 0.40463030338287354, 0.42585423588752747, 0.4470781683921814]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 11.0, 6.0, 6.0, 14.0, 10.0, 13.0, 14.0, 26.0, 29.0, 25.0, 41.0, 19.0, 27.0, 47.0, 32.0, 45.0, 45.0, 52.0, 41.0, 47.0, 51.0, 29.0, 53.0, 33.0, 35.0, 36.0, 31.0, 27.0, 19.0, 24.0, 25.0, 27.0, 11.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27719610929489136, -0.26700854301452637, -0.25682100653648376, -0.24663344025611877, -0.23644588887691498, -0.22625833749771118, -0.21607078611850739, -0.2058832347393036, -0.1956956684589386, -0.1855081170797348, -0.175320565700531, -0.16513299942016602, -0.15494544804096222, -0.14475789666175842, -0.13457034528255463, -0.12438278645277023, -0.11419524252414703, -0.10400769114494324, -0.09382013231515884, -0.08363258093595505, -0.07344502210617065, -0.06325747072696686, -0.05306991934776306, -0.04288236051797867, -0.03269480913877487, -0.022507254034280777, -0.012319700792431831, -0.0021321475505828857, 0.008055407553911209, 0.018242962658405304, 0.0284305140376091, 0.038618072867393494, 0.04880562424659729, 0.058993179351091385, 0.06918073445558548, 0.07936828583478928, 0.08955584466457367, 0.09974339604377747, 0.10993094742298126, 0.12011850625276566, 0.13030606508255005, 0.14049361646175385, 0.15068116784095764, 0.16086873412132263, 0.17105628550052643, 0.18124383687973022, 0.19143138825893402, 0.20161893963813782, 0.2118064910173416, 0.2219940423965454, 0.2321815937757492, 0.242369145154953, 0.252556711435318, 0.2627442479133606, 0.2729318141937256, 0.2831193804740906, 0.2933069169521332, 0.30349448323249817, 0.31368201971054077, 0.32386958599090576, 0.33405712246894836, 0.34424468874931335, 0.35443222522735596, 0.36461979150772095, 0.37480735778808594]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 14.0, 8.0, 11.0, 15.0, 28.0, 45.0, 71.0, 141.0, 236.0, 436.0, 850.0, 1739.0, 4264.0, 11946.0, 40904.0, 163083.0, 580005.0, 179512.0, 44124.0, 12952.0, 4453.0, 1820.0, 865.0, 461.0, 227.0, 126.0, 74.0, 48.0, 31.0, 19.0, 14.0, 15.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2890625, -0.28069114685058594, -0.2723197937011719, -0.2639484405517578, -0.25557708740234375, -0.2472057342529297, -0.23883438110351562, -0.23046302795410156, -0.2220916748046875, -0.21372032165527344, -0.20534896850585938, -0.1969776153564453, -0.18860626220703125, -0.1802349090576172, -0.17186355590820312, -0.16349220275878906, -0.155120849609375, -0.14674949645996094, -0.13837814331054688, -0.1300067901611328, -0.12163543701171875, -0.11326408386230469, -0.10489273071289062, -0.09652137756347656, -0.0881500244140625, -0.07977867126464844, -0.07140731811523438, -0.06303596496582031, -0.05466461181640625, -0.04629325866699219, -0.037921905517578125, -0.029550552368164062, -0.02117919921875, -0.012807846069335938, -0.004436492919921875, 0.0039348602294921875, 0.01230621337890625, 0.020677566528320312, 0.029048919677734375, 0.03742027282714844, 0.0457916259765625, 0.05416297912597656, 0.06253433227539062, 0.07090568542480469, 0.07927703857421875, 0.08764839172363281, 0.09601974487304688, 0.10439109802246094, 0.112762451171875, 0.12113380432128906, 0.12950515747070312, 0.1378765106201172, 0.14624786376953125, 0.1546192169189453, 0.16299057006835938, 0.17136192321777344, 0.1797332763671875, 0.18810462951660156, 0.19647598266601562, 0.2048473358154297, 0.21321868896484375, 0.2215900421142578, 0.22996139526367188, 0.23833274841308594, 0.2467041015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 17.0, 20.0, 16.0, 32.0, 46.0, 39.0, 55.0, 66.0, 75.0, 83.0, 65.0, 73.0, 71.0, 66.0, 70.0, 56.0, 37.0, 21.0, 26.0, 21.0, 8.0, 11.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05675458908081055, -0.054823875427246094, -0.05289316177368164, -0.05096244812011719, -0.049031734466552734, -0.04710102081298828, -0.04517030715942383, -0.043239593505859375, -0.04130887985229492, -0.03937816619873047, -0.037447452545166016, -0.03551673889160156, -0.03358602523803711, -0.031655311584472656, -0.029724597930908203, -0.02779388427734375, -0.025863170623779297, -0.023932456970214844, -0.02200174331665039, -0.020071029663085938, -0.018140316009521484, -0.01620960235595703, -0.014278888702392578, -0.012348175048828125, -0.010417461395263672, -0.008486747741699219, -0.006556034088134766, -0.0046253204345703125, -0.0026946067810058594, -0.0007638931274414062, 0.0011668205261230469, 0.0030975341796875, 0.005028247833251953, 0.006958961486816406, 0.00888967514038086, 0.010820388793945312, 0.012751102447509766, 0.014681816101074219, 0.016612529754638672, 0.018543243408203125, 0.020473957061767578, 0.02240467071533203, 0.024335384368896484, 0.026266098022460938, 0.02819681167602539, 0.030127525329589844, 0.0320582389831543, 0.03398895263671875, 0.0359196662902832, 0.037850379943847656, 0.03978109359741211, 0.04171180725097656, 0.043642520904541016, 0.04557323455810547, 0.04750394821166992, 0.049434661865234375, 0.05136537551879883, 0.05329608917236328, 0.055226802825927734, 0.05715751647949219, 0.05908823013305664, 0.061018943786621094, 0.06294965744018555, 0.06488037109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 17.0, 24.0, 33.0, 41.0, 68.0, 108.0, 166.0, 332.0, 702.0, 1580.0, 4837.0, 22859.0, 173923.0, 720651.0, 101464.0, 15456.0, 3722.0, 1265.0, 533.0, 290.0, 182.0, 103.0, 57.0, 42.0, 25.0, 12.0, 7.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.378173828125, -0.36748504638671875, -0.3567962646484375, -0.34610748291015625, -0.335418701171875, -0.32472991943359375, -0.3140411376953125, -0.30335235595703125, -0.29266357421875, -0.28197479248046875, -0.2712860107421875, -0.26059722900390625, -0.249908447265625, -0.23921966552734375, -0.2285308837890625, -0.21784210205078125, -0.2071533203125, -0.19646453857421875, -0.1857757568359375, -0.17508697509765625, -0.164398193359375, -0.15370941162109375, -0.1430206298828125, -0.13233184814453125, -0.12164306640625, -0.11095428466796875, -0.1002655029296875, -0.08957672119140625, -0.078887939453125, -0.06819915771484375, -0.0575103759765625, -0.04682159423828125, -0.0361328125, -0.02544403076171875, -0.0147552490234375, -0.00406646728515625, 0.006622314453125, 0.01731109619140625, 0.0279998779296875, 0.03868865966796875, 0.04937744140625, 0.06006622314453125, 0.0707550048828125, 0.08144378662109375, 0.092132568359375, 0.10282135009765625, 0.1135101318359375, 0.12419891357421875, 0.1348876953125, 0.14557647705078125, 0.1562652587890625, 0.16695404052734375, 0.177642822265625, 0.18833160400390625, 0.1990203857421875, 0.20970916748046875, 0.22039794921875, 0.23108673095703125, 0.2417755126953125, 0.25246429443359375, 0.263153076171875, 0.27384185791015625, 0.2845306396484375, 0.29521942138671875, 0.305908203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 8.0, 8.0, 7.0, 12.0, 18.0, 22.0, 26.0, 25.0, 30.0, 29.0, 42.0, 45.0, 45.0, 46.0, 50.0, 66.0, 65.0, 54.0, 53.0, 55.0, 45.0, 39.0, 30.0, 30.0, 25.0, 28.0, 17.0, 22.0, 12.0, 11.0, 11.0, 7.0, 5.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.24191856384277344, -0.23469161987304688, -0.2274646759033203, -0.22023773193359375, -0.2130107879638672, -0.20578384399414062, -0.19855690002441406, -0.1913299560546875, -0.18410301208496094, -0.17687606811523438, -0.1696491241455078, -0.16242218017578125, -0.1551952362060547, -0.14796829223632812, -0.14074134826660156, -0.133514404296875, -0.12628746032714844, -0.11906051635742188, -0.11183357238769531, -0.10460662841796875, -0.09737968444824219, -0.09015274047851562, -0.08292579650878906, -0.0756988525390625, -0.06847190856933594, -0.061244964599609375, -0.05401802062988281, -0.04679107666015625, -0.03956413269042969, -0.032337188720703125, -0.025110244750976562, -0.01788330078125, -0.010656356811523438, -0.003429412841796875, 0.0037975311279296875, 0.01102447509765625, 0.018251419067382812, 0.025478363037109375, 0.03270530700683594, 0.0399322509765625, 0.04715919494628906, 0.054386138916015625, 0.06161308288574219, 0.06884002685546875, 0.07606697082519531, 0.08329391479492188, 0.09052085876464844, 0.097747802734375, 0.10497474670410156, 0.11220169067382812, 0.11942863464355469, 0.12665557861328125, 0.1338825225830078, 0.14110946655273438, 0.14833641052246094, 0.1555633544921875, 0.16279029846191406, 0.17001724243164062, 0.1772441864013672, 0.18447113037109375, 0.1916980743408203, 0.19892501831054688, 0.20615196228027344, 0.21337890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 5.0, 8.0, 10.0, 5.0, 16.0, 12.0, 33.0, 45.0, 65.0, 120.0, 224.0, 364.0, 616.0, 1260.0, 2518.0, 6015.0, 17809.0, 83403.0, 744466.0, 152019.0, 25216.0, 7768.0, 3122.0, 1580.0, 783.0, 430.0, 232.0, 138.0, 87.0, 59.0, 35.0, 23.0, 22.0, 12.0, 7.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2413330078125, -0.23393821716308594, -0.22654342651367188, -0.2191486358642578, -0.21175384521484375, -0.2043590545654297, -0.19696426391601562, -0.18956947326660156, -0.1821746826171875, -0.17477989196777344, -0.16738510131835938, -0.1599903106689453, -0.15259552001953125, -0.1452007293701172, -0.13780593872070312, -0.13041114807128906, -0.123016357421875, -0.11562156677246094, -0.10822677612304688, -0.10083198547363281, -0.09343719482421875, -0.08604240417480469, -0.07864761352539062, -0.07125282287597656, -0.0638580322265625, -0.05646324157714844, -0.049068450927734375, -0.04167366027832031, -0.03427886962890625, -0.026884078979492188, -0.019489288330078125, -0.012094497680664062, -0.00469970703125, 0.0026950836181640625, 0.010089874267578125, 0.017484664916992188, 0.02487945556640625, 0.03227424621582031, 0.039669036865234375, 0.04706382751464844, 0.0544586181640625, 0.06185340881347656, 0.06924819946289062, 0.07664299011230469, 0.08403778076171875, 0.09143257141113281, 0.09882736206054688, 0.10622215270996094, 0.113616943359375, 0.12101173400878906, 0.12840652465820312, 0.1358013153076172, 0.14319610595703125, 0.1505908966064453, 0.15798568725585938, 0.16538047790527344, 0.1727752685546875, 0.18017005920410156, 0.18756484985351562, 0.1949596405029297, 0.20235443115234375, 0.2097492218017578, 0.21714401245117188, 0.22453880310058594, 0.23193359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 11.0, 7.0, 8.0, 15.0, 21.0, 28.0, 29.0, 56.0, 63.0, 104.0, 87.0, 106.0, 120.0, 102.0, 70.0, 46.0, 46.0, 24.0, 19.0, 15.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3451786041259766e-05, -4.1754916310310364e-05, -4.005804657936096e-05, -3.836117684841156e-05, -3.666430711746216e-05, -3.4967437386512756e-05, -3.3270567655563354e-05, -3.157369792461395e-05, -2.987682819366455e-05, -2.817995846271515e-05, -2.6483088731765747e-05, -2.4786219000816345e-05, -2.3089349269866943e-05, -2.139247953891754e-05, -1.969560980796814e-05, -1.7998740077018738e-05, -1.6301870346069336e-05, -1.4605000615119934e-05, -1.2908130884170532e-05, -1.121126115322113e-05, -9.514391422271729e-06, -7.817521691322327e-06, -6.120651960372925e-06, -4.423782229423523e-06, -2.726912498474121e-06, -1.0300427675247192e-06, 6.668269634246826e-07, 2.3636966943740845e-06, 4.060566425323486e-06, 5.757436156272888e-06, 7.45430588722229e-06, 9.151175618171692e-06, 1.0848045349121094e-05, 1.2544915080070496e-05, 1.4241784811019897e-05, 1.59386545419693e-05, 1.76355242729187e-05, 1.9332394003868103e-05, 2.1029263734817505e-05, 2.2726133465766907e-05, 2.442300319671631e-05, 2.611987292766571e-05, 2.7816742658615112e-05, 2.9513612389564514e-05, 3.1210482120513916e-05, 3.290735185146332e-05, 3.460422158241272e-05, 3.630109131336212e-05, 3.7997961044311523e-05, 3.9694830775260925e-05, 4.139170050621033e-05, 4.308857023715973e-05, 4.478543996810913e-05, 4.648230969905853e-05, 4.8179179430007935e-05, 4.9876049160957336e-05, 5.157291889190674e-05, 5.326978862285614e-05, 5.496665835380554e-05, 5.6663528084754944e-05, 5.8360397815704346e-05, 6.005726754665375e-05, 6.175413727760315e-05, 6.345100700855255e-05, 6.514787673950195e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 12.0, 19.0, 31.0, 53.0, 101.0, 222.0, 491.0, 1307.0, 5123.0, 46469.0, 931137.0, 55520.0, 5735.0, 1356.0, 493.0, 233.0, 114.0, 54.0, 30.0, 12.0, 16.0, 7.0, 0.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45703125, -0.442535400390625, -0.42803955078125, -0.413543701171875, -0.3990478515625, -0.384552001953125, -0.37005615234375, -0.355560302734375, -0.341064453125, -0.326568603515625, -0.31207275390625, -0.297576904296875, -0.2830810546875, -0.268585205078125, -0.25408935546875, -0.239593505859375, -0.22509765625, -0.210601806640625, -0.19610595703125, -0.181610107421875, -0.1671142578125, -0.152618408203125, -0.13812255859375, -0.123626708984375, -0.109130859375, -0.094635009765625, -0.08013916015625, -0.065643310546875, -0.0511474609375, -0.036651611328125, -0.02215576171875, -0.007659912109375, 0.0068359375, 0.021331787109375, 0.03582763671875, 0.050323486328125, 0.0648193359375, 0.079315185546875, 0.09381103515625, 0.108306884765625, 0.122802734375, 0.137298583984375, 0.15179443359375, 0.166290283203125, 0.1807861328125, 0.195281982421875, 0.20977783203125, 0.224273681640625, 0.23876953125, 0.253265380859375, 0.26776123046875, 0.282257080078125, 0.2967529296875, 0.311248779296875, 0.32574462890625, 0.340240478515625, 0.354736328125, 0.369232177734375, 0.38372802734375, 0.398223876953125, 0.4127197265625, 0.427215576171875, 0.44171142578125, 0.456207275390625, 0.470703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 16.0, 23.0, 33.0, 33.0, 91.0, 163.0, 224.0, 182.0, 83.0, 39.0, 29.0, 14.0, 17.0, 7.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23779296875, -0.23044395446777344, -0.22309494018554688, -0.2157459259033203, -0.20839691162109375, -0.2010478973388672, -0.19369888305664062, -0.18634986877441406, -0.1790008544921875, -0.17165184020996094, -0.16430282592773438, -0.1569538116455078, -0.14960479736328125, -0.1422557830810547, -0.13490676879882812, -0.12755775451660156, -0.120208740234375, -0.11285972595214844, -0.10551071166992188, -0.09816169738769531, -0.09081268310546875, -0.08346366882324219, -0.07611465454101562, -0.06876564025878906, -0.0614166259765625, -0.05406761169433594, -0.046718597412109375, -0.03936958312988281, -0.03202056884765625, -0.024671554565429688, -0.017322540283203125, -0.009973526000976562, -0.00262451171875, 0.0047245025634765625, 0.012073516845703125, 0.019422531127929688, 0.02677154541015625, 0.03412055969238281, 0.041469573974609375, 0.04881858825683594, 0.0561676025390625, 0.06351661682128906, 0.07086563110351562, 0.07821464538574219, 0.08556365966796875, 0.09291267395019531, 0.10026168823242188, 0.10761070251464844, 0.114959716796875, 0.12230873107910156, 0.12965774536132812, 0.1370067596435547, 0.14435577392578125, 0.1517047882080078, 0.15905380249023438, 0.16640281677246094, 0.1737518310546875, 0.18110084533691406, 0.18844985961914062, 0.1957988739013672, 0.20314788818359375, 0.2104969024658203, 0.21784591674804688, 0.22519493103027344, 0.2325439453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 70.0, 262.0, 377.0, 207.0, 54.0, 15.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4786880016326904, -1.3231526613235474, -1.1676174402236938, -1.0120820999145508, -0.8565468192100525, -0.7010115385055542, -0.5454761981964111, -0.3899409770965576, -0.23440563678741455, -0.07887034118175507, 0.07666495442390442, 0.2322002649307251, 0.3877355456352234, 0.5432708263397217, 0.6988061666488647, 0.8543413877487183, 1.0098767280578613, 1.1654120683670044, 1.320947289466858, 1.476482629776001, 1.6320178508758545, 1.7875531911849976, 1.9430885314941406, 2.098623752593994, 2.2541589736938477, 2.409694194793701, 2.565229654312134, 2.7207648754119873, 2.876300096511841, 3.0318355560302734, 3.187370777130127, 3.3429059982299805, 3.498441219329834, 3.6539764404296875, 3.80951189994812, 3.9650471210479736, 4.120582580566406, 4.27611780166626, 4.431653022766113, 4.587188243865967, 4.74272346496582, 4.898258686065674, 5.053793907165527, 5.209329605102539, 5.364864826202393, 5.520400047302246, 5.6759352684021, 5.831470489501953, 5.987006187438965, 6.142541408538818, 6.298076629638672, 6.453612327575684, 6.609147548675537, 6.764682769775391, 6.920217990875244, 7.075753211975098, 7.231288433074951, 7.386823654174805, 7.542358875274658, 7.697894096374512, 7.853429794311523, 8.008964538574219, 8.16450023651123, 8.320035934448242, 8.475570678710938]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 3.0, 9.0, 8.0, 12.0, 11.0, 14.0, 24.0, 19.0, 22.0, 24.0, 13.0, 21.0, 20.0, 37.0, 26.0, 41.0, 35.0, 37.0, 48.0, 41.0, 38.0, 40.0, 35.0, 42.0, 41.0, 42.0, 23.0, 26.0, 21.0, 31.0, 29.0, 34.0, 8.0, 18.0, 11.0, 15.0, 15.0, 9.0, 11.0, 6.0, 9.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0830885171890259, -1.0505239963531494, -1.0179593563079834, -0.9853948354721069, -0.9528303146362305, -0.920265793800354, -0.8877012133598328, -0.8551366329193115, -0.8225721120834351, -0.7900075912475586, -0.7574430108070374, -0.7248784303665161, -0.6923139095306396, -0.6597493886947632, -0.6271848082542419, -0.5946202278137207, -0.5620557069778442, -0.5294911861419678, -0.49692660570144653, -0.4643620550632477, -0.43179750442504883, -0.39923295378685, -0.3666684031486511, -0.33410385251045227, -0.3015393018722534, -0.26897475123405457, -0.2364102005958557, -0.20384564995765686, -0.171281099319458, -0.13871654868125916, -0.1061519980430603, -0.07358744740486145, -0.04102301597595215, -0.008458465337753296, 0.024106085300445557, 0.05667063593864441, 0.08923518657684326, 0.12179973721504211, 0.15436428785324097, 0.18692883849143982, 0.21949338912963867, 0.2520579397678375, 0.2846224904060364, 0.31718704104423523, 0.3497515916824341, 0.38231614232063293, 0.4148806929588318, 0.44744524359703064, 0.4800097942352295, 0.512574315071106, 0.5451388955116272, 0.5777034759521484, 0.6102679967880249, 0.6428325176239014, 0.6753970980644226, 0.7079616785049438, 0.7405261993408203, 0.7730907201766968, 0.805655300617218, 0.8382198810577393, 0.8707844018936157, 0.9033489227294922, 0.9359135031700134, 0.9684780836105347, 1.0010426044464111]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 16.0, 10.0, 19.0, 27.0, 37.0, 47.0, 89.0, 132.0, 227.0, 413.0, 744.0, 1411.0, 2945.0, 7122.0, 20595.0, 81087.0, 3133046.0, 851121.0, 65734.0, 17679.0, 6376.0, 2665.0, 1330.0, 604.0, 324.0, 177.0, 89.0, 84.0, 42.0, 39.0, 20.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24714279174804688, -0.23940277099609375, -0.23166275024414062, -0.2239227294921875, -0.21618270874023438, -0.20844268798828125, -0.20070266723632812, -0.192962646484375, -0.18522262573242188, -0.17748260498046875, -0.16974258422851562, -0.1620025634765625, -0.15426254272460938, -0.14652252197265625, -0.13878250122070312, -0.13104248046875, -0.12330245971679688, -0.11556243896484375, -0.10782241821289062, -0.1000823974609375, -0.09234237670898438, -0.08460235595703125, -0.07686233520507812, -0.069122314453125, -0.061382293701171875, -0.05364227294921875, -0.045902252197265625, -0.0381622314453125, -0.030422210693359375, -0.02268218994140625, -0.014942169189453125, -0.0072021484375, 0.000537872314453125, 0.00827789306640625, 0.016017913818359375, 0.0237579345703125, 0.031497955322265625, 0.03923797607421875, 0.046977996826171875, 0.054718017578125, 0.062458038330078125, 0.07019805908203125, 0.07793807983398438, 0.0856781005859375, 0.09341812133789062, 0.10115814208984375, 0.10889816284179688, 0.11663818359375, 0.12437820434570312, 0.13211822509765625, 0.13985824584960938, 0.1475982666015625, 0.15533828735351562, 0.16307830810546875, 0.17081832885742188, 0.178558349609375, 0.18629837036132812, 0.19403839111328125, 0.20177841186523438, 0.2095184326171875, 0.21725845336914062, 0.22499847412109375, 0.23273849487304688, 0.240478515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 3.0, 9.0, 14.0, 11.0, 24.0, 30.0, 26.0, 25.0, 42.0, 61.0, 64.0, 65.0, 65.0, 59.0, 56.0, 52.0, 65.0, 75.0, 38.0, 42.0, 41.0, 41.0, 23.0, 16.0, 10.0, 11.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0625, -0.06059408187866211, -0.05868816375732422, -0.05678224563598633, -0.05487632751464844, -0.05297040939331055, -0.051064491271972656, -0.049158573150634766, -0.047252655029296875, -0.045346736907958984, -0.043440818786621094, -0.0415349006652832, -0.03962898254394531, -0.03772306442260742, -0.03581714630126953, -0.03391122817993164, -0.03200531005859375, -0.03009939193725586, -0.02819347381591797, -0.026287555694580078, -0.024381637573242188, -0.022475719451904297, -0.020569801330566406, -0.018663883209228516, -0.016757965087890625, -0.014852046966552734, -0.012946128845214844, -0.011040210723876953, -0.009134292602539062, -0.007228374481201172, -0.005322456359863281, -0.0034165382385253906, -0.0015106201171875, 0.0003952980041503906, 0.0023012161254882812, 0.004207134246826172, 0.0061130523681640625, 0.008018970489501953, 0.009924888610839844, 0.011830806732177734, 0.013736724853515625, 0.015642642974853516, 0.017548561096191406, 0.019454479217529297, 0.021360397338867188, 0.023266315460205078, 0.02517223358154297, 0.02707815170288086, 0.02898406982421875, 0.03088998794555664, 0.03279590606689453, 0.03470182418823242, 0.03660774230957031, 0.0385136604309082, 0.040419578552246094, 0.042325496673583984, 0.044231414794921875, 0.046137332916259766, 0.048043251037597656, 0.04994916915893555, 0.05185508728027344, 0.05376100540161133, 0.05566692352294922, 0.05757284164428711, 0.059478759765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 7.0, 9.0, 18.0, 15.0, 36.0, 60.0, 85.0, 186.0, 353.0, 669.0, 1488.0, 3589.0, 9920.0, 34471.0, 219669.0, 3698399.0, 178694.0, 30853.0, 9491.0, 3480.0, 1394.0, 652.0, 340.0, 159.0, 97.0, 52.0, 32.0, 21.0, 20.0, 12.0, 3.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3510017395019531, -0.34018707275390625, -0.3293724060058594, -0.3185577392578125, -0.3077430725097656, -0.29692840576171875, -0.2861137390136719, -0.275299072265625, -0.2644844055175781, -0.25366973876953125, -0.24285507202148438, -0.2320404052734375, -0.22122573852539062, -0.21041107177734375, -0.19959640502929688, -0.18878173828125, -0.17796707153320312, -0.16715240478515625, -0.15633773803710938, -0.1455230712890625, -0.13470840454101562, -0.12389373779296875, -0.11307907104492188, -0.102264404296875, -0.09144973754882812, -0.08063507080078125, -0.06982040405273438, -0.0590057373046875, -0.048191070556640625, -0.03737640380859375, -0.026561737060546875, -0.0157470703125, -0.004932403564453125, 0.00588226318359375, 0.016696929931640625, 0.0275115966796875, 0.038326263427734375, 0.04914093017578125, 0.059955596923828125, 0.070770263671875, 0.08158493041992188, 0.09239959716796875, 0.10321426391601562, 0.1140289306640625, 0.12484359741210938, 0.13565826416015625, 0.14647293090820312, 0.15728759765625, 0.16810226440429688, 0.17891693115234375, 0.18973159790039062, 0.2005462646484375, 0.21136093139648438, 0.22217559814453125, 0.23299026489257812, 0.243804931640625, 0.2546195983886719, 0.26543426513671875, 0.2762489318847656, 0.2870635986328125, 0.2978782653808594, 0.30869293212890625, 0.3195075988769531, 0.330322265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 14.0, 6.0, 16.0, 18.0, 31.0, 56.0, 82.0, 128.0, 301.0, 1533.0, 1168.0, 290.0, 141.0, 82.0, 43.0, 36.0, 23.0, 21.0, 21.0, 11.0, 15.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12143707275390625, -0.1177520751953125, -0.11406707763671875, -0.110382080078125, -0.10669708251953125, -0.1030120849609375, -0.09932708740234375, -0.09564208984375, -0.09195709228515625, -0.0882720947265625, -0.08458709716796875, -0.080902099609375, -0.07721710205078125, -0.0735321044921875, -0.06984710693359375, -0.066162109375, -0.06247711181640625, -0.0587921142578125, -0.05510711669921875, -0.051422119140625, -0.04773712158203125, -0.0440521240234375, -0.04036712646484375, -0.03668212890625, -0.03299713134765625, -0.0293121337890625, -0.02562713623046875, -0.021942138671875, -0.01825714111328125, -0.0145721435546875, -0.01088714599609375, -0.0072021484375, -0.00351715087890625, 0.0001678466796875, 0.00385284423828125, 0.007537841796875, 0.01122283935546875, 0.0149078369140625, 0.01859283447265625, 0.02227783203125, 0.02596282958984375, 0.0296478271484375, 0.03333282470703125, 0.037017822265625, 0.04070281982421875, 0.0443878173828125, 0.04807281494140625, 0.0517578125, 0.05544281005859375, 0.0591278076171875, 0.06281280517578125, 0.066497802734375, 0.07018280029296875, 0.0738677978515625, 0.07755279541015625, 0.08123779296875, 0.08492279052734375, 0.0886077880859375, 0.09229278564453125, 0.095977783203125, 0.09966278076171875, 0.1033477783203125, 0.10703277587890625, 0.1107177734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 18.0, 33.0, 85.0, 160.0, 197.0, 215.0, 144.0, 82.0, 35.0, 15.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5483378171920776, -0.5134613513946533, -0.4785849153995514, -0.4437084496021271, -0.40883201360702515, -0.37395554780960083, -0.3390790820121765, -0.3042026162147522, -0.26932618021965027, -0.23444972932338715, -0.19957327842712402, -0.1646968126296997, -0.12982036173343658, -0.09494391083717346, -0.060067445039749146, -0.025190994143486023, 0.0096854567527771, 0.04456191137433052, 0.07943836599588394, 0.11431482434272766, 0.14919127523899078, 0.1840677261352539, 0.21894419193267822, 0.25382065773010254, 0.28869709372520447, 0.3235735595226288, 0.3584499955177307, 0.39332646131515503, 0.42820292711257935, 0.4630793631076813, 0.4979558289051056, 0.5328322649002075, 0.5677087306976318, 0.6025851964950562, 0.6374616622924805, 0.6723381280899048, 0.7072145342826843, 0.7420910000801086, 0.776967465877533, 0.8118439316749573, 0.8467203378677368, 0.8815968036651611, 0.9164732694625854, 0.9513497352600098, 0.9862261414527893, 1.0211026668548584, 1.0559790134429932, 1.0908554792404175, 1.1257319450378418, 1.1606084108352661, 1.1954848766326904, 1.2303613424301147, 1.265237808227539, 1.3001141548156738, 1.3349907398223877, 1.3698670864105225, 1.4047436714172363, 1.4396201372146606, 1.474496603012085, 1.5093730688095093, 1.5442495346069336, 1.5791258811950684, 1.6140024662017822, 1.648878812789917, 1.6837552785873413]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 4.0, 11.0, 5.0, 9.0, 10.0, 14.0, 18.0, 26.0, 32.0, 32.0, 22.0, 34.0, 33.0, 33.0, 45.0, 47.0, 51.0, 39.0, 37.0, 47.0, 31.0, 56.0, 38.0, 40.0, 39.0, 34.0, 32.0, 28.0, 22.0, 21.0, 18.0, 21.0, 11.0, 14.0, 10.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.37145864963531494, -0.3599833846092224, -0.3485080897808075, -0.33703282475471497, -0.32555752992630005, -0.3140822649002075, -0.302606999874115, -0.2911317050457001, -0.27965644001960754, -0.268181174993515, -0.2567058801651001, -0.24523061513900757, -0.23375533521175385, -0.22228005528450012, -0.2108047753572464, -0.19932949542999268, -0.18785421550273895, -0.17637893557548523, -0.1649036556482315, -0.15342837572097778, -0.14195311069488525, -0.13047783076763153, -0.11900255084037781, -0.10752727836370468, -0.09605199843645096, -0.08457671850919724, -0.07310144603252411, -0.061626166105270386, -0.05015088990330696, -0.038675613701343536, -0.027200333774089813, -0.015725061297416687, -0.004249781370162964, 0.007225495763123035, 0.018700772896409035, 0.03017605096101761, 0.04165132716298103, 0.05312660336494446, 0.06460188329219818, 0.07607715576887131, 0.08755243569612503, 0.09902771562337875, 0.11050298810005188, 0.1219782680273056, 0.13345354795455933, 0.14492881298065186, 0.15640410780906677, 0.1678793728351593, 0.17935465276241302, 0.19082993268966675, 0.20230521261692047, 0.2137804925441742, 0.22525575757026672, 0.23673103749752045, 0.24820631742477417, 0.2596815824508667, 0.2711568772792816, 0.28263214230537415, 0.29410743713378906, 0.3055827021598816, 0.3170579969882965, 0.32853326201438904, 0.34000855684280396, 0.3514838218688965, 0.362959086894989]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 11.0, 25.0, 32.0, 40.0, 66.0, 96.0, 165.0, 260.0, 465.0, 746.0, 1374.0, 2547.0, 5176.0, 11158.0, 25411.0, 65155.0, 189160.0, 443216.0, 189920.0, 65793.0, 25719.0, 10900.0, 5176.0, 2557.0, 1403.0, 776.0, 435.0, 261.0, 180.0, 101.0, 81.0, 45.0, 40.0, 27.0, 8.0, 8.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2462158203125, -0.23928070068359375, -0.2323455810546875, -0.22541046142578125, -0.218475341796875, -0.21154022216796875, -0.2046051025390625, -0.19766998291015625, -0.19073486328125, -0.18379974365234375, -0.1768646240234375, -0.16992950439453125, -0.162994384765625, -0.15605926513671875, -0.1491241455078125, -0.14218902587890625, -0.13525390625, -0.12831878662109375, -0.1213836669921875, -0.11444854736328125, -0.107513427734375, -0.10057830810546875, -0.0936431884765625, -0.08670806884765625, -0.07977294921875, -0.07283782958984375, -0.0659027099609375, -0.05896759033203125, -0.052032470703125, -0.04509735107421875, -0.0381622314453125, -0.03122711181640625, -0.0242919921875, -0.01735687255859375, -0.0104217529296875, -0.00348663330078125, 0.003448486328125, 0.01038360595703125, 0.0173187255859375, 0.02425384521484375, 0.03118896484375, 0.03812408447265625, 0.0450592041015625, 0.05199432373046875, 0.058929443359375, 0.06586456298828125, 0.0727996826171875, 0.07973480224609375, 0.086669921875, 0.09360504150390625, 0.1005401611328125, 0.10747528076171875, 0.114410400390625, 0.12134552001953125, 0.1282806396484375, 0.13521575927734375, 0.14215087890625, 0.14908599853515625, 0.1560211181640625, 0.16295623779296875, 0.169891357421875, 0.17682647705078125, 0.1837615966796875, 0.19069671630859375, 0.1976318359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 7.0, 7.0, 7.0, 8.0, 16.0, 16.0, 23.0, 21.0, 21.0, 31.0, 39.0, 58.0, 46.0, 63.0, 60.0, 59.0, 57.0, 46.0, 50.0, 49.0, 61.0, 46.0, 48.0, 31.0, 30.0, 23.0, 18.0, 11.0, 11.0, 12.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.062255859375, -0.060442447662353516, -0.05862903594970703, -0.05681562423706055, -0.05500221252441406, -0.05318880081176758, -0.051375389099121094, -0.04956197738647461, -0.047748565673828125, -0.04593515396118164, -0.044121742248535156, -0.04230833053588867, -0.04049491882324219, -0.0386815071105957, -0.03686809539794922, -0.035054683685302734, -0.03324127197265625, -0.031427860260009766, -0.02961444854736328, -0.027801036834716797, -0.025987625122070312, -0.024174213409423828, -0.022360801696777344, -0.02054738998413086, -0.018733978271484375, -0.01692056655883789, -0.015107154846191406, -0.013293743133544922, -0.011480331420898438, -0.009666919708251953, -0.007853507995605469, -0.006040096282958984, -0.0042266845703125, -0.0024132728576660156, -0.0005998611450195312, 0.0012135505676269531, 0.0030269622802734375, 0.004840373992919922, 0.006653785705566406, 0.00846719741821289, 0.010280609130859375, 0.01209402084350586, 0.013907432556152344, 0.015720844268798828, 0.017534255981445312, 0.019347667694091797, 0.02116107940673828, 0.022974491119384766, 0.02478790283203125, 0.026601314544677734, 0.02841472625732422, 0.030228137969970703, 0.03204154968261719, 0.03385496139526367, 0.035668373107910156, 0.03748178482055664, 0.039295196533203125, 0.04110860824584961, 0.042922019958496094, 0.04473543167114258, 0.04654884338378906, 0.04836225509643555, 0.05017566680908203, 0.051989078521728516, 0.053802490234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 24.0, 41.0, 51.0, 98.0, 196.0, 311.0, 630.0, 1662.0, 5582.0, 37622.0, 536430.0, 427184.0, 31050.0, 4848.0, 1455.0, 589.0, 317.0, 179.0, 105.0, 61.0, 35.0, 30.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5784149169921875, -0.563568115234375, -0.5487213134765625, -0.53387451171875, -0.5190277099609375, -0.504180908203125, -0.4893341064453125, -0.4744873046875, -0.4596405029296875, -0.444793701171875, -0.4299468994140625, -0.41510009765625, -0.4002532958984375, -0.385406494140625, -0.3705596923828125, -0.355712890625, -0.3408660888671875, -0.326019287109375, -0.3111724853515625, -0.29632568359375, -0.2814788818359375, -0.266632080078125, -0.2517852783203125, -0.2369384765625, -0.2220916748046875, -0.207244873046875, -0.1923980712890625, -0.17755126953125, -0.1627044677734375, -0.147857666015625, -0.1330108642578125, -0.1181640625, -0.1033172607421875, -0.088470458984375, -0.0736236572265625, -0.05877685546875, -0.0439300537109375, -0.029083251953125, -0.0142364501953125, 0.0006103515625, 0.0154571533203125, 0.030303955078125, 0.0451507568359375, 0.05999755859375, 0.0748443603515625, 0.089691162109375, 0.1045379638671875, 0.119384765625, 0.1342315673828125, 0.149078369140625, 0.1639251708984375, 0.17877197265625, 0.1936187744140625, 0.208465576171875, 0.2233123779296875, 0.2381591796875, 0.2530059814453125, 0.267852783203125, 0.2826995849609375, 0.29754638671875, 0.3123931884765625, 0.327239990234375, 0.3420867919921875, 0.35693359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 13.0, 18.0, 18.0, 21.0, 24.0, 33.0, 40.0, 41.0, 62.0, 53.0, 68.0, 64.0, 78.0, 73.0, 62.0, 63.0, 61.0, 36.0, 32.0, 24.0, 27.0, 22.0, 13.0, 17.0, 8.0, 1.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39111328125, -0.38060760498046875, -0.3701019287109375, -0.35959625244140625, -0.349090576171875, -0.33858489990234375, -0.3280792236328125, -0.31757354736328125, -0.30706787109375, -0.29656219482421875, -0.2860565185546875, -0.27555084228515625, -0.265045166015625, -0.25453948974609375, -0.2440338134765625, -0.23352813720703125, -0.2230224609375, -0.21251678466796875, -0.2020111083984375, -0.19150543212890625, -0.180999755859375, -0.17049407958984375, -0.1599884033203125, -0.14948272705078125, -0.13897705078125, -0.12847137451171875, -0.1179656982421875, -0.10746002197265625, -0.096954345703125, -0.08644866943359375, -0.0759429931640625, -0.06543731689453125, -0.054931640625, -0.04442596435546875, -0.0339202880859375, -0.02341461181640625, -0.012908935546875, -0.00240325927734375, 0.0081024169921875, 0.01860809326171875, 0.02911376953125, 0.03961944580078125, 0.0501251220703125, 0.06063079833984375, 0.071136474609375, 0.08164215087890625, 0.0921478271484375, 0.10265350341796875, 0.1131591796875, 0.12366485595703125, 0.1341705322265625, 0.14467620849609375, 0.155181884765625, 0.16568756103515625, 0.1761932373046875, 0.18669891357421875, 0.19720458984375, 0.20771026611328125, 0.2182159423828125, 0.22872161865234375, 0.239227294921875, 0.24973297119140625, 0.2602386474609375, 0.27074432373046875, 0.28125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 12.0, 9.0, 19.0, 16.0, 27.0, 46.0, 53.0, 86.0, 157.0, 222.0, 376.0, 645.0, 1117.0, 2098.0, 4073.0, 8570.0, 20785.0, 59727.0, 255209.0, 528501.0, 108666.0, 33256.0, 12731.0, 5771.0, 2797.0, 1462.0, 790.0, 459.0, 299.0, 186.0, 125.0, 72.0, 56.0, 41.0, 26.0, 15.0, 19.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1690673828125, -0.16365432739257812, -0.15824127197265625, -0.15282821655273438, -0.1474151611328125, -0.14200210571289062, -0.13658905029296875, -0.13117599487304688, -0.125762939453125, -0.12034988403320312, -0.11493682861328125, -0.10952377319335938, -0.1041107177734375, -0.09869766235351562, -0.09328460693359375, -0.08787155151367188, -0.08245849609375, -0.07704544067382812, -0.07163238525390625, -0.06621932983398438, -0.0608062744140625, -0.055393218994140625, -0.04998016357421875, -0.044567108154296875, -0.039154052734375, -0.033740997314453125, -0.02832794189453125, -0.022914886474609375, -0.0175018310546875, -0.012088775634765625, -0.00667572021484375, -0.001262664794921875, 0.004150390625, 0.009563446044921875, 0.01497650146484375, 0.020389556884765625, 0.0258026123046875, 0.031215667724609375, 0.03662872314453125, 0.042041778564453125, 0.047454833984375, 0.052867889404296875, 0.05828094482421875, 0.06369400024414062, 0.0691070556640625, 0.07452011108398438, 0.07993316650390625, 0.08534622192382812, 0.09075927734375, 0.09617233276367188, 0.10158538818359375, 0.10699844360351562, 0.1124114990234375, 0.11782455444335938, 0.12323760986328125, 0.12865066528320312, 0.134063720703125, 0.13947677612304688, 0.14488983154296875, 0.15030288696289062, 0.1557159423828125, 0.16112899780273438, 0.16654205322265625, 0.17195510864257812, 0.1773681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 14.0, 14.0, 15.0, 34.0, 27.0, 37.0, 45.0, 65.0, 89.0, 78.0, 93.0, 73.0, 81.0, 57.0, 46.0, 45.0, 38.0, 29.0, 16.0, 17.0, 8.0, 8.0, 5.0, 4.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6253204345703125e-05, -4.484318196773529e-05, -4.3433159589767456e-05, -4.202313721179962e-05, -4.061311483383179e-05, -3.920309245586395e-05, -3.779307007789612e-05, -3.6383047699928284e-05, -3.497302532196045e-05, -3.3563002943992615e-05, -3.215298056602478e-05, -3.0742958188056946e-05, -2.933293581008911e-05, -2.7922913432121277e-05, -2.6512891054153442e-05, -2.5102868676185608e-05, -2.3692846298217773e-05, -2.228282392024994e-05, -2.0872801542282104e-05, -1.946277916431427e-05, -1.8052756786346436e-05, -1.66427344083786e-05, -1.5232712030410767e-05, -1.3822689652442932e-05, -1.2412667274475098e-05, -1.1002644896507263e-05, -9.592622518539429e-06, -8.182600140571594e-06, -6.77257776260376e-06, -5.362555384635925e-06, -3.952533006668091e-06, -2.5425106287002563e-06, -1.1324882507324219e-06, 2.775341272354126e-07, 1.687556505203247e-06, 3.0975788831710815e-06, 4.507601261138916e-06, 5.9176236391067505e-06, 7.327646017074585e-06, 8.73766839504242e-06, 1.0147690773010254e-05, 1.1557713150978088e-05, 1.2967735528945923e-05, 1.4377757906913757e-05, 1.5787780284881592e-05, 1.7197802662849426e-05, 1.860782504081726e-05, 2.0017847418785095e-05, 2.142786979675293e-05, 2.2837892174720764e-05, 2.42479145526886e-05, 2.5657936930656433e-05, 2.7067959308624268e-05, 2.8477981686592102e-05, 2.9888004064559937e-05, 3.129802644252777e-05, 3.2708048820495605e-05, 3.411807119846344e-05, 3.5528093576431274e-05, 3.693811595439911e-05, 3.834813833236694e-05, 3.975816071033478e-05, 4.116818308830261e-05, 4.257820546627045e-05, 4.398822784423828e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 15.0, 12.0, 33.0, 45.0, 69.0, 128.0, 247.0, 538.0, 1144.0, 3510.0, 13660.0, 82022.0, 768987.0, 149718.0, 20816.0, 4770.0, 1505.0, 628.0, 300.0, 164.0, 78.0, 66.0, 39.0, 16.0, 7.0, 2.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.26918792724609375, -0.2590789794921875, -0.24897003173828125, -0.238861083984375, -0.22875213623046875, -0.2186431884765625, -0.20853424072265625, -0.19842529296875, -0.18831634521484375, -0.1782073974609375, -0.16809844970703125, -0.157989501953125, -0.14788055419921875, -0.1377716064453125, -0.12766265869140625, -0.1175537109375, -0.10744476318359375, -0.0973358154296875, -0.08722686767578125, -0.077117919921875, -0.06700897216796875, -0.0569000244140625, -0.04679107666015625, -0.03668212890625, -0.02657318115234375, -0.0164642333984375, -0.00635528564453125, 0.003753662109375, 0.01386260986328125, 0.0239715576171875, 0.03408050537109375, 0.044189453125, 0.05429840087890625, 0.0644073486328125, 0.07451629638671875, 0.084625244140625, 0.09473419189453125, 0.1048431396484375, 0.11495208740234375, 0.12506103515625, 0.13516998291015625, 0.1452789306640625, 0.15538787841796875, 0.165496826171875, 0.17560577392578125, 0.1857147216796875, 0.19582366943359375, 0.2059326171875, 0.21604156494140625, 0.2261505126953125, 0.23625946044921875, 0.246368408203125, 0.25647735595703125, 0.2665863037109375, 0.27669525146484375, 0.28680419921875, 0.29691314697265625, 0.3070220947265625, 0.31713104248046875, 0.327239990234375, 0.33734893798828125, 0.3474578857421875, 0.35756683349609375, 0.36767578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 3.0, 9.0, 13.0, 10.0, 8.0, 24.0, 10.0, 26.0, 30.0, 54.0, 66.0, 107.0, 130.0, 111.0, 79.0, 67.0, 45.0, 39.0, 26.0, 20.0, 16.0, 11.0, 14.0, 12.0, 11.0, 10.0, 5.0, 0.0, 2.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142822265625, -0.13818931579589844, -0.13355636596679688, -0.1289234161376953, -0.12429046630859375, -0.11965751647949219, -0.11502456665039062, -0.11039161682128906, -0.1057586669921875, -0.10112571716308594, -0.09649276733398438, -0.09185981750488281, -0.08722686767578125, -0.08259391784667969, -0.07796096801757812, -0.07332801818847656, -0.068695068359375, -0.06406211853027344, -0.059429168701171875, -0.05479621887207031, -0.05016326904296875, -0.04553031921386719, -0.040897369384765625, -0.03626441955566406, -0.0316314697265625, -0.026998519897460938, -0.022365570068359375, -0.017732620239257812, -0.01309967041015625, -0.008466720581054688, -0.003833770751953125, 0.0007991790771484375, 0.00543212890625, 0.010065078735351562, 0.014698028564453125, 0.019330978393554688, 0.02396392822265625, 0.028596878051757812, 0.033229827880859375, 0.03786277770996094, 0.0424957275390625, 0.04712867736816406, 0.051761627197265625, 0.05639457702636719, 0.06102752685546875, 0.06566047668457031, 0.07029342651367188, 0.07492637634277344, 0.079559326171875, 0.08419227600097656, 0.08882522583007812, 0.09345817565917969, 0.09809112548828125, 0.10272407531738281, 0.10735702514648438, 0.11198997497558594, 0.1166229248046875, 0.12125587463378906, 0.12588882446289062, 0.1305217742919922, 0.13515472412109375, 0.1397876739501953, 0.14442062377929688, 0.14905357360839844, 0.1536865234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 16.0, 19.0, 47.0, 67.0, 85.0, 139.0, 140.0, 141.0, 116.0, 93.0, 46.0, 38.0, 21.0, 8.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.738926649093628, -1.6743013858795166, -1.6096762418746948, -1.5450509786605835, -1.4804257154464722, -1.4158005714416504, -1.351175308227539, -1.2865500450134277, -1.2219247817993164, -1.157299518585205, -1.0926743745803833, -1.028049111366272, -0.9634238481521606, -0.8987986445426941, -0.8341734409332275, -0.7695481777191162, -0.7049230337142944, -0.6402978301048279, -0.5756725668907166, -0.51104736328125, -0.44642212986946106, -0.3817968964576721, -0.31717169284820557, -0.2525464594364166, -0.18792122602462769, -0.12329600006341934, -0.058670774102211, 0.005954444408416748, 0.07057967782020569, 0.13520491123199463, 0.19983011484146118, 0.2644553482532501, 0.32908058166503906, 0.393705815076828, 0.45833104848861694, 0.5229562520980835, 0.5875815153121948, 0.6522067189216614, 0.7168319225311279, 0.7814571857452393, 0.8460823893547058, 0.9107075929641724, 0.9753328561782837, 1.0399580001831055, 1.1045832633972168, 1.1692085266113281, 1.2338337898254395, 1.2984589338302612, 1.3630841970443726, 1.4277094602584839, 1.4923346042633057, 1.556959867477417, 1.6215851306915283, 1.6862103939056396, 1.7508355379104614, 1.8154608011245728, 1.8800859451293945, 1.9447112083435059, 2.009336471557617, 2.0739617347717285, 2.1385867595672607, 2.203212022781372, 2.2678372859954834, 2.3324625492095947, 2.397087812423706]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 7.0, 7.0, 10.0, 11.0, 19.0, 21.0, 21.0, 19.0, 27.0, 24.0, 49.0, 41.0, 50.0, 40.0, 56.0, 54.0, 48.0, 52.0, 44.0, 37.0, 58.0, 32.0, 49.0, 36.0, 35.0, 26.0, 23.0, 18.0, 20.0, 14.0, 6.0, 4.0, 4.0, 9.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6430422067642212, -1.598127841949463, -1.5532134771347046, -1.5082991123199463, -1.4633848667144775, -1.4184705018997192, -1.373556137084961, -1.3286417722702026, -1.2837274074554443, -1.238813042640686, -1.1938986778259277, -1.1489843130111694, -1.1040699481964111, -1.0591557025909424, -1.014241337776184, -0.9693269729614258, -0.9244126081466675, -0.8794982433319092, -0.8345838785171509, -0.7896695733070374, -0.744755208492279, -0.6998408436775208, -0.6549265384674072, -0.6100121736526489, -0.5650978088378906, -0.5201834440231323, -0.4752691090106964, -0.4303547739982605, -0.3854404091835022, -0.3405260443687439, -0.295611709356308, -0.25069737434387207, -0.20578312873840332, -0.1608687788248062, -0.1159544289112091, -0.071040078997612, -0.026125729084014893, 0.018788620829582214, 0.06370297074317932, 0.10861730575561523, 0.15353167057037354, 0.19844602048397064, 0.24336037039756775, 0.28827470541000366, 0.33318907022476196, 0.37810343503952026, 0.4230177700519562, 0.4679321050643921, 0.5128464698791504, 0.5577608346939087, 0.602675199508667, 0.6475895047187805, 0.6925038695335388, 0.7374182343482971, 0.7823325395584106, 0.827246904373169, 0.8721612691879272, 0.9170756340026855, 0.9619899988174438, 1.0069043636322021, 1.051818609237671, 1.0967329740524292, 1.1416473388671875, 1.1865617036819458, 1.231476068496704]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 10.0, 11.0, 15.0, 23.0, 35.0, 49.0, 84.0, 128.0, 211.0, 324.0, 555.0, 1033.0, 1958.0, 4029.0, 9137.0, 25165.0, 91019.0, 2496218.0, 1437920.0, 85717.0, 23669.0, 8874.0, 3799.0, 1866.0, 978.0, 557.0, 303.0, 182.0, 125.0, 81.0, 58.0, 36.0, 31.0, 19.0, 15.0, 13.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.2370586395263672, -0.22887802124023438, -0.22069740295410156, -0.21251678466796875, -0.20433616638183594, -0.19615554809570312, -0.1879749298095703, -0.1797943115234375, -0.1716136932373047, -0.16343307495117188, -0.15525245666503906, -0.14707183837890625, -0.13889122009277344, -0.13071060180664062, -0.12252998352050781, -0.114349365234375, -0.10616874694824219, -0.09798812866210938, -0.08980751037597656, -0.08162689208984375, -0.07344627380371094, -0.06526565551757812, -0.05708503723144531, -0.0489044189453125, -0.04072380065917969, -0.032543182373046875, -0.024362564086914062, -0.01618194580078125, -0.008001327514648438, 0.000179290771484375, 0.008359909057617188, 0.01654052734375, 0.024721145629882812, 0.032901763916015625, 0.04108238220214844, 0.04926300048828125, 0.05744361877441406, 0.06562423706054688, 0.07380485534667969, 0.0819854736328125, 0.09016609191894531, 0.09834671020507812, 0.10652732849121094, 0.11470794677734375, 0.12288856506347656, 0.13106918334960938, 0.1392498016357422, 0.147430419921875, 0.1556110382080078, 0.16379165649414062, 0.17197227478027344, 0.18015289306640625, 0.18833351135253906, 0.19651412963867188, 0.2046947479248047, 0.2128753662109375, 0.2210559844970703, 0.22923660278320312, 0.23741722106933594, 0.24559783935546875, 0.25377845764160156, 0.2619590759277344, 0.2701396942138672, 0.2783203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 17.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 49.0, 47.0, 54.0, 55.0, 77.0, 58.0, 63.0, 68.0, 60.0, 53.0, 58.0, 46.0, 29.0, 25.0, 29.0, 21.0, 13.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06298828125, -0.06085777282714844, -0.058727264404296875, -0.05659675598144531, -0.05446624755859375, -0.05233573913574219, -0.050205230712890625, -0.04807472229003906, -0.0459442138671875, -0.04381370544433594, -0.041683197021484375, -0.03955268859863281, -0.03742218017578125, -0.03529167175292969, -0.033161163330078125, -0.031030654907226562, -0.028900146484375, -0.026769638061523438, -0.024639129638671875, -0.022508621215820312, -0.02037811279296875, -0.018247604370117188, -0.016117095947265625, -0.013986587524414062, -0.0118560791015625, -0.009725570678710938, -0.007595062255859375, -0.0054645538330078125, -0.00333404541015625, -0.0012035369873046875, 0.000926971435546875, 0.0030574798583984375, 0.00518798828125, 0.0073184967041015625, 0.009449005126953125, 0.011579513549804688, 0.01371002197265625, 0.015840530395507812, 0.017971038818359375, 0.020101547241210938, 0.0222320556640625, 0.024362564086914062, 0.026493072509765625, 0.028623580932617188, 0.03075408935546875, 0.03288459777832031, 0.035015106201171875, 0.03714561462402344, 0.039276123046875, 0.04140663146972656, 0.043537139892578125, 0.04566764831542969, 0.04779815673828125, 0.04992866516113281, 0.052059173583984375, 0.05418968200683594, 0.0563201904296875, 0.05845069885253906, 0.060581207275390625, 0.06271171569824219, 0.06484222412109375, 0.06697273254394531, 0.06910324096679688, 0.07123374938964844, 0.0733642578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 16.0, 11.0, 17.0, 36.0, 46.0, 66.0, 86.0, 183.0, 391.0, 783.0, 1946.0, 5259.0, 16393.0, 67744.0, 599282.0, 3329645.0, 131783.0, 27636.0, 8037.0, 2818.0, 1079.0, 431.0, 225.0, 139.0, 71.0, 46.0, 35.0, 24.0, 10.0, 11.0, 6.0, 5.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.430908203125, -0.41991424560546875, -0.4089202880859375, -0.39792633056640625, -0.386932373046875, -0.37593841552734375, -0.3649444580078125, -0.35395050048828125, -0.34295654296875, -0.33196258544921875, -0.3209686279296875, -0.30997467041015625, -0.298980712890625, -0.28798675537109375, -0.2769927978515625, -0.26599884033203125, -0.2550048828125, -0.24401092529296875, -0.2330169677734375, -0.22202301025390625, -0.211029052734375, -0.20003509521484375, -0.1890411376953125, -0.17804718017578125, -0.16705322265625, -0.15605926513671875, -0.1450653076171875, -0.13407135009765625, -0.123077392578125, -0.11208343505859375, -0.1010894775390625, -0.09009552001953125, -0.0791015625, -0.06810760498046875, -0.0571136474609375, -0.04611968994140625, -0.035125732421875, -0.02413177490234375, -0.0131378173828125, -0.00214385986328125, 0.00885009765625, 0.01984405517578125, 0.0308380126953125, 0.04183197021484375, 0.052825927734375, 0.06381988525390625, 0.0748138427734375, 0.08580780029296875, 0.0968017578125, 0.10779571533203125, 0.1187896728515625, 0.12978363037109375, 0.140777587890625, 0.15177154541015625, 0.1627655029296875, 0.17375946044921875, 0.18475341796875, 0.19574737548828125, 0.2067413330078125, 0.21773529052734375, 0.228729248046875, 0.23972320556640625, 0.2507171630859375, 0.26171112060546875, 0.272705078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 10.0, 15.0, 14.0, 34.0, 38.0, 72.0, 102.0, 163.0, 369.0, 1721.0, 845.0, 288.0, 114.0, 88.0, 58.0, 34.0, 21.0, 25.0, 16.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2093505859375, -0.20434284210205078, -0.19933509826660156, -0.19432735443115234, -0.18931961059570312, -0.1843118667602539, -0.1793041229248047, -0.17429637908935547, -0.16928863525390625, -0.16428089141845703, -0.1592731475830078, -0.1542654037475586, -0.14925765991210938, -0.14424991607666016, -0.13924217224121094, -0.13423442840576172, -0.1292266845703125, -0.12421894073486328, -0.11921119689941406, -0.11420345306396484, -0.10919570922851562, -0.1041879653930664, -0.09918022155761719, -0.09417247772216797, -0.08916473388671875, -0.08415699005126953, -0.07914924621582031, -0.0741415023803711, -0.06913375854492188, -0.06412601470947266, -0.05911827087402344, -0.05411052703857422, -0.049102783203125, -0.04409503936767578, -0.03908729553222656, -0.034079551696777344, -0.029071807861328125, -0.024064064025878906, -0.019056320190429688, -0.014048576354980469, -0.00904083251953125, -0.004033088684082031, 0.0009746551513671875, 0.005982398986816406, 0.010990142822265625, 0.015997886657714844, 0.021005630493164062, 0.02601337432861328, 0.0310211181640625, 0.03602886199951172, 0.04103660583496094, 0.046044349670410156, 0.051052093505859375, 0.056059837341308594, 0.06106758117675781, 0.06607532501220703, 0.07108306884765625, 0.07609081268310547, 0.08109855651855469, 0.0861063003540039, 0.09111404418945312, 0.09612178802490234, 0.10112953186035156, 0.10613727569580078, 0.11114501953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 11.0, 16.0, 55.0, 148.0, 283.0, 251.0, 156.0, 54.0, 23.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.73797869682312, -2.681168556213379, -2.6243584156036377, -2.5675482749938965, -2.5107381343841553, -2.453927993774414, -2.397117853164673, -2.3403077125549316, -2.2834973335266113, -2.22668719291687, -2.169877052307129, -2.1130669116973877, -2.0562567710876465, -1.9994466304779053, -1.9426363706588745, -1.8858262300491333, -1.8290162086486816, -1.7722060680389404, -1.7153959274291992, -1.658585786819458, -1.6017756462097168, -1.5449655055999756, -1.4881552457809448, -1.4313451051712036, -1.3745349645614624, -1.3177248239517212, -1.26091468334198, -1.2041045427322388, -1.147294282913208, -1.0904841423034668, -1.0336740016937256, -0.9768638610839844, -0.9200537800788879, -0.8632436394691467, -0.8064334392547607, -0.7496232986450195, -0.6928131580352783, -0.6360030174255371, -0.5791928768157959, -0.5223826766014099, -0.4655725359916687, -0.4087623953819275, -0.3519522249698639, -0.2951420545578003, -0.23833191394805908, -0.18152177333831787, -0.12471160292625427, -0.06790143251419067, -0.011091291904449463, 0.04571886360645294, 0.10252901911735535, 0.15933917462825775, 0.21614933013916016, 0.27295947074890137, 0.32976964116096497, 0.38657981157302856, 0.4433899521827698, 0.500200092792511, 0.557010293006897, 0.6138204336166382, 0.6706305742263794, 0.7274407148361206, 0.7842508554458618, 0.8410610556602478, 0.897871196269989]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 22.0, 33.0, 42.0, 41.0, 54.0, 58.0, 70.0, 70.0, 65.0, 64.0, 68.0, 63.0, 59.0, 56.0, 48.0, 42.0, 24.0, 31.0, 28.0, 11.0, 11.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8174375295639038, -0.7941892743110657, -0.7709410190582275, -0.7476927042007446, -0.7244444489479065, -0.7011961936950684, -0.6779479384422302, -0.6546996831893921, -0.6314513683319092, -0.608203113079071, -0.5849548578262329, -0.56170654296875, -0.5384582877159119, -0.5152100324630737, -0.4919617772102356, -0.46871352195739746, -0.4454652667045593, -0.4222170114517212, -0.39896872639656067, -0.37572047114372253, -0.352472186088562, -0.3292239308357239, -0.30597567558288574, -0.2827274203300476, -0.2594791352748871, -0.23623086512088776, -0.21298259496688843, -0.1897343397140503, -0.16648606956005096, -0.14323779940605164, -0.1199895441532135, -0.09674127399921417, -0.07349306344985962, -0.05024479702115059, -0.02699653059244156, -0.003748267889022827, 0.0195000022649765, 0.04274827241897583, 0.06599652767181396, 0.0892447978258133, 0.11249306797981262, 0.13574133813381195, 0.15898960828781128, 0.18223786354064941, 0.20548613369464874, 0.22873440384864807, 0.2519826591014862, 0.27523094415664673, 0.29847919940948486, 0.321727454662323, 0.3449757397174835, 0.36822399497032166, 0.3914722800254822, 0.4147205352783203, 0.43796879053115845, 0.4612170457839966, 0.4844653308391571, 0.5077136158943176, 0.5309618711471558, 0.5542101263999939, 0.577458381652832, 0.6007066965103149, 0.6239548921585083, 0.6472032070159912, 0.6704514622688293]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 15.0, 31.0, 27.0, 56.0, 90.0, 114.0, 163.0, 292.0, 446.0, 800.0, 1294.0, 2353.0, 4379.0, 8584.0, 17701.0, 38781.0, 102292.0, 524241.0, 233138.0, 61435.0, 26391.0, 12223.0, 6098.0, 3234.0, 1790.0, 987.0, 567.0, 361.0, 246.0, 124.0, 84.0, 63.0, 51.0, 34.0, 19.0, 5.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21329116821289062, -0.20612335205078125, -0.19895553588867188, -0.1917877197265625, -0.18461990356445312, -0.17745208740234375, -0.17028427124023438, -0.163116455078125, -0.15594863891601562, -0.14878082275390625, -0.14161300659179688, -0.1344451904296875, -0.12727737426757812, -0.12010955810546875, -0.11294174194335938, -0.10577392578125, -0.09860610961914062, -0.09143829345703125, -0.08427047729492188, -0.0771026611328125, -0.06993484497070312, -0.06276702880859375, -0.055599212646484375, -0.048431396484375, -0.041263580322265625, -0.03409576416015625, -0.026927947998046875, -0.0197601318359375, -0.012592315673828125, -0.00542449951171875, 0.001743316650390625, 0.0089111328125, 0.016078948974609375, 0.02324676513671875, 0.030414581298828125, 0.0375823974609375, 0.044750213623046875, 0.05191802978515625, 0.059085845947265625, 0.066253662109375, 0.07342147827148438, 0.08058929443359375, 0.08775711059570312, 0.0949249267578125, 0.10209274291992188, 0.10926055908203125, 0.11642837524414062, 0.12359619140625, 0.13076400756835938, 0.13793182373046875, 0.14509963989257812, 0.1522674560546875, 0.15943527221679688, 0.16660308837890625, 0.17377090454101562, 0.180938720703125, 0.18810653686523438, 0.19527435302734375, 0.20244216918945312, 0.2096099853515625, 0.21677780151367188, 0.22394561767578125, 0.23111343383789062, 0.23828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 6.0, 16.0, 10.0, 23.0, 14.0, 19.0, 25.0, 32.0, 27.0, 31.0, 34.0, 41.0, 50.0, 42.0, 46.0, 47.0, 66.0, 43.0, 39.0, 53.0, 45.0, 40.0, 49.0, 35.0, 26.0, 30.0, 17.0, 13.0, 15.0, 10.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.056243896484375, -0.0545191764831543, -0.052794456481933594, -0.05106973648071289, -0.04934501647949219, -0.047620296478271484, -0.04589557647705078, -0.04417085647583008, -0.042446136474609375, -0.04072141647338867, -0.03899669647216797, -0.037271976470947266, -0.03554725646972656, -0.03382253646850586, -0.032097816467285156, -0.030373096466064453, -0.02864837646484375, -0.026923656463623047, -0.025198936462402344, -0.02347421646118164, -0.021749496459960938, -0.020024776458740234, -0.01830005645751953, -0.016575336456298828, -0.014850616455078125, -0.013125896453857422, -0.011401176452636719, -0.009676456451416016, -0.007951736450195312, -0.006227016448974609, -0.004502296447753906, -0.002777576446533203, -0.0010528564453125, 0.0006718635559082031, 0.0023965835571289062, 0.004121303558349609, 0.0058460235595703125, 0.007570743560791016, 0.009295463562011719, 0.011020183563232422, 0.012744903564453125, 0.014469623565673828, 0.01619434356689453, 0.017919063568115234, 0.019643783569335938, 0.02136850357055664, 0.023093223571777344, 0.024817943572998047, 0.02654266357421875, 0.028267383575439453, 0.029992103576660156, 0.03171682357788086, 0.03344154357910156, 0.035166263580322266, 0.03689098358154297, 0.03861570358276367, 0.040340423583984375, 0.04206514358520508, 0.04378986358642578, 0.045514583587646484, 0.04723930358886719, 0.04896402359008789, 0.050688743591308594, 0.0524134635925293, 0.05413818359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 9.0, 16.0, 18.0, 43.0, 58.0, 92.0, 173.0, 344.0, 617.0, 1440.0, 5368.0, 30667.0, 480709.0, 489801.0, 30995.0, 5350.0, 1374.0, 688.0, 322.0, 183.0, 127.0, 57.0, 32.0, 23.0, 17.0, 13.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5108909606933594, -0.49492645263671875, -0.4789619445800781, -0.4629974365234375, -0.4470329284667969, -0.43106842041015625, -0.4151039123535156, -0.399139404296875, -0.3831748962402344, -0.36721038818359375, -0.3512458801269531, -0.3352813720703125, -0.3193168640136719, -0.30335235595703125, -0.2873878479003906, -0.27142333984375, -0.2554588317871094, -0.23949432373046875, -0.22352981567382812, -0.2075653076171875, -0.19160079956054688, -0.17563629150390625, -0.15967178344726562, -0.143707275390625, -0.12774276733398438, -0.11177825927734375, -0.09581375122070312, -0.0798492431640625, -0.06388473510742188, -0.04792022705078125, -0.031955718994140625, -0.0159912109375, -2.6702880859375e-05, 0.01593780517578125, 0.031902313232421875, 0.0478668212890625, 0.06383132934570312, 0.07979583740234375, 0.09576034545898438, 0.111724853515625, 0.12768936157226562, 0.14365386962890625, 0.15961837768554688, 0.1755828857421875, 0.19154739379882812, 0.20751190185546875, 0.22347640991210938, 0.23944091796875, 0.2554054260253906, 0.27136993408203125, 0.2873344421386719, 0.3032989501953125, 0.3192634582519531, 0.33522796630859375, 0.3511924743652344, 0.367156982421875, 0.3831214904785156, 0.39908599853515625, 0.4150505065917969, 0.4310150146484375, 0.4469795227050781, 0.46294403076171875, 0.4789085388183594, 0.494873046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 5.0, 5.0, 7.0, 14.0, 18.0, 18.0, 21.0, 26.0, 41.0, 62.0, 56.0, 74.0, 70.0, 70.0, 79.0, 72.0, 72.0, 52.0, 66.0, 40.0, 30.0, 23.0, 17.0, 16.0, 12.0, 11.0, 10.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.423828125, -0.4123382568359375, -0.400848388671875, -0.3893585205078125, -0.37786865234375, -0.3663787841796875, -0.354888916015625, -0.3433990478515625, -0.3319091796875, -0.3204193115234375, -0.308929443359375, -0.2974395751953125, -0.28594970703125, -0.2744598388671875, -0.262969970703125, -0.2514801025390625, -0.239990234375, -0.2285003662109375, -0.217010498046875, -0.2055206298828125, -0.19403076171875, -0.1825408935546875, -0.171051025390625, -0.1595611572265625, -0.1480712890625, -0.1365814208984375, -0.125091552734375, -0.1136016845703125, -0.10211181640625, -0.0906219482421875, -0.079132080078125, -0.0676422119140625, -0.05615234375, -0.0446624755859375, -0.033172607421875, -0.0216827392578125, -0.01019287109375, 0.0012969970703125, 0.012786865234375, 0.0242767333984375, 0.0357666015625, 0.0472564697265625, 0.058746337890625, 0.0702362060546875, 0.08172607421875, 0.0932159423828125, 0.104705810546875, 0.1161956787109375, 0.127685546875, 0.1391754150390625, 0.150665283203125, 0.1621551513671875, 0.17364501953125, 0.1851348876953125, 0.196624755859375, 0.2081146240234375, 0.2196044921875, 0.2310943603515625, 0.242584228515625, 0.2540740966796875, 0.26556396484375, 0.2770538330078125, 0.288543701171875, 0.3000335693359375, 0.3115234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 17.0, 16.0, 30.0, 69.0, 111.0, 163.0, 339.0, 757.0, 1920.0, 5371.0, 19654.0, 590198.0, 403358.0, 18164.0, 5005.0, 1809.0, 732.0, 351.0, 190.0, 109.0, 59.0, 26.0, 43.0, 15.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52001953125, -0.5047149658203125, -0.489410400390625, -0.4741058349609375, -0.45880126953125, -0.4434967041015625, -0.428192138671875, -0.4128875732421875, -0.3975830078125, -0.3822784423828125, -0.366973876953125, -0.3516693115234375, -0.33636474609375, -0.3210601806640625, -0.305755615234375, -0.2904510498046875, -0.275146484375, -0.2598419189453125, -0.244537353515625, -0.2292327880859375, -0.21392822265625, -0.1986236572265625, -0.183319091796875, -0.1680145263671875, -0.1527099609375, -0.1374053955078125, -0.122100830078125, -0.1067962646484375, -0.09149169921875, -0.0761871337890625, -0.060882568359375, -0.0455780029296875, -0.0302734375, -0.0149688720703125, 0.000335693359375, 0.0156402587890625, 0.03094482421875, 0.0462493896484375, 0.061553955078125, 0.0768585205078125, 0.0921630859375, 0.1074676513671875, 0.122772216796875, 0.1380767822265625, 0.15338134765625, 0.1686859130859375, 0.183990478515625, 0.1992950439453125, 0.214599609375, 0.2299041748046875, 0.245208740234375, 0.2605133056640625, 0.27581787109375, 0.2911224365234375, 0.306427001953125, 0.3217315673828125, 0.3370361328125, 0.3523406982421875, 0.367645263671875, 0.3829498291015625, 0.39825439453125, 0.4135589599609375, 0.428863525390625, 0.4441680908203125, 0.45947265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 11.0, 18.0, 31.0, 61.0, 117.0, 218.0, 213.0, 148.0, 73.0, 43.0, 21.0, 13.0, 11.0, 9.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.161233901977539e-05, -8.811336010694504e-05, -8.461438119411469e-05, -8.111540228128433e-05, -7.761642336845398e-05, -7.411744445562363e-05, -7.061846554279327e-05, -6.711948662996292e-05, -6.362050771713257e-05, -6.0121528804302216e-05, -5.662254989147186e-05, -5.312357097864151e-05, -4.962459206581116e-05, -4.6125613152980804e-05, -4.262663424015045e-05, -3.91276553273201e-05, -3.5628676414489746e-05, -3.212969750165939e-05, -2.863071858882904e-05, -2.5131739675998688e-05, -2.1632760763168335e-05, -1.8133781850337982e-05, -1.463480293750763e-05, -1.1135824024677277e-05, -7.636845111846924e-06, -4.137866199016571e-06, -6.388872861862183e-07, 2.8600916266441345e-06, 6.359070539474487e-06, 9.85804945230484e-06, 1.3357028365135193e-05, 1.6856007277965546e-05, 2.03549861907959e-05, 2.385396510362625e-05, 2.7352944016456604e-05, 3.085192292928696e-05, 3.435090184211731e-05, 3.784988075494766e-05, 4.1348859667778015e-05, 4.484783858060837e-05, 4.834681749343872e-05, 5.1845796406269073e-05, 5.5344775319099426e-05, 5.884375423192978e-05, 6.234273314476013e-05, 6.584171205759048e-05, 6.934069097042084e-05, 7.283966988325119e-05, 7.633864879608154e-05, 7.98376277089119e-05, 8.333660662174225e-05, 8.68355855345726e-05, 9.033456444740295e-05, 9.383354336023331e-05, 9.733252227306366e-05, 0.00010083150118589401, 0.00010433048009872437, 0.00010782945901155472, 0.00011132843792438507, 0.00011482741683721542, 0.00011832639575004578, 0.00012182537466287613, 0.00012532435357570648, 0.00012882333248853683, 0.0001323223114013672]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 7.0, 11.0, 12.0, 27.0, 27.0, 58.0, 71.0, 127.0, 223.0, 419.0, 795.0, 1909.0, 5176.0, 17029.0, 225274.0, 764033.0, 22752.0, 6262.0, 2294.0, 945.0, 447.0, 261.0, 135.0, 86.0, 45.0, 33.0, 25.0, 24.0, 7.0, 8.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5543899536132812, -0.5394439697265625, -0.5244979858398438, -0.509552001953125, -0.49460601806640625, -0.4796600341796875, -0.46471405029296875, -0.44976806640625, -0.43482208251953125, -0.4198760986328125, -0.40493011474609375, -0.389984130859375, -0.37503814697265625, -0.3600921630859375, -0.34514617919921875, -0.3302001953125, -0.31525421142578125, -0.3003082275390625, -0.28536224365234375, -0.270416259765625, -0.25547027587890625, -0.2405242919921875, -0.22557830810546875, -0.21063232421875, -0.19568634033203125, -0.1807403564453125, -0.16579437255859375, -0.150848388671875, -0.13590240478515625, -0.1209564208984375, -0.10601043701171875, -0.091064453125, -0.07611846923828125, -0.0611724853515625, -0.04622650146484375, -0.031280517578125, -0.01633453369140625, -0.0013885498046875, 0.01355743408203125, 0.02850341796875, 0.04344940185546875, 0.0583953857421875, 0.07334136962890625, 0.088287353515625, 0.10323333740234375, 0.1181793212890625, 0.13312530517578125, 0.1480712890625, 0.16301727294921875, 0.1779632568359375, 0.19290924072265625, 0.207855224609375, 0.22280120849609375, 0.2377471923828125, 0.25269317626953125, 0.26763916015625, 0.28258514404296875, 0.2975311279296875, 0.31247711181640625, 0.327423095703125, 0.34236907958984375, 0.3573150634765625, 0.37226104736328125, 0.38720703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 4.0, 3.0, 11.0, 11.0, 14.0, 21.0, 27.0, 49.0, 122.0, 444.0, 139.0, 54.0, 38.0, 18.0, 12.0, 6.0, 8.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.3944816589355469, -0.38368988037109375, -0.3728981018066406, -0.3621063232421875, -0.3513145446777344, -0.34052276611328125, -0.3297309875488281, -0.318939208984375, -0.3081474304199219, -0.29735565185546875, -0.2865638732910156, -0.2757720947265625, -0.2649803161621094, -0.25418853759765625, -0.24339675903320312, -0.23260498046875, -0.22181320190429688, -0.21102142333984375, -0.20022964477539062, -0.1894378662109375, -0.17864608764648438, -0.16785430908203125, -0.15706253051757812, -0.146270751953125, -0.13547897338867188, -0.12468719482421875, -0.11389541625976562, -0.1031036376953125, -0.09231185913085938, -0.08152008056640625, -0.07072830200195312, -0.0599365234375, -0.049144744873046875, -0.03835296630859375, -0.027561187744140625, -0.0167694091796875, -0.005977630615234375, 0.00481414794921875, 0.015605926513671875, 0.026397705078125, 0.037189483642578125, 0.04798126220703125, 0.058773040771484375, 0.0695648193359375, 0.08035659790039062, 0.09114837646484375, 0.10194015502929688, 0.11273193359375, 0.12352371215820312, 0.13431549072265625, 0.14510726928710938, 0.1558990478515625, 0.16669082641601562, 0.17748260498046875, 0.18827438354492188, 0.199066162109375, 0.20985794067382812, 0.22064971923828125, 0.23144149780273438, 0.2422332763671875, 0.2530250549316406, 0.26381683349609375, 0.2746086120605469, 0.285400390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 14.0, 23.0, 79.0, 121.0, 255.0, 217.0, 168.0, 77.0, 29.0, 10.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.621408939361572, -5.481589317321777, -5.341769695281982, -5.201949596405029, -5.062129974365234, -4.9223103523254395, -4.7824907302856445, -4.64267110824585, -4.502851486206055, -4.36303186416626, -4.223212242126465, -4.083392143249512, -3.943572521209717, -3.803752899169922, -3.663933277130127, -3.524113655090332, -3.384293556213379, -3.244473934173584, -3.10465407371521, -2.964834451675415, -2.825014591217041, -2.685194969177246, -2.545375347137451, -2.4055557250976562, -2.2657358646392822, -2.1259162425994873, -1.9860963821411133, -1.8462767601013184, -1.7064570188522339, -1.5666372776031494, -1.4268176555633545, -1.28699791431427, -1.1471786499023438, -1.0073589086532593, -0.8675392270088196, -0.7277195453643799, -0.5878998041152954, -0.44808006286621094, -0.30826038122177124, -0.16844069957733154, -0.02862095832824707, 0.11119875311851501, 0.2510184645652771, 0.3908381760120392, 0.5306578874588013, 0.6704776287078857, 0.8102973103523254, 0.9501169919967651, 1.0899367332458496, 1.229756474494934, 1.3695762157440186, 1.5093958377838135, 1.649215579032898, 1.7890353202819824, 1.9288549423217773, 2.0686745643615723, 2.2084944248199463, 2.348314046859741, 2.4881339073181152, 2.62795352935791, 2.767773151397705, 2.907593011856079, 3.047412633895874, 3.187232494354248, 3.327052116394043]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 7.0, 6.0, 12.0, 6.0, 8.0, 15.0, 15.0, 16.0, 20.0, 27.0, 21.0, 21.0, 27.0, 40.0, 28.0, 38.0, 39.0, 46.0, 48.0, 29.0, 50.0, 38.0, 37.0, 33.0, 38.0, 35.0, 39.0, 36.0, 34.0, 31.0, 15.0, 23.0, 9.0, 17.0, 13.0, 13.0, 23.0, 10.0, 5.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2642617225646973, -1.2237061262130737, -1.1831506490707397, -1.1425950527191162, -1.1020395755767822, -1.0614839792251587, -1.0209285020828247, -0.9803729057312012, -0.9398173689842224, -0.8992618322372437, -0.8587062954902649, -0.8181507587432861, -0.7775951623916626, -0.7370396852493286, -0.6964840888977051, -0.6559285521507263, -0.6153730154037476, -0.5748174786567688, -0.53426194190979, -0.4937063753604889, -0.45315083861351013, -0.41259530186653137, -0.3720397353172302, -0.33148419857025146, -0.2909286618232727, -0.25037312507629395, -0.209817573428154, -0.16926202178001404, -0.12870648503303528, -0.08815094828605652, -0.047595396637916565, -0.007039844989776611, 0.03351569175720215, 0.0740712359547615, 0.11462678015232086, 0.15518233180046082, 0.19573786854743958, 0.23629340529441833, 0.2768489718437195, 0.31740450859069824, 0.357960045337677, 0.39851558208465576, 0.4390711188316345, 0.47962668538093567, 0.5201822519302368, 0.5607377290725708, 0.6012933254241943, 0.6418488621711731, 0.6824043989181519, 0.7229599356651306, 0.7635154724121094, 0.8040710091590881, 0.8446265459060669, 0.8851821422576904, 0.9257376790046692, 0.966293215751648, 1.0068488121032715, 1.047404408454895, 1.087959885597229, 1.1285154819488525, 1.1690709590911865, 1.20962655544281, 1.250182032585144, 1.2907376289367676, 1.3312931060791016]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 13.0, 9.0, 11.0, 14.0, 17.0, 27.0, 42.0, 51.0, 59.0, 96.0, 115.0, 210.0, 371.0, 546.0, 843.0, 1457.0, 2537.0, 4800.0, 10310.0, 24374.0, 75655.0, 810517.0, 3114533.0, 94877.0, 28500.0, 11608.0, 5564.0, 2919.0, 1621.0, 947.0, 556.0, 371.0, 229.0, 151.0, 100.0, 60.0, 35.0, 40.0, 21.0, 29.0, 10.0, 8.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.279541015625, -0.2715721130371094, -0.26360321044921875, -0.2556343078613281, -0.2476654052734375, -0.23969650268554688, -0.23172760009765625, -0.22375869750976562, -0.215789794921875, -0.20782089233398438, -0.19985198974609375, -0.19188308715820312, -0.1839141845703125, -0.17594528198242188, -0.16797637939453125, -0.16000747680664062, -0.15203857421875, -0.14406967163085938, -0.13610076904296875, -0.12813186645507812, -0.1201629638671875, -0.11219406127929688, -0.10422515869140625, -0.09625625610351562, -0.088287353515625, -0.08031845092773438, -0.07234954833984375, -0.06438064575195312, -0.0564117431640625, -0.048442840576171875, -0.04047393798828125, -0.032505035400390625, -0.0245361328125, -0.016567230224609375, -0.00859832763671875, -0.000629425048828125, 0.0073394775390625, 0.015308380126953125, 0.02327728271484375, 0.031246185302734375, 0.039215087890625, 0.047183990478515625, 0.05515289306640625, 0.06312179565429688, 0.0710906982421875, 0.07905960083007812, 0.08702850341796875, 0.09499740600585938, 0.10296630859375, 0.11093521118164062, 0.11890411376953125, 0.12687301635742188, 0.1348419189453125, 0.14281082153320312, 0.15077972412109375, 0.15874862670898438, 0.166717529296875, 0.17468643188476562, 0.18265533447265625, 0.19062423706054688, 0.1985931396484375, 0.20656204223632812, 0.21453094482421875, 0.22249984741210938, 0.23046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 10.0, 9.0, 8.0, 17.0, 17.0, 20.0, 16.0, 26.0, 28.0, 34.0, 44.0, 41.0, 39.0, 48.0, 52.0, 47.0, 46.0, 32.0, 51.0, 39.0, 58.0, 45.0, 40.0, 32.0, 31.0, 31.0, 36.0, 22.0, 13.0, 14.0, 6.0, 10.0, 7.0, 8.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06640625, -0.06442022323608398, -0.06243419647216797, -0.06044816970825195, -0.05846214294433594, -0.05647611618041992, -0.054490089416503906, -0.05250406265258789, -0.050518035888671875, -0.04853200912475586, -0.046545982360839844, -0.04455995559692383, -0.04257392883300781, -0.0405879020690918, -0.03860187530517578, -0.036615848541259766, -0.03462982177734375, -0.032643795013427734, -0.03065776824951172, -0.028671741485595703, -0.026685714721679688, -0.024699687957763672, -0.022713661193847656, -0.02072763442993164, -0.018741607666015625, -0.01675558090209961, -0.014769554138183594, -0.012783527374267578, -0.010797500610351562, -0.008811473846435547, -0.006825447082519531, -0.004839420318603516, -0.0028533935546875, -0.0008673667907714844, 0.0011186599731445312, 0.003104686737060547, 0.0050907135009765625, 0.007076740264892578, 0.009062767028808594, 0.01104879379272461, 0.013034820556640625, 0.01502084732055664, 0.017006874084472656, 0.018992900848388672, 0.020978927612304688, 0.022964954376220703, 0.02495098114013672, 0.026937007904052734, 0.02892303466796875, 0.030909061431884766, 0.03289508819580078, 0.0348811149597168, 0.03686714172363281, 0.03885316848754883, 0.040839195251464844, 0.04282522201538086, 0.044811248779296875, 0.04679727554321289, 0.048783302307128906, 0.05076932907104492, 0.05275535583496094, 0.05474138259887695, 0.05672740936279297, 0.058713436126708984, 0.060699462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 22.0, 32.0, 45.0, 76.0, 103.0, 125.0, 232.0, 357.0, 616.0, 1223.0, 2294.0, 5417.0, 14938.0, 51274.0, 342935.0, 3589827.0, 137256.0, 30023.0, 9574.0, 3787.0, 1772.0, 947.0, 523.0, 303.0, 177.0, 112.0, 71.0, 62.0, 34.0, 19.0, 12.0, 18.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.457275390625, -0.44467926025390625, -0.4320831298828125, -0.41948699951171875, -0.406890869140625, -0.39429473876953125, -0.3816986083984375, -0.36910247802734375, -0.35650634765625, -0.34391021728515625, -0.3313140869140625, -0.31871795654296875, -0.306121826171875, -0.29352569580078125, -0.2809295654296875, -0.26833343505859375, -0.2557373046875, -0.24314117431640625, -0.2305450439453125, -0.21794891357421875, -0.205352783203125, -0.19275665283203125, -0.1801605224609375, -0.16756439208984375, -0.15496826171875, -0.14237213134765625, -0.1297760009765625, -0.11717987060546875, -0.104583740234375, -0.09198760986328125, -0.0793914794921875, -0.06679534912109375, -0.05419921875, -0.04160308837890625, -0.0290069580078125, -0.01641082763671875, -0.003814697265625, 0.00878143310546875, 0.0213775634765625, 0.03397369384765625, 0.04656982421875, 0.05916595458984375, 0.0717620849609375, 0.08435821533203125, 0.096954345703125, 0.10955047607421875, 0.1221466064453125, 0.13474273681640625, 0.1473388671875, 0.15993499755859375, 0.1725311279296875, 0.18512725830078125, 0.197723388671875, 0.21031951904296875, 0.2229156494140625, 0.23551177978515625, 0.24810791015625, 0.26070404052734375, 0.2733001708984375, 0.28589630126953125, 0.298492431640625, 0.31108856201171875, 0.3236846923828125, 0.33628082275390625, 0.348876953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 4.0, 10.0, 14.0, 30.0, 33.0, 60.0, 84.0, 154.0, 580.0, 2321.0, 381.0, 153.0, 82.0, 50.0, 36.0, 21.0, 21.0, 4.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21848106384277344, -0.21247482299804688, -0.2064685821533203, -0.20046234130859375, -0.1944561004638672, -0.18844985961914062, -0.18244361877441406, -0.1764373779296875, -0.17043113708496094, -0.16442489624023438, -0.1584186553955078, -0.15241241455078125, -0.1464061737060547, -0.14039993286132812, -0.13439369201660156, -0.128387451171875, -0.12238121032714844, -0.11637496948242188, -0.11036872863769531, -0.10436248779296875, -0.09835624694824219, -0.09235000610351562, -0.08634376525878906, -0.0803375244140625, -0.07433128356933594, -0.06832504272460938, -0.06231880187988281, -0.05631256103515625, -0.05030632019042969, -0.044300079345703125, -0.03829383850097656, -0.03228759765625, -0.026281356811523438, -0.020275115966796875, -0.014268875122070312, -0.00826263427734375, -0.0022563934326171875, 0.003749847412109375, 0.009756088256835938, 0.0157623291015625, 0.021768569946289062, 0.027774810791015625, 0.03378105163574219, 0.03978729248046875, 0.04579353332519531, 0.051799774169921875, 0.05780601501464844, 0.063812255859375, 0.06981849670410156, 0.07582473754882812, 0.08183097839355469, 0.08783721923828125, 0.09384346008300781, 0.09984970092773438, 0.10585594177246094, 0.1118621826171875, 0.11786842346191406, 0.12387466430664062, 0.1298809051513672, 0.13588714599609375, 0.1418933868408203, 0.14789962768554688, 0.15390586853027344, 0.159912109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 36.0, 42.0, 56.0, 113.0, 103.0, 129.0, 110.0, 125.0, 96.0, 51.0, 40.0, 18.0, 26.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0710904598236084, -1.042158603668213, -1.0132266283035278, -0.9842947125434875, -0.9553627967834473, -0.9264309406280518, -0.8974990248680115, -0.8685671091079712, -0.8396351933479309, -0.8107032775878906, -0.7817713618278503, -0.7528394460678101, -0.7239075899124146, -0.6949756145477295, -0.666043758392334, -0.6371118426322937, -0.6081799268722534, -0.5792480111122131, -0.5503160953521729, -0.5213841795921326, -0.4924522936344147, -0.4635203778743744, -0.4345884919166565, -0.4056565761566162, -0.3767246603965759, -0.34779274463653564, -0.31886082887649536, -0.28992894291877747, -0.2609970271587372, -0.2320651113986969, -0.2031332105398178, -0.17420130968093872, -0.14526933431625366, -0.11633742600679398, -0.08740551769733429, -0.0584736093878746, -0.029541701078414917, -0.0006097853183746338, 0.028322115540504456, 0.057254016399383545, 0.08618593215942383, 0.11511784046888351, 0.1440497487783432, 0.1729816496372223, 0.20191356539726257, 0.23084548115730286, 0.25977736711502075, 0.28870928287506104, 0.3176411986351013, 0.3465731143951416, 0.3755050301551819, 0.4044369161128998, 0.43336883187294006, 0.46230074763298035, 0.49123263359069824, 0.5201645493507385, 0.5490964651107788, 0.5780283808708191, 0.6069602966308594, 0.6358922123908997, 0.6648241281509399, 0.6937559843063354, 0.7226879000663757, 0.751619815826416, 0.7805517315864563]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 9.0, 10.0, 12.0, 10.0, 14.0, 29.0, 23.0, 24.0, 20.0, 27.0, 30.0, 29.0, 30.0, 30.0, 34.0, 28.0, 40.0, 38.0, 44.0, 40.0, 30.0, 45.0, 34.0, 35.0, 26.0, 25.0, 30.0, 25.0, 26.0, 15.0, 25.0, 19.0, 28.0, 19.0, 18.0, 11.0, 8.0, 10.0, 7.0, 8.0, 7.0, 4.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.42418307065963745, -0.41092607378959656, -0.3976690471172333, -0.3844120502471924, -0.3711550533771515, -0.3578980267047882, -0.3446410298347473, -0.33138400316238403, -0.31812700629234314, -0.30487000942230225, -0.29161298274993896, -0.27835598587989807, -0.2650989890098572, -0.2518419623374939, -0.238584965467453, -0.22532795369625092, -0.21207095682621002, -0.19881394505500793, -0.18555694818496704, -0.17229993641376495, -0.15904292464256287, -0.14578592777252197, -0.13252891600131989, -0.1192719042301178, -0.10601489990949631, -0.09275789558887482, -0.07950088381767273, -0.06624387949705124, -0.05298687145113945, -0.03972986340522766, -0.02647285908460617, -0.013215847313404083, 4.1157007217407227e-05, 0.013298164121806622, 0.026555171236395836, 0.039812177419662476, 0.053069185465574265, 0.06632619351148605, 0.07958319783210754, 0.09284020960330963, 0.10609721392393112, 0.11935421824455261, 0.1326112300157547, 0.1458682417869568, 0.15912523865699768, 0.17238225042819977, 0.18563926219940186, 0.19889625906944275, 0.21215327084064484, 0.22541028261184692, 0.23866727948188782, 0.2519242763519287, 0.265181303024292, 0.2784382998943329, 0.2916952967643738, 0.30495232343673706, 0.31820932030677795, 0.33146631717681885, 0.34472334384918213, 0.357980340719223, 0.3712373375892639, 0.3844943642616272, 0.3977513611316681, 0.411008358001709, 0.42426538467407227]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 10.0, 12.0, 15.0, 14.0, 27.0, 44.0, 60.0, 94.0, 135.0, 212.0, 372.0, 598.0, 994.0, 1760.0, 3241.0, 6365.0, 12656.0, 26285.0, 61200.0, 219200.0, 493876.0, 134307.0, 45022.0, 20501.0, 10103.0, 5020.0, 2801.0, 1449.0, 767.0, 505.0, 293.0, 196.0, 113.0, 95.0, 55.0, 45.0, 23.0, 24.0, 16.0, 12.0, 11.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.23486328125, -0.22873687744140625, -0.2226104736328125, -0.21648406982421875, -0.210357666015625, -0.20423126220703125, -0.1981048583984375, -0.19197845458984375, -0.18585205078125, -0.17972564697265625, -0.1735992431640625, -0.16747283935546875, -0.161346435546875, -0.15522003173828125, -0.1490936279296875, -0.14296722412109375, -0.1368408203125, -0.13071441650390625, -0.1245880126953125, -0.11846160888671875, -0.112335205078125, -0.10620880126953125, -0.1000823974609375, -0.09395599365234375, -0.08782958984375, -0.08170318603515625, -0.0755767822265625, -0.06945037841796875, -0.063323974609375, -0.05719757080078125, -0.0510711669921875, -0.04494476318359375, -0.038818359375, -0.03269195556640625, -0.0265655517578125, -0.02043914794921875, -0.014312744140625, -0.00818634033203125, -0.0020599365234375, 0.00406646728515625, 0.01019287109375, 0.01631927490234375, 0.0224456787109375, 0.02857208251953125, 0.034698486328125, 0.04082489013671875, 0.0469512939453125, 0.05307769775390625, 0.0592041015625, 0.06533050537109375, 0.0714569091796875, 0.07758331298828125, 0.083709716796875, 0.08983612060546875, 0.0959625244140625, 0.10208892822265625, 0.10821533203125, 0.11434173583984375, 0.1204681396484375, 0.12659454345703125, 0.132720947265625, 0.13884735107421875, 0.1449737548828125, 0.15110015869140625, 0.1572265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 9.0, 8.0, 14.0, 19.0, 15.0, 26.0, 25.0, 31.0, 35.0, 39.0, 31.0, 46.0, 45.0, 50.0, 47.0, 61.0, 50.0, 49.0, 41.0, 42.0, 51.0, 38.0, 47.0, 31.0, 33.0, 18.0, 31.0, 11.0, 9.0, 13.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07811260223388672, -0.07584190368652344, -0.07357120513916016, -0.07130050659179688, -0.0690298080444336, -0.06675910949707031, -0.06448841094970703, -0.06221771240234375, -0.05994701385498047, -0.05767631530761719, -0.055405616760253906, -0.053134918212890625, -0.050864219665527344, -0.04859352111816406, -0.04632282257080078, -0.0440521240234375, -0.04178142547607422, -0.03951072692871094, -0.037240028381347656, -0.034969329833984375, -0.032698631286621094, -0.030427932739257812, -0.02815723419189453, -0.02588653564453125, -0.02361583709716797, -0.021345138549804688, -0.019074440002441406, -0.016803741455078125, -0.014533042907714844, -0.012262344360351562, -0.009991645812988281, -0.007720947265625, -0.005450248718261719, -0.0031795501708984375, -0.0009088516235351562, 0.001361846923828125, 0.0036325454711914062, 0.0059032440185546875, 0.008173942565917969, 0.01044464111328125, 0.012715339660644531, 0.014986038208007812, 0.017256736755371094, 0.019527435302734375, 0.021798133850097656, 0.024068832397460938, 0.02633953094482422, 0.0286102294921875, 0.03088092803955078, 0.03315162658691406, 0.035422325134277344, 0.037693023681640625, 0.039963722229003906, 0.04223442077636719, 0.04450511932373047, 0.04677581787109375, 0.04904651641845703, 0.05131721496582031, 0.053587913513183594, 0.055858612060546875, 0.058129310607910156, 0.06040000915527344, 0.06267070770263672, 0.06494140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 12.0, 17.0, 24.0, 28.0, 57.0, 78.0, 202.0, 301.0, 608.0, 1536.0, 4370.0, 13719.0, 53823.0, 783424.0, 152811.0, 25639.0, 7392.0, 2545.0, 980.0, 439.0, 221.0, 117.0, 65.0, 41.0, 23.0, 29.0, 15.0, 10.0, 3.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54345703125, -0.5273513793945312, -0.5112457275390625, -0.49514007568359375, -0.479034423828125, -0.46292877197265625, -0.4468231201171875, -0.43071746826171875, -0.41461181640625, -0.39850616455078125, -0.3824005126953125, -0.36629486083984375, -0.350189208984375, -0.33408355712890625, -0.3179779052734375, -0.30187225341796875, -0.2857666015625, -0.26966094970703125, -0.2535552978515625, -0.23744964599609375, -0.221343994140625, -0.20523834228515625, -0.1891326904296875, -0.17302703857421875, -0.15692138671875, -0.14081573486328125, -0.1247100830078125, -0.10860443115234375, -0.092498779296875, -0.07639312744140625, -0.0602874755859375, -0.04418182373046875, -0.028076171875, -0.01197052001953125, 0.0041351318359375, 0.02024078369140625, 0.036346435546875, 0.05245208740234375, 0.0685577392578125, 0.08466339111328125, 0.10076904296875, 0.11687469482421875, 0.1329803466796875, 0.14908599853515625, 0.165191650390625, 0.18129730224609375, 0.1974029541015625, 0.21350860595703125, 0.2296142578125, 0.24571990966796875, 0.2618255615234375, 0.27793121337890625, 0.294036865234375, 0.31014251708984375, 0.3262481689453125, 0.34235382080078125, 0.35845947265625, 0.37456512451171875, 0.3906707763671875, 0.40677642822265625, 0.422882080078125, 0.43898773193359375, 0.4550933837890625, 0.47119903564453125, 0.4873046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 4.0, 7.0, 12.0, 17.0, 19.0, 36.0, 52.0, 55.0, 60.0, 89.0, 73.0, 93.0, 93.0, 80.0, 64.0, 54.0, 45.0, 38.0, 27.0, 20.0, 10.0, 5.0, 12.0, 6.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.65087890625, -0.6347808837890625, -0.618682861328125, -0.6025848388671875, -0.58648681640625, -0.5703887939453125, -0.554290771484375, -0.5381927490234375, -0.5220947265625, -0.5059967041015625, -0.489898681640625, -0.4738006591796875, -0.45770263671875, -0.4416046142578125, -0.425506591796875, -0.4094085693359375, -0.393310546875, -0.3772125244140625, -0.361114501953125, -0.3450164794921875, -0.32891845703125, -0.3128204345703125, -0.296722412109375, -0.2806243896484375, -0.2645263671875, -0.2484283447265625, -0.232330322265625, -0.2162322998046875, -0.20013427734375, -0.1840362548828125, -0.167938232421875, -0.1518402099609375, -0.1357421875, -0.1196441650390625, -0.103546142578125, -0.0874481201171875, -0.07135009765625, -0.0552520751953125, -0.039154052734375, -0.0230560302734375, -0.0069580078125, 0.0091400146484375, 0.025238037109375, 0.0413360595703125, 0.05743408203125, 0.0735321044921875, 0.089630126953125, 0.1057281494140625, 0.121826171875, 0.1379241943359375, 0.154022216796875, 0.1701202392578125, 0.18621826171875, 0.2023162841796875, 0.218414306640625, 0.2345123291015625, 0.2506103515625, 0.2667083740234375, 0.282806396484375, 0.2989044189453125, 0.31500244140625, 0.3311004638671875, 0.347198486328125, 0.3632965087890625, 0.37939453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 21.0, 13.0, 36.0, 45.0, 46.0, 87.0, 119.0, 157.0, 267.0, 401.0, 609.0, 1069.0, 1887.0, 3883.0, 10519.0, 37420.0, 688278.0, 258670.0, 28580.0, 8676.0, 3415.0, 1688.0, 931.0, 566.0, 371.0, 247.0, 158.0, 115.0, 87.0, 49.0, 38.0, 27.0, 14.0, 11.0, 7.0, 9.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369384765625, -0.358489990234375, -0.34759521484375, -0.336700439453125, -0.3258056640625, -0.314910888671875, -0.30401611328125, -0.293121337890625, -0.2822265625, -0.271331787109375, -0.26043701171875, -0.249542236328125, -0.2386474609375, -0.227752685546875, -0.21685791015625, -0.205963134765625, -0.195068359375, -0.184173583984375, -0.17327880859375, -0.162384033203125, -0.1514892578125, -0.140594482421875, -0.12969970703125, -0.118804931640625, -0.10791015625, -0.097015380859375, -0.08612060546875, -0.075225830078125, -0.0643310546875, -0.053436279296875, -0.04254150390625, -0.031646728515625, -0.020751953125, -0.009857177734375, 0.00103759765625, 0.011932373046875, 0.0228271484375, 0.033721923828125, 0.04461669921875, 0.055511474609375, 0.06640625, 0.077301025390625, 0.08819580078125, 0.099090576171875, 0.1099853515625, 0.120880126953125, 0.13177490234375, 0.142669677734375, 0.153564453125, 0.164459228515625, 0.17535400390625, 0.186248779296875, 0.1971435546875, 0.208038330078125, 0.21893310546875, 0.229827880859375, 0.24072265625, 0.251617431640625, 0.26251220703125, 0.273406982421875, 0.2843017578125, 0.295196533203125, 0.30609130859375, 0.316986083984375, 0.327880859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 11.0, 16.0, 26.0, 34.0, 109.0, 311.0, 288.0, 89.0, 39.0, 18.0, 14.0, 13.0, 8.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.00014095008373260498, -0.00013622641563415527, -0.00013150274753570557, -0.00012677907943725586, -0.00012205541133880615, -0.00011733174324035645, -0.00011260807514190674, -0.00010788440704345703, -0.00010316073894500732, -9.843707084655762e-05, -9.371340274810791e-05, -8.89897346496582e-05, -8.42660665512085e-05, -7.954239845275879e-05, -7.481873035430908e-05, -7.009506225585938e-05, -6.537139415740967e-05, -6.064772605895996e-05, -5.5924057960510254e-05, -5.120038986206055e-05, -4.647672176361084e-05, -4.175305366516113e-05, -3.7029385566711426e-05, -3.230571746826172e-05, -2.7582049369812012e-05, -2.2858381271362305e-05, -1.8134713172912598e-05, -1.341104507446289e-05, -8.687376976013184e-06, -3.9637088775634766e-06, 7.599592208862305e-07, 5.4836273193359375e-06, 1.0207295417785645e-05, 1.4930963516235352e-05, 1.965463161468506e-05, 2.4378299713134766e-05, 2.9101967811584473e-05, 3.382563591003418e-05, 3.854930400848389e-05, 4.3272972106933594e-05, 4.79966402053833e-05, 5.272030830383301e-05, 5.7443976402282715e-05, 6.216764450073242e-05, 6.689131259918213e-05, 7.161498069763184e-05, 7.633864879608154e-05, 8.106231689453125e-05, 8.578598499298096e-05, 9.050965309143066e-05, 9.523332118988037e-05, 9.995698928833008e-05, 0.00010468065738677979, 0.00010940432548522949, 0.0001141279935836792, 0.0001188516616821289, 0.0001235753297805786, 0.00012829899787902832, 0.00013302266597747803, 0.00013774633407592773, 0.00014247000217437744, 0.00014719367027282715, 0.00015191733837127686, 0.00015664100646972656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 2.0, 6.0, 3.0, 6.0, 10.0, 12.0, 12.0, 32.0, 34.0, 88.0, 84.0, 154.0, 238.0, 362.0, 512.0, 740.0, 1026.0, 1720.0, 3059.0, 6684.0, 17857.0, 74302.0, 829378.0, 78661.0, 18521.0, 6735.0, 3167.0, 1743.0, 1088.0, 699.0, 500.0, 368.0, 202.0, 175.0, 102.0, 83.0, 49.0, 44.0, 16.0, 18.0, 20.0, 10.0, 4.0, 0.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34033203125, -0.3295326232910156, -0.31873321533203125, -0.3079338073730469, -0.2971343994140625, -0.2863349914550781, -0.27553558349609375, -0.2647361755371094, -0.253936767578125, -0.24313735961914062, -0.23233795166015625, -0.22153854370117188, -0.2107391357421875, -0.19993972778320312, -0.18914031982421875, -0.17834091186523438, -0.16754150390625, -0.15674209594726562, -0.14594268798828125, -0.13514328002929688, -0.1243438720703125, -0.11354446411132812, -0.10274505615234375, -0.09194564819335938, -0.081146240234375, -0.07034683227539062, -0.05954742431640625, -0.048748016357421875, -0.0379486083984375, -0.027149200439453125, -0.01634979248046875, -0.005550384521484375, 0.0052490234375, 0.016048431396484375, 0.02684783935546875, 0.037647247314453125, 0.0484466552734375, 0.059246063232421875, 0.07004547119140625, 0.08084487915039062, 0.091644287109375, 0.10244369506835938, 0.11324310302734375, 0.12404251098632812, 0.1348419189453125, 0.14564132690429688, 0.15644073486328125, 0.16724014282226562, 0.17803955078125, 0.18883895874023438, 0.19963836669921875, 0.21043777465820312, 0.2212371826171875, 0.23203659057617188, 0.24283599853515625, 0.2536354064941406, 0.264434814453125, 0.2752342224121094, 0.28603363037109375, 0.2968330383300781, 0.3076324462890625, 0.3184318542480469, 0.32923126220703125, 0.3400306701660156, 0.350830078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 10.0, 14.0, 14.0, 14.0, 32.0, 62.0, 178.0, 328.0, 139.0, 62.0, 35.0, 17.0, 16.0, 10.0, 14.0, 4.0, 5.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.36865234375, -0.3587989807128906, -0.34894561767578125, -0.3390922546386719, -0.3292388916015625, -0.3193855285644531, -0.30953216552734375, -0.2996788024902344, -0.289825439453125, -0.2799720764160156, -0.27011871337890625, -0.2602653503417969, -0.2504119873046875, -0.24055862426757812, -0.23070526123046875, -0.22085189819335938, -0.21099853515625, -0.20114517211914062, -0.19129180908203125, -0.18143844604492188, -0.1715850830078125, -0.16173171997070312, -0.15187835693359375, -0.14202499389648438, -0.132171630859375, -0.12231826782226562, -0.11246490478515625, -0.10261154174804688, -0.0927581787109375, -0.08290481567382812, -0.07305145263671875, -0.06319808959960938, -0.0533447265625, -0.043491363525390625, -0.03363800048828125, -0.023784637451171875, -0.0139312744140625, -0.004077911376953125, 0.00577545166015625, 0.015628814697265625, 0.025482177734375, 0.035335540771484375, 0.04518890380859375, 0.055042266845703125, 0.0648956298828125, 0.07474899291992188, 0.08460235595703125, 0.09445571899414062, 0.10430908203125, 0.11416244506835938, 0.12401580810546875, 0.13386917114257812, 0.1437225341796875, 0.15357589721679688, 0.16342926025390625, 0.17328262329101562, 0.183135986328125, 0.19298934936523438, 0.20284271240234375, 0.21269607543945312, 0.2225494384765625, 0.23240280151367188, 0.24225616455078125, 0.2521095275878906, 0.261962890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 5.0, 28.0, 37.0, 90.0, 139.0, 206.0, 215.0, 141.0, 74.0, 29.0, 26.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.804680109024048, -3.663499355316162, -3.5223186016082764, -3.3811378479003906, -3.239956855773926, -3.098776340484619, -2.9575953483581543, -2.8164145946502686, -2.675233840942383, -2.534053087234497, -2.3928723335266113, -2.2516915798187256, -2.11051082611084, -1.9693299531936646, -1.8281490802764893, -1.6869683265686035, -1.5457875728607178, -1.404606819152832, -1.2634260654449463, -1.122245192527771, -0.9810644388198853, -0.8398836851119995, -0.698702871799469, -0.5575220584869385, -0.41634130477905273, -0.2751605212688446, -0.13397973775863647, 0.007201045751571655, 0.14838182926177979, 0.2895625829696655, 0.43074339628219604, 0.5719242095947266, 0.7131052017211914, 0.8542859554290771, 0.9954667687416077, 1.1366475820541382, 1.277828335762024, 1.4190090894699097, 1.560189962387085, 1.7013707160949707, 1.8425514698028564, 1.9837322235107422, 2.124912977218628, 2.2660937309265137, 2.4072747230529785, 2.548455238342285, 2.68963623046875, 2.8308169841766357, 2.9719977378845215, 3.1131784915924072, 3.254359245300293, 3.3955399990081787, 3.5367207527160645, 3.6779017448425293, 3.819082498550415, 3.960263252258301, 4.101444244384766, 4.2426252365112305, 4.383805751800537, 4.524986743927002, 4.666167259216309, 4.807348251342773, 4.94852876663208, 5.089709758758545, 5.230890274047852]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 8.0, 12.0, 16.0, 22.0, 27.0, 24.0, 22.0, 30.0, 35.0, 37.0, 33.0, 31.0, 38.0, 47.0, 41.0, 58.0, 42.0, 42.0, 38.0, 49.0, 35.0, 34.0, 33.0, 33.0, 28.0, 26.0, 18.0, 11.0, 22.0, 12.0, 15.0, 5.0, 10.0, 6.0, 4.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5043754577636719, -1.4553288221359253, -1.4062821865081787, -1.3572355508804321, -1.3081889152526855, -1.259142279624939, -1.2100956439971924, -1.1610491275787354, -1.1120023727416992, -1.0629557371139526, -1.013909101486206, -0.9648624658584595, -0.9158158302307129, -0.8667691946029663, -0.8177226185798645, -0.7686759829521179, -0.7196294069290161, -0.6705827713012695, -0.621536135673523, -0.5724895000457764, -0.5234428644180298, -0.4743962585926056, -0.4253496527671814, -0.3763030171394348, -0.32725638151168823, -0.27820974588394165, -0.22916312515735626, -0.18011650443077087, -0.1310698688030243, -0.08202323317527771, -0.032976627349853516, 0.016070008277893066, 0.06511664390563965, 0.11416327208280563, 0.16320990025997162, 0.212256520986557, 0.2613031566143036, 0.31034979224205017, 0.35939639806747437, 0.40844303369522095, 0.45748966932296753, 0.5065363049507141, 0.5555829405784607, 0.6046295166015625, 0.6536761522293091, 0.7027227878570557, 0.7517694234848022, 0.8008160591125488, 0.8498626947402954, 0.898909330368042, 0.9479559659957886, 0.9970026016235352, 1.0460492372512817, 1.0950958728790283, 1.1441423892974854, 1.1931891441345215, 1.2422356605529785, 1.291282296180725, 1.3403289318084717, 1.3893755674362183, 1.4384222030639648, 1.4874688386917114, 1.536515474319458, 1.585561990737915, 1.6346087455749512]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 11.0, 10.0, 14.0, 23.0, 26.0, 37.0, 65.0, 83.0, 156.0, 215.0, 354.0, 674.0, 1249.0, 2543.0, 5499.0, 14515.0, 51157.0, 692791.0, 3331799.0, 64389.0, 16950.0, 6213.0, 2601.0, 1332.0, 651.0, 357.0, 191.0, 136.0, 81.0, 53.0, 39.0, 23.0, 12.0, 7.0, 11.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.525390625, -0.5108261108398438, -0.4962615966796875, -0.48169708251953125, -0.467132568359375, -0.45256805419921875, -0.4380035400390625, -0.42343902587890625, -0.40887451171875, -0.39430999755859375, -0.3797454833984375, -0.36518096923828125, -0.350616455078125, -0.33605194091796875, -0.3214874267578125, -0.30692291259765625, -0.2923583984375, -0.27779388427734375, -0.2632293701171875, -0.24866485595703125, -0.234100341796875, -0.21953582763671875, -0.2049713134765625, -0.19040679931640625, -0.17584228515625, -0.16127777099609375, -0.1467132568359375, -0.13214874267578125, -0.117584228515625, -0.10301971435546875, -0.0884552001953125, -0.07389068603515625, -0.059326171875, -0.04476165771484375, -0.0301971435546875, -0.01563262939453125, -0.001068115234375, 0.01349639892578125, 0.0280609130859375, 0.04262542724609375, 0.05718994140625, 0.07175445556640625, 0.0863189697265625, 0.10088348388671875, 0.115447998046875, 0.13001251220703125, 0.1445770263671875, 0.15914154052734375, 0.1737060546875, 0.18827056884765625, 0.2028350830078125, 0.21739959716796875, 0.231964111328125, 0.24652862548828125, 0.2610931396484375, 0.27565765380859375, 0.29022216796875, 0.30478668212890625, 0.3193511962890625, 0.33391571044921875, 0.348480224609375, 0.36304473876953125, 0.3776092529296875, 0.39217376708984375, 0.40673828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 14.0, 15.0, 12.0, 13.0, 21.0, 25.0, 25.0, 38.0, 36.0, 38.0, 51.0, 55.0, 44.0, 45.0, 40.0, 56.0, 36.0, 58.0, 39.0, 46.0, 49.0, 38.0, 30.0, 38.0, 23.0, 22.0, 23.0, 13.0, 4.0, 11.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08831787109375, -0.08587169647216797, -0.08342552185058594, -0.0809793472290039, -0.07853317260742188, -0.07608699798583984, -0.07364082336425781, -0.07119464874267578, -0.06874847412109375, -0.06630229949951172, -0.06385612487792969, -0.061409950256347656, -0.058963775634765625, -0.056517601013183594, -0.05407142639160156, -0.05162525177001953, -0.0491790771484375, -0.04673290252685547, -0.04428672790527344, -0.041840553283691406, -0.039394378662109375, -0.036948204040527344, -0.03450202941894531, -0.03205585479736328, -0.02960968017578125, -0.02716350555419922, -0.024717330932617188, -0.022271156311035156, -0.019824981689453125, -0.017378807067871094, -0.014932632446289062, -0.012486457824707031, -0.010040283203125, -0.007594108581542969, -0.0051479339599609375, -0.0027017593383789062, -0.000255584716796875, 0.0021905899047851562, 0.0046367645263671875, 0.007082939147949219, 0.00952911376953125, 0.011975288391113281, 0.014421463012695312, 0.016867637634277344, 0.019313812255859375, 0.021759986877441406, 0.024206161499023438, 0.02665233612060547, 0.0290985107421875, 0.03154468536376953, 0.03399085998535156, 0.036437034606933594, 0.038883209228515625, 0.041329383850097656, 0.04377555847167969, 0.04622173309326172, 0.04866790771484375, 0.05111408233642578, 0.05356025695800781, 0.056006431579589844, 0.058452606201171875, 0.060898780822753906, 0.06334495544433594, 0.06579113006591797, 0.0682373046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 14.0, 20.0, 23.0, 28.0, 48.0, 62.0, 76.0, 121.0, 200.0, 286.0, 448.0, 639.0, 972.0, 1637.0, 2577.0, 4430.0, 8439.0, 18132.0, 48368.0, 219672.0, 3604008.0, 200659.0, 46226.0, 17715.0, 8248.0, 4358.0, 2551.0, 1518.0, 966.0, 551.0, 400.0, 288.0, 170.0, 125.0, 93.0, 73.0, 45.0, 39.0, 22.0, 14.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4349517822265625, -0.420196533203125, -0.4054412841796875, -0.39068603515625, -0.3759307861328125, -0.361175537109375, -0.3464202880859375, -0.3316650390625, -0.3169097900390625, -0.302154541015625, -0.2873992919921875, -0.27264404296875, -0.2578887939453125, -0.243133544921875, -0.2283782958984375, -0.213623046875, -0.1988677978515625, -0.184112548828125, -0.1693572998046875, -0.15460205078125, -0.1398468017578125, -0.125091552734375, -0.1103363037109375, -0.0955810546875, -0.0808258056640625, -0.066070556640625, -0.0513153076171875, -0.03656005859375, -0.0218048095703125, -0.007049560546875, 0.0077056884765625, 0.0224609375, 0.0372161865234375, 0.051971435546875, 0.0667266845703125, 0.08148193359375, 0.0962371826171875, 0.110992431640625, 0.1257476806640625, 0.1405029296875, 0.1552581787109375, 0.170013427734375, 0.1847686767578125, 0.19952392578125, 0.2142791748046875, 0.229034423828125, 0.2437896728515625, 0.258544921875, 0.2733001708984375, 0.288055419921875, 0.3028106689453125, 0.31756591796875, 0.3323211669921875, 0.347076416015625, 0.3618316650390625, 0.3765869140625, 0.3913421630859375, 0.406097412109375, 0.4208526611328125, 0.43560791015625, 0.4503631591796875, 0.465118408203125, 0.4798736572265625, 0.49462890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 9.0, 10.0, 9.0, 12.0, 22.0, 30.0, 33.0, 61.0, 108.0, 304.0, 2340.0, 643.0, 196.0, 96.0, 55.0, 37.0, 23.0, 15.0, 14.0, 12.0, 8.0, 2.0, 3.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21198463439941406, -0.20460891723632812, -0.1972332000732422, -0.18985748291015625, -0.1824817657470703, -0.17510604858398438, -0.16773033142089844, -0.1603546142578125, -0.15297889709472656, -0.14560317993164062, -0.1382274627685547, -0.13085174560546875, -0.12347602844238281, -0.11610031127929688, -0.10872459411621094, -0.101348876953125, -0.09397315979003906, -0.08659744262695312, -0.07922172546386719, -0.07184600830078125, -0.06447029113769531, -0.057094573974609375, -0.04971885681152344, -0.0423431396484375, -0.03496742248535156, -0.027591705322265625, -0.020215988159179688, -0.01284027099609375, -0.0054645538330078125, 0.001911163330078125, 0.009286880493164062, 0.01666259765625, 0.024038314819335938, 0.031414031982421875, 0.03878974914550781, 0.04616546630859375, 0.05354118347167969, 0.060916900634765625, 0.06829261779785156, 0.0756683349609375, 0.08304405212402344, 0.09041976928710938, 0.09779548645019531, 0.10517120361328125, 0.11254692077636719, 0.11992263793945312, 0.12729835510253906, 0.134674072265625, 0.14204978942871094, 0.14942550659179688, 0.1568012237548828, 0.16417694091796875, 0.1715526580810547, 0.17892837524414062, 0.18630409240722656, 0.1936798095703125, 0.20105552673339844, 0.20843124389648438, 0.2158069610595703, 0.22318267822265625, 0.2305583953857422, 0.23793411254882812, 0.24530982971191406, 0.252685546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 21.0, 41.0, 69.0, 87.0, 124.0, 144.0, 156.0, 110.0, 86.0, 62.0, 34.0, 25.0, 14.0, 5.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8972572684288025, -0.8539426922798157, -0.8106281757354736, -0.7673135995864868, -0.7239990234375, -0.6806844472885132, -0.6373698711395264, -0.5940553545951843, -0.5507407784461975, -0.5074262022972107, -0.46411165595054626, -0.42079710960388184, -0.377482533454895, -0.3341679573059082, -0.2908534109592438, -0.24753886461257935, -0.20422428846359253, -0.1609097272157669, -0.11759516596794128, -0.07428060472011566, -0.03096604347229004, 0.012348517775535583, 0.055663079023361206, 0.09897762537002563, 0.14229220151901245, 0.18560676276683807, 0.2289213240146637, 0.2722358703613281, 0.31555044651031494, 0.35886502265930176, 0.4021795690059662, 0.4454941153526306, 0.48880863189697266, 0.5321232080459595, 0.5754377841949463, 0.6187523007392883, 0.6620668768882751, 0.705381453037262, 0.748695969581604, 0.7920105457305908, 0.8353251218795776, 0.8786396980285645, 0.9219542741775513, 0.9652687907218933, 1.0085833072662354, 1.0518978834152222, 1.095212459564209, 1.1385270357131958, 1.1818416118621826, 1.2251561880111694, 1.2684707641601562, 1.311785340309143, 1.3550999164581299, 1.3984143733978271, 1.441728949546814, 1.4850435256958008, 1.5283581018447876, 1.5716726779937744, 1.6149872541427612, 1.658301830291748, 1.7016162872314453, 1.7449308633804321, 1.788245439529419, 1.8315600156784058, 1.8748745918273926]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 7.0, 9.0, 11.0, 11.0, 11.0, 12.0, 10.0, 16.0, 20.0, 11.0, 25.0, 21.0, 30.0, 33.0, 27.0, 30.0, 53.0, 39.0, 40.0, 39.0, 45.0, 48.0, 32.0, 35.0, 33.0, 35.0, 35.0, 36.0, 19.0, 27.0, 26.0, 30.0, 17.0, 19.0, 23.0, 16.0, 13.0, 16.0, 10.0, 5.0, 8.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5524599552154541, -0.5349141359329224, -0.5173683166503906, -0.4998224973678589, -0.48227664828300476, -0.464730829000473, -0.4471850097179413, -0.42963919043540955, -0.4120933413505554, -0.3945475220680237, -0.37700170278549194, -0.3594558835029602, -0.3419100344181061, -0.32436421513557434, -0.3068183958530426, -0.28927257657051086, -0.2717267572879791, -0.2541809380054474, -0.23663510382175446, -0.21908928453922272, -0.20154345035552979, -0.18399763107299805, -0.1664518117904663, -0.14890599250793457, -0.13136015832424164, -0.1138143315911293, -0.09626850485801697, -0.07872268557548523, -0.061176858842372894, -0.04363103210926056, -0.02608521282672882, -0.008539386093616486, 0.00900644063949585, 0.026552265509963036, 0.04409809038043022, 0.06164391338825226, 0.0791897401213646, 0.09673556685447693, 0.11428138613700867, 0.1318272054195404, 0.14937303960323334, 0.16691885888576508, 0.184464693069458, 0.20201051235198975, 0.21955633163452148, 0.23710216581821442, 0.25464797019958496, 0.2721938192844391, 0.2897396385669708, 0.30728545784950256, 0.3248312771320343, 0.3423771262168884, 0.35992294549942017, 0.3774687647819519, 0.39501458406448364, 0.4125604033470154, 0.4301062226295471, 0.44765204191207886, 0.4651978611946106, 0.48274368047714233, 0.5002894997596741, 0.5178353786468506, 0.5353811979293823, 0.5529270172119141, 0.5704728364944458]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 7.0, 6.0, 14.0, 24.0, 19.0, 46.0, 49.0, 93.0, 91.0, 185.0, 257.0, 436.0, 651.0, 1039.0, 1705.0, 2930.0, 4793.0, 8325.0, 14451.0, 25542.0, 46654.0, 88678.0, 190621.0, 312192.0, 169476.0, 80725.0, 43242.0, 23781.0, 13584.0, 7601.0, 4408.0, 2596.0, 1556.0, 973.0, 647.0, 372.0, 269.0, 164.0, 103.0, 80.0, 43.0, 46.0, 22.0, 18.0, 10.0, 9.0, 3.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1846923828125, -0.17862319946289062, -0.17255401611328125, -0.16648483276367188, -0.1604156494140625, -0.15434646606445312, -0.14827728271484375, -0.14220809936523438, -0.136138916015625, -0.13006973266601562, -0.12400054931640625, -0.11793136596679688, -0.1118621826171875, -0.10579299926757812, -0.09972381591796875, -0.09365463256835938, -0.08758544921875, -0.08151626586914062, -0.07544708251953125, -0.06937789916992188, -0.0633087158203125, -0.057239532470703125, -0.05117034912109375, -0.045101165771484375, -0.039031982421875, -0.032962799072265625, -0.02689361572265625, -0.020824432373046875, -0.0147552490234375, -0.008686065673828125, -0.00261688232421875, 0.003452301025390625, 0.009521484375, 0.015590667724609375, 0.02165985107421875, 0.027729034423828125, 0.0337982177734375, 0.039867401123046875, 0.04593658447265625, 0.052005767822265625, 0.058074951171875, 0.06414413452148438, 0.07021331787109375, 0.07628250122070312, 0.0823516845703125, 0.08842086791992188, 0.09449005126953125, 0.10055923461914062, 0.10662841796875, 0.11269760131835938, 0.11876678466796875, 0.12483596801757812, 0.1309051513671875, 0.13697433471679688, 0.14304351806640625, 0.14911270141601562, 0.155181884765625, 0.16125106811523438, 0.16732025146484375, 0.17338943481445312, 0.1794586181640625, 0.18552780151367188, 0.19159698486328125, 0.19766616821289062, 0.2037353515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 7.0, 8.0, 9.0, 15.0, 10.0, 18.0, 19.0, 24.0, 24.0, 18.0, 36.0, 29.0, 33.0, 50.0, 52.0, 40.0, 51.0, 37.0, 31.0, 41.0, 44.0, 33.0, 40.0, 41.0, 50.0, 38.0, 31.0, 22.0, 27.0, 21.0, 18.0, 22.0, 9.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0819091796875, -0.07945442199707031, -0.07699966430664062, -0.07454490661621094, -0.07209014892578125, -0.06963539123535156, -0.06718063354492188, -0.06472587585449219, -0.0622711181640625, -0.05981636047363281, -0.057361602783203125, -0.05490684509277344, -0.05245208740234375, -0.04999732971191406, -0.047542572021484375, -0.04508781433105469, -0.042633056640625, -0.04017829895019531, -0.037723541259765625, -0.03526878356933594, -0.03281402587890625, -0.030359268188476562, -0.027904510498046875, -0.025449752807617188, -0.0229949951171875, -0.020540237426757812, -0.018085479736328125, -0.015630722045898438, -0.01317596435546875, -0.010721206665039062, -0.008266448974609375, -0.0058116912841796875, -0.00335693359375, -0.0009021759033203125, 0.001552581787109375, 0.0040073394775390625, 0.00646209716796875, 0.008916854858398438, 0.011371612548828125, 0.013826370239257812, 0.0162811279296875, 0.018735885620117188, 0.021190643310546875, 0.023645401000976562, 0.02610015869140625, 0.028554916381835938, 0.031009674072265625, 0.03346443176269531, 0.035919189453125, 0.03837394714355469, 0.040828704833984375, 0.04328346252441406, 0.04573822021484375, 0.04819297790527344, 0.050647735595703125, 0.05310249328613281, 0.0555572509765625, 0.05801200866699219, 0.060466766357421875, 0.06292152404785156, 0.06537628173828125, 0.06783103942871094, 0.07028579711914062, 0.07274055480957031, 0.0751953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 3.0, 9.0, 23.0, 16.0, 29.0, 28.0, 39.0, 59.0, 97.0, 161.0, 215.0, 307.0, 489.0, 837.0, 1556.0, 3521.0, 8939.0, 26640.0, 89165.0, 437279.0, 361724.0, 78566.0, 23545.0, 8218.0, 3346.0, 1545.0, 766.0, 471.0, 291.0, 181.0, 138.0, 94.0, 86.0, 36.0, 32.0, 28.0, 17.0, 15.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.455322265625, -0.442657470703125, -0.42999267578125, -0.417327880859375, -0.4046630859375, -0.391998291015625, -0.37933349609375, -0.366668701171875, -0.35400390625, -0.341339111328125, -0.32867431640625, -0.316009521484375, -0.3033447265625, -0.290679931640625, -0.27801513671875, -0.265350341796875, -0.252685546875, -0.240020751953125, -0.22735595703125, -0.214691162109375, -0.2020263671875, -0.189361572265625, -0.17669677734375, -0.164031982421875, -0.1513671875, -0.138702392578125, -0.12603759765625, -0.113372802734375, -0.1007080078125, -0.088043212890625, -0.07537841796875, -0.062713623046875, -0.050048828125, -0.037384033203125, -0.02471923828125, -0.012054443359375, 0.0006103515625, 0.013275146484375, 0.02593994140625, 0.038604736328125, 0.05126953125, 0.063934326171875, 0.07659912109375, 0.089263916015625, 0.1019287109375, 0.114593505859375, 0.12725830078125, 0.139923095703125, 0.152587890625, 0.165252685546875, 0.17791748046875, 0.190582275390625, 0.2032470703125, 0.215911865234375, 0.22857666015625, 0.241241455078125, 0.25390625, 0.266571044921875, 0.27923583984375, 0.291900634765625, 0.3045654296875, 0.317230224609375, 0.32989501953125, 0.342559814453125, 0.355224609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 5.0, 18.0, 10.0, 16.0, 20.0, 22.0, 31.0, 27.0, 39.0, 44.0, 34.0, 49.0, 55.0, 50.0, 58.0, 49.0, 41.0, 45.0, 41.0, 48.0, 39.0, 37.0, 31.0, 25.0, 24.0, 26.0, 24.0, 16.0, 10.0, 11.0, 4.0, 9.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3658714294433594, -0.35210418701171875, -0.3383369445800781, -0.3245697021484375, -0.3108024597167969, -0.29703521728515625, -0.2832679748535156, -0.269500732421875, -0.2557334899902344, -0.24196624755859375, -0.22819900512695312, -0.2144317626953125, -0.20066452026367188, -0.18689727783203125, -0.17313003540039062, -0.15936279296875, -0.14559555053710938, -0.13182830810546875, -0.11806106567382812, -0.1042938232421875, -0.09052658081054688, -0.07675933837890625, -0.06299209594726562, -0.049224853515625, -0.035457611083984375, -0.02169036865234375, -0.007923126220703125, 0.0058441162109375, 0.019611358642578125, 0.03337860107421875, 0.047145843505859375, 0.0609130859375, 0.07468032836914062, 0.08844757080078125, 0.10221481323242188, 0.1159820556640625, 0.12974929809570312, 0.14351654052734375, 0.15728378295898438, 0.171051025390625, 0.18481826782226562, 0.19858551025390625, 0.21235275268554688, 0.2261199951171875, 0.23988723754882812, 0.25365447998046875, 0.2674217224121094, 0.28118896484375, 0.2949562072753906, 0.30872344970703125, 0.3224906921386719, 0.3362579345703125, 0.3500251770019531, 0.36379241943359375, 0.3775596618652344, 0.391326904296875, 0.4050941467285156, 0.41886138916015625, 0.4326286315917969, 0.4463958740234375, 0.4601631164550781, 0.47393035888671875, 0.4876976013183594, 0.50146484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 11.0, 9.0, 16.0, 21.0, 27.0, 48.0, 61.0, 80.0, 147.0, 221.0, 275.0, 453.0, 858.0, 1643.0, 3606.0, 10581.0, 43776.0, 343158.0, 564245.0, 57702.0, 13039.0, 4306.0, 1844.0, 878.0, 561.0, 340.0, 199.0, 138.0, 111.0, 66.0, 45.0, 22.0, 25.0, 17.0, 7.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29132080078125, -0.2801513671875, -0.26898193359375, -0.2578125, -0.24664306640625, -0.2354736328125, -0.22430419921875, -0.213134765625, -0.20196533203125, -0.1907958984375, -0.17962646484375, -0.16845703125, -0.15728759765625, -0.1461181640625, -0.13494873046875, -0.123779296875, -0.11260986328125, -0.1014404296875, -0.09027099609375, -0.0791015625, -0.06793212890625, -0.0567626953125, -0.04559326171875, -0.034423828125, -0.02325439453125, -0.0120849609375, -0.00091552734375, 0.01025390625, 0.02142333984375, 0.0325927734375, 0.04376220703125, 0.054931640625, 0.06610107421875, 0.0772705078125, 0.08843994140625, 0.099609375, 0.11077880859375, 0.1219482421875, 0.13311767578125, 0.144287109375, 0.15545654296875, 0.1666259765625, 0.17779541015625, 0.18896484375, 0.20013427734375, 0.2113037109375, 0.22247314453125, 0.233642578125, 0.24481201171875, 0.2559814453125, 0.26715087890625, 0.2783203125, 0.28948974609375, 0.3006591796875, 0.31182861328125, 0.322998046875, 0.33416748046875, 0.3453369140625, 0.35650634765625, 0.36767578125, 0.37884521484375, 0.3900146484375, 0.40118408203125, 0.412353515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 8.0, 13.0, 27.0, 41.0, 55.0, 98.0, 150.0, 243.0, 150.0, 89.0, 49.0, 31.0, 17.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014066696166992188, -0.00013689789921045303, -0.0001331288367509842, -0.00012935977429151535, -0.0001255907118320465, -0.00012182164937257767, -0.00011805258691310883, -0.00011428352445363998, -0.00011051446199417114, -0.0001067453995347023, -0.00010297633707523346, -9.920727461576462e-05, -9.543821215629578e-05, -9.166914969682693e-05, -8.79000872373581e-05, -8.413102477788925e-05, -8.036196231842041e-05, -7.659289985895157e-05, -7.282383739948273e-05, -6.905477494001389e-05, -6.528571248054504e-05, -6.15166500210762e-05, -5.774758756160736e-05, -5.397852510213852e-05, -5.020946264266968e-05, -4.6440400183200836e-05, -4.2671337723731995e-05, -3.890227526426315e-05, -3.513321280479431e-05, -3.136415034532547e-05, -2.759508788585663e-05, -2.3826025426387787e-05, -2.0056962966918945e-05, -1.6287900507450104e-05, -1.2518838047981262e-05, -8.74977558851242e-06, -4.980713129043579e-06, -1.2116506695747375e-06, 2.557411789894104e-06, 6.3264742493629456e-06, 1.0095536708831787e-05, 1.3864599168300629e-05, 1.763366162776947e-05, 2.1402724087238312e-05, 2.5171786546707153e-05, 2.8940849006175995e-05, 3.2709911465644836e-05, 3.647897392511368e-05, 4.024803638458252e-05, 4.401709884405136e-05, 4.77861613035202e-05, 5.1555223762989044e-05, 5.5324286222457886e-05, 5.909334868192673e-05, 6.286241114139557e-05, 6.663147360086441e-05, 7.040053606033325e-05, 7.41695985198021e-05, 7.793866097927094e-05, 8.170772343873978e-05, 8.547678589820862e-05, 8.924584835767746e-05, 9.30149108171463e-05, 9.678397327661514e-05, 0.00010055303573608398]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 8.0, 4.0, 4.0, 8.0, 8.0, 10.0, 15.0, 29.0, 46.0, 63.0, 117.0, 209.0, 349.0, 626.0, 1273.0, 2605.0, 6917.0, 23644.0, 130796.0, 714788.0, 130835.0, 23705.0, 7060.0, 2647.0, 1220.0, 664.0, 378.0, 190.0, 129.0, 77.0, 45.0, 25.0, 15.0, 14.0, 11.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36483001708984375, -0.3524627685546875, -0.34009552001953125, -0.327728271484375, -0.31536102294921875, -0.3029937744140625, -0.29062652587890625, -0.27825927734375, -0.26589202880859375, -0.2535247802734375, -0.24115753173828125, -0.228790283203125, -0.21642303466796875, -0.2040557861328125, -0.19168853759765625, -0.1793212890625, -0.16695404052734375, -0.1545867919921875, -0.14221954345703125, -0.129852294921875, -0.11748504638671875, -0.1051177978515625, -0.09275054931640625, -0.08038330078125, -0.06801605224609375, -0.0556488037109375, -0.04328155517578125, -0.030914306640625, -0.01854705810546875, -0.0061798095703125, 0.00618743896484375, 0.0185546875, 0.03092193603515625, 0.0432891845703125, 0.05565643310546875, 0.068023681640625, 0.08039093017578125, 0.0927581787109375, 0.10512542724609375, 0.11749267578125, 0.12985992431640625, 0.1422271728515625, 0.15459442138671875, 0.166961669921875, 0.17932891845703125, 0.1916961669921875, 0.20406341552734375, 0.2164306640625, 0.22879791259765625, 0.2411651611328125, 0.25353240966796875, 0.265899658203125, 0.27826690673828125, 0.2906341552734375, 0.30300140380859375, 0.31536865234375, 0.32773590087890625, 0.3401031494140625, 0.35247039794921875, 0.364837646484375, 0.37720489501953125, 0.3895721435546875, 0.40193939208984375, 0.414306640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 11.0, 4.0, 20.0, 10.0, 25.0, 32.0, 44.0, 61.0, 88.0, 131.0, 137.0, 122.0, 77.0, 59.0, 43.0, 37.0, 25.0, 12.0, 14.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25390625, -0.24465560913085938, -0.23540496826171875, -0.22615432739257812, -0.2169036865234375, -0.20765304565429688, -0.19840240478515625, -0.18915176391601562, -0.179901123046875, -0.17065048217773438, -0.16139984130859375, -0.15214920043945312, -0.1428985595703125, -0.13364791870117188, -0.12439727783203125, -0.11514663696289062, -0.10589599609375, -0.09664535522460938, -0.08739471435546875, -0.07814407348632812, -0.0688934326171875, -0.059642791748046875, -0.05039215087890625, -0.041141510009765625, -0.031890869140625, -0.022640228271484375, -0.01338958740234375, -0.004138946533203125, 0.0051116943359375, 0.014362335205078125, 0.02361297607421875, 0.032863616943359375, 0.0421142578125, 0.051364898681640625, 0.06061553955078125, 0.06986618041992188, 0.0791168212890625, 0.08836746215820312, 0.09761810302734375, 0.10686874389648438, 0.116119384765625, 0.12537002563476562, 0.13462066650390625, 0.14387130737304688, 0.1531219482421875, 0.16237258911132812, 0.17162322998046875, 0.18087387084960938, 0.19012451171875, 0.19937515258789062, 0.20862579345703125, 0.21787643432617188, 0.2271270751953125, 0.23637771606445312, 0.24562835693359375, 0.2548789978027344, 0.264129638671875, 0.2733802795410156, 0.28263092041015625, 0.2918815612792969, 0.3011322021484375, 0.3103828430175781, 0.31963348388671875, 0.3288841247558594, 0.338134765625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 13.0, 84.0, 165.0, 313.0, 268.0, 105.0, 37.0, 8.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7446107864379883, -3.470951795578003, -3.1972928047180176, -2.9236338138580322, -2.649974822998047, -2.3763158321380615, -2.102656841278076, -1.8289978504180908, -1.5553388595581055, -1.2816798686981201, -1.0080208778381348, -0.7343618869781494, -0.46070289611816406, -0.1870439052581787, 0.08661508560180664, 0.360274076461792, 0.6339330673217773, 0.9075920581817627, 1.181251049041748, 1.4549100399017334, 1.7285690307617188, 2.002228021621704, 2.2758870124816895, 2.549546003341675, 2.82320499420166, 3.0968639850616455, 3.370522975921631, 3.644181966781616, 3.9178409576416016, 4.191499710083008, 4.465158939361572, 4.738818168640137, 5.012475967407227, 5.286134719848633, 5.559793949127197, 5.833453178405762, 6.107111930847168, 6.380770683288574, 6.654429912567139, 6.928089141845703, 7.201747894287109, 7.475406646728516, 7.74906587600708, 8.022725105285645, 8.29638385772705, 8.570042610168457, 8.84370231628418, 9.117361068725586, 9.391019821166992, 9.664678573608398, 9.938337326049805, 10.211997032165527, 10.485655784606934, 10.75931453704834, 11.032974243164062, 11.306632995605469, 11.580291748046875, 11.853950500488281, 12.127609252929688, 12.40126895904541, 12.674927711486816, 12.948586463928223, 13.222246170043945, 13.495904922485352, 13.769563674926758]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 12.0, 9.0, 9.0, 20.0, 15.0, 16.0, 17.0, 27.0, 32.0, 31.0, 36.0, 50.0, 47.0, 50.0, 49.0, 40.0, 51.0, 35.0, 39.0, 31.0, 45.0, 33.0, 37.0, 40.0, 29.0, 37.0, 26.0, 22.0, 21.0, 18.0, 20.0, 9.0, 5.0, 7.0, 4.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.277494430541992, -2.2030272483825684, -2.1285598278045654, -2.0540926456451416, -1.9796253442764282, -1.9051580429077148, -1.830690860748291, -1.7562235593795776, -1.6817562580108643, -1.6072889566421509, -1.532821774482727, -1.4583544731140137, -1.3838871717453003, -1.309419870376587, -1.234952688217163, -1.1604853868484497, -1.0860182046890259, -1.0115509033203125, -0.9370836615562439, -0.8626164197921753, -0.7881491184234619, -0.7136818766593933, -0.6392146348953247, -0.5647473335266113, -0.4902800917625427, -0.41581282019615173, -0.34134554862976074, -0.26687830686569214, -0.19241103529930115, -0.11794376373291016, -0.04347652196884155, 0.030990779399871826, 0.10545802116394043, 0.17992529273033142, 0.2543925642967224, 0.328859806060791, 0.403327077627182, 0.477794349193573, 0.5522615909576416, 0.626728892326355, 0.7011961340904236, 0.7756633758544922, 0.8501306772232056, 0.9245979189872742, 0.9990651607513428, 1.0735324621200562, 1.1479997634887695, 1.2224669456481934, 1.2969342470169067, 1.3714015483856201, 1.445868730545044, 1.5203360319137573, 1.5948033332824707, 1.6692705154418945, 1.743737816810608, 1.8182051181793213, 1.8926723003387451, 1.9671396017074585, 2.041606903076172, 2.1160740852355957, 2.1905412673950195, 2.2650086879730225, 2.3394758701324463, 2.413943290710449, 2.488410472869873]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 6.0, 14.0, 14.0, 20.0, 29.0, 38.0, 52.0, 92.0, 106.0, 181.0, 213.0, 310.0, 424.0, 680.0, 1043.0, 1646.0, 2768.0, 4803.0, 9031.0, 19490.0, 52281.0, 239593.0, 3558583.0, 212822.0, 50300.0, 19098.0, 8816.0, 4683.0, 2631.0, 1512.0, 983.0, 686.0, 442.0, 285.0, 172.0, 132.0, 77.0, 59.0, 50.0, 34.0, 25.0, 13.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.40283203125, -0.3914756774902344, -0.38011932373046875, -0.3687629699707031, -0.3574066162109375, -0.3460502624511719, -0.33469390869140625, -0.3233375549316406, -0.311981201171875, -0.3006248474121094, -0.28926849365234375, -0.2779121398925781, -0.2665557861328125, -0.2551994323730469, -0.24384307861328125, -0.23248672485351562, -0.22113037109375, -0.20977401733398438, -0.19841766357421875, -0.18706130981445312, -0.1757049560546875, -0.16434860229492188, -0.15299224853515625, -0.14163589477539062, -0.130279541015625, -0.11892318725585938, -0.10756683349609375, -0.09621047973632812, -0.0848541259765625, -0.07349777221679688, -0.06214141845703125, -0.050785064697265625, -0.0394287109375, -0.028072357177734375, -0.01671600341796875, -0.005359649658203125, 0.0059967041015625, 0.017353057861328125, 0.02870941162109375, 0.040065765380859375, 0.051422119140625, 0.06277847290039062, 0.07413482666015625, 0.08549118041992188, 0.0968475341796875, 0.10820388793945312, 0.11956024169921875, 0.13091659545898438, 0.14227294921875, 0.15362930297851562, 0.16498565673828125, 0.17634201049804688, 0.1876983642578125, 0.19905471801757812, 0.21041107177734375, 0.22176742553710938, 0.233123779296875, 0.24448013305664062, 0.25583648681640625, 0.2671928405761719, 0.2785491943359375, 0.2899055480957031, 0.30126190185546875, 0.3126182556152344, 0.323974609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 8.0, 7.0, 19.0, 19.0, 13.0, 28.0, 19.0, 24.0, 29.0, 44.0, 32.0, 37.0, 39.0, 39.0, 46.0, 35.0, 39.0, 48.0, 30.0, 30.0, 40.0, 35.0, 41.0, 38.0, 41.0, 26.0, 18.0, 24.0, 15.0, 25.0, 14.0, 7.0, 13.0, 8.0, 10.0, 10.0, 3.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.08551025390625, -0.08304214477539062, -0.08057403564453125, -0.07810592651367188, -0.0756378173828125, -0.07316970825195312, -0.07070159912109375, -0.06823348999023438, -0.065765380859375, -0.06329727172851562, -0.06082916259765625, -0.058361053466796875, -0.0558929443359375, -0.053424835205078125, -0.05095672607421875, -0.048488616943359375, -0.0460205078125, -0.043552398681640625, -0.04108428955078125, -0.038616180419921875, -0.0361480712890625, -0.033679962158203125, -0.03121185302734375, -0.028743743896484375, -0.026275634765625, -0.023807525634765625, -0.02133941650390625, -0.018871307373046875, -0.0164031982421875, -0.013935089111328125, -0.01146697998046875, -0.008998870849609375, -0.00653076171875, -0.004062652587890625, -0.00159454345703125, 0.000873565673828125, 0.0033416748046875, 0.005809783935546875, 0.00827789306640625, 0.010746002197265625, 0.013214111328125, 0.015682220458984375, 0.01815032958984375, 0.020618438720703125, 0.0230865478515625, 0.025554656982421875, 0.02802276611328125, 0.030490875244140625, 0.032958984375, 0.035427093505859375, 0.03789520263671875, 0.040363311767578125, 0.0428314208984375, 0.045299530029296875, 0.04776763916015625, 0.050235748291015625, 0.052703857421875, 0.055171966552734375, 0.05764007568359375, 0.060108184814453125, 0.0625762939453125, 0.06504440307617188, 0.06751251220703125, 0.06998062133789062, 0.07244873046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 1.0, 8.0, 2.0, 8.0, 11.0, 12.0, 20.0, 21.0, 37.0, 33.0, 47.0, 74.0, 120.0, 168.0, 267.0, 465.0, 622.0, 1116.0, 2008.0, 3811.0, 8433.0, 22410.0, 86781.0, 2497476.0, 1450241.0, 81340.0, 21879.0, 8166.0, 3832.0, 1854.0, 1089.0, 719.0, 412.0, 261.0, 156.0, 110.0, 80.0, 54.0, 42.0, 17.0, 17.0, 17.0, 14.0, 10.0, 6.0, 2.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.677734375, -0.6551284790039062, -0.6325225830078125, -0.6099166870117188, -0.587310791015625, -0.5647048950195312, -0.5420989990234375, -0.5194931030273438, -0.49688720703125, -0.47428131103515625, -0.4516754150390625, -0.42906951904296875, -0.406463623046875, -0.38385772705078125, -0.3612518310546875, -0.33864593505859375, -0.3160400390625, -0.29343414306640625, -0.2708282470703125, -0.24822235107421875, -0.225616455078125, -0.20301055908203125, -0.1804046630859375, -0.15779876708984375, -0.13519287109375, -0.11258697509765625, -0.0899810791015625, -0.06737518310546875, -0.044769287109375, -0.02216339111328125, 0.0004425048828125, 0.02304840087890625, 0.045654296875, 0.06826019287109375, 0.0908660888671875, 0.11347198486328125, 0.136077880859375, 0.15868377685546875, 0.1812896728515625, 0.20389556884765625, 0.22650146484375, 0.24910736083984375, 0.2717132568359375, 0.29431915283203125, 0.316925048828125, 0.33953094482421875, 0.3621368408203125, 0.38474273681640625, 0.4073486328125, 0.42995452880859375, 0.4525604248046875, 0.47516632080078125, 0.497772216796875, 0.5203781127929688, 0.5429840087890625, 0.5655899047851562, 0.58819580078125, 0.6108016967773438, 0.6334075927734375, 0.6560134887695312, 0.678619384765625, 0.7012252807617188, 0.7238311767578125, 0.7464370727539062, 0.76904296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 21.0, 27.0, 43.0, 73.0, 134.0, 356.0, 2337.0, 658.0, 168.0, 98.0, 47.0, 23.0, 23.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.4303131103515625, -0.416290283203125, -0.4022674560546875, -0.38824462890625, -0.3742218017578125, -0.360198974609375, -0.3461761474609375, -0.3321533203125, -0.3181304931640625, -0.304107666015625, -0.2900848388671875, -0.27606201171875, -0.2620391845703125, -0.248016357421875, -0.2339935302734375, -0.219970703125, -0.2059478759765625, -0.191925048828125, -0.1779022216796875, -0.16387939453125, -0.1498565673828125, -0.135833740234375, -0.1218109130859375, -0.1077880859375, -0.0937652587890625, -0.079742431640625, -0.0657196044921875, -0.05169677734375, -0.0376739501953125, -0.023651123046875, -0.0096282958984375, 0.00439453125, 0.0184173583984375, 0.032440185546875, 0.0464630126953125, 0.06048583984375, 0.0745086669921875, 0.088531494140625, 0.1025543212890625, 0.1165771484375, 0.1305999755859375, 0.144622802734375, 0.1586456298828125, 0.17266845703125, 0.1866912841796875, 0.200714111328125, 0.2147369384765625, 0.228759765625, 0.2427825927734375, 0.256805419921875, 0.2708282470703125, 0.28485107421875, 0.2988739013671875, 0.312896728515625, 0.3269195556640625, 0.3409423828125, 0.3549652099609375, 0.368988037109375, 0.3830108642578125, 0.39703369140625, 0.4110565185546875, 0.425079345703125, 0.4391021728515625, 0.453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 11.0, 33.0, 45.0, 64.0, 121.0, 162.0, 165.0, 154.0, 107.0, 49.0, 33.0, 21.0, 13.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4327988624572754, -3.3454413414001465, -3.2580835819244385, -3.1707260608673096, -3.0833685398101807, -2.9960107803344727, -2.9086532592773438, -2.821295738220215, -2.733938217163086, -2.646580696105957, -2.559222936630249, -2.47186541557312, -2.384507894515991, -2.297150135040283, -2.2097926139831543, -2.1224350929260254, -2.0350773334503174, -1.947719693183899, -1.86036217212677, -1.7730045318603516, -1.6856470108032227, -1.5982893705368042, -1.5109317302703857, -1.4235742092132568, -1.3362165689468384, -1.24885892868042, -1.161501407623291, -1.0741437673568726, -0.9867861866950989, -0.8994286060333252, -0.8120709657669067, -0.7247133851051331, -0.6373560428619385, -0.5499984622001648, -0.4626408517360687, -0.37528324127197266, -0.287925660610199, -0.2005680799484253, -0.11321043968200684, -0.025852859020233154, 0.06150472164154053, 0.1488623172044754, 0.23621991276741028, 0.32357752323150635, 0.41093510389328003, 0.4982926845550537, 0.5856503248214722, 0.6730079054832458, 0.7603654861450195, 0.8477230668067932, 0.9350806474685669, 1.0224382877349854, 1.1097958087921143, 1.1971534490585327, 1.2845110893249512, 1.37186861038208, 1.4592262506484985, 1.546583890914917, 1.633941411972046, 1.7212990522384644, 1.8086566925048828, 1.8960142135620117, 1.9833718538284302, 2.0707294940948486, 2.1580870151519775]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 5.0, 9.0, 8.0, 9.0, 14.0, 15.0, 9.0, 23.0, 23.0, 26.0, 29.0, 35.0, 33.0, 43.0, 40.0, 54.0, 47.0, 34.0, 37.0, 44.0, 45.0, 38.0, 26.0, 46.0, 45.0, 45.0, 25.0, 26.0, 30.0, 26.0, 16.0, 20.0, 7.0, 8.0, 14.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.1031018495559692, -1.0700597763061523, -1.037017822265625, -1.0039758682250977, -0.9709337949752808, -0.9378917813301086, -0.9048497676849365, -0.8718077540397644, -0.8387657403945923, -0.8057237267494202, -0.772681713104248, -0.7396396994590759, -0.7065976858139038, -0.6735556721687317, -0.6405136585235596, -0.6074716448783875, -0.5744296312332153, -0.5413876175880432, -0.5083456039428711, -0.475303590297699, -0.44226157665252686, -0.40921956300735474, -0.3761775493621826, -0.3431355357170105, -0.3100935220718384, -0.27705150842666626, -0.24400949478149414, -0.21096748113632202, -0.1779254674911499, -0.14488345384597778, -0.11184144020080566, -0.07879942655563354, -0.045757293701171875, -0.012715280055999756, 0.020326733589172363, 0.05336874723434448, 0.0864107608795166, 0.11945277452468872, 0.15249478816986084, 0.18553680181503296, 0.21857881546020508, 0.2516208291053772, 0.2846628427505493, 0.31770485639572144, 0.35074687004089355, 0.3837888836860657, 0.4168308973312378, 0.4498729109764099, 0.48291492462158203, 0.5159569382667542, 0.5489989519119263, 0.5820409655570984, 0.6150829792022705, 0.6481249928474426, 0.6811670064926147, 0.7142090201377869, 0.747251033782959, 0.7802930474281311, 0.8133350610733032, 0.8463770747184753, 0.8794190883636475, 0.9124611020088196, 0.9455031156539917, 0.9785451292991638, 1.011587142944336]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 8.0, 17.0, 18.0, 29.0, 35.0, 55.0, 108.0, 134.0, 190.0, 332.0, 501.0, 793.0, 1214.0, 2054.0, 3435.0, 5803.0, 10425.0, 20567.0, 42894.0, 104386.0, 258389.0, 325445.0, 152079.0, 60587.0, 27226.0, 13575.0, 7475.0, 4185.0, 2441.0, 1474.0, 974.0, 559.0, 386.0, 254.0, 153.0, 94.0, 75.0, 54.0, 38.0, 33.0, 16.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28594207763671875, -0.2764739990234375, -0.26700592041015625, -0.257537841796875, -0.24806976318359375, -0.2386016845703125, -0.22913360595703125, -0.21966552734375, -0.21019744873046875, -0.2007293701171875, -0.19126129150390625, -0.181793212890625, -0.17232513427734375, -0.1628570556640625, -0.15338897705078125, -0.1439208984375, -0.13445281982421875, -0.1249847412109375, -0.11551666259765625, -0.106048583984375, -0.09658050537109375, -0.0871124267578125, -0.07764434814453125, -0.06817626953125, -0.05870819091796875, -0.0492401123046875, -0.03977203369140625, -0.030303955078125, -0.02083587646484375, -0.0113677978515625, -0.00189971923828125, 0.007568359375, 0.01703643798828125, 0.0265045166015625, 0.03597259521484375, 0.045440673828125, 0.05490875244140625, 0.0643768310546875, 0.07384490966796875, 0.08331298828125, 0.09278106689453125, 0.1022491455078125, 0.11171722412109375, 0.121185302734375, 0.13065338134765625, 0.1401214599609375, 0.14958953857421875, 0.1590576171875, 0.16852569580078125, 0.1779937744140625, 0.18746185302734375, 0.196929931640625, 0.20639801025390625, 0.2158660888671875, 0.22533416748046875, 0.23480224609375, 0.24427032470703125, 0.2537384033203125, 0.26320648193359375, 0.272674560546875, 0.28214263916015625, 0.2916107177734375, 0.30107879638671875, 0.310546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 9.0, 14.0, 12.0, 14.0, 12.0, 23.0, 19.0, 22.0, 38.0, 27.0, 41.0, 39.0, 42.0, 47.0, 52.0, 57.0, 42.0, 53.0, 36.0, 65.0, 50.0, 46.0, 33.0, 34.0, 21.0, 25.0, 27.0, 17.0, 14.0, 14.0, 19.0, 10.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10546875, -0.10201168060302734, -0.09855461120605469, -0.09509754180908203, -0.09164047241210938, -0.08818340301513672, -0.08472633361816406, -0.0812692642211914, -0.07781219482421875, -0.0743551254272461, -0.07089805603027344, -0.06744098663330078, -0.06398391723632812, -0.06052684783935547, -0.05706977844238281, -0.053612709045410156, -0.0501556396484375, -0.046698570251464844, -0.04324150085449219, -0.03978443145751953, -0.036327362060546875, -0.03287029266357422, -0.029413223266601562, -0.025956153869628906, -0.02249908447265625, -0.019042015075683594, -0.015584945678710938, -0.012127876281738281, -0.008670806884765625, -0.005213737487792969, -0.0017566680908203125, 0.0017004013061523438, 0.005157470703125, 0.008614540100097656, 0.012071609497070312, 0.015528678894042969, 0.018985748291015625, 0.02244281768798828, 0.025899887084960938, 0.029356956481933594, 0.03281402587890625, 0.036271095275878906, 0.03972816467285156, 0.04318523406982422, 0.046642303466796875, 0.05009937286376953, 0.05355644226074219, 0.057013511657714844, 0.0604705810546875, 0.06392765045166016, 0.06738471984863281, 0.07084178924560547, 0.07429885864257812, 0.07775592803955078, 0.08121299743652344, 0.0846700668334961, 0.08812713623046875, 0.0915842056274414, 0.09504127502441406, 0.09849834442138672, 0.10195541381835938, 0.10541248321533203, 0.10886955261230469, 0.11232662200927734, 0.11578369140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 8.0, 15.0, 26.0, 29.0, 41.0, 71.0, 118.0, 204.0, 370.0, 868.0, 2330.0, 8798.0, 44156.0, 380054.0, 532958.0, 61980.0, 11372.0, 3094.0, 1011.0, 440.0, 202.0, 124.0, 72.0, 53.0, 35.0, 18.0, 24.0, 9.0, 10.0, 10.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6618194580078125, -0.639068603515625, -0.6163177490234375, -0.59356689453125, -0.5708160400390625, -0.548065185546875, -0.5253143310546875, -0.5025634765625, -0.4798126220703125, -0.457061767578125, -0.4343109130859375, -0.41156005859375, -0.3888092041015625, -0.366058349609375, -0.3433074951171875, -0.320556640625, -0.2978057861328125, -0.275054931640625, -0.2523040771484375, -0.22955322265625, -0.2068023681640625, -0.184051513671875, -0.1613006591796875, -0.1385498046875, -0.1157989501953125, -0.093048095703125, -0.0702972412109375, -0.04754638671875, -0.0247955322265625, -0.002044677734375, 0.0207061767578125, 0.04345703125, 0.0662078857421875, 0.088958740234375, 0.1117095947265625, 0.13446044921875, 0.1572113037109375, 0.179962158203125, 0.2027130126953125, 0.2254638671875, 0.2482147216796875, 0.270965576171875, 0.2937164306640625, 0.31646728515625, 0.3392181396484375, 0.361968994140625, 0.3847198486328125, 0.407470703125, 0.4302215576171875, 0.452972412109375, 0.4757232666015625, 0.49847412109375, 0.5212249755859375, 0.543975830078125, 0.5667266845703125, 0.5894775390625, 0.6122283935546875, 0.634979248046875, 0.6577301025390625, 0.68048095703125, 0.7032318115234375, 0.725982666015625, 0.7487335205078125, 0.771484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 8.0, 7.0, 15.0, 14.0, 12.0, 23.0, 31.0, 25.0, 23.0, 22.0, 28.0, 43.0, 36.0, 35.0, 47.0, 40.0, 44.0, 55.0, 46.0, 47.0, 33.0, 32.0, 38.0, 40.0, 33.0, 21.0, 34.0, 20.0, 25.0, 26.0, 10.0, 18.0, 9.0, 9.0, 10.0, 5.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5248336791992188, -0.5076751708984375, -0.49051666259765625, -0.473358154296875, -0.45619964599609375, -0.4390411376953125, -0.42188262939453125, -0.40472412109375, -0.38756561279296875, -0.3704071044921875, -0.35324859619140625, -0.336090087890625, -0.31893157958984375, -0.3017730712890625, -0.28461456298828125, -0.2674560546875, -0.25029754638671875, -0.2331390380859375, -0.21598052978515625, -0.198822021484375, -0.18166351318359375, -0.1645050048828125, -0.14734649658203125, -0.13018798828125, -0.11302947998046875, -0.0958709716796875, -0.07871246337890625, -0.061553955078125, -0.04439544677734375, -0.0272369384765625, -0.01007843017578125, 0.007080078125, 0.02423858642578125, 0.0413970947265625, 0.05855560302734375, 0.075714111328125, 0.09287261962890625, 0.1100311279296875, 0.12718963623046875, 0.14434814453125, 0.16150665283203125, 0.1786651611328125, 0.19582366943359375, 0.212982177734375, 0.23014068603515625, 0.2472991943359375, 0.26445770263671875, 0.2816162109375, 0.29877471923828125, 0.3159332275390625, 0.33309173583984375, 0.350250244140625, 0.36740875244140625, 0.3845672607421875, 0.40172576904296875, 0.41888427734375, 0.43604278564453125, 0.4532012939453125, 0.47035980224609375, 0.487518310546875, 0.5046768188476562, 0.5218353271484375, 0.5389938354492188, 0.55615234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 6.0, 14.0, 21.0, 31.0, 66.0, 129.0, 222.0, 543.0, 1503.0, 5319.0, 24280.0, 234395.0, 693604.0, 72556.0, 11369.0, 2818.0, 923.0, 376.0, 168.0, 74.0, 42.0, 24.0, 21.0, 16.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36572265625, -0.35124969482421875, -0.3367767333984375, -0.32230377197265625, -0.307830810546875, -0.29335784912109375, -0.2788848876953125, -0.26441192626953125, -0.24993896484375, -0.23546600341796875, -0.2209930419921875, -0.20652008056640625, -0.192047119140625, -0.17757415771484375, -0.1631011962890625, -0.14862823486328125, -0.1341552734375, -0.11968231201171875, -0.1052093505859375, -0.09073638916015625, -0.076263427734375, -0.06179046630859375, -0.0473175048828125, -0.03284454345703125, -0.01837158203125, -0.00389862060546875, 0.0105743408203125, 0.02504730224609375, 0.039520263671875, 0.05399322509765625, 0.0684661865234375, 0.08293914794921875, 0.097412109375, 0.11188507080078125, 0.1263580322265625, 0.14083099365234375, 0.155303955078125, 0.16977691650390625, 0.1842498779296875, 0.19872283935546875, 0.21319580078125, 0.22766876220703125, 0.2421417236328125, 0.25661468505859375, 0.271087646484375, 0.28556060791015625, 0.3000335693359375, 0.31450653076171875, 0.3289794921875, 0.34345245361328125, 0.3579254150390625, 0.37239837646484375, 0.386871337890625, 0.40134429931640625, 0.4158172607421875, 0.43029022216796875, 0.44476318359375, 0.45923614501953125, 0.4737091064453125, 0.48818206787109375, 0.502655029296875, 0.5171279907226562, 0.5316009521484375, 0.5460739135742188, 0.560546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 23.0, 27.0, 49.0, 57.0, 74.0, 109.0, 138.0, 146.0, 94.0, 87.0, 53.0, 38.0, 14.0, 19.0, 9.0, 9.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.328126907348633e-05, -9.015202522277832e-05, -8.702278137207031e-05, -8.38935375213623e-05, -8.07642936706543e-05, -7.763504981994629e-05, -7.450580596923828e-05, -7.137656211853027e-05, -6.824731826782227e-05, -6.511807441711426e-05, -6.198883056640625e-05, -5.885958671569824e-05, -5.5730342864990234e-05, -5.2601099014282227e-05, -4.947185516357422e-05, -4.634261131286621e-05, -4.32133674621582e-05, -4.0084123611450195e-05, -3.695487976074219e-05, -3.382563591003418e-05, -3.069639205932617e-05, -2.7567148208618164e-05, -2.4437904357910156e-05, -2.130866050720215e-05, -1.817941665649414e-05, -1.5050172805786133e-05, -1.1920928955078125e-05, -8.791685104370117e-06, -5.662441253662109e-06, -2.5331974029541016e-06, 5.960464477539062e-07, 3.725290298461914e-06, 6.854534149169922e-06, 9.98377799987793e-06, 1.3113021850585938e-05, 1.6242265701293945e-05, 1.9371509552001953e-05, 2.250075340270996e-05, 2.562999725341797e-05, 2.8759241104125977e-05, 3.1888484954833984e-05, 3.501772880554199e-05, 3.814697265625e-05, 4.127621650695801e-05, 4.4405460357666016e-05, 4.7534704208374023e-05, 5.066394805908203e-05, 5.379319190979004e-05, 5.692243576049805e-05, 6.0051679611206055e-05, 6.318092346191406e-05, 6.631016731262207e-05, 6.943941116333008e-05, 7.256865501403809e-05, 7.56978988647461e-05, 7.88271427154541e-05, 8.195638656616211e-05, 8.508563041687012e-05, 8.821487426757812e-05, 9.134411811828613e-05, 9.447336196899414e-05, 9.760260581970215e-05, 0.00010073184967041016, 0.00010386109352111816, 0.00010699033737182617]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 8.0, 5.0, 5.0, 6.0, 16.0, 31.0, 45.0, 53.0, 78.0, 103.0, 164.0, 303.0, 426.0, 825.0, 1509.0, 3065.0, 6448.0, 16102.0, 46941.0, 174048.0, 485243.0, 221205.0, 57728.0, 19089.0, 7536.0, 3400.0, 1773.0, 960.0, 516.0, 339.0, 198.0, 124.0, 81.0, 41.0, 34.0, 39.0, 15.0, 18.0, 7.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.264404296875, -0.2562904357910156, -0.24817657470703125, -0.24006271362304688, -0.2319488525390625, -0.22383499145507812, -0.21572113037109375, -0.20760726928710938, -0.199493408203125, -0.19137954711914062, -0.18326568603515625, -0.17515182495117188, -0.1670379638671875, -0.15892410278320312, -0.15081024169921875, -0.14269638061523438, -0.13458251953125, -0.12646865844726562, -0.11835479736328125, -0.11024093627929688, -0.1021270751953125, -0.09401321411132812, -0.08589935302734375, -0.07778549194335938, -0.069671630859375, -0.061557769775390625, -0.05344390869140625, -0.045330047607421875, -0.0372161865234375, -0.029102325439453125, -0.02098846435546875, -0.012874603271484375, -0.0047607421875, 0.003353118896484375, 0.01146697998046875, 0.019580841064453125, 0.0276947021484375, 0.035808563232421875, 0.04392242431640625, 0.052036285400390625, 0.060150146484375, 0.06826400756835938, 0.07637786865234375, 0.08449172973632812, 0.0926055908203125, 0.10071945190429688, 0.10883331298828125, 0.11694717407226562, 0.12506103515625, 0.13317489624023438, 0.14128875732421875, 0.14940261840820312, 0.1575164794921875, 0.16563034057617188, 0.17374420166015625, 0.18185806274414062, 0.189971923828125, 0.19808578491210938, 0.20619964599609375, 0.21431350708007812, 0.2224273681640625, 0.23054122924804688, 0.23865509033203125, 0.24676895141601562, 0.2548828125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 20.0, 26.0, 26.0, 41.0, 73.0, 68.0, 105.0, 139.0, 125.0, 113.0, 94.0, 54.0, 33.0, 23.0, 11.0, 14.0, 7.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.26171875, -0.250244140625, -0.23876953125, -0.227294921875, -0.2158203125, -0.204345703125, -0.19287109375, -0.181396484375, -0.169921875, -0.158447265625, -0.14697265625, -0.135498046875, -0.1240234375, -0.112548828125, -0.10107421875, -0.089599609375, -0.078125, -0.066650390625, -0.05517578125, -0.043701171875, -0.0322265625, -0.020751953125, -0.00927734375, 0.002197265625, 0.013671875, 0.025146484375, 0.03662109375, 0.048095703125, 0.0595703125, 0.071044921875, 0.08251953125, 0.093994140625, 0.10546875, 0.116943359375, 0.12841796875, 0.139892578125, 0.1513671875, 0.162841796875, 0.17431640625, 0.185791015625, 0.197265625, 0.208740234375, 0.22021484375, 0.231689453125, 0.2431640625, 0.254638671875, 0.26611328125, 0.277587890625, 0.2890625, 0.300537109375, 0.31201171875, 0.323486328125, 0.3349609375, 0.346435546875, 0.35791015625, 0.369384765625, 0.380859375, 0.392333984375, 0.40380859375, 0.415283203125, 0.4267578125, 0.438232421875, 0.44970703125, 0.461181640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 15.0, 33.0, 68.0, 120.0, 216.0, 215.0, 155.0, 109.0, 38.0, 22.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.987802028656006, -2.7788026332855225, -2.569803237915039, -2.3608040809631348, -2.1518044471740723, -1.9428051710128784, -1.7338058948516846, -1.5248064994812012, -1.3158071041107178, -1.1068077087402344, -0.8978083729743958, -0.6888090372085571, -0.47980964183807373, -0.27081024646759033, -0.061810970306396484, 0.14718842506408691, 0.3561878204345703, 0.5651872158050537, 0.7741865515708923, 0.983185887336731, 1.1921852827072144, 1.4011846780776978, 1.6101839542388916, 1.819183349609375, 2.0281827449798584, 2.237182140350342, 2.446181535720825, 2.6551809310913086, 2.864180088043213, 3.0731797218322754, 3.2821788787841797, 3.491178274154663, 3.7001771926879883, 3.9091765880584717, 4.118175983428955, 4.327175140380859, 4.536174774169922, 4.745173931121826, 4.9541730880737305, 5.163172721862793, 5.3721723556518555, 5.58117151260376, 5.790171146392822, 5.999170303344727, 6.208169937133789, 6.417169094085693, 6.626168251037598, 6.83516788482666, 7.0441670417785645, 7.253166198730469, 7.462165832519531, 7.6711649894714355, 7.880164623260498, 8.089163780212402, 8.298163414001465, 8.507162094116211, 8.716161727905273, 8.925161361694336, 9.134160041809082, 9.343159675598145, 9.552159309387207, 9.76115894317627, 9.970157623291016, 10.179157257080078, 10.38815689086914]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 11.0, 10.0, 13.0, 17.0, 14.0, 18.0, 21.0, 23.0, 14.0, 25.0, 41.0, 37.0, 40.0, 33.0, 33.0, 41.0, 44.0, 42.0, 52.0, 31.0, 43.0, 35.0, 39.0, 43.0, 38.0, 32.0, 27.0, 36.0, 20.0, 19.0, 23.0, 19.0, 7.0, 9.0, 8.0, 5.0, 3.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3804855346679688, -2.2952613830566406, -2.2100374698638916, -2.1248135566711426, -2.0395894050598145, -1.9543653726577759, -1.8691413402557373, -1.7839173078536987, -1.6986932754516602, -1.6134692430496216, -1.528245210647583, -1.4430211782455444, -1.3577971458435059, -1.2725731134414673, -1.1873490810394287, -1.1021250486373901, -1.0169010162353516, -0.931676983833313, -0.8464529514312744, -0.7612289190292358, -0.6760048866271973, -0.5907808542251587, -0.5055568218231201, -0.42033278942108154, -0.33510875701904297, -0.2498847246170044, -0.16466069221496582, -0.07943665981292725, 0.005787372589111328, 0.0910114049911499, 0.17623543739318848, 0.26145946979522705, 0.3466835021972656, 0.4319075345993042, 0.5171315670013428, 0.6023555994033813, 0.6875796318054199, 0.7728036642074585, 0.8580276966094971, 0.9432517290115356, 1.0284757614135742, 1.1136997938156128, 1.1989238262176514, 1.28414785861969, 1.3693718910217285, 1.454595923423767, 1.5398199558258057, 1.6250439882278442, 1.7102680206298828, 1.7954920530319214, 1.88071608543396, 1.9659401178359985, 2.051164150238037, 2.1363883018493652, 2.2216122150421143, 2.3068361282348633, 2.3920602798461914, 2.4772844314575195, 2.5625083446502686, 2.6477322578430176, 2.7329564094543457, 2.818180561065674, 2.903404474258423, 2.988628387451172, 3.0738525390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 4.0, 8.0, 5.0, 12.0, 17.0, 9.0, 22.0, 35.0, 43.0, 50.0, 70.0, 86.0, 133.0, 188.0, 274.0, 468.0, 751.0, 1324.0, 2525.0, 6502.0, 34900.0, 4116277.0, 20235.0, 5024.0, 2191.0, 1123.0, 719.0, 411.0, 229.0, 169.0, 116.0, 93.0, 60.0, 53.0, 34.0, 35.0, 27.0, 14.0, 16.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.244140625, -1.208984375, -1.173828125, -1.138671875, -1.103515625, -1.068359375, -1.033203125, -0.998046875, -0.962890625, -0.927734375, -0.892578125, -0.857421875, -0.822265625, -0.787109375, -0.751953125, -0.716796875, -0.681640625, -0.646484375, -0.611328125, -0.576171875, -0.541015625, -0.505859375, -0.470703125, -0.435546875, -0.400390625, -0.365234375, -0.330078125, -0.294921875, -0.259765625, -0.224609375, -0.189453125, -0.154296875, -0.119140625, -0.083984375, -0.048828125, -0.013671875, 0.021484375, 0.056640625, 0.091796875, 0.126953125, 0.162109375, 0.197265625, 0.232421875, 0.267578125, 0.302734375, 0.337890625, 0.373046875, 0.408203125, 0.443359375, 0.478515625, 0.513671875, 0.548828125, 0.583984375, 0.619140625, 0.654296875, 0.689453125, 0.724609375, 0.759765625, 0.794921875, 0.830078125, 0.865234375, 0.900390625, 0.935546875, 0.970703125, 1.005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 11.0, 11.0, 13.0, 15.0, 21.0, 20.0, 26.0, 19.0, 32.0, 44.0, 47.0, 49.0, 47.0, 50.0, 40.0, 60.0, 51.0, 55.0, 56.0, 41.0, 35.0, 43.0, 34.0, 29.0, 24.0, 19.0, 29.0, 12.0, 13.0, 9.0, 8.0, 3.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11187744140625, -0.10806751251220703, -0.10425758361816406, -0.1004476547241211, -0.09663772583007812, -0.09282779693603516, -0.08901786804199219, -0.08520793914794922, -0.08139801025390625, -0.07758808135986328, -0.07377815246582031, -0.06996822357177734, -0.06615829467773438, -0.062348365783691406, -0.05853843688964844, -0.05472850799560547, -0.0509185791015625, -0.04710865020751953, -0.04329872131347656, -0.039488792419433594, -0.035678863525390625, -0.031868934631347656, -0.028059005737304688, -0.02424907684326172, -0.02043914794921875, -0.01662921905517578, -0.012819290161132812, -0.009009361267089844, -0.005199432373046875, -0.0013895034790039062, 0.0024204254150390625, 0.006230354309082031, 0.010040283203125, 0.013850212097167969, 0.017660140991210938, 0.021470069885253906, 0.025279998779296875, 0.029089927673339844, 0.03289985656738281, 0.03670978546142578, 0.04051971435546875, 0.04432964324951172, 0.04813957214355469, 0.051949501037597656, 0.055759429931640625, 0.059569358825683594, 0.06337928771972656, 0.06718921661376953, 0.0709991455078125, 0.07480907440185547, 0.07861900329589844, 0.0824289321899414, 0.08623886108398438, 0.09004878997802734, 0.09385871887207031, 0.09766864776611328, 0.10147857666015625, 0.10528850555419922, 0.10909843444824219, 0.11290836334228516, 0.11671829223632812, 0.1205282211303711, 0.12433815002441406, 0.12814807891845703, 0.1319580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 8.0, 11.0, 16.0, 19.0, 19.0, 29.0, 45.0, 53.0, 53.0, 61.0, 89.0, 109.0, 163.0, 228.0, 351.0, 613.0, 1298.0, 2966.0, 8976.0, 77439.0, 4074369.0, 18222.0, 4843.0, 1885.0, 892.0, 435.0, 272.0, 208.0, 137.0, 99.0, 82.0, 61.0, 41.0, 48.0, 29.0, 26.0, 20.0, 14.0, 8.0, 12.0, 6.0, 1.0, 5.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0], "bins": [-1.6728515625, -1.6253662109375, -1.577880859375, -1.5303955078125, -1.48291015625, -1.4354248046875, -1.387939453125, -1.3404541015625, -1.29296875, -1.2454833984375, -1.197998046875, -1.1505126953125, -1.10302734375, -1.0555419921875, -1.008056640625, -0.9605712890625, -0.9130859375, -0.8656005859375, -0.818115234375, -0.7706298828125, -0.72314453125, -0.6756591796875, -0.628173828125, -0.5806884765625, -0.533203125, -0.4857177734375, -0.438232421875, -0.3907470703125, -0.34326171875, -0.2957763671875, -0.248291015625, -0.2008056640625, -0.1533203125, -0.1058349609375, -0.058349609375, -0.0108642578125, 0.03662109375, 0.0841064453125, 0.131591796875, 0.1790771484375, 0.2265625, 0.2740478515625, 0.321533203125, 0.3690185546875, 0.41650390625, 0.4639892578125, 0.511474609375, 0.5589599609375, 0.6064453125, 0.6539306640625, 0.701416015625, 0.7489013671875, 0.79638671875, 0.8438720703125, 0.891357421875, 0.9388427734375, 0.986328125, 1.0338134765625, 1.081298828125, 1.1287841796875, 1.17626953125, 1.2237548828125, 1.271240234375, 1.3187255859375, 1.3662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 21.0, 26.0, 266.0, 3634.0, 55.0, 35.0, 10.0, 6.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.421875, -0.41082000732421875, -0.3997650146484375, -0.38871002197265625, -0.377655029296875, -0.36660003662109375, -0.3555450439453125, -0.34449005126953125, -0.33343505859375, -0.32238006591796875, -0.3113250732421875, -0.30027008056640625, -0.289215087890625, -0.27816009521484375, -0.2671051025390625, -0.25605010986328125, -0.2449951171875, -0.23394012451171875, -0.2228851318359375, -0.21183013916015625, -0.200775146484375, -0.18972015380859375, -0.1786651611328125, -0.16761016845703125, -0.15655517578125, -0.14550018310546875, -0.1344451904296875, -0.12339019775390625, -0.112335205078125, -0.10128021240234375, -0.0902252197265625, -0.07917022705078125, -0.068115234375, -0.05706024169921875, -0.0460052490234375, -0.03495025634765625, -0.023895263671875, -0.01284027099609375, -0.0017852783203125, 0.00926971435546875, 0.02032470703125, 0.03137969970703125, 0.0424346923828125, 0.05348968505859375, 0.064544677734375, 0.07559967041015625, 0.0866546630859375, 0.09770965576171875, 0.1087646484375, 0.11981964111328125, 0.1308746337890625, 0.14192962646484375, 0.152984619140625, 0.16403961181640625, 0.1750946044921875, 0.18614959716796875, 0.19720458984375, 0.20825958251953125, 0.2193145751953125, 0.23036956787109375, 0.241424560546875, 0.25247955322265625, 0.2635345458984375, 0.27458953857421875, 0.28564453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 15.0, 21.0, 40.0, 50.0, 101.0, 126.0, 126.0, 155.0, 102.0, 55.0, 63.0, 40.0, 34.0, 23.0, 17.0, 7.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.322012186050415, -1.2915350198745728, -1.26105797290802, -1.2305808067321777, -1.200103759765625, -1.1696265935897827, -1.1391494274139404, -1.1086723804473877, -1.0781952142715454, -1.0477180480957031, -1.0172410011291504, -0.9867638349533081, -0.9562867283821106, -0.9258096218109131, -0.8953325152397156, -0.8648554086685181, -0.8343782424926758, -0.8039011359214783, -0.7734240293502808, -0.7429468631744385, -0.712469756603241, -0.6819926500320435, -0.651515543460846, -0.6210384368896484, -0.5905613303184509, -0.5600842237472534, -0.5296071171760559, -0.499129980802536, -0.4686528444290161, -0.4381757378578186, -0.4076986312866211, -0.3772214949131012, -0.3467443585395813, -0.3162672519683838, -0.2857901155948639, -0.2553130090236664, -0.22483587265014648, -0.19435876607894897, -0.16388164460659027, -0.13340452313423157, -0.10292740166187286, -0.07245028018951416, -0.041973162442445755, -0.01149604469537735, 0.018981076776981354, 0.04945819079875946, 0.07993531227111816, 0.11041243374347687, 0.14088955521583557, 0.17136667668819427, 0.20184379816055298, 0.2323209047317505, 0.2627980411052704, 0.2932751476764679, 0.3237522840499878, 0.3542293906211853, 0.3847064971923828, 0.4151836037635803, 0.4456607401371002, 0.47613784670829773, 0.5066149830818176, 0.5370920896530151, 0.5675691962242126, 0.5980463027954102, 0.6285234689712524]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 9.0, 15.0, 16.0, 17.0, 20.0, 26.0, 19.0, 39.0, 39.0, 39.0, 24.0, 36.0, 44.0, 39.0, 43.0, 30.0, 38.0, 29.0, 37.0, 32.0, 41.0, 37.0, 38.0, 34.0, 36.0, 29.0, 32.0, 27.0, 26.0, 25.0, 13.0, 17.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5178878903388977, -0.5019795298576355, -0.4860711693763733, -0.47016283869743347, -0.45425447821617126, -0.43834611773490906, -0.42243778705596924, -0.40652942657470703, -0.3906210660934448, -0.3747127056121826, -0.3588043451309204, -0.3428960144519806, -0.3269876539707184, -0.3110792934894562, -0.29517096281051636, -0.27926260232925415, -0.26335424184799194, -0.24744588136672974, -0.23153753578662872, -0.2156291902065277, -0.1997208297252655, -0.1838124692440033, -0.16790412366390228, -0.15199577808380127, -0.13608741760253906, -0.12017906457185745, -0.10427071154117584, -0.08836235851049423, -0.07245400547981262, -0.05654565244913101, -0.0406372994184494, -0.024728946387767792, -0.008820533752441406, 0.007087819278240204, 0.022996172308921814, 0.038904525339603424, 0.054812878370285034, 0.07072123140096664, 0.08662958443164825, 0.10253793746232986, 0.11844629049301147, 0.13435465097427368, 0.1502629965543747, 0.1661713421344757, 0.18207970261573792, 0.19798806309700012, 0.21389640867710114, 0.22980475425720215, 0.24571311473846436, 0.26162147521972656, 0.27752983570098877, 0.2934381663799286, 0.3093465268611908, 0.325254887342453, 0.3411632180213928, 0.35707157850265503, 0.37297993898391724, 0.38888829946517944, 0.40479665994644165, 0.42070499062538147, 0.4366133511066437, 0.4525217115879059, 0.4684300422668457, 0.4843384027481079, 0.5002467632293701]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 16.0, 19.0, 16.0, 33.0, 63.0, 75.0, 120.0, 191.0, 289.0, 495.0, 830.0, 1393.0, 2509.0, 4797.0, 9345.0, 19601.0, 47541.0, 133874.0, 362436.0, 295145.0, 99701.0, 37069.0, 15934.0, 7808.0, 4028.0, 2152.0, 1209.0, 723.0, 405.0, 245.0, 162.0, 112.0, 59.0, 47.0, 30.0, 20.0, 16.0, 12.0, 17.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5140647888183594, -0.49932098388671875, -0.4845771789550781, -0.4698333740234375, -0.4550895690917969, -0.44034576416015625, -0.4256019592285156, -0.410858154296875, -0.3961143493652344, -0.38137054443359375, -0.3666267395019531, -0.3518829345703125, -0.3371391296386719, -0.32239532470703125, -0.3076515197753906, -0.29290771484375, -0.2781639099121094, -0.26342010498046875, -0.24867630004882812, -0.2339324951171875, -0.21918869018554688, -0.20444488525390625, -0.18970108032226562, -0.174957275390625, -0.16021347045898438, -0.14546966552734375, -0.13072586059570312, -0.1159820556640625, -0.10123825073242188, -0.08649444580078125, -0.07175064086914062, -0.0570068359375, -0.042263031005859375, -0.02751922607421875, -0.012775421142578125, 0.0019683837890625, 0.016712188720703125, 0.03145599365234375, 0.046199798583984375, 0.060943603515625, 0.07568740844726562, 0.09043121337890625, 0.10517501831054688, 0.1199188232421875, 0.13466262817382812, 0.14940643310546875, 0.16415023803710938, 0.17889404296875, 0.19363784790039062, 0.20838165283203125, 0.22312545776367188, 0.2378692626953125, 0.2526130676269531, 0.26735687255859375, 0.2821006774902344, 0.296844482421875, 0.3115882873535156, 0.32633209228515625, 0.3410758972167969, 0.3558197021484375, 0.3705635070800781, 0.38530731201171875, 0.4000511169433594, 0.414794921875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 2.0, 9.0, 12.0, 9.0, 14.0, 14.0, 16.0, 19.0, 24.0, 16.0, 27.0, 37.0, 36.0, 35.0, 38.0, 38.0, 46.0, 43.0, 37.0, 50.0, 45.0, 46.0, 43.0, 44.0, 38.0, 43.0, 34.0, 24.0, 27.0, 27.0, 27.0, 15.0, 14.0, 9.0, 3.0, 9.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1260986328125, -0.12201881408691406, -0.11793899536132812, -0.11385917663574219, -0.10977935791015625, -0.10569953918457031, -0.10161972045898438, -0.09753990173339844, -0.0934600830078125, -0.08938026428222656, -0.08530044555664062, -0.08122062683105469, -0.07714080810546875, -0.07306098937988281, -0.06898117065429688, -0.06490135192871094, -0.060821533203125, -0.05674171447753906, -0.052661895751953125, -0.04858207702636719, -0.04450225830078125, -0.04042243957519531, -0.036342620849609375, -0.03226280212402344, -0.0281829833984375, -0.024103164672851562, -0.020023345947265625, -0.015943527221679688, -0.01186370849609375, -0.0077838897705078125, -0.003704071044921875, 0.0003757476806640625, 0.00445556640625, 0.008535385131835938, 0.012615203857421875, 0.016695022583007812, 0.02077484130859375, 0.024854660034179688, 0.028934478759765625, 0.03301429748535156, 0.0370941162109375, 0.04117393493652344, 0.045253753662109375, 0.04933357238769531, 0.05341339111328125, 0.05749320983886719, 0.061573028564453125, 0.06565284729003906, 0.069732666015625, 0.07381248474121094, 0.07789230346679688, 0.08197212219238281, 0.08605194091796875, 0.09013175964355469, 0.09421157836914062, 0.09829139709472656, 0.1023712158203125, 0.10645103454589844, 0.11053085327148438, 0.11461067199707031, 0.11869049072265625, 0.12277030944824219, 0.12685012817382812, 0.13092994689941406, 0.135009765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 10.0, 13.0, 17.0, 24.0, 42.0, 50.0, 61.0, 102.0, 149.0, 227.0, 339.0, 511.0, 864.0, 1501.0, 2480.0, 5107.0, 11059.0, 28469.0, 89941.0, 332654.0, 404642.0, 110637.0, 33801.0, 13031.0, 5753.0, 2872.0, 1511.0, 899.0, 542.0, 401.0, 247.0, 180.0, 98.0, 76.0, 66.0, 37.0, 27.0, 22.0, 15.0, 17.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.433837890625, -0.4198799133300781, -0.40592193603515625, -0.3919639587402344, -0.3780059814453125, -0.3640480041503906, -0.35009002685546875, -0.3361320495605469, -0.322174072265625, -0.3082160949707031, -0.29425811767578125, -0.2803001403808594, -0.2663421630859375, -0.2523841857910156, -0.23842620849609375, -0.22446823120117188, -0.21051025390625, -0.19655227661132812, -0.18259429931640625, -0.16863632202148438, -0.1546783447265625, -0.14072036743164062, -0.12676239013671875, -0.11280441284179688, -0.098846435546875, -0.08488845825195312, -0.07093048095703125, -0.056972503662109375, -0.0430145263671875, -0.029056549072265625, -0.01509857177734375, -0.001140594482421875, 0.0128173828125, 0.026775360107421875, 0.04073333740234375, 0.054691314697265625, 0.0686492919921875, 0.08260726928710938, 0.09656524658203125, 0.11052322387695312, 0.124481201171875, 0.13843917846679688, 0.15239715576171875, 0.16635513305664062, 0.1803131103515625, 0.19427108764648438, 0.20822906494140625, 0.22218704223632812, 0.23614501953125, 0.2501029968261719, 0.26406097412109375, 0.2780189514160156, 0.2919769287109375, 0.3059349060058594, 0.31989288330078125, 0.3338508605957031, 0.347808837890625, 0.3617668151855469, 0.37572479248046875, 0.3896827697753906, 0.4036407470703125, 0.4175987243652344, 0.43155670166015625, 0.4455146789550781, 0.45947265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 19.0, 18.0, 35.0, 15.0, 44.0, 37.0, 50.0, 48.0, 41.0, 51.0, 61.0, 50.0, 51.0, 50.0, 52.0, 42.0, 42.0, 57.0, 31.0, 36.0, 30.0, 24.0, 18.0, 22.0, 10.0, 12.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.617431640625, -0.59228515625, -0.567138671875, -0.5419921875, -0.516845703125, -0.49169921875, -0.466552734375, -0.44140625, -0.416259765625, -0.39111328125, -0.365966796875, -0.3408203125, -0.315673828125, -0.29052734375, -0.265380859375, -0.240234375, -0.215087890625, -0.18994140625, -0.164794921875, -0.1396484375, -0.114501953125, -0.08935546875, -0.064208984375, -0.0390625, -0.013916015625, 0.01123046875, 0.036376953125, 0.0615234375, 0.086669921875, 0.11181640625, 0.136962890625, 0.162109375, 0.187255859375, 0.21240234375, 0.237548828125, 0.2626953125, 0.287841796875, 0.31298828125, 0.338134765625, 0.36328125, 0.388427734375, 0.41357421875, 0.438720703125, 0.4638671875, 0.489013671875, 0.51416015625, 0.539306640625, 0.564453125, 0.589599609375, 0.61474609375, 0.639892578125, 0.6650390625, 0.690185546875, 0.71533203125, 0.740478515625, 0.765625, 0.790771484375, 0.81591796875, 0.841064453125, 0.8662109375, 0.891357421875, 0.91650390625, 0.941650390625, 0.966796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 4.0, 11.0, 18.0, 20.0, 29.0, 35.0, 58.0, 86.0, 120.0, 172.0, 282.0, 478.0, 851.0, 1786.0, 3753.0, 9491.0, 31748.0, 179988.0, 644234.0, 133647.0, 26105.0, 8497.0, 3401.0, 1633.0, 848.0, 465.0, 272.0, 155.0, 102.0, 65.0, 50.0, 31.0, 27.0, 23.0, 10.0, 14.0, 5.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.43603515625, -0.42438507080078125, -0.4127349853515625, -0.40108489990234375, -0.389434814453125, -0.37778472900390625, -0.3661346435546875, -0.35448455810546875, -0.34283447265625, -0.33118438720703125, -0.3195343017578125, -0.30788421630859375, -0.296234130859375, -0.28458404541015625, -0.2729339599609375, -0.26128387451171875, -0.2496337890625, -0.23798370361328125, -0.2263336181640625, -0.21468353271484375, -0.203033447265625, -0.19138336181640625, -0.1797332763671875, -0.16808319091796875, -0.15643310546875, -0.14478302001953125, -0.1331329345703125, -0.12148284912109375, -0.109832763671875, -0.09818267822265625, -0.0865325927734375, -0.07488250732421875, -0.063232421875, -0.05158233642578125, -0.0399322509765625, -0.02828216552734375, -0.016632080078125, -0.00498199462890625, 0.0066680908203125, 0.01831817626953125, 0.02996826171875, 0.04161834716796875, 0.0532684326171875, 0.06491851806640625, 0.076568603515625, 0.08821868896484375, 0.0998687744140625, 0.11151885986328125, 0.1231689453125, 0.13481903076171875, 0.1464691162109375, 0.15811920166015625, 0.169769287109375, 0.18141937255859375, 0.1930694580078125, 0.20471954345703125, 0.21636962890625, 0.22801971435546875, 0.2396697998046875, 0.25131988525390625, 0.262969970703125, 0.27462005615234375, 0.2862701416015625, 0.29792022705078125, 0.3095703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 2.0, 14.0, 17.0, 26.0, 35.0, 36.0, 46.0, 72.0, 95.0, 96.0, 110.0, 105.0, 86.0, 65.0, 56.0, 34.0, 30.0, 17.0, 14.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.343292236328125e-05, -7.093511521816254e-05, -6.843730807304382e-05, -6.593950092792511e-05, -6.34416937828064e-05, -6.094388663768768e-05, -5.844607949256897e-05, -5.5948272347450256e-05, -5.345046520233154e-05, -5.095265805721283e-05, -4.8454850912094116e-05, -4.59570437669754e-05, -4.345923662185669e-05, -4.0961429476737976e-05, -3.846362233161926e-05, -3.596581518650055e-05, -3.3468008041381836e-05, -3.097020089626312e-05, -2.847239375114441e-05, -2.5974586606025696e-05, -2.3476779460906982e-05, -2.097897231578827e-05, -1.8481165170669556e-05, -1.5983358025550842e-05, -1.3485550880432129e-05, -1.0987743735313416e-05, -8.489936590194702e-06, -5.992129445075989e-06, -3.4943222999572754e-06, -9.96515154838562e-07, 1.5012919902801514e-06, 3.999099135398865e-06, 6.496906280517578e-06, 8.994713425636292e-06, 1.1492520570755005e-05, 1.3990327715873718e-05, 1.648813486099243e-05, 1.8985942006111145e-05, 2.148374915122986e-05, 2.3981556296348572e-05, 2.6479363441467285e-05, 2.8977170586586e-05, 3.147497773170471e-05, 3.3972784876823425e-05, 3.647059202194214e-05, 3.896839916706085e-05, 4.1466206312179565e-05, 4.396401345729828e-05, 4.646182060241699e-05, 4.8959627747535706e-05, 5.145743489265442e-05, 5.395524203777313e-05, 5.6453049182891846e-05, 5.895085632801056e-05, 6.144866347312927e-05, 6.394647061824799e-05, 6.64442777633667e-05, 6.894208490848541e-05, 7.143989205360413e-05, 7.393769919872284e-05, 7.643550634384155e-05, 7.893331348896027e-05, 8.143112063407898e-05, 8.392892777919769e-05, 8.64267349243164e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 8.0, 10.0, 24.0, 28.0, 51.0, 73.0, 106.0, 210.0, 322.0, 753.0, 1645.0, 4920.0, 19530.0, 171505.0, 749913.0, 81004.0, 12441.0, 3440.0, 1294.0, 510.0, 331.0, 183.0, 91.0, 55.0, 36.0, 26.0, 15.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.625, -0.6073226928710938, -0.5896453857421875, -0.5719680786132812, -0.554290771484375, -0.5366134643554688, -0.5189361572265625, -0.5012588500976562, -0.48358154296875, -0.46590423583984375, -0.4482269287109375, -0.43054962158203125, -0.412872314453125, -0.39519500732421875, -0.3775177001953125, -0.35984039306640625, -0.3421630859375, -0.32448577880859375, -0.3068084716796875, -0.28913116455078125, -0.271453857421875, -0.25377655029296875, -0.2360992431640625, -0.21842193603515625, -0.20074462890625, -0.18306732177734375, -0.1653900146484375, -0.14771270751953125, -0.130035400390625, -0.11235809326171875, -0.0946807861328125, -0.07700347900390625, -0.059326171875, -0.04164886474609375, -0.0239715576171875, -0.00629425048828125, 0.011383056640625, 0.02906036376953125, 0.0467376708984375, 0.06441497802734375, 0.08209228515625, 0.09976959228515625, 0.1174468994140625, 0.13512420654296875, 0.152801513671875, 0.17047882080078125, 0.1881561279296875, 0.20583343505859375, 0.2235107421875, 0.24118804931640625, 0.2588653564453125, 0.27654266357421875, 0.294219970703125, 0.31189727783203125, 0.3295745849609375, 0.34725189208984375, 0.36492919921875, 0.38260650634765625, 0.4002838134765625, 0.41796112060546875, 0.435638427734375, 0.45331573486328125, 0.4709930419921875, 0.48867034912109375, 0.50634765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 14.0, 28.0, 30.0, 53.0, 96.0, 141.0, 159.0, 154.0, 131.0, 82.0, 41.0, 28.0, 14.0, 12.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8369140625, -0.8194084167480469, -0.8019027709960938, -0.7843971252441406, -0.7668914794921875, -0.7493858337402344, -0.7318801879882812, -0.7143745422363281, -0.696868896484375, -0.6793632507324219, -0.6618576049804688, -0.6443519592285156, -0.6268463134765625, -0.6093406677246094, -0.5918350219726562, -0.5743293762207031, -0.55682373046875, -0.5393180847167969, -0.5218124389648438, -0.5043067932128906, -0.4868011474609375, -0.4692955017089844, -0.45178985595703125, -0.4342842102050781, -0.416778564453125, -0.3992729187011719, -0.38176727294921875, -0.3642616271972656, -0.3467559814453125, -0.3292503356933594, -0.31174468994140625, -0.2942390441894531, -0.2767333984375, -0.2592277526855469, -0.24172210693359375, -0.22421646118164062, -0.2067108154296875, -0.18920516967773438, -0.17169952392578125, -0.15419387817382812, -0.136688232421875, -0.11918258666992188, -0.10167694091796875, -0.08417129516601562, -0.0666656494140625, -0.049160003662109375, -0.03165435791015625, -0.014148712158203125, 0.00335693359375, 0.020862579345703125, 0.03836822509765625, 0.055873870849609375, 0.0733795166015625, 0.09088516235351562, 0.10839080810546875, 0.12589645385742188, 0.143402099609375, 0.16090774536132812, 0.17841339111328125, 0.19591903686523438, 0.2134246826171875, 0.23093032836914062, 0.24843597412109375, 0.2659416198730469, 0.283447265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 15.0, 13.0, 25.0, 53.0, 75.0, 98.0, 143.0, 132.0, 118.0, 90.0, 86.0, 61.0, 30.0, 10.0, 17.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910872220993042, -3.7437593936920166, -3.576646566390991, -3.409533739089966, -3.2424209117889404, -3.075308084487915, -2.9081954956054688, -2.7410826683044434, -2.573969841003418, -2.4068570137023926, -2.239744186401367, -2.072631359100342, -1.9055185317993164, -1.738405704498291, -1.5712929964065552, -1.4041801691055298, -1.2370672225952148, -1.0699543952941895, -0.9028415679931641, -0.7357288002967834, -0.5686159729957581, -0.40150314569473267, -0.23439037799835205, -0.06727755069732666, 0.09983527660369873, 0.2669481039047241, 0.4340609014034271, 0.6011736989021301, 0.7682865262031555, 0.9353993535041809, 1.1025121212005615, 1.269624948501587, 1.4367375373840332, 1.6038503646850586, 1.770963191986084, 1.9380760192871094, 2.1051888465881348, 2.27230167388916, 2.4394145011901855, 2.606527328491211, 2.7736401557922363, 2.9407529830932617, 3.107865810394287, 3.2749786376953125, 3.442091464996338, 3.6092042922973633, 3.7763171195983887, 3.943429946899414, 4.110542297363281, 4.277655124664307, 4.444767951965332, 4.611880779266357, 4.778993606567383, 4.946106433868408, 5.113219261169434, 5.280332088470459, 5.447444915771484, 5.61455774307251, 5.781670570373535, 5.9487833976745605, 6.115896224975586, 6.283009052276611, 6.450121879577637, 6.617234706878662, 6.7843475341796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 6.0, 6.0, 4.0, 7.0, 11.0, 8.0, 19.0, 13.0, 17.0, 26.0, 26.0, 31.0, 31.0, 32.0, 36.0, 33.0, 47.0, 41.0, 34.0, 50.0, 53.0, 50.0, 43.0, 53.0, 37.0, 36.0, 34.0, 26.0, 31.0, 18.0, 20.0, 23.0, 11.0, 11.0, 8.0, 11.0, 13.0, 8.0, 11.0, 3.0, 9.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.3878402709960938, -3.2825968265533447, -3.1773533821105957, -3.072110176086426, -2.9668667316436768, -2.8616232872009277, -2.7563798427581787, -2.6511363983154297, -2.5458931922912598, -2.4406497478485107, -2.3354063034057617, -2.230163097381592, -2.1249196529388428, -2.0196762084960938, -1.9144327640533447, -1.8091894388198853, -1.7039459943771362, -1.5987025499343872, -1.4934592247009277, -1.3882157802581787, -1.2829724550247192, -1.1777290105819702, -1.0724856853485107, -0.9672422409057617, -0.8619988560676575, -0.7567554712295532, -0.651512086391449, -0.5462687015533447, -0.4410252869129181, -0.33578187227249146, -0.2305384874343872, -0.12529510259628296, -0.02005171775817871, 0.08519167453050613, 0.19043506681919098, 0.2956784665584564, 0.40092185139656067, 0.5061652660369873, 0.6114086508750916, 0.7166520357131958, 0.8218954205513, 0.9271388053894043, 1.0323822498321533, 1.1376255750656128, 1.2428690195083618, 1.3481123447418213, 1.4533557891845703, 1.5585992336273193, 1.6638425588607788, 1.7690860033035278, 1.8743293285369873, 1.9795727729797363, 2.0848162174224854, 2.1900596618652344, 2.2953028678894043, 2.4005463123321533, 2.5057897567749023, 2.6110332012176514, 2.7162766456604004, 2.8215198516845703, 2.9267632961273193, 3.0320067405700684, 3.1372501850128174, 3.2424936294555664, 3.3477368354797363]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 9.0, 6.0, 12.0, 11.0, 12.0, 31.0, 25.0, 39.0, 46.0, 57.0, 78.0, 109.0, 141.0, 255.0, 375.0, 590.0, 963.0, 1684.0, 3071.0, 6573.0, 20916.0, 3949820.0, 180957.0, 16214.0, 5651.0, 2691.0, 1400.0, 901.0, 486.0, 361.0, 252.0, 123.0, 103.0, 78.0, 62.0, 48.0, 29.0, 25.0, 29.0, 10.0, 8.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.87451171875, -0.8487167358398438, -0.8229217529296875, -0.7971267700195312, -0.771331787109375, -0.7455368041992188, -0.7197418212890625, -0.6939468383789062, -0.66815185546875, -0.6423568725585938, -0.6165618896484375, -0.5907669067382812, -0.564971923828125, -0.5391769409179688, -0.5133819580078125, -0.48758697509765625, -0.4617919921875, -0.43599700927734375, -0.4102020263671875, -0.38440704345703125, -0.358612060546875, -0.33281707763671875, -0.3070220947265625, -0.28122711181640625, -0.25543212890625, -0.22963714599609375, -0.2038421630859375, -0.17804718017578125, -0.152252197265625, -0.12645721435546875, -0.1006622314453125, -0.07486724853515625, -0.049072265625, -0.02327728271484375, 0.0025177001953125, 0.02831268310546875, 0.054107666015625, 0.07990264892578125, 0.1056976318359375, 0.13149261474609375, 0.15728759765625, 0.18308258056640625, 0.2088775634765625, 0.23467254638671875, 0.260467529296875, 0.28626251220703125, 0.3120574951171875, 0.33785247802734375, 0.3636474609375, 0.38944244384765625, 0.4152374267578125, 0.44103240966796875, 0.466827392578125, 0.49262237548828125, 0.5184173583984375, 0.5442123413085938, 0.57000732421875, 0.5958023071289062, 0.6215972900390625, 0.6473922729492188, 0.673187255859375, 0.6989822387695312, 0.7247772216796875, 0.7505722045898438, 0.7763671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 15.0, 11.0, 24.0, 24.0, 35.0, 34.0, 38.0, 43.0, 43.0, 52.0, 55.0, 42.0, 57.0, 57.0, 51.0, 52.0, 59.0, 42.0, 45.0, 26.0, 26.0, 21.0, 23.0, 15.0, 19.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14480018615722656, -0.14030838012695312, -0.1358165740966797, -0.13132476806640625, -0.1268329620361328, -0.12234115600585938, -0.11784934997558594, -0.1133575439453125, -0.10886573791503906, -0.10437393188476562, -0.09988212585449219, -0.09539031982421875, -0.09089851379394531, -0.08640670776367188, -0.08191490173339844, -0.077423095703125, -0.07293128967285156, -0.06843948364257812, -0.06394767761230469, -0.05945587158203125, -0.05496406555175781, -0.050472259521484375, -0.04598045349121094, -0.0414886474609375, -0.03699684143066406, -0.032505035400390625, -0.028013229370117188, -0.02352142333984375, -0.019029617309570312, -0.014537811279296875, -0.010046005249023438, -0.00555419921875, -0.0010623931884765625, 0.003429412841796875, 0.007921218872070312, 0.01241302490234375, 0.016904830932617188, 0.021396636962890625, 0.025888442993164062, 0.0303802490234375, 0.03487205505371094, 0.039363861083984375, 0.04385566711425781, 0.04834747314453125, 0.05283927917480469, 0.057331085205078125, 0.06182289123535156, 0.066314697265625, 0.07080650329589844, 0.07529830932617188, 0.07979011535644531, 0.08428192138671875, 0.08877372741699219, 0.09326553344726562, 0.09775733947753906, 0.1022491455078125, 0.10674095153808594, 0.11123275756835938, 0.11572456359863281, 0.12021636962890625, 0.12470817565917969, 0.12919998168945312, 0.13369178771972656, 0.13818359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 10.0, 12.0, 22.0, 34.0, 29.0, 46.0, 54.0, 75.0, 134.0, 171.0, 343.0, 701.0, 1316.0, 2972.0, 8733.0, 44805.0, 4093357.0, 29494.0, 6811.0, 2550.0, 1142.0, 561.0, 320.0, 155.0, 106.0, 79.0, 53.0, 45.0, 29.0, 26.0, 15.0, 14.0, 9.0, 10.0, 13.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.90234375, -1.8486175537109375, -1.794891357421875, -1.7411651611328125, -1.68743896484375, -1.6337127685546875, -1.579986572265625, -1.5262603759765625, -1.4725341796875, -1.4188079833984375, -1.365081787109375, -1.3113555908203125, -1.25762939453125, -1.2039031982421875, -1.150177001953125, -1.0964508056640625, -1.042724609375, -0.9889984130859375, -0.935272216796875, -0.8815460205078125, -0.82781982421875, -0.7740936279296875, -0.720367431640625, -0.6666412353515625, -0.6129150390625, -0.5591888427734375, -0.505462646484375, -0.4517364501953125, -0.39801025390625, -0.3442840576171875, -0.290557861328125, -0.2368316650390625, -0.18310546875, -0.1293792724609375, -0.075653076171875, -0.0219268798828125, 0.03179931640625, 0.0855255126953125, 0.139251708984375, 0.1929779052734375, 0.2467041015625, 0.3004302978515625, 0.354156494140625, 0.4078826904296875, 0.46160888671875, 0.5153350830078125, 0.569061279296875, 0.6227874755859375, 0.676513671875, 0.7302398681640625, 0.783966064453125, 0.8376922607421875, 0.89141845703125, 0.9451446533203125, 0.998870849609375, 1.0525970458984375, 1.1063232421875, 1.1600494384765625, 1.213775634765625, 1.2675018310546875, 1.32122802734375, 1.3749542236328125, 1.428680419921875, 1.4824066162109375, 1.5361328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 9.0, 18.0, 20.0, 85.0, 3673.0, 189.0, 30.0, 18.0, 7.0, 8.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.517791748046875, -0.50286865234375, -0.487945556640625, -0.4730224609375, -0.458099365234375, -0.44317626953125, -0.428253173828125, -0.413330078125, -0.398406982421875, -0.38348388671875, -0.368560791015625, -0.3536376953125, -0.338714599609375, -0.32379150390625, -0.308868408203125, -0.2939453125, -0.279022216796875, -0.26409912109375, -0.249176025390625, -0.2342529296875, -0.219329833984375, -0.20440673828125, -0.189483642578125, -0.174560546875, -0.159637451171875, -0.14471435546875, -0.129791259765625, -0.1148681640625, -0.099945068359375, -0.08502197265625, -0.070098876953125, -0.05517578125, -0.040252685546875, -0.02532958984375, -0.010406494140625, 0.0045166015625, 0.019439697265625, 0.03436279296875, 0.049285888671875, 0.064208984375, 0.079132080078125, 0.09405517578125, 0.108978271484375, 0.1239013671875, 0.138824462890625, 0.15374755859375, 0.168670654296875, 0.18359375, 0.198516845703125, 0.21343994140625, 0.228363037109375, 0.2432861328125, 0.258209228515625, 0.27313232421875, 0.288055419921875, 0.302978515625, 0.317901611328125, 0.33282470703125, 0.347747802734375, 0.3626708984375, 0.377593994140625, 0.39251708984375, 0.407440185546875, 0.42236328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 5.0, 10.0, 8.0, 18.0, 27.0, 24.0, 44.0, 73.0, 90.0, 93.0, 109.0, 131.0, 84.0, 87.0, 50.0, 36.0, 32.0, 24.0, 16.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0571504831314087, -1.0264272689819336, -0.9957041144371033, -0.964980959892273, -0.9342578053474426, -0.9035346508026123, -0.8728114366531372, -0.8420882821083069, -0.8113651275634766, -0.7806419730186462, -0.7499187588691711, -0.7191956043243408, -0.6884724497795105, -0.6577492952346802, -0.6270260810852051, -0.5963029265403748, -0.5655797719955444, -0.5348566174507141, -0.504133403301239, -0.4734102487564087, -0.44268709421157837, -0.41196390986442566, -0.38124072551727295, -0.3505175709724426, -0.31979435682296753, -0.2890711724758148, -0.2583480179309845, -0.2276248335838318, -0.19690167903900146, -0.16617849469184875, -0.13545532524585724, -0.10473215579986572, -0.0740090012550354, -0.043285831809043884, -0.01256265863776207, 0.018160514533519745, 0.04888368397951126, 0.07960686087608337, 0.11033003032207489, 0.1410531997680664, 0.17177636921405792, 0.20249953866004944, 0.23322270810604095, 0.26394587755203247, 0.2946690618991852, 0.3253922462463379, 0.3561154007911682, 0.38683855533599854, 0.41756173968315125, 0.44828492403030396, 0.4790080785751343, 0.5097312331199646, 0.5404544472694397, 0.57117760181427, 0.6019007563591003, 0.6326239109039307, 0.6633471250534058, 0.6940702795982361, 0.7247934937477112, 0.7555166482925415, 0.7862398028373718, 0.8169629573822021, 0.8476861715316772, 0.8784093260765076, 0.9091324806213379]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 5.0, 12.0, 10.0, 9.0, 14.0, 12.0, 14.0, 28.0, 29.0, 16.0, 27.0, 32.0, 29.0, 43.0, 27.0, 38.0, 40.0, 40.0, 34.0, 48.0, 52.0, 35.0, 43.0, 40.0, 33.0, 43.0, 39.0, 24.0, 30.0, 23.0, 22.0, 13.0, 20.0, 19.0, 11.0, 8.0, 11.0, 3.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5670897960662842, -0.5485234260559082, -0.5299570560455322, -0.5113906860351562, -0.4928243160247803, -0.4742579460144043, -0.45569154620170593, -0.43712517619132996, -0.418558806180954, -0.399992436170578, -0.381426066160202, -0.36285969614982605, -0.3442932963371277, -0.3257269263267517, -0.30716055631637573, -0.28859418630599976, -0.2700278162956238, -0.2514614462852478, -0.23289507627487183, -0.21432869136333466, -0.19576232135295868, -0.1771959513425827, -0.15862956643104553, -0.14006319642066956, -0.12149682641029358, -0.1029304563999176, -0.08436407893896103, -0.06579770147800446, -0.04723133146762848, -0.028664961457252502, -0.010098583996295929, 0.008467793464660645, 0.027034103870391846, 0.04560047760605812, 0.0641668513417244, 0.08273322880268097, 0.10129959881305695, 0.11986596882343292, 0.1384323537349701, 0.15699872374534607, 0.17556509375572205, 0.19413146376609802, 0.212697833776474, 0.23126421868801117, 0.24983058869838715, 0.2683969736099243, 0.2869633436203003, 0.30552971363067627, 0.32409608364105225, 0.3426624536514282, 0.3612288236618042, 0.3797951936721802, 0.39836156368255615, 0.41692793369293213, 0.4354943335056305, 0.45406070351600647, 0.47262707352638245, 0.4911934435367584, 0.5097598433494568, 0.5283262133598328, 0.5468925833702087, 0.5654589533805847, 0.5840253233909607, 0.6025916934013367, 0.6211580634117126]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 30.0, 34.0, 58.0, 89.0, 181.0, 347.0, 560.0, 1013.0, 1973.0, 4013.0, 8240.0, 18621.0, 47117.0, 144742.0, 395093.0, 282105.0, 88009.0, 31174.0, 12979.0, 5871.0, 2983.0, 1486.0, 800.0, 451.0, 219.0, 138.0, 73.0, 41.0, 38.0, 16.0, 10.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.4110069274902344, -0.39720916748046875, -0.3834114074707031, -0.3696136474609375, -0.3558158874511719, -0.34201812744140625, -0.3282203674316406, -0.314422607421875, -0.3006248474121094, -0.28682708740234375, -0.2730293273925781, -0.2592315673828125, -0.24543380737304688, -0.23163604736328125, -0.21783828735351562, -0.20404052734375, -0.19024276733398438, -0.17644500732421875, -0.16264724731445312, -0.1488494873046875, -0.13505172729492188, -0.12125396728515625, -0.10745620727539062, -0.093658447265625, -0.07986068725585938, -0.06606292724609375, -0.052265167236328125, -0.0384674072265625, -0.024669647216796875, -0.01087188720703125, 0.002925872802734375, 0.0167236328125, 0.030521392822265625, 0.04431915283203125, 0.058116912841796875, 0.0719146728515625, 0.08571243286132812, 0.09951019287109375, 0.11330795288085938, 0.127105712890625, 0.14090347290039062, 0.15470123291015625, 0.16849899291992188, 0.1822967529296875, 0.19609451293945312, 0.20989227294921875, 0.22369003295898438, 0.23748779296875, 0.2512855529785156, 0.26508331298828125, 0.2788810729980469, 0.2926788330078125, 0.3064765930175781, 0.32027435302734375, 0.3340721130371094, 0.347869873046875, 0.3616676330566406, 0.37546539306640625, 0.3892631530761719, 0.4030609130859375, 0.4168586730957031, 0.43065643310546875, 0.4444541931152344, 0.458251953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 8.0, 7.0, 17.0, 13.0, 22.0, 32.0, 13.0, 31.0, 42.0, 48.0, 43.0, 45.0, 44.0, 57.0, 55.0, 58.0, 52.0, 52.0, 67.0, 47.0, 62.0, 33.0, 26.0, 21.0, 21.0, 14.0, 17.0, 13.0, 9.0, 1.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.2374267578125, -0.23132705688476562, -0.22522735595703125, -0.21912765502929688, -0.2130279541015625, -0.20692825317382812, -0.20082855224609375, -0.19472885131835938, -0.188629150390625, -0.18252944946289062, -0.17642974853515625, -0.17033004760742188, -0.1642303466796875, -0.15813064575195312, -0.15203094482421875, -0.14593124389648438, -0.13983154296875, -0.13373184204101562, -0.12763214111328125, -0.12153244018554688, -0.1154327392578125, -0.10933303833007812, -0.10323333740234375, -0.09713363647460938, -0.091033935546875, -0.08493423461914062, -0.07883453369140625, -0.07273483276367188, -0.0666351318359375, -0.060535430908203125, -0.05443572998046875, -0.048336029052734375, -0.042236328125, -0.036136627197265625, -0.03003692626953125, -0.023937225341796875, -0.0178375244140625, -0.011737823486328125, -0.00563812255859375, 0.000461578369140625, 0.006561279296875, 0.012660980224609375, 0.01876068115234375, 0.024860382080078125, 0.0309600830078125, 0.037059783935546875, 0.04315948486328125, 0.049259185791015625, 0.05535888671875, 0.061458587646484375, 0.06755828857421875, 0.07365798950195312, 0.0797576904296875, 0.08585739135742188, 0.09195709228515625, 0.09805679321289062, 0.104156494140625, 0.11025619506835938, 0.11635589599609375, 0.12245559692382812, 0.1285552978515625, 0.13465499877929688, 0.14075469970703125, 0.14685440063476562, 0.1529541015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 3.0, 11.0, 14.0, 14.0, 20.0, 34.0, 60.0, 101.0, 116.0, 241.0, 370.0, 662.0, 1615.0, 4415.0, 17222.0, 130962.0, 765196.0, 105614.0, 14859.0, 3981.0, 1505.0, 644.0, 337.0, 193.0, 119.0, 60.0, 54.0, 35.0, 20.0, 19.0, 12.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.748046875, -0.7208023071289062, -0.6935577392578125, -0.6663131713867188, -0.639068603515625, -0.6118240356445312, -0.5845794677734375, -0.5573348999023438, -0.53009033203125, -0.5028457641601562, -0.4756011962890625, -0.44835662841796875, -0.421112060546875, -0.39386749267578125, -0.3666229248046875, -0.33937835693359375, -0.3121337890625, -0.28488922119140625, -0.2576446533203125, -0.23040008544921875, -0.203155517578125, -0.17591094970703125, -0.1486663818359375, -0.12142181396484375, -0.09417724609375, -0.06693267822265625, -0.0396881103515625, -0.01244354248046875, 0.014801025390625, 0.04204559326171875, 0.0692901611328125, 0.09653472900390625, 0.123779296875, 0.15102386474609375, 0.1782684326171875, 0.20551300048828125, 0.232757568359375, 0.26000213623046875, 0.2872467041015625, 0.31449127197265625, 0.34173583984375, 0.36898040771484375, 0.3962249755859375, 0.42346954345703125, 0.450714111328125, 0.47795867919921875, 0.5052032470703125, 0.5324478149414062, 0.5596923828125, 0.5869369506835938, 0.6141815185546875, 0.6414260864257812, 0.668670654296875, 0.6959152221679688, 0.7231597900390625, 0.7504043579101562, 0.77764892578125, 0.8048934936523438, 0.8321380615234375, 0.8593826293945312, 0.886627197265625, 0.9138717651367188, 0.9411163330078125, 0.9683609008789062, 0.99560546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 6.0, 11.0, 12.0, 15.0, 16.0, 13.0, 31.0, 25.0, 24.0, 41.0, 36.0, 45.0, 47.0, 49.0, 71.0, 57.0, 52.0, 59.0, 61.0, 45.0, 45.0, 54.0, 27.0, 25.0, 27.0, 28.0, 17.0, 19.0, 10.0, 8.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1058578491210938, -1.0759735107421875, -1.0460891723632812, -1.016204833984375, -0.9863204956054688, -0.9564361572265625, -0.9265518188476562, -0.89666748046875, -0.8667831420898438, -0.8368988037109375, -0.8070144653320312, -0.777130126953125, -0.7472457885742188, -0.7173614501953125, -0.6874771118164062, -0.6575927734375, -0.6277084350585938, -0.5978240966796875, -0.5679397583007812, -0.538055419921875, -0.5081710815429688, -0.4782867431640625, -0.44840240478515625, -0.41851806640625, -0.38863372802734375, -0.3587493896484375, -0.32886505126953125, -0.298980712890625, -0.26909637451171875, -0.2392120361328125, -0.20932769775390625, -0.179443359375, -0.14955902099609375, -0.1196746826171875, -0.08979034423828125, -0.059906005859375, -0.03002166748046875, -0.0001373291015625, 0.02974700927734375, 0.05963134765625, 0.08951568603515625, 0.1194000244140625, 0.14928436279296875, 0.179168701171875, 0.20905303955078125, 0.2389373779296875, 0.26882171630859375, 0.2987060546875, 0.32859039306640625, 0.3584747314453125, 0.38835906982421875, 0.418243408203125, 0.44812774658203125, 0.4780120849609375, 0.5078964233398438, 0.53778076171875, 0.5676651000976562, 0.5975494384765625, 0.6274337768554688, 0.657318115234375, 0.6872024536132812, 0.7170867919921875, 0.7469711303710938, 0.77685546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 11.0, 10.0, 17.0, 26.0, 51.0, 67.0, 109.0, 169.0, 247.0, 406.0, 814.0, 1728.0, 4718.0, 18604.0, 134708.0, 730058.0, 130443.0, 17943.0, 4717.0, 1695.0, 823.0, 437.0, 251.0, 166.0, 121.0, 65.0, 29.0, 14.0, 29.0, 29.0, 12.0, 15.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394775390625, -0.3813896179199219, -0.36800384521484375, -0.3546180725097656, -0.3412322998046875, -0.3278465270996094, -0.31446075439453125, -0.3010749816894531, -0.287689208984375, -0.2743034362792969, -0.26091766357421875, -0.24753189086914062, -0.2341461181640625, -0.22076034545898438, -0.20737457275390625, -0.19398880004882812, -0.18060302734375, -0.16721725463867188, -0.15383148193359375, -0.14044570922851562, -0.1270599365234375, -0.11367416381835938, -0.10028839111328125, -0.08690261840820312, -0.073516845703125, -0.060131072998046875, -0.04674530029296875, -0.033359527587890625, -0.0199737548828125, -0.006587982177734375, 0.00679779052734375, 0.020183563232421875, 0.0335693359375, 0.046955108642578125, 0.06034088134765625, 0.07372665405273438, 0.0871124267578125, 0.10049819946289062, 0.11388397216796875, 0.12726974487304688, 0.140655517578125, 0.15404129028320312, 0.16742706298828125, 0.18081283569335938, 0.1941986083984375, 0.20758438110351562, 0.22097015380859375, 0.23435592651367188, 0.24774169921875, 0.2611274719238281, 0.27451324462890625, 0.2878990173339844, 0.3012847900390625, 0.3146705627441406, 0.32805633544921875, 0.3414421081542969, 0.354827880859375, 0.3682136535644531, 0.38159942626953125, 0.3949851989746094, 0.4083709716796875, 0.4217567443847656, 0.43514251708984375, 0.4485282897949219, 0.4619140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 2.0, 9.0, 10.0, 16.0, 39.0, 45.0, 72.0, 96.0, 119.0, 150.0, 103.0, 102.0, 70.0, 45.0, 32.0, 35.0, 17.0, 9.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010126829147338867, -9.826663881540298e-05, -9.52649861574173e-05, -9.226333349943161e-05, -8.926168084144592e-05, -8.626002818346024e-05, -8.325837552547455e-05, -8.025672286748886e-05, -7.725507020950317e-05, -7.425341755151749e-05, -7.12517648935318e-05, -6.825011223554611e-05, -6.524845957756042e-05, -6.224680691957474e-05, -5.924515426158905e-05, -5.624350160360336e-05, -5.3241848945617676e-05, -5.024019628763199e-05, -4.72385436296463e-05, -4.4236890971660614e-05, -4.123523831367493e-05, -3.823358565568924e-05, -3.523193299770355e-05, -3.2230280339717865e-05, -2.9228627681732178e-05, -2.622697502374649e-05, -2.3225322365760803e-05, -2.0223669707775116e-05, -1.722201704978943e-05, -1.4220364391803741e-05, -1.1218711733818054e-05, -8.217059075832367e-06, -5.21540641784668e-06, -2.2137537598609924e-06, 7.878988981246948e-07, 3.789551556110382e-06, 6.791204214096069e-06, 9.792856872081757e-06, 1.2794509530067444e-05, 1.579616218805313e-05, 1.879781484603882e-05, 2.1799467504024506e-05, 2.4801120162010193e-05, 2.780277281999588e-05, 3.080442547798157e-05, 3.3806078135967255e-05, 3.680773079395294e-05, 3.980938345193863e-05, 4.2811036109924316e-05, 4.5812688767910004e-05, 4.881434142589569e-05, 5.181599408388138e-05, 5.4817646741867065e-05, 5.781929939985275e-05, 6.082095205783844e-05, 6.382260471582413e-05, 6.682425737380981e-05, 6.98259100317955e-05, 7.282756268978119e-05, 7.582921534776688e-05, 7.883086800575256e-05, 8.183252066373825e-05, 8.483417332172394e-05, 8.783582597970963e-05, 9.083747863769531e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 13.0, 15.0, 25.0, 31.0, 39.0, 94.0, 103.0, 214.0, 372.0, 693.0, 1408.0, 3473.0, 12579.0, 80242.0, 712014.0, 205298.0, 22494.0, 5440.0, 1934.0, 938.0, 444.0, 268.0, 143.0, 87.0, 54.0, 38.0, 36.0, 16.0, 13.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.455078125, -0.44024658203125, -0.4254150390625, -0.41058349609375, -0.395751953125, -0.38092041015625, -0.3660888671875, -0.35125732421875, -0.33642578125, -0.32159423828125, -0.3067626953125, -0.29193115234375, -0.277099609375, -0.26226806640625, -0.2474365234375, -0.23260498046875, -0.2177734375, -0.20294189453125, -0.1881103515625, -0.17327880859375, -0.158447265625, -0.14361572265625, -0.1287841796875, -0.11395263671875, -0.09912109375, -0.08428955078125, -0.0694580078125, -0.05462646484375, -0.039794921875, -0.02496337890625, -0.0101318359375, 0.00469970703125, 0.01953125, 0.03436279296875, 0.0491943359375, 0.06402587890625, 0.078857421875, 0.09368896484375, 0.1085205078125, 0.12335205078125, 0.13818359375, 0.15301513671875, 0.1678466796875, 0.18267822265625, 0.197509765625, 0.21234130859375, 0.2271728515625, 0.24200439453125, 0.2568359375, 0.27166748046875, 0.2864990234375, 0.30133056640625, 0.316162109375, 0.33099365234375, 0.3458251953125, 0.36065673828125, 0.37548828125, 0.39031982421875, 0.4051513671875, 0.41998291015625, 0.434814453125, 0.44964599609375, 0.4644775390625, 0.47930908203125, 0.494140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 11.0, 19.0, 25.0, 25.0, 61.0, 82.0, 103.0, 128.0, 132.0, 118.0, 92.0, 67.0, 45.0, 36.0, 17.0, 12.0, 11.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4444541931152344, -0.42821502685546875, -0.4119758605957031, -0.3957366943359375, -0.3794975280761719, -0.36325836181640625, -0.3470191955566406, -0.330780029296875, -0.3145408630371094, -0.29830169677734375, -0.2820625305175781, -0.2658233642578125, -0.24958419799804688, -0.23334503173828125, -0.21710586547851562, -0.20086669921875, -0.18462753295898438, -0.16838836669921875, -0.15214920043945312, -0.1359100341796875, -0.11967086791992188, -0.10343170166015625, -0.08719253540039062, -0.070953369140625, -0.054714202880859375, -0.03847503662109375, -0.022235870361328125, -0.0059967041015625, 0.010242462158203125, 0.02648162841796875, 0.042720794677734375, 0.0589599609375, 0.07519912719726562, 0.09143829345703125, 0.10767745971679688, 0.1239166259765625, 0.14015579223632812, 0.15639495849609375, 0.17263412475585938, 0.188873291015625, 0.20511245727539062, 0.22135162353515625, 0.23759078979492188, 0.2538299560546875, 0.2700691223144531, 0.28630828857421875, 0.3025474548339844, 0.31878662109375, 0.3350257873535156, 0.35126495361328125, 0.3675041198730469, 0.3837432861328125, 0.3999824523925781, 0.41622161865234375, 0.4324607849121094, 0.448699951171875, 0.4649391174316406, 0.48117828369140625, 0.4974174499511719, 0.5136566162109375, 0.5298957824707031, 0.5461349487304688, 0.5623741149902344, 0.57861328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 20.0, 87.0, 272.0, 361.0, 193.0, 51.0, 14.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31913423538208, -3.7977378368377686, -3.276341438293457, -2.7549452781677246, -2.233548879623413, -1.7121524810791016, -1.1907563209533691, -0.6693599224090576, -0.1479635238647461, 0.37343281507492065, 0.8948291540145874, 1.4162254333496094, 1.937621831893921, 2.4590182304382324, 2.980414390563965, 3.5018107891082764, 4.023207187652588, 4.54460334777832, 5.065999984741211, 5.587396144866943, 6.108792304992676, 6.630188941955566, 7.151585102081299, 7.672981262207031, 8.194377899169922, 8.715774536132812, 9.237170219421387, 9.758566856384277, 10.279963493347168, 10.801359176635742, 11.322755813598633, 11.844152450561523, 12.365547180175781, 12.886943817138672, 13.408339500427246, 13.929736137390137, 14.451132774353027, 14.972528457641602, 15.493925094604492, 16.015321731567383, 16.536718368530273, 17.058115005493164, 17.579511642456055, 18.100906372070312, 18.622303009033203, 19.143699645996094, 19.665096282958984, 20.186492919921875, 20.707889556884766, 21.229286193847656, 21.750682830810547, 22.272079467773438, 22.793474197387695, 23.314870834350586, 23.836267471313477, 24.357664108276367, 24.879058837890625, 25.400455474853516, 25.921852111816406, 26.443248748779297, 26.964643478393555, 27.486040115356445, 28.007436752319336, 28.528833389282227, 29.050230026245117]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 8.0, 8.0, 17.0, 17.0, 26.0, 18.0, 30.0, 27.0, 28.0, 45.0, 39.0, 70.0, 54.0, 52.0, 60.0, 60.0, 44.0, 55.0, 48.0, 40.0, 38.0, 31.0, 32.0, 27.0, 20.0, 19.0, 16.0, 12.0, 14.0, 8.0, 5.0, 3.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.067383766174316, -4.918712615966797, -4.770041465759277, -4.621370315551758, -4.472699165344238, -4.3240275382995605, -4.175356388092041, -4.0266852378845215, -3.878014087677002, -3.7293429374694824, -3.580671787261963, -3.4320003986358643, -3.2833292484283447, -3.134658098220825, -2.9859867095947266, -2.837315559387207, -2.6886444091796875, -2.539973258972168, -2.3913021087646484, -2.24263072013855, -2.0939595699310303, -1.9452884197235107, -1.7966171503067017, -1.6479458808898926, -1.499274730682373, -1.3506035804748535, -1.2019323110580444, -1.0532610416412354, -0.9045898914337158, -0.7559186816215515, -0.6072474718093872, -0.4585762023925781, -0.3099050521850586, -0.1612338423728943, -0.01256263256072998, 0.13610857725143433, 0.28477978706359863, 0.43345099687576294, 0.5821222066879272, 0.7307934761047363, 0.8794646263122559, 1.0281357765197754, 1.1768070459365845, 1.3254783153533936, 1.474149465560913, 1.6228206157684326, 1.7714918851852417, 1.9201631546020508, 2.0688343048095703, 2.21750545501709, 2.3661766052246094, 2.514847993850708, 2.6635191440582275, 2.812190294265747, 2.9608616828918457, 3.1095328330993652, 3.2582039833068848, 3.4068751335144043, 3.555546283721924, 3.7042176723480225, 3.852888822555542, 4.001560211181641, 4.15023136138916, 4.29890251159668, 4.447573661804199]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 7.0, 19.0, 23.0, 37.0, 36.0, 64.0, 123.0, 151.0, 245.0, 433.0, 739.0, 1639.0, 4853.0, 44110.0, 4126263.0, 10418.0, 2590.0, 1060.0, 527.0, 310.0, 194.0, 115.0, 88.0, 64.0, 50.0, 31.0, 25.0, 17.0, 14.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1907196044921875, -1.149993896484375, -1.1092681884765625, -1.06854248046875, -1.0278167724609375, -0.987091064453125, -0.9463653564453125, -0.9056396484375, -0.8649139404296875, -0.824188232421875, -0.7834625244140625, -0.74273681640625, -0.7020111083984375, -0.661285400390625, -0.6205596923828125, -0.579833984375, -0.5391082763671875, -0.498382568359375, -0.4576568603515625, -0.41693115234375, -0.3762054443359375, -0.335479736328125, -0.2947540283203125, -0.2540283203125, -0.2133026123046875, -0.172576904296875, -0.1318511962890625, -0.09112548828125, -0.0503997802734375, -0.009674072265625, 0.0310516357421875, 0.07177734375, 0.1125030517578125, 0.153228759765625, 0.1939544677734375, 0.23468017578125, 0.2754058837890625, 0.316131591796875, 0.3568572998046875, 0.3975830078125, 0.4383087158203125, 0.479034423828125, 0.5197601318359375, 0.56048583984375, 0.6012115478515625, 0.641937255859375, 0.6826629638671875, 0.723388671875, 0.7641143798828125, 0.804840087890625, 0.8455657958984375, 0.88629150390625, 0.9270172119140625, 0.967742919921875, 1.0084686279296875, 1.0491943359375, 1.0899200439453125, 1.130645751953125, 1.1713714599609375, 1.21209716796875, 1.2528228759765625, 1.293548583984375, 1.3342742919921875, 1.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 5.0, 2.0, 7.0, 1.0, 5.0, 6.0, 8.0, 20.0, 14.0, 18.0, 17.0, 33.0, 28.0, 40.0, 32.0, 53.0, 43.0, 62.0, 61.0, 64.0, 48.0, 45.0, 61.0, 52.0, 48.0, 51.0, 36.0, 27.0, 25.0, 22.0, 14.0, 12.0, 10.0, 6.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20703125, -0.2007007598876953, -0.19437026977539062, -0.18803977966308594, -0.18170928955078125, -0.17537879943847656, -0.16904830932617188, -0.1627178192138672, -0.1563873291015625, -0.1500568389892578, -0.14372634887695312, -0.13739585876464844, -0.13106536865234375, -0.12473487854003906, -0.11840438842773438, -0.11207389831542969, -0.105743408203125, -0.09941291809082031, -0.09308242797851562, -0.08675193786621094, -0.08042144775390625, -0.07409095764160156, -0.06776046752929688, -0.06142997741699219, -0.0550994873046875, -0.04876899719238281, -0.042438507080078125, -0.03610801696777344, -0.02977752685546875, -0.023447036743164062, -0.017116546630859375, -0.010786056518554688, -0.00445556640625, 0.0018749237060546875, 0.008205413818359375, 0.014535903930664062, 0.02086639404296875, 0.027196884155273438, 0.033527374267578125, 0.03985786437988281, 0.0461883544921875, 0.05251884460449219, 0.058849334716796875, 0.06517982482910156, 0.07151031494140625, 0.07784080505371094, 0.08417129516601562, 0.09050178527832031, 0.096832275390625, 0.10316276550292969, 0.10949325561523438, 0.11582374572753906, 0.12215423583984375, 0.12848472595214844, 0.13481521606445312, 0.1411457061767578, 0.1474761962890625, 0.1538066864013672, 0.16013717651367188, 0.16646766662597656, 0.17279815673828125, 0.17912864685058594, 0.18545913696289062, 0.1917896270751953, 0.1981201171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 13.0, 24.0, 13.0, 39.0, 44.0, 68.0, 132.0, 154.0, 257.0, 360.0, 552.0, 869.0, 1260.0, 2133.0, 3649.0, 7864.0, 30385.0, 4072336.0, 53173.0, 10068.0, 4238.0, 2381.0, 1428.0, 942.0, 610.0, 452.0, 279.0, 173.0, 116.0, 101.0, 60.0, 30.0, 29.0, 13.0, 14.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0625, -1.0326690673828125, -1.002838134765625, -0.9730072021484375, -0.94317626953125, -0.9133453369140625, -0.883514404296875, -0.8536834716796875, -0.8238525390625, -0.7940216064453125, -0.764190673828125, -0.7343597412109375, -0.70452880859375, -0.6746978759765625, -0.644866943359375, -0.6150360107421875, -0.585205078125, -0.5553741455078125, -0.525543212890625, -0.4957122802734375, -0.46588134765625, -0.4360504150390625, -0.406219482421875, -0.3763885498046875, -0.3465576171875, -0.3167266845703125, -0.286895751953125, -0.2570648193359375, -0.22723388671875, -0.1974029541015625, -0.167572021484375, -0.1377410888671875, -0.10791015625, -0.0780792236328125, -0.048248291015625, -0.0184173583984375, 0.01141357421875, 0.0412445068359375, 0.071075439453125, 0.1009063720703125, 0.1307373046875, 0.1605682373046875, 0.190399169921875, 0.2202301025390625, 0.25006103515625, 0.2798919677734375, 0.309722900390625, 0.3395538330078125, 0.369384765625, 0.3992156982421875, 0.429046630859375, 0.4588775634765625, 0.48870849609375, 0.5185394287109375, 0.548370361328125, 0.5782012939453125, 0.6080322265625, 0.6378631591796875, 0.667694091796875, 0.6975250244140625, 0.72735595703125, 0.7571868896484375, 0.787017822265625, 0.8168487548828125, 0.8466796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 25.0, 29.0, 222.0, 3597.0, 79.0, 32.0, 15.0, 16.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.248779296875, -0.24190711975097656, -0.23503494262695312, -0.2281627655029297, -0.22129058837890625, -0.2144184112548828, -0.20754623413085938, -0.20067405700683594, -0.1938018798828125, -0.18692970275878906, -0.18005752563476562, -0.1731853485107422, -0.16631317138671875, -0.1594409942626953, -0.15256881713867188, -0.14569664001464844, -0.138824462890625, -0.13195228576660156, -0.12508010864257812, -0.11820793151855469, -0.11133575439453125, -0.10446357727050781, -0.09759140014648438, -0.09071922302246094, -0.0838470458984375, -0.07697486877441406, -0.07010269165039062, -0.06323051452636719, -0.05635833740234375, -0.04948616027832031, -0.042613983154296875, -0.03574180603027344, -0.02886962890625, -0.021997451782226562, -0.015125274658203125, -0.008253097534179688, -0.00138092041015625, 0.0054912567138671875, 0.012363433837890625, 0.019235610961914062, 0.0261077880859375, 0.03297996520996094, 0.039852142333984375, 0.04672431945800781, 0.05359649658203125, 0.06046867370605469, 0.06734085083007812, 0.07421302795410156, 0.081085205078125, 0.08795738220214844, 0.09482955932617188, 0.10170173645019531, 0.10857391357421875, 0.11544609069824219, 0.12231826782226562, 0.12919044494628906, 0.1360626220703125, 0.14293479919433594, 0.14980697631835938, 0.1566791534423828, 0.16355133056640625, 0.1704235076904297, 0.17729568481445312, 0.18416786193847656, 0.1910400390625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 12.0, 25.0, 23.0, 33.0, 53.0, 70.0, 71.0, 96.0, 114.0, 121.0, 84.0, 80.0, 68.0, 47.0, 34.0, 27.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6498937010765076, -0.624650239944458, -0.5994067788124084, -0.5741633176803589, -0.5489199161529541, -0.5236764550209045, -0.498432993888855, -0.4731895327568054, -0.44794610142707825, -0.4227026402950287, -0.3974592089653015, -0.37221574783325195, -0.3469722867012024, -0.3217288553714752, -0.29648539423942566, -0.2712419629096985, -0.24599850177764893, -0.22075505554676056, -0.1955116093158722, -0.17026814818382263, -0.14502470195293427, -0.1197812557220459, -0.09453779458999634, -0.06929434835910797, -0.044050902128219604, -0.01880745217204094, 0.006435997784137726, 0.03167945146560669, 0.056922897696495056, 0.08216634392738342, 0.10740980505943298, 0.13265325129032135, 0.15789663791656494, 0.1831400841474533, 0.20838353037834167, 0.23362699151039124, 0.2588704228401184, 0.28411388397216797, 0.30935734510421753, 0.3346008062362671, 0.35984423756599426, 0.3850876986980438, 0.410331130027771, 0.43557459115982056, 0.4608180522918701, 0.4860614836215973, 0.5113049745559692, 0.536548376083374, 0.5617918372154236, 0.5870352983474731, 0.6122787594795227, 0.6375222206115723, 0.662765622138977, 0.6880090832710266, 0.7132525444030762, 0.7384960055351257, 0.7637394666671753, 0.7889829277992249, 0.8142263889312744, 0.8394697904586792, 0.8647132515907288, 0.8899567127227783, 0.9152001738548279, 0.9404436349868774, 0.9656870365142822]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 16.0, 19.0, 13.0, 9.0, 13.0, 13.0, 24.0, 23.0, 23.0, 17.0, 33.0, 43.0, 33.0, 36.0, 34.0, 40.0, 37.0, 49.0, 41.0, 39.0, 38.0, 27.0, 33.0, 33.0, 38.0, 33.0, 34.0, 25.0, 19.0, 22.0, 15.0, 20.0, 13.0, 11.0, 12.0, 13.0, 7.0, 8.0, 5.0, 7.0, 1.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.3959835171699524, -0.38427460193634033, -0.37256571650505066, -0.360856831073761, -0.3491479158401489, -0.33743900060653687, -0.3257301151752472, -0.3140212297439575, -0.30231231451034546, -0.2906033992767334, -0.2788945138454437, -0.26718562841415405, -0.255476713180542, -0.24376781284809113, -0.23205891251564026, -0.2203500121831894, -0.20864111185073853, -0.19693221151828766, -0.1852233111858368, -0.17351441085338593, -0.16180551052093506, -0.1500966101884842, -0.13838770985603333, -0.12667880952358246, -0.11496990919113159, -0.10326100885868073, -0.09155210852622986, -0.07984320819377899, -0.06813430786132812, -0.05642540752887726, -0.04471650719642639, -0.033007606863975525, -0.021298706531524658, -0.009589806199073792, 0.002119094133377075, 0.013827994465827942, 0.02553689479827881, 0.037245795130729675, 0.04895469546318054, 0.06066359579563141, 0.07237249612808228, 0.08408139646053314, 0.09579029679298401, 0.10749919712543488, 0.11920809745788574, 0.1309169977903366, 0.14262589812278748, 0.15433479845523834, 0.1660436987876892, 0.17775259912014008, 0.18946149945259094, 0.2011703997850418, 0.21287930011749268, 0.22458820044994354, 0.2362971007823944, 0.24800600111484528, 0.25971490144729614, 0.2714238166809082, 0.2831327021121979, 0.29484158754348755, 0.3065505027770996, 0.31825941801071167, 0.32996830344200134, 0.341677188873291, 0.3533861041069031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 6.0, 13.0, 18.0, 22.0, 24.0, 35.0, 51.0, 73.0, 95.0, 160.0, 235.0, 354.0, 612.0, 1013.0, 1840.0, 3624.0, 7221.0, 16232.0, 39815.0, 103427.0, 267419.0, 350156.0, 153904.0, 58530.0, 23257.0, 9990.0, 4711.0, 2399.0, 1292.0, 730.0, 441.0, 273.0, 183.0, 107.0, 76.0, 56.0, 40.0, 30.0, 22.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.35257720947265625, -0.3416290283203125, -0.33068084716796875, -0.319732666015625, -0.30878448486328125, -0.2978363037109375, -0.28688812255859375, -0.27593994140625, -0.26499176025390625, -0.2540435791015625, -0.24309539794921875, -0.232147216796875, -0.22119903564453125, -0.2102508544921875, -0.19930267333984375, -0.1883544921875, -0.17740631103515625, -0.1664581298828125, -0.15550994873046875, -0.144561767578125, -0.13361358642578125, -0.1226654052734375, -0.11171722412109375, -0.10076904296875, -0.08982086181640625, -0.0788726806640625, -0.06792449951171875, -0.056976318359375, -0.04602813720703125, -0.0350799560546875, -0.02413177490234375, -0.01318359375, -0.00223541259765625, 0.0087127685546875, 0.01966094970703125, 0.030609130859375, 0.04155731201171875, 0.0525054931640625, 0.06345367431640625, 0.07440185546875, 0.08535003662109375, 0.0962982177734375, 0.10724639892578125, 0.118194580078125, 0.12914276123046875, 0.1400909423828125, 0.15103912353515625, 0.1619873046875, 0.17293548583984375, 0.1838836669921875, 0.19483184814453125, 0.205780029296875, 0.21672821044921875, 0.2276763916015625, 0.23862457275390625, 0.24957275390625, 0.26052093505859375, 0.2714691162109375, 0.28241729736328125, 0.293365478515625, 0.30431365966796875, 0.3152618408203125, 0.32621002197265625, 0.337158203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 5.0, 6.0, 10.0, 12.0, 11.0, 12.0, 12.0, 15.0, 21.0, 23.0, 27.0, 33.0, 28.0, 31.0, 32.0, 54.0, 58.0, 46.0, 45.0, 38.0, 58.0, 46.0, 42.0, 47.0, 41.0, 32.0, 29.0, 29.0, 20.0, 21.0, 16.0, 13.0, 13.0, 12.0, 14.0, 5.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17815017700195312, -0.17258453369140625, -0.16701889038085938, -0.1614532470703125, -0.15588760375976562, -0.15032196044921875, -0.14475631713867188, -0.139190673828125, -0.13362503051757812, -0.12805938720703125, -0.12249374389648438, -0.1169281005859375, -0.11136245727539062, -0.10579681396484375, -0.10023117065429688, -0.09466552734375, -0.08909988403320312, -0.08353424072265625, -0.07796859741210938, -0.0724029541015625, -0.06683731079101562, -0.06127166748046875, -0.055706024169921875, -0.050140380859375, -0.044574737548828125, -0.03900909423828125, -0.033443450927734375, -0.0278778076171875, -0.022312164306640625, -0.01674652099609375, -0.011180877685546875, -0.005615234375, -4.9591064453125e-05, 0.00551605224609375, 0.011081695556640625, 0.0166473388671875, 0.022212982177734375, 0.02777862548828125, 0.033344268798828125, 0.038909912109375, 0.044475555419921875, 0.05004119873046875, 0.055606842041015625, 0.0611724853515625, 0.06673812866210938, 0.07230377197265625, 0.07786941528320312, 0.08343505859375, 0.08900070190429688, 0.09456634521484375, 0.10013198852539062, 0.1056976318359375, 0.11126327514648438, 0.11682891845703125, 0.12239456176757812, 0.127960205078125, 0.13352584838867188, 0.13909149169921875, 0.14465713500976562, 0.1502227783203125, 0.15578842163085938, 0.16135406494140625, 0.16691970825195312, 0.1724853515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 7.0, 8.0, 9.0, 22.0, 25.0, 29.0, 39.0, 49.0, 96.0, 102.0, 194.0, 288.0, 450.0, 731.0, 1457.0, 3450.0, 10922.0, 56817.0, 546957.0, 371302.0, 40953.0, 8539.0, 2812.0, 1307.0, 662.0, 457.0, 267.0, 163.0, 117.0, 74.0, 68.0, 37.0, 24.0, 23.0, 11.0, 11.0, 17.0, 10.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.5830078125, -0.56414794921875, -0.5452880859375, -0.52642822265625, -0.507568359375, -0.48870849609375, -0.4698486328125, -0.45098876953125, -0.43212890625, -0.41326904296875, -0.3944091796875, -0.37554931640625, -0.356689453125, -0.33782958984375, -0.3189697265625, -0.30010986328125, -0.28125, -0.26239013671875, -0.2435302734375, -0.22467041015625, -0.205810546875, -0.18695068359375, -0.1680908203125, -0.14923095703125, -0.13037109375, -0.11151123046875, -0.0926513671875, -0.07379150390625, -0.054931640625, -0.03607177734375, -0.0172119140625, 0.00164794921875, 0.0205078125, 0.03936767578125, 0.0582275390625, 0.07708740234375, 0.095947265625, 0.11480712890625, 0.1336669921875, 0.15252685546875, 0.17138671875, 0.19024658203125, 0.2091064453125, 0.22796630859375, 0.246826171875, 0.26568603515625, 0.2845458984375, 0.30340576171875, 0.322265625, 0.34112548828125, 0.3599853515625, 0.37884521484375, 0.397705078125, 0.41656494140625, 0.4354248046875, 0.45428466796875, 0.47314453125, 0.49200439453125, 0.5108642578125, 0.52972412109375, 0.548583984375, 0.56744384765625, 0.5863037109375, 0.60516357421875, 0.6240234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 13.0, 14.0, 10.0, 18.0, 21.0, 24.0, 24.0, 42.0, 40.0, 42.0, 36.0, 49.0, 38.0, 49.0, 42.0, 51.0, 53.0, 53.0, 42.0, 32.0, 38.0, 32.0, 42.0, 31.0, 24.0, 25.0, 13.0, 18.0, 14.0, 11.0, 6.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.837890625, -0.8110275268554688, -0.7841644287109375, -0.7573013305664062, -0.730438232421875, -0.7035751342773438, -0.6767120361328125, -0.6498489379882812, -0.62298583984375, -0.5961227416992188, -0.5692596435546875, -0.5423965454101562, -0.515533447265625, -0.48867034912109375, -0.4618072509765625, -0.43494415283203125, -0.4080810546875, -0.38121795654296875, -0.3543548583984375, -0.32749176025390625, -0.300628662109375, -0.27376556396484375, -0.2469024658203125, -0.22003936767578125, -0.19317626953125, -0.16631317138671875, -0.1394500732421875, -0.11258697509765625, -0.085723876953125, -0.05886077880859375, -0.0319976806640625, -0.00513458251953125, 0.021728515625, 0.04859161376953125, 0.0754547119140625, 0.10231781005859375, 0.129180908203125, 0.15604400634765625, 0.1829071044921875, 0.20977020263671875, 0.23663330078125, 0.26349639892578125, 0.2903594970703125, 0.31722259521484375, 0.344085693359375, 0.37094879150390625, 0.3978118896484375, 0.42467498779296875, 0.4515380859375, 0.47840118408203125, 0.5052642822265625, 0.5321273803710938, 0.558990478515625, 0.5858535766601562, 0.6127166748046875, 0.6395797729492188, 0.66644287109375, 0.6933059692382812, 0.7201690673828125, 0.7470321655273438, 0.773895263671875, 0.8007583618164062, 0.8276214599609375, 0.8544845581054688, 0.88134765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 10.0, 13.0, 26.0, 41.0, 93.0, 134.0, 316.0, 889.0, 3959.0, 48595.0, 967921.0, 22551.0, 2726.0, 673.0, 273.0, 126.0, 75.0, 39.0, 26.0, 10.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4180984497070312, -1.3820953369140625, -1.3460922241210938, -1.310089111328125, -1.2740859985351562, -1.2380828857421875, -1.2020797729492188, -1.16607666015625, -1.1300735473632812, -1.0940704345703125, -1.0580673217773438, -1.022064208984375, -0.9860610961914062, -0.9500579833984375, -0.9140548706054688, -0.8780517578125, -0.8420486450195312, -0.8060455322265625, -0.7700424194335938, -0.734039306640625, -0.6980361938476562, -0.6620330810546875, -0.6260299682617188, -0.59002685546875, -0.5540237426757812, -0.5180206298828125, -0.48201751708984375, -0.446014404296875, -0.41001129150390625, -0.3740081787109375, -0.33800506591796875, -0.302001953125, -0.26599884033203125, -0.2299957275390625, -0.19399261474609375, -0.157989501953125, -0.12198638916015625, -0.0859832763671875, -0.04998016357421875, -0.01397705078125, 0.02202606201171875, 0.0580291748046875, 0.09403228759765625, 0.130035400390625, 0.16603851318359375, 0.2020416259765625, 0.23804473876953125, 0.2740478515625, 0.31005096435546875, 0.3460540771484375, 0.38205718994140625, 0.418060302734375, 0.45406341552734375, 0.4900665283203125, 0.5260696411132812, 0.56207275390625, 0.5980758666992188, 0.6340789794921875, 0.6700820922851562, 0.706085205078125, 0.7420883178710938, 0.7780914306640625, 0.8140945434570312, 0.85009765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 15.0, 27.0, 45.0, 68.0, 132.0, 161.0, 192.0, 138.0, 86.0, 51.0, 32.0, 24.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014579296112060547, -0.00014187581837177277, -0.00013795867562294006, -0.00013404153287410736, -0.00013012439012527466, -0.00012620724737644196, -0.00012229010462760925, -0.00011837296187877655, -0.00011445581912994385, -0.00011053867638111115, -0.00010662153363227844, -0.00010270439088344574, -9.878724813461304e-05, -9.487010538578033e-05, -9.095296263694763e-05, -8.703581988811493e-05, -8.311867713928223e-05, -7.920153439044952e-05, -7.528439164161682e-05, -7.136724889278412e-05, -6.745010614395142e-05, -6.353296339511871e-05, -5.961582064628601e-05, -5.569867789745331e-05, -5.1781535148620605e-05, -4.78643923997879e-05, -4.39472496509552e-05, -4.00301069021225e-05, -3.6112964153289795e-05, -3.219582140445709e-05, -2.827867865562439e-05, -2.4361535906791687e-05, -2.0444393157958984e-05, -1.6527250409126282e-05, -1.2610107660293579e-05, -8.692964911460876e-06, -4.775822162628174e-06, -8.586794137954712e-07, 3.0584633350372314e-06, 6.975606083869934e-06, 1.0892748832702637e-05, 1.480989158153534e-05, 1.8727034330368042e-05, 2.2644177079200745e-05, 2.6561319828033447e-05, 3.047846257686615e-05, 3.439560532569885e-05, 3.8312748074531555e-05, 4.222989082336426e-05, 4.614703357219696e-05, 5.006417632102966e-05, 5.3981319069862366e-05, 5.789846181869507e-05, 6.181560456752777e-05, 6.573274731636047e-05, 6.964989006519318e-05, 7.356703281402588e-05, 7.748417556285858e-05, 8.140131831169128e-05, 8.531846106052399e-05, 8.923560380935669e-05, 9.315274655818939e-05, 9.70698893070221e-05, 0.0001009870320558548, 0.0001049041748046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 27.0, 36.0, 59.0, 113.0, 185.0, 384.0, 1074.0, 4561.0, 54405.0, 946373.0, 35794.0, 3795.0, 946.0, 370.0, 165.0, 101.0, 47.0, 32.0, 17.0, 17.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1748046875, -1.1416549682617188, -1.1085052490234375, -1.0753555297851562, -1.042205810546875, -1.0090560913085938, -0.9759063720703125, -0.9427566528320312, -0.90960693359375, -0.8764572143554688, -0.8433074951171875, -0.8101577758789062, -0.777008056640625, -0.7438583374023438, -0.7107086181640625, -0.6775588989257812, -0.6444091796875, -0.6112594604492188, -0.5781097412109375, -0.5449600219726562, -0.511810302734375, -0.47866058349609375, -0.4455108642578125, -0.41236114501953125, -0.37921142578125, -0.34606170654296875, -0.3129119873046875, -0.27976226806640625, -0.246612548828125, -0.21346282958984375, -0.1803131103515625, -0.14716339111328125, -0.114013671875, -0.08086395263671875, -0.0477142333984375, -0.01456451416015625, 0.018585205078125, 0.05173492431640625, 0.0848846435546875, 0.11803436279296875, 0.15118408203125, 0.18433380126953125, 0.2174835205078125, 0.25063323974609375, 0.283782958984375, 0.31693267822265625, 0.3500823974609375, 0.38323211669921875, 0.4163818359375, 0.44953155517578125, 0.4826812744140625, 0.5158309936523438, 0.548980712890625, 0.5821304321289062, 0.6152801513671875, 0.6484298706054688, 0.68157958984375, 0.7147293090820312, 0.7478790283203125, 0.7810287475585938, 0.814178466796875, 0.8473281860351562, 0.8804779052734375, 0.9136276245117188, 0.94677734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 5.0, 17.0, 12.0, 32.0, 50.0, 96.0, 174.0, 210.0, 175.0, 90.0, 59.0, 19.0, 17.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5792770385742188, -0.5535736083984375, -0.5278701782226562, -0.502166748046875, -0.47646331787109375, -0.4507598876953125, -0.42505645751953125, -0.39935302734375, -0.37364959716796875, -0.3479461669921875, -0.32224273681640625, -0.296539306640625, -0.27083587646484375, -0.2451324462890625, -0.21942901611328125, -0.1937255859375, -0.16802215576171875, -0.1423187255859375, -0.11661529541015625, -0.090911865234375, -0.06520843505859375, -0.0395050048828125, -0.01380157470703125, 0.01190185546875, 0.03760528564453125, 0.0633087158203125, 0.08901214599609375, 0.114715576171875, 0.14041900634765625, 0.1661224365234375, 0.19182586669921875, 0.217529296875, 0.24323272705078125, 0.2689361572265625, 0.29463958740234375, 0.320343017578125, 0.34604644775390625, 0.3717498779296875, 0.39745330810546875, 0.42315673828125, 0.44886016845703125, 0.4745635986328125, 0.5002670288085938, 0.525970458984375, 0.5516738891601562, 0.5773773193359375, 0.6030807495117188, 0.6287841796875, 0.6544876098632812, 0.6801910400390625, 0.7058944702148438, 0.731597900390625, 0.7573013305664062, 0.7830047607421875, 0.8087081909179688, 0.83441162109375, 0.8601150512695312, 0.8858184814453125, 0.9115219116210938, 0.937225341796875, 0.9629287719726562, 0.9886322021484375, 1.0143356323242188, 1.0400390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 16.0, 30.0, 59.0, 96.0, 188.0, 247.0, 160.0, 92.0, 51.0, 23.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.260588645935059, -11.970691680908203, -11.680793762207031, -11.390896797180176, -11.10099983215332, -10.811101913452148, -10.521204948425293, -10.231307983398438, -9.941410064697266, -9.65151309967041, -9.361615180969238, -9.071718215942383, -8.781820297241211, -8.491923332214355, -8.2020263671875, -7.912128925323486, -7.622231483459473, -7.332334041595459, -7.042436599731445, -6.75253963470459, -6.462642192840576, -6.1727447509765625, -5.882847785949707, -5.592950344085693, -5.30305290222168, -5.013155460357666, -4.723258018493652, -4.433361053466797, -4.143463611602783, -3.8535661697387695, -3.563668966293335, -3.2737717628479004, -2.9838733673095703, -2.6939759254455566, -2.404078722000122, -2.1141815185546875, -1.8242840766906738, -1.5343867540359497, -1.2444894313812256, -0.954592227935791, -0.6646947860717773, -0.3747974634170532, -0.0849001407623291, 0.20499718189239502, 0.49489450454711914, 0.7847918272018433, 1.0746891498565674, 1.364586353302002, 1.6544837951660156, 1.9443811178207397, 2.234278440475464, 2.5241756439208984, 2.814073085784912, 3.103970527648926, 3.3938677310943604, 3.683764934539795, 3.9736623764038086, 4.263559818267822, 4.553457260131836, 4.843354225158691, 5.133251667022705, 5.423149108886719, 5.713046073913574, 6.002943515777588, 6.292840957641602]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 7.0, 10.0, 5.0, 12.0, 11.0, 14.0, 22.0, 22.0, 25.0, 28.0, 24.0, 38.0, 37.0, 36.0, 49.0, 44.0, 44.0, 50.0, 43.0, 54.0, 47.0, 49.0, 36.0, 37.0, 44.0, 24.0, 28.0, 21.0, 24.0, 20.0, 19.0, 16.0, 16.0, 6.0, 7.0, 10.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.166521072387695, -4.029800891876221, -3.893080949783325, -3.7563610076904297, -3.619640827178955, -3.4829208850860596, -3.346200942993164, -3.2094807624816895, -3.072760581970215, -2.9360406398773193, -2.7993204593658447, -2.662600517272949, -2.5258803367614746, -2.389160394668579, -2.2524404525756836, -2.115720272064209, -1.9790003299713135, -1.8422802686691284, -1.7055602073669434, -1.5688402652740479, -1.4321200847625732, -1.2954001426696777, -1.1586800813674927, -1.0219600200653076, -0.8852399587631226, -0.7485198974609375, -0.6117998361587524, -0.47507983446121216, -0.3383597731590271, -0.20163971185684204, -0.06491971015930176, 0.0718003511428833, 0.20852041244506836, 0.3452404737472534, 0.4819605052471161, 0.6186805367469788, 0.7554005980491638, 0.8921206593513489, 1.0288406610488892, 1.1655607223510742, 1.3022807836532593, 1.4390008449554443, 1.5757209062576294, 1.7124409675598145, 1.84916090965271, 1.9858810901641846, 2.12260103225708, 2.2593212127685547, 2.39604115486145, 2.5327610969543457, 2.6694812774658203, 2.806201219558716, 2.9429214000701904, 3.079641342163086, 3.2163615226745605, 3.353081464767456, 3.4898014068603516, 3.626521348953247, 3.7632415294647217, 3.899961471557617, 4.036681652069092, 4.173401832580566, 4.310121536254883, 4.446841716766357, 4.583561897277832]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 16.0, 16.0, 29.0, 65.0, 72.0, 102.0, 169.0, 297.0, 475.0, 850.0, 1513.0, 3107.0, 6960.0, 22890.0, 3744290.0, 380744.0, 19848.0, 6531.0, 2931.0, 1427.0, 781.0, 455.0, 269.0, 157.0, 107.0, 46.0, 36.0, 21.0, 18.0, 18.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.71728515625, -0.691619873046875, -0.66595458984375, -0.640289306640625, -0.6146240234375, -0.588958740234375, -0.56329345703125, -0.537628173828125, -0.511962890625, -0.486297607421875, -0.46063232421875, -0.434967041015625, -0.4093017578125, -0.383636474609375, -0.35797119140625, -0.332305908203125, -0.306640625, -0.280975341796875, -0.25531005859375, -0.229644775390625, -0.2039794921875, -0.178314208984375, -0.15264892578125, -0.126983642578125, -0.101318359375, -0.075653076171875, -0.04998779296875, -0.024322509765625, 0.0013427734375, 0.027008056640625, 0.05267333984375, 0.078338623046875, 0.10400390625, 0.129669189453125, 0.15533447265625, 0.180999755859375, 0.2066650390625, 0.232330322265625, 0.25799560546875, 0.283660888671875, 0.309326171875, 0.334991455078125, 0.36065673828125, 0.386322021484375, 0.4119873046875, 0.437652587890625, 0.46331787109375, 0.488983154296875, 0.5146484375, 0.540313720703125, 0.56597900390625, 0.591644287109375, 0.6173095703125, 0.642974853515625, 0.66864013671875, 0.694305419921875, 0.719970703125, 0.745635986328125, 0.77130126953125, 0.796966552734375, 0.8226318359375, 0.848297119140625, 0.87396240234375, 0.899627685546875, 0.92529296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 7.0, 10.0, 8.0, 18.0, 16.0, 23.0, 30.0, 32.0, 36.0, 31.0, 48.0, 48.0, 55.0, 52.0, 57.0, 69.0, 59.0, 66.0, 65.0, 40.0, 50.0, 46.0, 24.0, 22.0, 22.0, 13.0, 7.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21484375, -0.20786666870117188, -0.20088958740234375, -0.19391250610351562, -0.1869354248046875, -0.17995834350585938, -0.17298126220703125, -0.16600418090820312, -0.159027099609375, -0.15205001831054688, -0.14507293701171875, -0.13809585571289062, -0.1311187744140625, -0.12414169311523438, -0.11716461181640625, -0.11018753051757812, -0.10321044921875, -0.09623336791992188, -0.08925628662109375, -0.08227920532226562, -0.0753021240234375, -0.06832504272460938, -0.06134796142578125, -0.054370880126953125, -0.047393798828125, -0.040416717529296875, -0.03343963623046875, -0.026462554931640625, -0.0194854736328125, -0.012508392333984375, -0.00553131103515625, 0.001445770263671875, 0.0084228515625, 0.015399932861328125, 0.02237701416015625, 0.029354095458984375, 0.0363311767578125, 0.043308258056640625, 0.05028533935546875, 0.057262420654296875, 0.064239501953125, 0.07121658325195312, 0.07819366455078125, 0.08517074584960938, 0.0921478271484375, 0.09912490844726562, 0.10610198974609375, 0.11307907104492188, 0.12005615234375, 0.12703323364257812, 0.13401031494140625, 0.14098739624023438, 0.1479644775390625, 0.15494155883789062, 0.16191864013671875, 0.16889572143554688, 0.175872802734375, 0.18284988403320312, 0.18982696533203125, 0.19680404663085938, 0.2037811279296875, 0.21075820922851562, 0.21773529052734375, 0.22471237182617188, 0.231689453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 17.0, 18.0, 48.0, 62.0, 120.0, 185.0, 324.0, 617.0, 1297.0, 2959.0, 8225.0, 32494.0, 3843624.0, 272007.0, 21347.0, 6236.0, 2390.0, 1112.0, 506.0, 255.0, 149.0, 98.0, 63.0, 35.0, 22.0, 18.0, 10.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.992950439453125, -0.95855712890625, -0.924163818359375, -0.8897705078125, -0.855377197265625, -0.82098388671875, -0.786590576171875, -0.752197265625, -0.717803955078125, -0.68341064453125, -0.649017333984375, -0.6146240234375, -0.580230712890625, -0.54583740234375, -0.511444091796875, -0.47705078125, -0.442657470703125, -0.40826416015625, -0.373870849609375, -0.3394775390625, -0.305084228515625, -0.27069091796875, -0.236297607421875, -0.201904296875, -0.167510986328125, -0.13311767578125, -0.098724365234375, -0.0643310546875, -0.029937744140625, 0.00445556640625, 0.038848876953125, 0.0732421875, 0.107635498046875, 0.14202880859375, 0.176422119140625, 0.2108154296875, 0.245208740234375, 0.27960205078125, 0.313995361328125, 0.348388671875, 0.382781982421875, 0.41717529296875, 0.451568603515625, 0.4859619140625, 0.520355224609375, 0.55474853515625, 0.589141845703125, 0.62353515625, 0.657928466796875, 0.69232177734375, 0.726715087890625, 0.7611083984375, 0.795501708984375, 0.82989501953125, 0.864288330078125, 0.898681640625, 0.933074951171875, 0.96746826171875, 1.001861572265625, 1.0362548828125, 1.070648193359375, 1.10504150390625, 1.139434814453125, 1.173828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 18.0, 22.0, 30.0, 86.0, 252.0, 3271.0, 213.0, 53.0, 43.0, 18.0, 14.0, 6.0, 8.0, 5.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39306640625, -0.3781890869140625, -0.363311767578125, -0.3484344482421875, -0.33355712890625, -0.3186798095703125, -0.303802490234375, -0.2889251708984375, -0.2740478515625, -0.2591705322265625, -0.244293212890625, -0.2294158935546875, -0.21453857421875, -0.1996612548828125, -0.184783935546875, -0.1699066162109375, -0.155029296875, -0.1401519775390625, -0.125274658203125, -0.1103973388671875, -0.09552001953125, -0.0806427001953125, -0.065765380859375, -0.0508880615234375, -0.0360107421875, -0.0211334228515625, -0.006256103515625, 0.0086212158203125, 0.02349853515625, 0.0383758544921875, 0.053253173828125, 0.0681304931640625, 0.0830078125, 0.0978851318359375, 0.112762451171875, 0.1276397705078125, 0.14251708984375, 0.1573944091796875, 0.172271728515625, 0.1871490478515625, 0.2020263671875, 0.2169036865234375, 0.231781005859375, 0.2466583251953125, 0.26153564453125, 0.2764129638671875, 0.291290283203125, 0.3061676025390625, 0.321044921875, 0.3359222412109375, 0.350799560546875, 0.3656768798828125, 0.38055419921875, 0.3954315185546875, 0.410308837890625, 0.4251861572265625, 0.4400634765625, 0.4549407958984375, 0.469818115234375, 0.4846954345703125, 0.49957275390625, 0.5144500732421875, 0.529327392578125, 0.5442047119140625, 0.55908203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 17.0, 22.0, 52.0, 71.0, 103.0, 142.0, 137.0, 114.0, 86.0, 73.0, 48.0, 31.0, 32.0, 14.0, 9.0, 9.0, 5.0, 5.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.506753921508789, -1.4527078866958618, -1.3986618518829346, -1.3446158170700073, -1.29056978225708, -1.2365237474441528, -1.1824777126312256, -1.1284316778182983, -1.074385643005371, -1.0203396081924438, -0.9662935733795166, -0.9122475385665894, -0.8582015037536621, -0.8041554689407349, -0.7501094341278076, -0.6960633993148804, -0.6420173048973083, -0.5879712700843811, -0.5339252352714539, -0.4798792004585266, -0.42583316564559937, -0.37178710103034973, -0.3177410662174225, -0.26369503140449524, -0.209648996591568, -0.15560296177864075, -0.1015569195151329, -0.04751087725162506, 0.006535157561302185, 0.060581207275390625, 0.11462724208831787, 0.16867327690124512, 0.22271931171417236, 0.2767653465270996, 0.33081138134002686, 0.3848574161529541, 0.43890345096588135, 0.492949515581131, 0.5469955205917358, 0.6010415554046631, 0.6550875902175903, 0.7091336250305176, 0.7631796598434448, 0.8172256946563721, 0.8712717294692993, 0.9253177642822266, 0.9793637990951538, 1.033409833908081, 1.0874559879302979, 1.141502022743225, 1.1955480575561523, 1.2495940923690796, 1.3036401271820068, 1.357686161994934, 1.4117321968078613, 1.4657782316207886, 1.5198242664337158, 1.573870301246643, 1.6279163360595703, 1.6819623708724976, 1.7360084056854248, 1.790054440498352, 1.8441004753112793, 1.8981465101242065, 1.9521925449371338]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 10.0, 12.0, 21.0, 29.0, 19.0, 20.0, 32.0, 29.0, 27.0, 40.0, 46.0, 34.0, 46.0, 44.0, 40.0, 41.0, 41.0, 43.0, 48.0, 45.0, 38.0, 33.0, 41.0, 34.0, 27.0, 29.0, 16.0, 20.0, 16.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1297924518585205, -1.098103404045105, -1.0664143562316895, -1.0347254276275635, -1.003036379814148, -0.9713473320007324, -0.9396582841873169, -0.9079692363739014, -0.8762801885604858, -0.8445911407470703, -0.8129021525382996, -0.781213104724884, -0.7495240569114685, -0.7178350687026978, -0.6861460208892822, -0.6544569730758667, -0.622767984867096, -0.5910789370536804, -0.5593899488449097, -0.5277009010314941, -0.4960118532180786, -0.4643228352069855, -0.43263381719589233, -0.4009447693824768, -0.36925575137138367, -0.3375667333602905, -0.305877685546875, -0.27418866753578186, -0.24249963462352753, -0.2108106017112732, -0.17912158370018005, -0.14743255078792572, -0.11574351787567139, -0.08405448496341705, -0.05236545950174332, -0.02067643404006958, 0.011012598872184753, 0.04270163178443909, 0.07439064979553223, 0.10607968270778656, 0.1377687156200409, 0.16945774853229523, 0.20114678144454956, 0.2328357994556427, 0.26452481746673584, 0.29621386528015137, 0.3279028832912445, 0.35959190130233765, 0.3912809491157532, 0.4229699671268463, 0.45465901494026184, 0.486348032951355, 0.5180370807647705, 0.549726128578186, 0.5814151167869568, 0.6131041646003723, 0.6447931528091431, 0.6764822006225586, 0.7081711888313293, 0.7398602366447449, 0.7715492844581604, 0.8032382726669312, 0.8349273204803467, 0.8666163682937622, 0.8983054161071777]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 6.0, 3.0, 8.0, 12.0, 9.0, 23.0, 27.0, 40.0, 50.0, 82.0, 109.0, 172.0, 230.0, 374.0, 564.0, 893.0, 1474.0, 2404.0, 4112.0, 7825.0, 15552.0, 33230.0, 73323.0, 173120.0, 361926.0, 209085.0, 86504.0, 38444.0, 18116.0, 8926.0, 4817.0, 2691.0, 1546.0, 1014.0, 592.0, 426.0, 258.0, 176.0, 139.0, 75.0, 53.0, 36.0, 29.0, 18.0, 11.0, 18.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.488525390625, -0.4751777648925781, -0.46183013916015625, -0.4484825134277344, -0.4351348876953125, -0.4217872619628906, -0.40843963623046875, -0.3950920104980469, -0.381744384765625, -0.3683967590332031, -0.35504913330078125, -0.3417015075683594, -0.3283538818359375, -0.3150062561035156, -0.30165863037109375, -0.2883110046386719, -0.27496337890625, -0.2616157531738281, -0.24826812744140625, -0.23492050170898438, -0.2215728759765625, -0.20822525024414062, -0.19487762451171875, -0.18152999877929688, -0.168182373046875, -0.15483474731445312, -0.14148712158203125, -0.12813949584960938, -0.1147918701171875, -0.10144424438476562, -0.08809661865234375, -0.07474899291992188, -0.0614013671875, -0.048053741455078125, -0.03470611572265625, -0.021358489990234375, -0.0080108642578125, 0.005336761474609375, 0.01868438720703125, 0.032032012939453125, 0.045379638671875, 0.058727264404296875, 0.07207489013671875, 0.08542251586914062, 0.0987701416015625, 0.11211776733398438, 0.12546539306640625, 0.13881301879882812, 0.15216064453125, 0.16550827026367188, 0.17885589599609375, 0.19220352172851562, 0.2055511474609375, 0.21889877319335938, 0.23224639892578125, 0.24559402465820312, 0.258941650390625, 0.2722892761230469, 0.28563690185546875, 0.2989845275878906, 0.3123321533203125, 0.3256797790527344, 0.33902740478515625, 0.3523750305175781, 0.36572265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 6.0, 8.0, 14.0, 17.0, 23.0, 21.0, 29.0, 42.0, 42.0, 44.0, 46.0, 46.0, 62.0, 66.0, 57.0, 51.0, 48.0, 60.0, 45.0, 45.0, 40.0, 38.0, 25.0, 24.0, 18.0, 20.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.23929405212402344, -0.23163986206054688, -0.2239856719970703, -0.21633148193359375, -0.2086772918701172, -0.20102310180664062, -0.19336891174316406, -0.1857147216796875, -0.17806053161621094, -0.17040634155273438, -0.1627521514892578, -0.15509796142578125, -0.1474437713623047, -0.13978958129882812, -0.13213539123535156, -0.124481201171875, -0.11682701110839844, -0.10917282104492188, -0.10151863098144531, -0.09386444091796875, -0.08621025085449219, -0.07855606079101562, -0.07090187072753906, -0.0632476806640625, -0.05559349060058594, -0.047939300537109375, -0.04028511047363281, -0.03263092041015625, -0.024976730346679688, -0.017322540283203125, -0.009668350219726562, -0.00201416015625, 0.0056400299072265625, 0.013294219970703125, 0.020948410034179688, 0.02860260009765625, 0.03625679016113281, 0.043910980224609375, 0.05156517028808594, 0.0592193603515625, 0.06687355041503906, 0.07452774047851562, 0.08218193054199219, 0.08983612060546875, 0.09749031066894531, 0.10514450073242188, 0.11279869079589844, 0.120452880859375, 0.12810707092285156, 0.13576126098632812, 0.1434154510498047, 0.15106964111328125, 0.1587238311767578, 0.16637802124023438, 0.17403221130371094, 0.1816864013671875, 0.18934059143066406, 0.19699478149414062, 0.2046489715576172, 0.21230316162109375, 0.2199573516845703, 0.22761154174804688, 0.23526573181152344, 0.242919921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 14.0, 22.0, 42.0, 61.0, 81.0, 117.0, 190.0, 250.0, 435.0, 703.0, 1128.0, 2485.0, 7198.0, 35315.0, 377298.0, 560090.0, 48357.0, 8575.0, 2820.0, 1367.0, 674.0, 420.0, 264.0, 191.0, 132.0, 87.0, 62.0, 49.0, 38.0, 18.0, 20.0, 7.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0380859375, -1.0066986083984375, -0.975311279296875, -0.9439239501953125, -0.91253662109375, -0.8811492919921875, -0.849761962890625, -0.8183746337890625, -0.7869873046875, -0.7555999755859375, -0.724212646484375, -0.6928253173828125, -0.66143798828125, -0.6300506591796875, -0.598663330078125, -0.5672760009765625, -0.535888671875, -0.5045013427734375, -0.473114013671875, -0.4417266845703125, -0.41033935546875, -0.3789520263671875, -0.347564697265625, -0.3161773681640625, -0.2847900390625, -0.2534027099609375, -0.222015380859375, -0.1906280517578125, -0.15924072265625, -0.1278533935546875, -0.096466064453125, -0.0650787353515625, -0.03369140625, -0.0023040771484375, 0.029083251953125, 0.0604705810546875, 0.09185791015625, 0.1232452392578125, 0.154632568359375, 0.1860198974609375, 0.2174072265625, 0.2487945556640625, 0.280181884765625, 0.3115692138671875, 0.34295654296875, 0.3743438720703125, 0.405731201171875, 0.4371185302734375, 0.468505859375, 0.4998931884765625, 0.531280517578125, 0.5626678466796875, 0.59405517578125, 0.6254425048828125, 0.656829833984375, 0.6882171630859375, 0.7196044921875, 0.7509918212890625, 0.782379150390625, 0.8137664794921875, 0.84515380859375, 0.8765411376953125, 0.907928466796875, 0.9393157958984375, 0.970703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 10.0, 15.0, 11.0, 15.0, 19.0, 25.0, 16.0, 27.0, 26.0, 40.0, 44.0, 39.0, 54.0, 50.0, 44.0, 49.0, 53.0, 31.0, 53.0, 44.0, 47.0, 39.0, 41.0, 28.0, 27.0, 23.0, 19.0, 16.0, 21.0, 15.0, 13.0, 8.0, 6.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.974609375, -0.94317626953125, -0.9117431640625, -0.88031005859375, -0.848876953125, -0.81744384765625, -0.7860107421875, -0.75457763671875, -0.72314453125, -0.69171142578125, -0.6602783203125, -0.62884521484375, -0.597412109375, -0.56597900390625, -0.5345458984375, -0.50311279296875, -0.4716796875, -0.44024658203125, -0.4088134765625, -0.37738037109375, -0.345947265625, -0.31451416015625, -0.2830810546875, -0.25164794921875, -0.22021484375, -0.18878173828125, -0.1573486328125, -0.12591552734375, -0.094482421875, -0.06304931640625, -0.0316162109375, -0.00018310546875, 0.03125, 0.06268310546875, 0.0941162109375, 0.12554931640625, 0.156982421875, 0.18841552734375, 0.2198486328125, 0.25128173828125, 0.28271484375, 0.31414794921875, 0.3455810546875, 0.37701416015625, 0.408447265625, 0.43988037109375, 0.4713134765625, 0.50274658203125, 0.5341796875, 0.56561279296875, 0.5970458984375, 0.62847900390625, 0.659912109375, 0.69134521484375, 0.7227783203125, 0.75421142578125, 0.78564453125, 0.81707763671875, 0.8485107421875, 0.87994384765625, 0.911376953125, 0.94281005859375, 0.9742431640625, 1.00567626953125, 1.037109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 5.0, 9.0, 9.0, 9.0, 18.0, 17.0, 41.0, 37.0, 59.0, 87.0, 110.0, 210.0, 337.0, 775.0, 1659.0, 4715.0, 20415.0, 231242.0, 724721.0, 50774.0, 8440.0, 2530.0, 999.0, 502.0, 286.0, 180.0, 116.0, 79.0, 41.0, 32.0, 22.0, 18.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.449951171875, -0.4350624084472656, -0.42017364501953125, -0.4052848815917969, -0.3903961181640625, -0.3755073547363281, -0.36061859130859375, -0.3457298278808594, -0.330841064453125, -0.3159523010253906, -0.30106353759765625, -0.2861747741699219, -0.2712860107421875, -0.2563972473144531, -0.24150848388671875, -0.22661972045898438, -0.21173095703125, -0.19684219360351562, -0.18195343017578125, -0.16706466674804688, -0.1521759033203125, -0.13728713989257812, -0.12239837646484375, -0.10750961303710938, -0.092620849609375, -0.07773208618164062, -0.06284332275390625, -0.047954559326171875, -0.0330657958984375, -0.018177032470703125, -0.00328826904296875, 0.011600494384765625, 0.0264892578125, 0.041378021240234375, 0.05626678466796875, 0.07115554809570312, 0.0860443115234375, 0.10093307495117188, 0.11582183837890625, 0.13071060180664062, 0.145599365234375, 0.16048812866210938, 0.17537689208984375, 0.19026565551757812, 0.2051544189453125, 0.22004318237304688, 0.23493194580078125, 0.24982070922851562, 0.26470947265625, 0.2795982360839844, 0.29448699951171875, 0.3093757629394531, 0.3242645263671875, 0.3391532897949219, 0.35404205322265625, 0.3689308166503906, 0.383819580078125, 0.3987083435058594, 0.41359710693359375, 0.4284858703613281, 0.4433746337890625, 0.4582633972167969, 0.47315216064453125, 0.4880409240722656, 0.5029296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 14.0, 14.0, 21.0, 33.0, 46.0, 68.0, 90.0, 134.0, 176.0, 127.0, 73.0, 44.0, 44.0, 27.0, 13.0, 12.0, 18.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.423494338989258e-05, -9.020697325468063e-05, -8.617900311946869e-05, -8.215103298425674e-05, -7.81230628490448e-05, -7.409509271383286e-05, -7.006712257862091e-05, -6.603915244340897e-05, -6.201118230819702e-05, -5.798321217298508e-05, -5.395524203777313e-05, -4.992727190256119e-05, -4.589930176734924e-05, -4.18713316321373e-05, -3.7843361496925354e-05, -3.381539136171341e-05, -2.9787421226501465e-05, -2.575945109128952e-05, -2.1731480956077576e-05, -1.770351082086563e-05, -1.3675540685653687e-05, -9.647570550441742e-06, -5.619600415229797e-06, -1.5916302800178528e-06, 2.436339855194092e-06, 6.464309990406036e-06, 1.0492280125617981e-05, 1.4520250260829926e-05, 1.854822039604187e-05, 2.2576190531253815e-05, 2.660416066646576e-05, 3.0632130801677704e-05, 3.466010093688965e-05, 3.868807107210159e-05, 4.271604120731354e-05, 4.674401134252548e-05, 5.077198147773743e-05, 5.479995161294937e-05, 5.8827921748161316e-05, 6.285589188337326e-05, 6.68838620185852e-05, 7.091183215379715e-05, 7.49398022890091e-05, 7.896777242422104e-05, 8.299574255943298e-05, 8.702371269464493e-05, 9.105168282985687e-05, 9.507965296506882e-05, 9.910762310028076e-05, 0.0001031355932354927, 0.00010716356337070465, 0.0001111915335059166, 0.00011521950364112854, 0.00011924747377634048, 0.00012327544391155243, 0.00012730341404676437, 0.00013133138418197632, 0.00013535935431718826, 0.0001393873244524002, 0.00014341529458761215, 0.0001474432647228241, 0.00015147123485803604, 0.00015549920499324799, 0.00015952717512845993, 0.00016355514526367188]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 11.0, 6.0, 16.0, 15.0, 27.0, 40.0, 45.0, 74.0, 102.0, 168.0, 258.0, 493.0, 976.0, 2311.0, 7116.0, 36179.0, 542531.0, 416807.0, 30599.0, 6524.0, 2120.0, 924.0, 459.0, 233.0, 174.0, 108.0, 69.0, 52.0, 37.0, 22.0, 23.0, 7.0, 10.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4136810302734375, -0.399871826171875, -0.3860626220703125, -0.37225341796875, -0.3584442138671875, -0.344635009765625, -0.3308258056640625, -0.3170166015625, -0.3032073974609375, -0.289398193359375, -0.2755889892578125, -0.26177978515625, -0.2479705810546875, -0.234161376953125, -0.2203521728515625, -0.20654296875, -0.1927337646484375, -0.178924560546875, -0.1651153564453125, -0.15130615234375, -0.1374969482421875, -0.123687744140625, -0.1098785400390625, -0.0960693359375, -0.0822601318359375, -0.068450927734375, -0.0546417236328125, -0.04083251953125, -0.0270233154296875, -0.013214111328125, 0.0005950927734375, 0.014404296875, 0.0282135009765625, 0.042022705078125, 0.0558319091796875, 0.06964111328125, 0.0834503173828125, 0.097259521484375, 0.1110687255859375, 0.1248779296875, 0.1386871337890625, 0.152496337890625, 0.1663055419921875, 0.18011474609375, 0.1939239501953125, 0.207733154296875, 0.2215423583984375, 0.2353515625, 0.2491607666015625, 0.262969970703125, 0.2767791748046875, 0.29058837890625, 0.3043975830078125, 0.318206787109375, 0.3320159912109375, 0.3458251953125, 0.3596343994140625, 0.373443603515625, 0.3872528076171875, 0.40106201171875, 0.4148712158203125, 0.428680419921875, 0.4424896240234375, 0.456298828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 3.0, 8.0, 14.0, 15.0, 25.0, 35.0, 53.0, 66.0, 107.0, 96.0, 116.0, 109.0, 79.0, 79.0, 47.0, 37.0, 24.0, 19.0, 12.0, 9.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48974609375, -0.475921630859375, -0.46209716796875, -0.448272705078125, -0.4344482421875, -0.420623779296875, -0.40679931640625, -0.392974853515625, -0.379150390625, -0.365325927734375, -0.35150146484375, -0.337677001953125, -0.3238525390625, -0.310028076171875, -0.29620361328125, -0.282379150390625, -0.2685546875, -0.254730224609375, -0.24090576171875, -0.227081298828125, -0.2132568359375, -0.199432373046875, -0.18560791015625, -0.171783447265625, -0.157958984375, -0.144134521484375, -0.13031005859375, -0.116485595703125, -0.1026611328125, -0.088836669921875, -0.07501220703125, -0.061187744140625, -0.04736328125, -0.033538818359375, -0.01971435546875, -0.005889892578125, 0.0079345703125, 0.021759033203125, 0.03558349609375, 0.049407958984375, 0.063232421875, 0.077056884765625, 0.09088134765625, 0.104705810546875, 0.1185302734375, 0.132354736328125, 0.14617919921875, 0.160003662109375, 0.173828125, 0.187652587890625, 0.20147705078125, 0.215301513671875, 0.2291259765625, 0.242950439453125, 0.25677490234375, 0.270599365234375, 0.284423828125, 0.298248291015625, 0.31207275390625, 0.325897216796875, 0.3397216796875, 0.353546142578125, 0.36737060546875, 0.381195068359375, 0.39501953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 13.0, 39.0, 143.0, 399.0, 300.0, 80.0, 21.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.629871368408203, -14.041703224182129, -13.453536033630371, -12.865367889404297, -12.277200698852539, -11.689032554626465, -11.10086441040039, -10.512697219848633, -9.924530029296875, -9.3363618850708, -8.748194694519043, -8.160026550292969, -7.571859359741211, -6.983691215515137, -6.395523548126221, -5.807355880737305, -5.2191877365112305, -4.6310200691223145, -4.042852401733398, -3.4546844959259033, -2.8665168285369873, -2.2783491611480713, -1.6901812553405762, -1.1020135879516602, -0.5138459205627441, 0.07432180643081665, 0.6624895334243774, 1.250657320022583, 1.838824987411499, 2.426992654800415, 3.01516056060791, 3.603328227996826, 4.191495895385742, 4.779663562774658, 5.367831230163574, 5.955999374389648, 6.544166564941406, 7.1323347091674805, 7.7205023765563965, 8.308670043945312, 8.89683723449707, 9.485005378723145, 10.073172569274902, 10.661340713500977, 11.249507904052734, 11.837676048278809, 12.425844192504883, 13.01401138305664, 13.602179527282715, 14.190347671508789, 14.778514862060547, 15.366683006286621, 15.954850196838379, 16.543018341064453, 17.13118553161621, 17.71935272216797, 18.30752182006836, 18.895689010620117, 19.483858108520508, 20.072025299072266, 20.660192489624023, 21.24835968017578, 21.836528778076172, 22.42469596862793, 23.012863159179688]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 21.0, 17.0, 13.0, 17.0, 19.0, 33.0, 29.0, 27.0, 45.0, 39.0, 50.0, 51.0, 49.0, 52.0, 50.0, 47.0, 59.0, 38.0, 47.0, 35.0, 37.0, 29.0, 19.0, 24.0, 26.0, 18.0, 12.0, 15.0, 10.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.276425838470459, -4.143445014953613, -4.010463714599609, -3.8774826526641846, -3.7445015907287598, -3.611520528793335, -3.47853946685791, -3.3455584049224854, -3.2125773429870605, -3.0795962810516357, -2.946615219116211, -2.813634157180786, -2.6806530952453613, -2.5476720333099365, -2.4146909713745117, -2.281709909439087, -2.148728847503662, -2.0157477855682373, -1.8827667236328125, -1.7497856616973877, -1.616804599761963, -1.483823537826538, -1.3508424758911133, -1.2178614139556885, -1.0848803520202637, -0.9518992900848389, -0.8189182281494141, -0.6859371662139893, -0.5529561042785645, -0.41997504234313965, -0.28699398040771484, -0.15401291847229004, -0.02103137969970703, 0.11194968223571777, 0.24493074417114258, 0.3779118061065674, 0.5108928680419922, 0.643873929977417, 0.7768549919128418, 0.9098360538482666, 1.0428171157836914, 1.1757981777191162, 1.308779239654541, 1.4417603015899658, 1.5747413635253906, 1.7077224254608154, 1.8407034873962402, 1.973684549331665, 2.10666561126709, 2.2396466732025146, 2.3726277351379395, 2.5056087970733643, 2.638589859008789, 2.771570920944214, 2.9045519828796387, 3.0375330448150635, 3.1705141067504883, 3.303495168685913, 3.436476230621338, 3.5694572925567627, 3.7024383544921875, 3.8354194164276123, 3.968400478363037, 4.101381301879883, 4.234362602233887]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 11.0, 6.0, 9.0, 6.0, 15.0, 12.0, 12.0, 27.0, 29.0, 46.0, 61.0, 94.0, 142.0, 206.0, 311.0, 552.0, 963.0, 1695.0, 2953.0, 5955.0, 12699.0, 34459.0, 149941.0, 2067632.0, 1722704.0, 135134.0, 33464.0, 12736.0, 5604.0, 2906.0, 1544.0, 877.0, 499.0, 325.0, 228.0, 153.0, 69.0, 61.0, 43.0, 29.0, 19.0, 15.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.43505859375, -0.4226188659667969, -0.41017913818359375, -0.3977394104003906, -0.3852996826171875, -0.3728599548339844, -0.36042022705078125, -0.3479804992675781, -0.335540771484375, -0.3231010437011719, -0.31066131591796875, -0.2982215881347656, -0.2857818603515625, -0.2733421325683594, -0.26090240478515625, -0.24846267700195312, -0.23602294921875, -0.22358322143554688, -0.21114349365234375, -0.19870376586914062, -0.1862640380859375, -0.17382431030273438, -0.16138458251953125, -0.14894485473632812, -0.136505126953125, -0.12406539916992188, -0.11162567138671875, -0.09918594360351562, -0.0867462158203125, -0.07430648803710938, -0.06186676025390625, -0.049427032470703125, -0.0369873046875, -0.024547576904296875, -0.01210784912109375, 0.000331878662109375, 0.0127716064453125, 0.025211334228515625, 0.03765106201171875, 0.050090789794921875, 0.062530517578125, 0.07497024536132812, 0.08740997314453125, 0.09984970092773438, 0.1122894287109375, 0.12472915649414062, 0.13716888427734375, 0.14960861206054688, 0.16204833984375, 0.17448806762695312, 0.18692779541015625, 0.19936752319335938, 0.2118072509765625, 0.22424697875976562, 0.23668670654296875, 0.24912643432617188, 0.261566162109375, 0.2740058898925781, 0.28644561767578125, 0.2988853454589844, 0.3113250732421875, 0.3237648010253906, 0.33620452880859375, 0.3486442565917969, 0.361083984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 4.0, 7.0, 15.0, 22.0, 28.0, 55.0, 65.0, 82.0, 95.0, 77.0, 101.0, 103.0, 90.0, 57.0, 63.0, 51.0, 28.0, 25.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.5966796875, -0.5845756530761719, -0.5724716186523438, -0.5603675842285156, -0.5482635498046875, -0.5361595153808594, -0.5240554809570312, -0.5119514465332031, -0.499847412109375, -0.4877433776855469, -0.47563934326171875, -0.4635353088378906, -0.4514312744140625, -0.4393272399902344, -0.42722320556640625, -0.4151191711425781, -0.40301513671875, -0.3909111022949219, -0.37880706787109375, -0.3667030334472656, -0.3545989990234375, -0.3424949645996094, -0.33039093017578125, -0.3182868957519531, -0.306182861328125, -0.2940788269042969, -0.28197479248046875, -0.2698707580566406, -0.2577667236328125, -0.24566268920898438, -0.23355865478515625, -0.22145462036132812, -0.2093505859375, -0.19724655151367188, -0.18514251708984375, -0.17303848266601562, -0.1609344482421875, -0.14883041381835938, -0.13672637939453125, -0.12462234497070312, -0.112518310546875, -0.10041427612304688, -0.08831024169921875, -0.07620620727539062, -0.0641021728515625, -0.051998138427734375, -0.03989410400390625, -0.027790069580078125, -0.01568603515625, -0.003582000732421875, 0.00852203369140625, 0.020626068115234375, 0.0327301025390625, 0.044834136962890625, 0.05693817138671875, 0.06904220581054688, 0.081146240234375, 0.09325027465820312, 0.10535430908203125, 0.11745834350585938, 0.1295623779296875, 0.14166641235351562, 0.15377044677734375, 0.16587448120117188, 0.177978515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 7.0, 7.0, 10.0, 12.0, 27.0, 43.0, 41.0, 75.0, 113.0, 225.0, 466.0, 876.0, 1866.0, 4726.0, 13872.0, 53293.0, 449267.0, 3443797.0, 179175.0, 31229.0, 9025.0, 3225.0, 1351.0, 703.0, 314.0, 185.0, 104.0, 82.0, 38.0, 38.0, 20.0, 24.0, 17.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6728591918945312, -0.6513824462890625, -0.6299057006835938, -0.608428955078125, -0.5869522094726562, -0.5654754638671875, -0.5439987182617188, -0.52252197265625, -0.5010452270507812, -0.4795684814453125, -0.45809173583984375, -0.436614990234375, -0.41513824462890625, -0.3936614990234375, -0.37218475341796875, -0.3507080078125, -0.32923126220703125, -0.3077545166015625, -0.28627777099609375, -0.264801025390625, -0.24332427978515625, -0.2218475341796875, -0.20037078857421875, -0.17889404296875, -0.15741729736328125, -0.1359405517578125, -0.11446380615234375, -0.092987060546875, -0.07151031494140625, -0.0500335693359375, -0.02855682373046875, -0.007080078125, 0.01439666748046875, 0.0358734130859375, 0.05735015869140625, 0.078826904296875, 0.10030364990234375, 0.1217803955078125, 0.14325714111328125, 0.16473388671875, 0.18621063232421875, 0.2076873779296875, 0.22916412353515625, 0.250640869140625, 0.27211761474609375, 0.2935943603515625, 0.31507110595703125, 0.3365478515625, 0.35802459716796875, 0.3795013427734375, 0.40097808837890625, 0.422454833984375, 0.44393157958984375, 0.4654083251953125, 0.48688507080078125, 0.50836181640625, 0.5298385620117188, 0.5513153076171875, 0.5727920532226562, 0.594268798828125, 0.6157455444335938, 0.6372222900390625, 0.6586990356445312, 0.68017578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 18.0, 16.0, 25.0, 24.0, 53.0, 47.0, 78.0, 113.0, 137.0, 295.0, 615.0, 1070.0, 717.0, 353.0, 164.0, 100.0, 60.0, 41.0, 26.0, 22.0, 15.0, 11.0, 16.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7373046875, -0.7152328491210938, -0.6931610107421875, -0.6710891723632812, -0.649017333984375, -0.6269454956054688, -0.6048736572265625, -0.5828018188476562, -0.56072998046875, -0.5386581420898438, -0.5165863037109375, -0.49451446533203125, -0.472442626953125, -0.45037078857421875, -0.4282989501953125, -0.40622711181640625, -0.3841552734375, -0.36208343505859375, -0.3400115966796875, -0.31793975830078125, -0.295867919921875, -0.27379608154296875, -0.2517242431640625, -0.22965240478515625, -0.20758056640625, -0.18550872802734375, -0.1634368896484375, -0.14136505126953125, -0.119293212890625, -0.09722137451171875, -0.0751495361328125, -0.05307769775390625, -0.031005859375, -0.00893402099609375, 0.0131378173828125, 0.03520965576171875, 0.057281494140625, 0.07935333251953125, 0.1014251708984375, 0.12349700927734375, 0.14556884765625, 0.16764068603515625, 0.1897125244140625, 0.21178436279296875, 0.233856201171875, 0.25592803955078125, 0.2779998779296875, 0.30007171630859375, 0.3221435546875, 0.34421539306640625, 0.3662872314453125, 0.38835906982421875, 0.410430908203125, 0.43250274658203125, 0.4545745849609375, 0.47664642333984375, 0.49871826171875, 0.5207901000976562, 0.5428619384765625, 0.5649337768554688, 0.587005615234375, 0.6090774536132812, 0.6311492919921875, 0.6532211303710938, 0.67529296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 24.0, 45.0, 119.0, 287.0, 295.0, 162.0, 46.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.010629653930664, -9.642141342163086, -9.273652076721191, -8.905163764953613, -8.536675453186035, -8.16818618774414, -7.7996978759765625, -7.431209564208984, -7.062720775604248, -6.694231986999512, -6.325743675231934, -5.957254886627197, -5.588766098022461, -5.220277786254883, -4.8517889976501465, -4.48330020904541, -4.114811897277832, -3.746323347091675, -3.3778347969055176, -3.0093460083007812, -2.640857458114624, -2.272368907928467, -1.9038801193237305, -1.5353915691375732, -1.166903018951416, -0.798414409160614, -0.429925799369812, -0.061437129974365234, 0.307051420211792, 0.6755399703979492, 1.0440287590026855, 1.4125173091888428, 1.781005859375, 2.1494944095611572, 2.5179829597473145, 2.886471748352051, 3.254960298538208, 3.6234488487243652, 3.9919376373291016, 4.36042594909668, 4.728914737701416, 5.097403526306152, 5.4658918380737305, 5.834380626678467, 6.202869415283203, 6.571357727050781, 6.939846515655518, 7.308335304260254, 7.676823616027832, 8.04531192779541, 8.413801193237305, 8.782289505004883, 9.150777816772461, 9.519266128540039, 9.887755393981934, 10.256243705749512, 10.624732971191406, 10.993221282958984, 11.361710548400879, 11.730198860168457, 12.098687171936035, 12.46717643737793, 12.835664749145508, 13.204153060913086, 13.572641372680664]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 10.0, 9.0, 12.0, 11.0, 16.0, 31.0, 35.0, 44.0, 45.0, 49.0, 58.0, 60.0, 64.0, 62.0, 67.0, 50.0, 57.0, 44.0, 40.0, 51.0, 40.0, 35.0, 26.0, 15.0, 19.0, 14.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513559341430664, -3.3802833557128906, -3.247007369995117, -3.1137313842773438, -2.9804553985595703, -2.847179412841797, -2.7139036655426025, -2.580627679824829, -2.4473516941070557, -2.3140757083892822, -2.180799722671509, -2.0475237369537354, -1.9142478704452515, -1.780971884727478, -1.6476960182189941, -1.5144200325012207, -1.3811440467834473, -1.2478680610656738, -1.1145920753479004, -0.9813162088394165, -0.8480402231216431, -0.7147642374038696, -0.581488311290741, -0.4482123851776123, -0.31493639945983887, -0.18166044354438782, -0.04838448762893677, 0.08489146828651428, 0.21816742420196533, 0.35144340991973877, 0.48471933603286743, 0.6179952621459961, 0.7512707710266113, 0.8845467567443848, 1.0178227424621582, 1.151098608970642, 1.2843745946884155, 1.417650580406189, 1.5509264469146729, 1.6842024326324463, 1.8174784183502197, 1.9507544040679932, 2.0840303897857666, 2.21730637550354, 2.3505821228027344, 2.483858108520508, 2.6171340942382812, 2.7504100799560547, 2.883686065673828, 3.0169620513916016, 3.150238037109375, 3.2835140228271484, 3.416790008544922, 3.5500659942626953, 3.6833417415618896, 3.816617727279663, 3.9498937129974365, 4.083169460296631, 4.216445446014404, 4.349721431732178, 4.482997417449951, 4.616273403167725, 4.749549388885498, 4.8828253746032715, 5.016101360321045]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 15.0, 21.0, 31.0, 55.0, 113.0, 163.0, 358.0, 731.0, 1732.0, 4244.0, 12245.0, 45587.0, 285128.0, 588577.0, 80181.0, 19118.0, 5972.0, 2303.0, 963.0, 463.0, 228.0, 115.0, 68.0, 35.0, 29.0, 15.0, 13.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.60693359375, -0.5818328857421875, -0.556732177734375, -0.5316314697265625, -0.50653076171875, -0.4814300537109375, -0.456329345703125, -0.4312286376953125, -0.4061279296875, -0.3810272216796875, -0.355926513671875, -0.3308258056640625, -0.30572509765625, -0.2806243896484375, -0.255523681640625, -0.2304229736328125, -0.205322265625, -0.1802215576171875, -0.155120849609375, -0.1300201416015625, -0.10491943359375, -0.0798187255859375, -0.054718017578125, -0.0296173095703125, -0.0045166015625, 0.0205841064453125, 0.045684814453125, 0.0707855224609375, 0.09588623046875, 0.1209869384765625, 0.146087646484375, 0.1711883544921875, 0.1962890625, 0.2213897705078125, 0.246490478515625, 0.2715911865234375, 0.29669189453125, 0.3217926025390625, 0.346893310546875, 0.3719940185546875, 0.3970947265625, 0.4221954345703125, 0.447296142578125, 0.4723968505859375, 0.49749755859375, 0.5225982666015625, 0.547698974609375, 0.5727996826171875, 0.597900390625, 0.6230010986328125, 0.648101806640625, 0.6732025146484375, 0.69830322265625, 0.7234039306640625, 0.748504638671875, 0.7736053466796875, 0.7987060546875, 0.8238067626953125, 0.848907470703125, 0.8740081787109375, 0.89910888671875, 0.9242095947265625, 0.949310302734375, 0.9744110107421875, 0.99951171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 3.0, 11.0, 9.0, 4.0, 28.0, 25.0, 24.0, 35.0, 38.0, 53.0, 62.0, 75.0, 62.0, 66.0, 71.0, 67.0, 56.0, 61.0, 51.0, 32.0, 40.0, 34.0, 20.0, 22.0, 18.0, 10.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.365478515625, -0.3565330505371094, -0.34758758544921875, -0.3386421203613281, -0.3296966552734375, -0.3207511901855469, -0.31180572509765625, -0.3028602600097656, -0.293914794921875, -0.2849693298339844, -0.27602386474609375, -0.2670783996582031, -0.2581329345703125, -0.24918746948242188, -0.24024200439453125, -0.23129653930664062, -0.22235107421875, -0.21340560913085938, -0.20446014404296875, -0.19551467895507812, -0.1865692138671875, -0.17762374877929688, -0.16867828369140625, -0.15973281860351562, -0.150787353515625, -0.14184188842773438, -0.13289642333984375, -0.12395095825195312, -0.1150054931640625, -0.10606002807617188, -0.09711456298828125, -0.08816909790039062, -0.0792236328125, -0.07027816772460938, -0.06133270263671875, -0.052387237548828125, -0.0434417724609375, -0.034496307373046875, -0.02555084228515625, -0.016605377197265625, -0.007659912109375, 0.001285552978515625, 0.01023101806640625, 0.019176483154296875, 0.0281219482421875, 0.037067413330078125, 0.04601287841796875, 0.054958343505859375, 0.06390380859375, 0.07284927368164062, 0.08179473876953125, 0.09074020385742188, 0.0996856689453125, 0.10863113403320312, 0.11757659912109375, 0.12652206420898438, 0.135467529296875, 0.14441299438476562, 0.15335845947265625, 0.16230392456054688, 0.1712493896484375, 0.18019485473632812, 0.18914031982421875, 0.19808578491210938, 0.20703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 17.0, 6.0, 14.0, 22.0, 29.0, 36.0, 53.0, 67.0, 113.0, 163.0, 260.0, 410.0, 775.0, 1710.0, 4584.0, 19113.0, 258453.0, 720479.0, 31742.0, 6153.0, 2064.0, 910.0, 471.0, 288.0, 190.0, 142.0, 92.0, 65.0, 30.0, 26.0, 15.0, 16.0, 11.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.03179931640625, -0.9923095703125, -0.95281982421875, -0.913330078125, -0.87384033203125, -0.8343505859375, -0.79486083984375, -0.75537109375, -0.71588134765625, -0.6763916015625, -0.63690185546875, -0.597412109375, -0.55792236328125, -0.5184326171875, -0.47894287109375, -0.439453125, -0.39996337890625, -0.3604736328125, -0.32098388671875, -0.281494140625, -0.24200439453125, -0.2025146484375, -0.16302490234375, -0.12353515625, -0.08404541015625, -0.0445556640625, -0.00506591796875, 0.034423828125, 0.07391357421875, 0.1134033203125, 0.15289306640625, 0.1923828125, 0.23187255859375, 0.2713623046875, 0.31085205078125, 0.350341796875, 0.38983154296875, 0.4293212890625, 0.46881103515625, 0.50830078125, 0.54779052734375, 0.5872802734375, 0.62677001953125, 0.666259765625, 0.70574951171875, 0.7452392578125, 0.78472900390625, 0.82421875, 0.86370849609375, 0.9031982421875, 0.94268798828125, 0.982177734375, 1.02166748046875, 1.0611572265625, 1.10064697265625, 1.14013671875, 1.17962646484375, 1.2191162109375, 1.25860595703125, 1.298095703125, 1.33758544921875, 1.3770751953125, 1.41656494140625, 1.4560546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 7.0, 10.0, 11.0, 13.0, 20.0, 20.0, 33.0, 36.0, 31.0, 51.0, 39.0, 46.0, 53.0, 41.0, 52.0, 61.0, 48.0, 50.0, 47.0, 54.0, 39.0, 29.0, 32.0, 30.0, 21.0, 22.0, 10.0, 10.0, 14.0, 10.0, 11.0, 10.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.982421875, -0.949920654296875, -0.91741943359375, -0.884918212890625, -0.8524169921875, -0.819915771484375, -0.78741455078125, -0.754913330078125, -0.722412109375, -0.689910888671875, -0.65740966796875, -0.624908447265625, -0.5924072265625, -0.559906005859375, -0.52740478515625, -0.494903564453125, -0.46240234375, -0.429901123046875, -0.39739990234375, -0.364898681640625, -0.3323974609375, -0.299896240234375, -0.26739501953125, -0.234893798828125, -0.202392578125, -0.169891357421875, -0.13739013671875, -0.104888916015625, -0.0723876953125, -0.039886474609375, -0.00738525390625, 0.025115966796875, 0.0576171875, 0.090118408203125, 0.12261962890625, 0.155120849609375, 0.1876220703125, 0.220123291015625, 0.25262451171875, 0.285125732421875, 0.317626953125, 0.350128173828125, 0.38262939453125, 0.415130615234375, 0.4476318359375, 0.480133056640625, 0.51263427734375, 0.545135498046875, 0.57763671875, 0.610137939453125, 0.64263916015625, 0.675140380859375, 0.7076416015625, 0.740142822265625, 0.77264404296875, 0.805145263671875, 0.837646484375, 0.870147705078125, 0.90264892578125, 0.935150146484375, 0.9676513671875, 1.000152587890625, 1.03265380859375, 1.065155029296875, 1.09765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 6.0, 10.0, 18.0, 34.0, 43.0, 74.0, 73.0, 176.0, 310.0, 607.0, 1566.0, 4492.0, 19866.0, 203253.0, 755706.0, 49621.0, 8347.0, 2442.0, 876.0, 393.0, 225.0, 139.0, 91.0, 59.0, 34.0, 19.0, 19.0, 10.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.425537109375, -0.4123344421386719, -0.39913177490234375, -0.3859291076660156, -0.3727264404296875, -0.3595237731933594, -0.34632110595703125, -0.3331184387207031, -0.319915771484375, -0.3067131042480469, -0.29351043701171875, -0.2803077697753906, -0.2671051025390625, -0.2539024353027344, -0.24069976806640625, -0.22749710083007812, -0.21429443359375, -0.20109176635742188, -0.18788909912109375, -0.17468643188476562, -0.1614837646484375, -0.14828109741210938, -0.13507843017578125, -0.12187576293945312, -0.108673095703125, -0.09547042846679688, -0.08226776123046875, -0.06906509399414062, -0.0558624267578125, -0.042659759521484375, -0.02945709228515625, -0.016254425048828125, -0.0030517578125, 0.010150909423828125, 0.02335357666015625, 0.036556243896484375, 0.0497589111328125, 0.06296157836914062, 0.07616424560546875, 0.08936691284179688, 0.102569580078125, 0.11577224731445312, 0.12897491455078125, 0.14217758178710938, 0.1553802490234375, 0.16858291625976562, 0.18178558349609375, 0.19498825073242188, 0.20819091796875, 0.22139358520507812, 0.23459625244140625, 0.24779891967773438, 0.2610015869140625, 0.2742042541503906, 0.28740692138671875, 0.3006095886230469, 0.313812255859375, 0.3270149230957031, 0.34021759033203125, 0.3534202575683594, 0.3666229248046875, 0.3798255920410156, 0.39302825927734375, 0.4062309265136719, 0.41943359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 14.0, 20.0, 16.0, 29.0, 38.0, 61.0, 97.0, 149.0, 164.0, 136.0, 66.0, 60.0, 35.0, 26.0, 14.0, 12.0, 11.0, 7.0, 2.0, 7.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001131296157836914, -0.00011009536683559418, -0.00010706111788749695, -0.00010402686893939972, -0.00010099261999130249, -9.795837104320526e-05, -9.492412209510803e-05, -9.18898731470108e-05, -8.885562419891357e-05, -8.582137525081635e-05, -8.278712630271912e-05, -7.975287735462189e-05, -7.671862840652466e-05, -7.368437945842743e-05, -7.06501305103302e-05, -6.761588156223297e-05, -6.458163261413574e-05, -6.154738366603851e-05, -5.8513134717941284e-05, -5.5478885769844055e-05, -5.2444636821746826e-05, -4.94103878736496e-05, -4.637613892555237e-05, -4.334188997745514e-05, -4.030764102935791e-05, -3.727339208126068e-05, -3.423914313316345e-05, -3.120489418506622e-05, -2.8170645236968994e-05, -2.5136396288871765e-05, -2.2102147340774536e-05, -1.9067898392677307e-05, -1.6033649444580078e-05, -1.2999400496482849e-05, -9.96515154838562e-06, -6.930902600288391e-06, -3.896653652191162e-06, -8.624047040939331e-07, 2.171844244003296e-06, 5.206093192100525e-06, 8.240342140197754e-06, 1.1274591088294983e-05, 1.4308840036392212e-05, 1.734308898448944e-05, 2.037733793258667e-05, 2.34115868806839e-05, 2.6445835828781128e-05, 2.9480084776878357e-05, 3.2514333724975586e-05, 3.5548582673072815e-05, 3.8582831621170044e-05, 4.161708056926727e-05, 4.46513295173645e-05, 4.768557846546173e-05, 5.071982741355896e-05, 5.375407636165619e-05, 5.678832530975342e-05, 5.982257425785065e-05, 6.285682320594788e-05, 6.58910721540451e-05, 6.892532110214233e-05, 7.195957005023956e-05, 7.499381899833679e-05, 7.802806794643402e-05, 8.106231689453125e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 10.0, 10.0, 8.0, 11.0, 34.0, 28.0, 42.0, 73.0, 95.0, 125.0, 190.0, 330.0, 545.0, 1017.0, 2182.0, 5759.0, 24874.0, 228758.0, 704347.0, 62658.0, 10870.0, 3288.0, 1476.0, 684.0, 402.0, 238.0, 140.0, 98.0, 65.0, 54.0, 35.0, 32.0, 17.0, 11.0, 10.0, 7.0, 4.0, 10.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.31562042236328125, -0.3048248291015625, -0.29402923583984375, -0.283233642578125, -0.27243804931640625, -0.2616424560546875, -0.25084686279296875, -0.24005126953125, -0.22925567626953125, -0.2184600830078125, -0.20766448974609375, -0.196868896484375, -0.18607330322265625, -0.1752777099609375, -0.16448211669921875, -0.1536865234375, -0.14289093017578125, -0.1320953369140625, -0.12129974365234375, -0.110504150390625, -0.09970855712890625, -0.0889129638671875, -0.07811737060546875, -0.06732177734375, -0.05652618408203125, -0.0457305908203125, -0.03493499755859375, -0.024139404296875, -0.01334381103515625, -0.0025482177734375, 0.00824737548828125, 0.01904296875, 0.02983856201171875, 0.0406341552734375, 0.05142974853515625, 0.062225341796875, 0.07302093505859375, 0.0838165283203125, 0.09461212158203125, 0.10540771484375, 0.11620330810546875, 0.1269989013671875, 0.13779449462890625, 0.148590087890625, 0.15938568115234375, 0.1701812744140625, 0.18097686767578125, 0.1917724609375, 0.20256805419921875, 0.2133636474609375, 0.22415924072265625, 0.234954833984375, 0.24575042724609375, 0.2565460205078125, 0.26734161376953125, 0.27813720703125, 0.28893280029296875, 0.2997283935546875, 0.31052398681640625, 0.321319580078125, 0.33211517333984375, 0.3429107666015625, 0.35370635986328125, 0.364501953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 10.0, 20.0, 15.0, 17.0, 23.0, 42.0, 40.0, 44.0, 53.0, 59.0, 76.0, 76.0, 81.0, 83.0, 50.0, 39.0, 40.0, 36.0, 33.0, 22.0, 28.0, 16.0, 8.0, 9.0, 7.0, 2.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28076171875, -0.2729034423828125, -0.265045166015625, -0.2571868896484375, -0.24932861328125, -0.2414703369140625, -0.233612060546875, -0.2257537841796875, -0.2178955078125, -0.2100372314453125, -0.202178955078125, -0.1943206787109375, -0.18646240234375, -0.1786041259765625, -0.170745849609375, -0.1628875732421875, -0.155029296875, -0.1471710205078125, -0.139312744140625, -0.1314544677734375, -0.12359619140625, -0.1157379150390625, -0.107879638671875, -0.1000213623046875, -0.0921630859375, -0.0843048095703125, -0.076446533203125, -0.0685882568359375, -0.06072998046875, -0.0528717041015625, -0.045013427734375, -0.0371551513671875, -0.029296875, -0.0214385986328125, -0.013580322265625, -0.0057220458984375, 0.00213623046875, 0.0099945068359375, 0.017852783203125, 0.0257110595703125, 0.0335693359375, 0.0414276123046875, 0.049285888671875, 0.0571441650390625, 0.06500244140625, 0.0728607177734375, 0.080718994140625, 0.0885772705078125, 0.096435546875, 0.1042938232421875, 0.112152099609375, 0.1200103759765625, 0.12786865234375, 0.1357269287109375, 0.143585205078125, 0.1514434814453125, 0.1593017578125, 0.1671600341796875, 0.175018310546875, 0.1828765869140625, 0.19073486328125, 0.1985931396484375, 0.206451416015625, 0.2143096923828125, 0.22216796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 11.0, 23.0, 59.0, 108.0, 201.0, 241.0, 173.0, 97.0, 44.0, 15.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.356454849243164, -10.087518692016602, -9.818582534790039, -9.549646377563477, -9.280710220336914, -9.011774063110352, -8.742837905883789, -8.473901748657227, -8.204965591430664, -7.936029434204102, -7.667093276977539, -7.398157119750977, -7.129220962524414, -6.860284805297852, -6.591349124908447, -6.322412967681885, -6.0534772872924805, -5.784541130065918, -5.5156049728393555, -5.246668815612793, -4.9777326583862305, -4.708796501159668, -4.439860820770264, -4.170924663543701, -3.9019885063171387, -3.633052349090576, -3.3641161918640137, -3.0951802730560303, -2.8262441158294678, -2.5573079586029053, -2.288372039794922, -2.0194358825683594, -1.7505006790161133, -1.4815645217895508, -1.2126284837722778, -0.9436923861503601, -0.6747562885284424, -0.4058201313018799, -0.13688409328460693, 0.13205194473266602, 0.4009881019592285, 0.6699241995811462, 0.938860297203064, 1.207796335220337, 1.4767324924468994, 1.745668649673462, 2.0146045684814453, 2.283540725708008, 2.5524768829345703, 2.821413040161133, 3.0903491973876953, 3.3592851161956787, 3.628221273422241, 3.8971574306488037, 4.166093349456787, 4.43502950668335, 4.703965663909912, 4.972901821136475, 5.241837978363037, 5.5107741355896, 5.779709815979004, 6.048645973205566, 6.317582130432129, 6.586518287658691, 6.855454444885254]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 12.0, 13.0, 8.0, 12.0, 22.0, 13.0, 17.0, 27.0, 29.0, 24.0, 36.0, 39.0, 54.0, 51.0, 68.0, 71.0, 73.0, 67.0, 49.0, 46.0, 44.0, 26.0, 31.0, 31.0, 31.0, 19.0, 19.0, 11.0, 14.0, 11.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.709228277206421, -3.574207067489624, -3.439185857772827, -3.3041646480560303, -3.1691434383392334, -3.0341222286224365, -2.8991007804870605, -2.7640795707702637, -2.629058361053467, -2.49403715133667, -2.359015941619873, -2.223994731903076, -2.0889735221862793, -1.9539523124694824, -1.818930983543396, -1.6839097738265991, -1.5488886833190918, -1.413867473602295, -1.278846263885498, -1.1438250541687012, -1.0088038444519043, -0.8737825751304626, -0.738761305809021, -0.6037400960922241, -0.46871888637542725, -0.33369767665863037, -0.1986764371395111, -0.06365519762039185, 0.07136601209640503, 0.2063872218132019, 0.34140849113464355, 0.47642970085144043, 0.6114506721496582, 0.7464718818664551, 0.881493091583252, 1.0165143013000488, 1.1515355110168457, 1.2865567207336426, 1.421578049659729, 1.5565992593765259, 1.6916204690933228, 1.8266416788101196, 1.9616628885269165, 2.096684217453003, 2.2317054271698, 2.3667266368865967, 2.5017478466033936, 2.6367690563201904, 2.7717902660369873, 2.906811475753784, 3.041832685470581, 3.176853895187378, 3.311875104904175, 3.4468963146209717, 3.5819177627563477, 3.7169389724731445, 3.8519601821899414, 3.9869813919067383, 4.122002601623535, 4.257023811340332, 4.392045021057129, 4.527066230773926, 4.662087440490723, 4.7971086502075195, 4.932129859924316]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 18.0, 13.0, 24.0, 42.0, 51.0, 72.0, 123.0, 226.0, 778.0, 7441.0, 2378182.0, 1798728.0, 7054.0, 856.0, 265.0, 130.0, 65.0, 69.0, 42.0, 19.0, 19.0, 10.0, 12.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6281280517578125, -1.575592041015625, -1.5230560302734375, -1.47052001953125, -1.4179840087890625, -1.365447998046875, -1.3129119873046875, -1.2603759765625, -1.2078399658203125, -1.155303955078125, -1.1027679443359375, -1.05023193359375, -0.9976959228515625, -0.945159912109375, -0.8926239013671875, -0.840087890625, -0.7875518798828125, -0.735015869140625, -0.6824798583984375, -0.62994384765625, -0.5774078369140625, -0.524871826171875, -0.4723358154296875, -0.4197998046875, -0.3672637939453125, -0.314727783203125, -0.2621917724609375, -0.20965576171875, -0.1571197509765625, -0.104583740234375, -0.0520477294921875, 0.00048828125, 0.0530242919921875, 0.105560302734375, 0.1580963134765625, 0.21063232421875, 0.2631683349609375, 0.315704345703125, 0.3682403564453125, 0.4207763671875, 0.4733123779296875, 0.525848388671875, 0.5783843994140625, 0.63092041015625, 0.6834564208984375, 0.735992431640625, 0.7885284423828125, 0.841064453125, 0.8936004638671875, 0.946136474609375, 0.9986724853515625, 1.05120849609375, 1.1037445068359375, 1.156280517578125, 1.2088165283203125, 1.2613525390625, 1.3138885498046875, 1.366424560546875, 1.4189605712890625, 1.47149658203125, 1.5240325927734375, 1.576568603515625, 1.6291046142578125, 1.681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 8.0, 12.0, 14.0, 17.0, 27.0, 32.0, 46.0, 59.0, 49.0, 60.0, 58.0, 67.0, 66.0, 61.0, 74.0, 55.0, 53.0, 50.0, 36.0, 33.0, 27.0, 28.0, 18.0, 11.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217529296875, -0.20933151245117188, -0.20113372802734375, -0.19293594360351562, -0.1847381591796875, -0.17654037475585938, -0.16834259033203125, -0.16014480590820312, -0.151947021484375, -0.14374923706054688, -0.13555145263671875, -0.12735366821289062, -0.1191558837890625, -0.11095809936523438, -0.10276031494140625, -0.09456253051757812, -0.08636474609375, -0.07816696166992188, -0.06996917724609375, -0.061771392822265625, -0.0535736083984375, -0.045375823974609375, -0.03717803955078125, -0.028980255126953125, -0.020782470703125, -0.012584686279296875, -0.00438690185546875, 0.003810882568359375, 0.0120086669921875, 0.020206451416015625, 0.02840423583984375, 0.036602020263671875, 0.0447998046875, 0.052997589111328125, 0.06119537353515625, 0.06939315795898438, 0.0775909423828125, 0.08578872680664062, 0.09398651123046875, 0.10218429565429688, 0.110382080078125, 0.11857986450195312, 0.12677764892578125, 0.13497543334960938, 0.1431732177734375, 0.15137100219726562, 0.15956878662109375, 0.16776657104492188, 0.17596435546875, 0.18416213989257812, 0.19235992431640625, 0.20055770874023438, 0.2087554931640625, 0.21695327758789062, 0.22515106201171875, 0.23334884643554688, 0.241546630859375, 0.24974441528320312, 0.25794219970703125, 0.2661399841308594, 0.2743377685546875, 0.2825355529785156, 0.29073333740234375, 0.2989311218261719, 0.30712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 4.0, 14.0, 13.0, 30.0, 22.0, 29.0, 51.0, 99.0, 165.0, 293.0, 608.0, 1219.0, 2736.0, 6349.0, 15554.0, 43774.0, 189702.0, 2945377.0, 850390.0, 92443.0, 26969.0, 10156.0, 4333.0, 1910.0, 921.0, 462.0, 237.0, 150.0, 88.0, 53.0, 36.0, 22.0, 15.0, 9.0, 7.0, 12.0, 6.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5046310424804688, -0.4887542724609375, -0.47287750244140625, -0.457000732421875, -0.44112396240234375, -0.4252471923828125, -0.40937042236328125, -0.39349365234375, -0.37761688232421875, -0.3617401123046875, -0.34586334228515625, -0.329986572265625, -0.31410980224609375, -0.2982330322265625, -0.28235626220703125, -0.2664794921875, -0.25060272216796875, -0.2347259521484375, -0.21884918212890625, -0.202972412109375, -0.18709564208984375, -0.1712188720703125, -0.15534210205078125, -0.13946533203125, -0.12358856201171875, -0.1077117919921875, -0.09183502197265625, -0.075958251953125, -0.06008148193359375, -0.0442047119140625, -0.02832794189453125, -0.012451171875, 0.00342559814453125, 0.0193023681640625, 0.03517913818359375, 0.051055908203125, 0.06693267822265625, 0.0828094482421875, 0.09868621826171875, 0.11456298828125, 0.13043975830078125, 0.1463165283203125, 0.16219329833984375, 0.178070068359375, 0.19394683837890625, 0.2098236083984375, 0.22570037841796875, 0.2415771484375, 0.25745391845703125, 0.2733306884765625, 0.28920745849609375, 0.305084228515625, 0.32096099853515625, 0.3368377685546875, 0.35271453857421875, 0.36859130859375, 0.38446807861328125, 0.4003448486328125, 0.41622161865234375, 0.432098388671875, 0.44797515869140625, 0.4638519287109375, 0.47972869873046875, 0.49560546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 6.0, 7.0, 9.0, 10.0, 20.0, 24.0, 24.0, 28.0, 43.0, 75.0, 108.0, 164.0, 314.0, 630.0, 993.0, 686.0, 319.0, 191.0, 106.0, 85.0, 52.0, 34.0, 27.0, 17.0, 16.0, 16.0, 6.0, 9.0, 7.0, 4.0, 9.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5419082641601562, -0.5247344970703125, -0.5075607299804688, -0.490386962890625, -0.47321319580078125, -0.4560394287109375, -0.43886566162109375, -0.42169189453125, -0.40451812744140625, -0.3873443603515625, -0.37017059326171875, -0.352996826171875, -0.33582305908203125, -0.3186492919921875, -0.30147552490234375, -0.2843017578125, -0.26712799072265625, -0.2499542236328125, -0.23278045654296875, -0.215606689453125, -0.19843292236328125, -0.1812591552734375, -0.16408538818359375, -0.14691162109375, -0.12973785400390625, -0.1125640869140625, -0.09539031982421875, -0.078216552734375, -0.06104278564453125, -0.0438690185546875, -0.02669525146484375, -0.009521484375, 0.00765228271484375, 0.0248260498046875, 0.04199981689453125, 0.059173583984375, 0.07634735107421875, 0.0935211181640625, 0.11069488525390625, 0.12786865234375, 0.14504241943359375, 0.1622161865234375, 0.17938995361328125, 0.196563720703125, 0.21373748779296875, 0.2309112548828125, 0.24808502197265625, 0.2652587890625, 0.28243255615234375, 0.2996063232421875, 0.31678009033203125, 0.333953857421875, 0.35112762451171875, 0.3683013916015625, 0.38547515869140625, 0.40264892578125, 0.41982269287109375, 0.4369964599609375, 0.45417022705078125, 0.471343994140625, 0.48851776123046875, 0.5056915283203125, 0.5228652954101562, 0.5400390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 13.0, 18.0, 54.0, 129.0, 260.0, 243.0, 162.0, 54.0, 28.0, 10.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.792000770568848, -7.556621551513672, -7.321242809295654, -7.0858635902404785, -6.850484371185303, -6.615105628967285, -6.379726409912109, -6.144347190856934, -5.908967971801758, -5.673588752746582, -5.4382100105285645, -5.202830791473389, -4.967451572418213, -4.732072830200195, -4.4966936111450195, -4.261314392089844, -4.025935649871826, -3.7905566692352295, -3.5551774501800537, -3.319798469543457, -3.0844192504882812, -2.8490402698516846, -2.613661289215088, -2.378282070159912, -2.1429030895233154, -1.9075239896774292, -1.672144889831543, -1.4367659091949463, -1.20138680934906, -0.9660077095031738, -0.7306287288665771, -0.4952496290206909, -0.2598705291748047, -0.024491459131240845, 0.210887610912323, 0.44626665115356445, 0.6816457509994507, 0.9170248508453369, 1.1524038314819336, 1.3877829313278198, 1.623162031173706, 1.8585411310195923, 2.0939202308654785, 2.329299211502075, 2.564678192138672, 2.8000574111938477, 3.0354363918304443, 3.270815372467041, 3.506194591522217, 3.7415735721588135, 3.9769527912139893, 4.212331771850586, 4.447710990905762, 4.6830902099609375, 4.918468952178955, 5.153848171234131, 5.389226913452148, 5.624606132507324, 5.859984874725342, 6.095364093780518, 6.330743312835693, 6.566122055053711, 6.801501274108887, 7.0368804931640625, 7.272259712219238]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 6.0, 12.0, 11.0, 10.0, 11.0, 5.0, 11.0, 22.0, 21.0, 30.0, 22.0, 26.0, 36.0, 36.0, 29.0, 32.0, 37.0, 40.0, 44.0, 46.0, 37.0, 41.0, 40.0, 40.0, 31.0, 41.0, 31.0, 29.0, 30.0, 19.0, 22.0, 26.0, 17.0, 14.0, 8.0, 16.0, 8.0, 9.0, 2.0, 6.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.027822256088257, -1.9634045362472534, -1.89898681640625, -1.8345690965652466, -1.7701513767242432, -1.7057336568832397, -1.6413159370422363, -1.576898217201233, -1.5124804973602295, -1.448062777519226, -1.3836450576782227, -1.3192273378372192, -1.2548096179962158, -1.1903918981552124, -1.125974178314209, -1.0615564584732056, -0.9971387386322021, -0.9327210187911987, -0.8683032989501953, -0.8038855791091919, -0.7394678592681885, -0.6750501394271851, -0.6106324195861816, -0.5462146997451782, -0.4817969799041748, -0.4173792600631714, -0.35296154022216797, -0.28854382038116455, -0.22412610054016113, -0.15970838069915771, -0.0952906608581543, -0.03087294101715088, 0.03354454040527344, 0.09796226024627686, 0.16237998008728027, 0.2267976999282837, 0.2912154197692871, 0.3556331396102905, 0.42005085945129395, 0.48446857929229736, 0.5488862991333008, 0.6133040189743042, 0.6777217388153076, 0.742139458656311, 0.8065571784973145, 0.8709748983383179, 0.9353926181793213, 0.9998103380203247, 1.0642280578613281, 1.1286457777023315, 1.193063497543335, 1.2574812173843384, 1.3218989372253418, 1.3863166570663452, 1.4507343769073486, 1.515152096748352, 1.5795698165893555, 1.6439875364303589, 1.7084052562713623, 1.7728229761123657, 1.8372406959533691, 1.9016584157943726, 1.966076135635376, 2.03049373626709, 2.094911575317383]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 11.0, 9.0, 20.0, 30.0, 40.0, 71.0, 88.0, 148.0, 258.0, 387.0, 605.0, 1158.0, 1998.0, 3731.0, 7177.0, 14897.0, 34069.0, 95264.0, 326651.0, 377093.0, 111514.0, 39534.0, 16713.0, 7827.0, 3956.0, 2143.0, 1217.0, 733.0, 454.0, 313.0, 135.0, 111.0, 59.0, 51.0, 30.0, 18.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3752174377441406, -0.36273956298828125, -0.3502616882324219, -0.3377838134765625, -0.3253059387207031, -0.31282806396484375, -0.3003501892089844, -0.287872314453125, -0.2753944396972656, -0.26291656494140625, -0.2504386901855469, -0.2379608154296875, -0.22548294067382812, -0.21300506591796875, -0.20052719116210938, -0.18804931640625, -0.17557144165039062, -0.16309356689453125, -0.15061569213867188, -0.1381378173828125, -0.12565994262695312, -0.11318206787109375, -0.10070419311523438, -0.088226318359375, -0.07574844360351562, -0.06327056884765625, -0.050792694091796875, -0.0383148193359375, -0.025836944580078125, -0.01335906982421875, -0.000881195068359375, 0.0115966796875, 0.024074554443359375, 0.03655242919921875, 0.049030303955078125, 0.0615081787109375, 0.07398605346679688, 0.08646392822265625, 0.09894180297851562, 0.111419677734375, 0.12389755249023438, 0.13637542724609375, 0.14885330200195312, 0.1613311767578125, 0.17380905151367188, 0.18628692626953125, 0.19876480102539062, 0.21124267578125, 0.22372055053710938, 0.23619842529296875, 0.24867630004882812, 0.2611541748046875, 0.2736320495605469, 0.28610992431640625, 0.2985877990722656, 0.311065673828125, 0.3235435485839844, 0.33602142333984375, 0.3484992980957031, 0.3609771728515625, 0.3734550476074219, 0.38593292236328125, 0.3984107971191406, 0.410888671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 7.0, 11.0, 24.0, 21.0, 22.0, 24.0, 31.0, 27.0, 40.0, 49.0, 60.0, 55.0, 59.0, 56.0, 54.0, 50.0, 54.0, 51.0, 52.0, 33.0, 33.0, 36.0, 23.0, 17.0, 26.0, 14.0, 10.0, 15.0, 8.0, 5.0, 5.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.23657608032226562, -0.22913360595703125, -0.22169113159179688, -0.2142486572265625, -0.20680618286132812, -0.19936370849609375, -0.19192123413085938, -0.184478759765625, -0.17703628540039062, -0.16959381103515625, -0.16215133666992188, -0.1547088623046875, -0.14726638793945312, -0.13982391357421875, -0.13238143920898438, -0.12493896484375, -0.11749649047851562, -0.11005401611328125, -0.10261154174804688, -0.0951690673828125, -0.08772659301757812, -0.08028411865234375, -0.07284164428710938, -0.065399169921875, -0.057956695556640625, -0.05051422119140625, -0.043071746826171875, -0.0356292724609375, -0.028186798095703125, -0.02074432373046875, -0.013301849365234375, -0.005859375, 0.001583099365234375, 0.00902557373046875, 0.016468048095703125, 0.0239105224609375, 0.031352996826171875, 0.03879547119140625, 0.046237945556640625, 0.053680419921875, 0.061122894287109375, 0.06856536865234375, 0.07600784301757812, 0.0834503173828125, 0.09089279174804688, 0.09833526611328125, 0.10577774047851562, 0.11322021484375, 0.12066268920898438, 0.12810516357421875, 0.13554763793945312, 0.1429901123046875, 0.15043258666992188, 0.15787506103515625, 0.16531753540039062, 0.172760009765625, 0.18020248413085938, 0.18764495849609375, 0.19508743286132812, 0.2025299072265625, 0.20997238159179688, 0.21741485595703125, 0.22485733032226562, 0.2322998046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 17.0, 14.0, 22.0, 25.0, 34.0, 51.0, 78.0, 97.0, 159.0, 274.0, 451.0, 865.0, 1593.0, 4513.0, 18232.0, 133195.0, 787923.0, 81025.0, 13095.0, 3645.0, 1441.0, 693.0, 422.0, 220.0, 151.0, 86.0, 51.0, 38.0, 33.0, 22.0, 21.0, 16.0, 13.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7446060180664062, -0.7152862548828125, -0.6859664916992188, -0.656646728515625, -0.6273269653320312, -0.5980072021484375, -0.5686874389648438, -0.53936767578125, -0.5100479125976562, -0.4807281494140625, -0.45140838623046875, -0.422088623046875, -0.39276885986328125, -0.3634490966796875, -0.33412933349609375, -0.3048095703125, -0.27548980712890625, -0.2461700439453125, -0.21685028076171875, -0.187530517578125, -0.15821075439453125, -0.1288909912109375, -0.09957122802734375, -0.07025146484375, -0.04093170166015625, -0.0116119384765625, 0.01770782470703125, 0.047027587890625, 0.07634735107421875, 0.1056671142578125, 0.13498687744140625, 0.164306640625, 0.19362640380859375, 0.2229461669921875, 0.25226593017578125, 0.281585693359375, 0.31090545654296875, 0.3402252197265625, 0.36954498291015625, 0.39886474609375, 0.42818450927734375, 0.4575042724609375, 0.48682403564453125, 0.516143798828125, 0.5454635620117188, 0.5747833251953125, 0.6041030883789062, 0.6334228515625, 0.6627426147460938, 0.6920623779296875, 0.7213821411132812, 0.750701904296875, 0.7800216674804688, 0.8093414306640625, 0.8386611938476562, 0.86798095703125, 0.8973007202148438, 0.9266204833984375, 0.9559402465820312, 0.985260009765625, 1.0145797729492188, 1.0438995361328125, 1.0732192993164062, 1.1025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 1.0, 5.0, 8.0, 10.0, 4.0, 18.0, 19.0, 12.0, 26.0, 28.0, 22.0, 37.0, 42.0, 42.0, 52.0, 62.0, 56.0, 59.0, 61.0, 69.0, 56.0, 46.0, 51.0, 37.0, 36.0, 28.0, 21.0, 24.0, 13.0, 6.0, 16.0, 14.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2254409790039062, -1.1920928955078125, -1.1587448120117188, -1.125396728515625, -1.0920486450195312, -1.0587005615234375, -1.0253524780273438, -0.99200439453125, -0.9586563110351562, -0.9253082275390625, -0.8919601440429688, -0.858612060546875, -0.8252639770507812, -0.7919158935546875, -0.7585678100585938, -0.7252197265625, -0.6918716430664062, -0.6585235595703125, -0.6251754760742188, -0.591827392578125, -0.5584793090820312, -0.5251312255859375, -0.49178314208984375, -0.45843505859375, -0.42508697509765625, -0.3917388916015625, -0.35839080810546875, -0.325042724609375, -0.29169464111328125, -0.2583465576171875, -0.22499847412109375, -0.191650390625, -0.15830230712890625, -0.1249542236328125, -0.09160614013671875, -0.058258056640625, -0.02490997314453125, 0.0084381103515625, 0.04178619384765625, 0.07513427734375, 0.10848236083984375, 0.1418304443359375, 0.17517852783203125, 0.208526611328125, 0.24187469482421875, 0.2752227783203125, 0.30857086181640625, 0.3419189453125, 0.37526702880859375, 0.4086151123046875, 0.44196319580078125, 0.475311279296875, 0.5086593627929688, 0.5420074462890625, 0.5753555297851562, 0.60870361328125, 0.6420516967773438, 0.6753997802734375, 0.7087478637695312, 0.742095947265625, 0.7754440307617188, 0.8087921142578125, 0.8421401977539062, 0.87548828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 15.0, 18.0, 31.0, 59.0, 203.0, 625.0, 3319.0, 48707.0, 942639.0, 48514.0, 3393.0, 640.0, 206.0, 80.0, 38.0, 18.0, 15.0, 3.0, 5.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1124954223632812, -1.0863189697265625, -1.0601425170898438, -1.033966064453125, -1.0077896118164062, -0.9816131591796875, -0.9554367065429688, -0.92926025390625, -0.9030838012695312, -0.8769073486328125, -0.8507308959960938, -0.824554443359375, -0.7983779907226562, -0.7722015380859375, -0.7460250854492188, -0.7198486328125, -0.6936721801757812, -0.6674957275390625, -0.6413192749023438, -0.615142822265625, -0.5889663696289062, -0.5627899169921875, -0.5366134643554688, -0.51043701171875, -0.48426055908203125, -0.4580841064453125, -0.43190765380859375, -0.405731201171875, -0.37955474853515625, -0.3533782958984375, -0.32720184326171875, -0.301025390625, -0.27484893798828125, -0.2486724853515625, -0.22249603271484375, -0.196319580078125, -0.17014312744140625, -0.1439666748046875, -0.11779022216796875, -0.09161376953125, -0.06543731689453125, -0.0392608642578125, -0.01308441162109375, 0.013092041015625, 0.03926849365234375, 0.0654449462890625, 0.09162139892578125, 0.1177978515625, 0.14397430419921875, 0.1701507568359375, 0.19632720947265625, 0.222503662109375, 0.24868011474609375, 0.2748565673828125, 0.30103302001953125, 0.32720947265625, 0.35338592529296875, 0.3795623779296875, 0.40573883056640625, 0.431915283203125, 0.45809173583984375, 0.4842681884765625, 0.5104446411132812, 0.53662109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 8.0, 4.0, 6.0, 8.0, 5.0, 14.0, 15.0, 24.0, 46.0, 43.0, 55.0, 76.0, 106.0, 148.0, 107.0, 87.0, 73.0, 55.0, 37.0, 21.0, 17.0, 10.0, 8.0, 9.0, 7.0, 2.0, 0.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00011521577835083008, -0.00011245440691709518, -0.00010969303548336029, -0.0001069316640496254, -0.0001041702926158905, -0.00010140892118215561, -9.864754974842072e-05, -9.588617831468582e-05, -9.312480688095093e-05, -9.036343544721603e-05, -8.760206401348114e-05, -8.484069257974625e-05, -8.207932114601135e-05, -7.931794971227646e-05, -7.655657827854156e-05, -7.379520684480667e-05, -7.103383541107178e-05, -6.827246397733688e-05, -6.551109254360199e-05, -6.27497211098671e-05, -5.99883496761322e-05, -5.722697824239731e-05, -5.4465606808662415e-05, -5.170423537492752e-05, -4.894286394119263e-05, -4.618149250745773e-05, -4.342012107372284e-05, -4.0658749639987946e-05, -3.789737820625305e-05, -3.513600677251816e-05, -3.2374635338783264e-05, -2.961326390504837e-05, -2.6851892471313477e-05, -2.4090521037578583e-05, -2.132914960384369e-05, -1.8567778170108795e-05, -1.58064067363739e-05, -1.3045035302639008e-05, -1.0283663868904114e-05, -7.52229243516922e-06, -4.760921001434326e-06, -1.9995495676994324e-06, 7.618218660354614e-07, 3.5231932997703552e-06, 6.284564733505249e-06, 9.045936167240143e-06, 1.1807307600975037e-05, 1.456867903470993e-05, 1.7330050468444824e-05, 2.0091421902179718e-05, 2.2852793335914612e-05, 2.5614164769649506e-05, 2.83755362033844e-05, 3.113690763711929e-05, 3.389827907085419e-05, 3.665965050458908e-05, 3.9421021938323975e-05, 4.218239337205887e-05, 4.494376480579376e-05, 4.7705136239528656e-05, 5.046650767326355e-05, 5.3227879106998444e-05, 5.598925054073334e-05, 5.875062197446823e-05, 6.151199340820312e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 16.0, 29.0, 68.0, 136.0, 310.0, 892.0, 4120.0, 55132.0, 926837.0, 55316.0, 4161.0, 923.0, 319.0, 154.0, 64.0, 30.0, 13.0, 13.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83056640625, -0.8084182739257812, -0.7862701416015625, -0.7641220092773438, -0.741973876953125, -0.7198257446289062, -0.6976776123046875, -0.6755294799804688, -0.65338134765625, -0.6312332153320312, -0.6090850830078125, -0.5869369506835938, -0.564788818359375, -0.5426406860351562, -0.5204925537109375, -0.49834442138671875, -0.4761962890625, -0.45404815673828125, -0.4319000244140625, -0.40975189208984375, -0.387603759765625, -0.36545562744140625, -0.3433074951171875, -0.32115936279296875, -0.29901123046875, -0.27686309814453125, -0.2547149658203125, -0.23256683349609375, -0.210418701171875, -0.18827056884765625, -0.1661224365234375, -0.14397430419921875, -0.121826171875, -0.09967803955078125, -0.0775299072265625, -0.05538177490234375, -0.033233642578125, -0.01108551025390625, 0.0110626220703125, 0.03321075439453125, 0.05535888671875, 0.07750701904296875, 0.0996551513671875, 0.12180328369140625, 0.143951416015625, 0.16609954833984375, 0.1882476806640625, 0.21039581298828125, 0.2325439453125, 0.25469207763671875, 0.2768402099609375, 0.29898834228515625, 0.321136474609375, 0.34328460693359375, 0.3654327392578125, 0.38758087158203125, 0.40972900390625, 0.43187713623046875, 0.4540252685546875, 0.47617340087890625, 0.498321533203125, 0.5204696655273438, 0.5426177978515625, 0.5647659301757812, 0.5869140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 11.0, 21.0, 26.0, 35.0, 40.0, 75.0, 72.0, 103.0, 111.0, 108.0, 76.0, 66.0, 59.0, 50.0, 29.0, 28.0, 12.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3193626403808594, -0.30742645263671875, -0.2954902648925781, -0.2835540771484375, -0.2716178894042969, -0.25968170166015625, -0.24774551391601562, -0.235809326171875, -0.22387313842773438, -0.21193695068359375, -0.20000076293945312, -0.1880645751953125, -0.17612838745117188, -0.16419219970703125, -0.15225601196289062, -0.14031982421875, -0.12838363647460938, -0.11644744873046875, -0.10451126098632812, -0.0925750732421875, -0.08063888549804688, -0.06870269775390625, -0.056766510009765625, -0.044830322265625, -0.032894134521484375, -0.02095794677734375, -0.009021759033203125, 0.0029144287109375, 0.014850616455078125, 0.02678680419921875, 0.038722991943359375, 0.0506591796875, 0.06259536743164062, 0.07453155517578125, 0.08646774291992188, 0.0984039306640625, 0.11034011840820312, 0.12227630615234375, 0.13421249389648438, 0.146148681640625, 0.15808486938476562, 0.17002105712890625, 0.18195724487304688, 0.1938934326171875, 0.20582962036132812, 0.21776580810546875, 0.22970199584960938, 0.24163818359375, 0.2535743713378906, 0.26551055908203125, 0.2774467468261719, 0.2893829345703125, 0.3013191223144531, 0.31325531005859375, 0.3251914978027344, 0.337127685546875, 0.3490638732910156, 0.36100006103515625, 0.3729362487792969, 0.3848724365234375, 0.3968086242675781, 0.40874481201171875, 0.4206809997558594, 0.4326171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 8.0, 44.0, 143.0, 327.0, 294.0, 113.0, 39.0, 15.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.595186233520508, -13.225724220275879, -12.856261253356934, -12.486799240112305, -12.11733627319336, -11.74787425994873, -11.378412246704102, -11.008949279785156, -10.639486312866211, -10.270024299621582, -9.900561332702637, -9.531099319458008, -9.161636352539062, -8.792174339294434, -8.422712326049805, -8.05324935913086, -7.6837873458862305, -7.314324855804443, -6.944862365722656, -6.575400352478027, -6.205937385559082, -5.836475372314453, -5.467012882232666, -5.097550392150879, -4.728087902069092, -4.358625411987305, -3.9891629219055176, -3.6197006702423096, -3.2502381801605225, -2.8807756900787354, -2.5113134384155273, -2.1418509483337402, -1.7723884582519531, -1.402925968170166, -1.0334635972976685, -0.6640012264251709, -0.2945387363433838, 0.07492375373840332, 0.44438600540161133, 0.8138484954833984, 1.1833109855651855, 1.5527734756469727, 1.9222358465194702, 2.2916982173919678, 2.661160707473755, 3.030623197555542, 3.40008544921875, 3.769547939300537, 4.139010429382324, 4.508472919464111, 4.877935409545898, 5.247397422790527, 5.616860389709473, 5.986322402954102, 6.355784893035889, 6.725247383117676, 7.094709873199463, 7.46417236328125, 7.833634853363037, 8.203097343444824, 8.572559356689453, 8.942022323608398, 9.311484336853027, 9.680946350097656, 10.050409317016602]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 9.0, 14.0, 15.0, 16.0, 23.0, 29.0, 19.0, 34.0, 25.0, 26.0, 47.0, 58.0, 58.0, 60.0, 74.0, 60.0, 54.0, 41.0, 39.0, 38.0, 47.0, 26.0, 28.0, 23.0, 22.0, 23.0, 11.0, 21.0, 12.0, 9.0, 9.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.173884868621826, -4.039281368255615, -3.9046778678894043, -3.7700746059417725, -3.6354711055755615, -3.5008676052093506, -3.3662643432617188, -3.231660842895508, -3.097057342529297, -2.962453842163086, -2.827850341796875, -2.693247079849243, -2.5586435794830322, -2.4240400791168213, -2.2894368171691895, -2.1548333168029785, -2.0202298164367676, -1.8856263160705566, -1.7510229349136353, -1.6164195537567139, -1.481816053390503, -1.347212553024292, -1.2126091718673706, -1.0780057907104492, -0.9434022903442383, -0.8087988495826721, -0.674195408821106, -0.5395919680595398, -0.40498852729797363, -0.27038508653640747, -0.1357816457748413, -0.0011782050132751465, 0.1334247589111328, 0.268028199672699, 0.40263164043426514, 0.5372350811958313, 0.6718385219573975, 0.8064419627189636, 0.9410454034805298, 1.0756487846374512, 1.210252285003662, 1.344855785369873, 1.4794591665267944, 1.6140625476837158, 1.7486660480499268, 1.8832695484161377, 2.0178728103637695, 2.1524763107299805, 2.2870798110961914, 2.4216833114624023, 2.5562868118286133, 2.690890073776245, 2.825493574142456, 2.960097074508667, 3.094700336456299, 3.2293038368225098, 3.3639073371887207, 3.4985108375549316, 3.6331143379211426, 3.7677175998687744, 3.9023211002349854, 4.036924362182617, 4.171527862548828, 4.306131362915039, 4.44073486328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 17.0, 40.0, 50.0, 105.0, 143.0, 208.0, 344.0, 602.0, 1124.0, 2122.0, 4198.0, 8782.0, 19756.0, 51365.0, 170507.0, 854504.0, 2279647.0, 602980.0, 126518.0, 40069.0, 16222.0, 7144.0, 3471.0, 1870.0, 1003.0, 545.0, 316.0, 196.0, 131.0, 89.0, 60.0, 40.0, 23.0, 14.0, 13.0, 15.0, 3.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.2316570281982422, -0.22320175170898438, -0.21474647521972656, -0.20629119873046875, -0.19783592224121094, -0.18938064575195312, -0.1809253692626953, -0.1724700927734375, -0.1640148162841797, -0.15555953979492188, -0.14710426330566406, -0.13864898681640625, -0.13019371032714844, -0.12173843383789062, -0.11328315734863281, -0.104827880859375, -0.09637260437011719, -0.08791732788085938, -0.07946205139160156, -0.07100677490234375, -0.06255149841308594, -0.054096221923828125, -0.04564094543457031, -0.0371856689453125, -0.028730392456054688, -0.020275115966796875, -0.011819839477539062, -0.00336456298828125, 0.0050907135009765625, 0.013545989990234375, 0.022001266479492188, 0.03045654296875, 0.03891181945800781, 0.047367095947265625, 0.05582237243652344, 0.06427764892578125, 0.07273292541503906, 0.08118820190429688, 0.08964347839355469, 0.0980987548828125, 0.10655403137207031, 0.11500930786132812, 0.12346458435058594, 0.13191986083984375, 0.14037513732910156, 0.14883041381835938, 0.1572856903076172, 0.165740966796875, 0.1741962432861328, 0.18265151977539062, 0.19110679626464844, 0.19956207275390625, 0.20801734924316406, 0.21647262573242188, 0.2249279022216797, 0.2333831787109375, 0.2418384552001953, 0.2502937316894531, 0.25874900817871094, 0.26720428466796875, 0.27565956115722656, 0.2841148376464844, 0.2925701141357422, 0.301025390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 11.0, 19.0, 15.0, 20.0, 30.0, 39.0, 38.0, 61.0, 66.0, 71.0, 74.0, 91.0, 92.0, 80.0, 81.0, 58.0, 50.0, 34.0, 24.0, 17.0, 17.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.14758682250976562, -0.13745880126953125, -0.12733078002929688, -0.1172027587890625, -0.10707473754882812, -0.09694671630859375, -0.08681869506835938, -0.076690673828125, -0.06656265258789062, -0.05643463134765625, -0.046306610107421875, -0.0361785888671875, -0.026050567626953125, -0.01592254638671875, -0.005794525146484375, 0.00433349609375, 0.014461517333984375, 0.02458953857421875, 0.034717559814453125, 0.0448455810546875, 0.054973602294921875, 0.06510162353515625, 0.07522964477539062, 0.085357666015625, 0.09548568725585938, 0.10561370849609375, 0.11574172973632812, 0.1258697509765625, 0.13599777221679688, 0.14612579345703125, 0.15625381469726562, 0.1663818359375, 0.17650985717773438, 0.18663787841796875, 0.19676589965820312, 0.2068939208984375, 0.21702194213867188, 0.22714996337890625, 0.23727798461914062, 0.247406005859375, 0.2575340270996094, 0.26766204833984375, 0.2777900695800781, 0.2879180908203125, 0.2980461120605469, 0.30817413330078125, 0.3183021545410156, 0.32843017578125, 0.3385581970214844, 0.34868621826171875, 0.3588142395019531, 0.3689422607421875, 0.3790702819824219, 0.38919830322265625, 0.3993263244628906, 0.409454345703125, 0.4195823669433594, 0.42971038818359375, 0.4398384094238281, 0.4499664306640625, 0.4600944519042969, 0.47022247314453125, 0.4803504943847656, 0.490478515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 10.0, 10.0, 9.0, 12.0, 15.0, 30.0, 31.0, 61.0, 93.0, 164.0, 235.0, 407.0, 675.0, 1338.0, 3037.0, 7986.0, 25472.0, 103899.0, 845978.0, 2868886.0, 260332.0, 51336.0, 14715.0, 5085.0, 2108.0, 1058.0, 491.0, 290.0, 138.0, 116.0, 72.0, 62.0, 33.0, 23.0, 13.0, 18.0, 9.0, 10.0, 5.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43285369873046875, -0.4169769287109375, -0.40110015869140625, -0.385223388671875, -0.36934661865234375, -0.3534698486328125, -0.33759307861328125, -0.32171630859375, -0.30583953857421875, -0.2899627685546875, -0.27408599853515625, -0.258209228515625, -0.24233245849609375, -0.2264556884765625, -0.21057891845703125, -0.1947021484375, -0.17882537841796875, -0.1629486083984375, -0.14707183837890625, -0.131195068359375, -0.11531829833984375, -0.0994415283203125, -0.08356475830078125, -0.06768798828125, -0.05181121826171875, -0.0359344482421875, -0.02005767822265625, -0.004180908203125, 0.01169586181640625, 0.0275726318359375, 0.04344940185546875, 0.059326171875, 0.07520294189453125, 0.0910797119140625, 0.10695648193359375, 0.122833251953125, 0.13871002197265625, 0.1545867919921875, 0.17046356201171875, 0.18634033203125, 0.20221710205078125, 0.2180938720703125, 0.23397064208984375, 0.249847412109375, 0.26572418212890625, 0.2816009521484375, 0.29747772216796875, 0.3133544921875, 0.32923126220703125, 0.3451080322265625, 0.36098480224609375, 0.376861572265625, 0.39273834228515625, 0.4086151123046875, 0.42449188232421875, 0.44036865234375, 0.45624542236328125, 0.4721221923828125, 0.48799896240234375, 0.503875732421875, 0.5197525024414062, 0.5356292724609375, 0.5515060424804688, 0.5673828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 7.0, 18.0, 15.0, 21.0, 26.0, 38.0, 36.0, 65.0, 103.0, 158.0, 208.0, 324.0, 542.0, 698.0, 623.0, 410.0, 246.0, 142.0, 108.0, 65.0, 48.0, 40.0, 28.0, 17.0, 22.0, 13.0, 15.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.607421875, -0.5882797241210938, -0.5691375732421875, -0.5499954223632812, -0.530853271484375, -0.5117111206054688, -0.4925689697265625, -0.47342681884765625, -0.45428466796875, -0.43514251708984375, -0.4160003662109375, -0.39685821533203125, -0.377716064453125, -0.35857391357421875, -0.3394317626953125, -0.32028961181640625, -0.3011474609375, -0.28200531005859375, -0.2628631591796875, -0.24372100830078125, -0.224578857421875, -0.20543670654296875, -0.1862945556640625, -0.16715240478515625, -0.14801025390625, -0.12886810302734375, -0.1097259521484375, -0.09058380126953125, -0.071441650390625, -0.05229949951171875, -0.0331573486328125, -0.01401519775390625, 0.005126953125, 0.02426910400390625, 0.0434112548828125, 0.06255340576171875, 0.081695556640625, 0.10083770751953125, 0.1199798583984375, 0.13912200927734375, 0.15826416015625, 0.17740631103515625, 0.1965484619140625, 0.21569061279296875, 0.234832763671875, 0.25397491455078125, 0.2731170654296875, 0.29225921630859375, 0.3114013671875, 0.33054351806640625, 0.3496856689453125, 0.36882781982421875, 0.387969970703125, 0.40711212158203125, 0.4262542724609375, 0.44539642333984375, 0.46453857421875, 0.48368072509765625, 0.5028228759765625, 0.5219650268554688, 0.541107177734375, 0.5602493286132812, 0.5793914794921875, 0.5985336303710938, 0.61767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 20.0, 90.0, 337.0, 393.0, 116.0, 30.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.909759521484375, -5.4194464683532715, -4.929133892059326, -4.438820838928223, -3.9485080242156982, -3.458195209503174, -2.9678821563720703, -2.477569341659546, -1.9872565269470215, -1.496943712234497, -1.006630778312683, -0.5163178443908691, -0.026005029678344727, 0.4643077850341797, 0.9546208381652832, 1.4449336528778076, 1.935246467590332, 2.4255592823028564, 2.915872097015381, 3.4061851501464844, 3.896497964859009, 4.386810779571533, 4.877123832702637, 5.367436408996582, 5.8577494621276855, 6.348062515258789, 6.838375091552734, 7.328688144683838, 7.819001197814941, 8.309313774108887, 8.799627304077148, 9.289939880371094, 9.780252456665039, 10.270565032958984, 10.760878562927246, 11.251191139221191, 11.741503715515137, 12.231817245483398, 12.722129821777344, 13.212442398071289, 13.702754974365234, 14.19306755065918, 14.683381080627441, 15.173693656921387, 15.664006233215332, 16.154319763183594, 16.64463233947754, 17.134944915771484, 17.625259399414062, 18.115571975708008, 18.605884552001953, 19.09619903564453, 19.586511611938477, 20.076824188232422, 20.567136764526367, 21.057449340820312, 21.547761917114258, 22.038074493408203, 22.52838706970215, 23.018699645996094, 23.509014129638672, 23.999326705932617, 24.489639282226562, 24.979951858520508, 25.470264434814453]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 17.0, 11.0, 24.0, 26.0, 47.0, 46.0, 45.0, 59.0, 70.0, 72.0, 76.0, 71.0, 58.0, 64.0, 64.0, 50.0, 32.0, 38.0, 27.0, 27.0, 12.0, 16.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.914650917053223, -5.772266387939453, -5.629881858825684, -5.487497329711914, -5.3451128005981445, -5.202728271484375, -5.0603437423706055, -4.917959213256836, -4.775574684143066, -4.633190155029297, -4.490805625915527, -4.348421096801758, -4.206036567687988, -4.063652038574219, -3.921267509460449, -3.7788829803466797, -3.63649845123291, -3.4941139221191406, -3.351729393005371, -3.2093448638916016, -3.066960334777832, -2.9245758056640625, -2.782191276550293, -2.6398067474365234, -2.497422218322754, -2.3550376892089844, -2.212653160095215, -2.0702686309814453, -1.9278841018676758, -1.7854995727539062, -1.6431150436401367, -1.5007305145263672, -1.3583455085754395, -1.21596097946167, -1.0735764503479004, -0.9311919212341309, -0.7888073921203613, -0.6464228630065918, -0.5040383338928223, -0.36165380477905273, -0.2192692756652832, -0.07688474655151367, 0.06549978256225586, 0.2078843116760254, 0.3502688407897949, 0.49265336990356445, 0.635037899017334, 0.7774224281311035, 0.919806957244873, 1.0621914863586426, 1.204576015472412, 1.3469605445861816, 1.4893450736999512, 1.6317296028137207, 1.7741141319274902, 1.9164986610412598, 2.0588831901550293, 2.201267719268799, 2.3436522483825684, 2.486036777496338, 2.6284213066101074, 2.770805835723877, 2.9131903648376465, 3.055574893951416, 3.1979594230651855]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 10.0, 12.0, 14.0, 25.0, 27.0, 67.0, 105.0, 139.0, 237.0, 399.0, 723.0, 1327.0, 2660.0, 5630.0, 12510.0, 30212.0, 74504.0, 200475.0, 398908.0, 195003.0, 73011.0, 29407.0, 12238.0, 5428.0, 2518.0, 1246.0, 684.0, 384.0, 248.0, 133.0, 96.0, 46.0, 37.0, 28.0, 22.0, 11.0, 12.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4795036315917969, -0.46559906005859375, -0.4516944885253906, -0.4377899169921875, -0.4238853454589844, -0.40998077392578125, -0.3960762023925781, -0.382171630859375, -0.3682670593261719, -0.35436248779296875, -0.3404579162597656, -0.3265533447265625, -0.3126487731933594, -0.29874420166015625, -0.2848396301269531, -0.27093505859375, -0.2570304870605469, -0.24312591552734375, -0.22922134399414062, -0.2153167724609375, -0.20141220092773438, -0.18750762939453125, -0.17360305786132812, -0.159698486328125, -0.14579391479492188, -0.13188934326171875, -0.11798477172851562, -0.1040802001953125, -0.09017562866210938, -0.07627105712890625, -0.062366485595703125, -0.0484619140625, -0.034557342529296875, -0.02065277099609375, -0.006748199462890625, 0.0071563720703125, 0.021060943603515625, 0.03496551513671875, 0.048870086669921875, 0.062774658203125, 0.07667922973632812, 0.09058380126953125, 0.10448837280273438, 0.1183929443359375, 0.13229751586914062, 0.14620208740234375, 0.16010665893554688, 0.17401123046875, 0.18791580200195312, 0.20182037353515625, 0.21572494506835938, 0.2296295166015625, 0.24353408813476562, 0.25743865966796875, 0.2713432312011719, 0.285247802734375, 0.2991523742675781, 0.31305694580078125, 0.3269615173339844, 0.3408660888671875, 0.3547706604003906, 0.36867523193359375, 0.3825798034667969, 0.396484375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 4.0, 15.0, 10.0, 14.0, 16.0, 19.0, 21.0, 21.0, 29.0, 18.0, 19.0, 49.0, 43.0, 42.0, 40.0, 32.0, 48.0, 36.0, 44.0, 42.0, 36.0, 39.0, 41.0, 41.0, 39.0, 28.0, 32.0, 17.0, 28.0, 23.0, 25.0, 13.0, 13.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15927886962890625, -0.1537628173828125, -0.14824676513671875, -0.142730712890625, -0.13721466064453125, -0.1316986083984375, -0.12618255615234375, -0.12066650390625, -0.11515045166015625, -0.1096343994140625, -0.10411834716796875, -0.098602294921875, -0.09308624267578125, -0.0875701904296875, -0.08205413818359375, -0.0765380859375, -0.07102203369140625, -0.0655059814453125, -0.05998992919921875, -0.054473876953125, -0.04895782470703125, -0.0434417724609375, -0.03792572021484375, -0.03240966796875, -0.02689361572265625, -0.0213775634765625, -0.01586151123046875, -0.010345458984375, -0.00482940673828125, 0.0006866455078125, 0.00620269775390625, 0.01171875, 0.01723480224609375, 0.0227508544921875, 0.02826690673828125, 0.033782958984375, 0.03929901123046875, 0.0448150634765625, 0.05033111572265625, 0.05584716796875, 0.06136322021484375, 0.0668792724609375, 0.07239532470703125, 0.077911376953125, 0.08342742919921875, 0.0889434814453125, 0.09445953369140625, 0.0999755859375, 0.10549163818359375, 0.1110076904296875, 0.11652374267578125, 0.122039794921875, 0.12755584716796875, 0.1330718994140625, 0.13858795166015625, 0.14410400390625, 0.14962005615234375, 0.1551361083984375, 0.16065216064453125, 0.166168212890625, 0.17168426513671875, 0.1772003173828125, 0.18271636962890625, 0.188232421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 11.0, 17.0, 18.0, 45.0, 68.0, 82.0, 152.0, 220.0, 425.0, 793.0, 1606.0, 3935.0, 15949.0, 191636.0, 781653.0, 40362.0, 6698.0, 2362.0, 1085.0, 537.0, 321.0, 207.0, 131.0, 58.0, 52.0, 32.0, 28.0, 14.0, 13.0, 13.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2744140625, -1.2335968017578125, -1.192779541015625, -1.1519622802734375, -1.11114501953125, -1.0703277587890625, -1.029510498046875, -0.9886932373046875, -0.9478759765625, -0.9070587158203125, -0.866241455078125, -0.8254241943359375, -0.78460693359375, -0.7437896728515625, -0.702972412109375, -0.6621551513671875, -0.621337890625, -0.5805206298828125, -0.539703369140625, -0.4988861083984375, -0.45806884765625, -0.4172515869140625, -0.376434326171875, -0.3356170654296875, -0.2947998046875, -0.2539825439453125, -0.213165283203125, -0.1723480224609375, -0.13153076171875, -0.0907135009765625, -0.049896240234375, -0.0090789794921875, 0.03173828125, 0.0725555419921875, 0.113372802734375, 0.1541900634765625, 0.19500732421875, 0.2358245849609375, 0.276641845703125, 0.3174591064453125, 0.3582763671875, 0.3990936279296875, 0.439910888671875, 0.4807281494140625, 0.52154541015625, 0.5623626708984375, 0.603179931640625, 0.6439971923828125, 0.684814453125, 0.7256317138671875, 0.766448974609375, 0.8072662353515625, 0.84808349609375, 0.8889007568359375, 0.929718017578125, 0.9705352783203125, 1.0113525390625, 1.0521697998046875, 1.092987060546875, 1.1338043212890625, 1.17462158203125, 1.2154388427734375, 1.256256103515625, 1.2970733642578125, 1.337890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 15.0, 10.0, 13.0, 19.0, 22.0, 32.0, 37.0, 35.0, 40.0, 48.0, 56.0, 71.0, 72.0, 50.0, 54.0, 56.0, 40.0, 48.0, 37.0, 35.0, 48.0, 34.0, 33.0, 19.0, 15.0, 14.0, 18.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7822494506835938, -0.7476043701171875, -0.7129592895507812, -0.678314208984375, -0.6436691284179688, -0.6090240478515625, -0.5743789672851562, -0.53973388671875, -0.5050888061523438, -0.4704437255859375, -0.43579864501953125, -0.401153564453125, -0.36650848388671875, -0.3318634033203125, -0.29721832275390625, -0.2625732421875, -0.22792816162109375, -0.1932830810546875, -0.15863800048828125, -0.123992919921875, -0.08934783935546875, -0.0547027587890625, -0.02005767822265625, 0.01458740234375, 0.04923248291015625, 0.0838775634765625, 0.11852264404296875, 0.153167724609375, 0.18781280517578125, 0.2224578857421875, 0.25710296630859375, 0.291748046875, 0.32639312744140625, 0.3610382080078125, 0.39568328857421875, 0.430328369140625, 0.46497344970703125, 0.4996185302734375, 0.5342636108398438, 0.56890869140625, 0.6035537719726562, 0.6381988525390625, 0.6728439331054688, 0.707489013671875, 0.7421340942382812, 0.7767791748046875, 0.8114242553710938, 0.8460693359375, 0.8807144165039062, 0.9153594970703125, 0.9500045776367188, 0.984649658203125, 1.0192947387695312, 1.0539398193359375, 1.0885848999023438, 1.12322998046875, 1.1578750610351562, 1.1925201416015625, 1.2271652221679688, 1.261810302734375, 1.2964553833007812, 1.3311004638671875, 1.3657455444335938, 1.400390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 9.0, 16.0, 20.0, 34.0, 35.0, 57.0, 75.0, 109.0, 187.0, 273.0, 447.0, 828.0, 1495.0, 3184.0, 7266.0, 20138.0, 63827.0, 247404.0, 546713.0, 105754.0, 31241.0, 10491.0, 4227.0, 2038.0, 1034.0, 576.0, 363.0, 210.0, 149.0, 91.0, 60.0, 47.0, 32.0, 24.0, 23.0, 14.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.226806640625, -0.21997451782226562, -0.21314239501953125, -0.20631027221679688, -0.1994781494140625, -0.19264602661132812, -0.18581390380859375, -0.17898178100585938, -0.172149658203125, -0.16531753540039062, -0.15848541259765625, -0.15165328979492188, -0.1448211669921875, -0.13798904418945312, -0.13115692138671875, -0.12432479858398438, -0.11749267578125, -0.11066055297851562, -0.10382843017578125, -0.09699630737304688, -0.0901641845703125, -0.08333206176757812, -0.07649993896484375, -0.06966781616210938, -0.062835693359375, -0.056003570556640625, -0.04917144775390625, -0.042339324951171875, -0.0355072021484375, -0.028675079345703125, -0.02184295654296875, -0.015010833740234375, -0.0081787109375, -0.001346588134765625, 0.00548553466796875, 0.012317657470703125, 0.0191497802734375, 0.025981903076171875, 0.03281402587890625, 0.039646148681640625, 0.046478271484375, 0.053310394287109375, 0.06014251708984375, 0.06697463989257812, 0.0738067626953125, 0.08063888549804688, 0.08747100830078125, 0.09430313110351562, 0.10113525390625, 0.10796737670898438, 0.11479949951171875, 0.12163162231445312, 0.1284637451171875, 0.13529586791992188, 0.14212799072265625, 0.14896011352539062, 0.155792236328125, 0.16262435913085938, 0.16945648193359375, 0.17628860473632812, 0.1831207275390625, 0.18995285034179688, 0.19678497314453125, 0.20361709594726562, 0.21044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 9.0, 9.0, 13.0, 7.0, 9.0, 16.0, 22.0, 25.0, 18.0, 30.0, 39.0, 49.0, 68.0, 101.0, 124.0, 97.0, 75.0, 67.0, 36.0, 42.0, 26.0, 24.0, 18.0, 16.0, 13.0, 15.0, 12.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.543433457612991e-05, -7.278658449649811e-05, -7.01388344168663e-05, -6.74910843372345e-05, -6.484333425760269e-05, -6.219558417797089e-05, -5.954783409833908e-05, -5.6900084018707275e-05, -5.425233393907547e-05, -5.1604583859443665e-05, -4.895683377981186e-05, -4.6309083700180054e-05, -4.366133362054825e-05, -4.101358354091644e-05, -3.836583346128464e-05, -3.571808338165283e-05, -3.3070333302021027e-05, -3.042258322238922e-05, -2.7774833142757416e-05, -2.512708306312561e-05, -2.2479332983493805e-05, -1.9831582903862e-05, -1.7183832824230194e-05, -1.4536082744598389e-05, -1.1888332664966583e-05, -9.240582585334778e-06, -6.592832505702972e-06, -3.945082426071167e-06, -1.2973323464393616e-06, 1.3504177331924438e-06, 3.998167812824249e-06, 6.645917892456055e-06, 9.29366797208786e-06, 1.1941418051719666e-05, 1.4589168131351471e-05, 1.7236918210983276e-05, 1.9884668290615082e-05, 2.2532418370246887e-05, 2.5180168449878693e-05, 2.7827918529510498e-05, 3.0475668609142303e-05, 3.312341868877411e-05, 3.5771168768405914e-05, 3.841891884803772e-05, 4.1066668927669525e-05, 4.371441900730133e-05, 4.6362169086933136e-05, 4.900991916656494e-05, 5.165766924619675e-05, 5.430541932582855e-05, 5.695316940546036e-05, 5.960091948509216e-05, 6.224866956472397e-05, 6.489641964435577e-05, 6.754416972398758e-05, 7.019191980361938e-05, 7.283966988325119e-05, 7.5487419962883e-05, 7.81351700425148e-05, 8.07829201221466e-05, 8.343067020177841e-05, 8.607842028141022e-05, 8.872617036104202e-05, 9.137392044067383e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 12.0, 9.0, 28.0, 23.0, 56.0, 53.0, 124.0, 202.0, 368.0, 547.0, 1120.0, 2506.0, 7279.0, 38860.0, 528763.0, 419353.0, 37340.0, 6986.0, 2471.0, 1076.0, 564.0, 317.0, 181.0, 121.0, 70.0, 35.0, 34.0, 17.0, 9.0, 12.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2854042053222656, -0.27442169189453125, -0.2634391784667969, -0.2524566650390625, -0.24147415161132812, -0.23049163818359375, -0.21950912475585938, -0.208526611328125, -0.19754409790039062, -0.18656158447265625, -0.17557907104492188, -0.1645965576171875, -0.15361404418945312, -0.14263153076171875, -0.13164901733398438, -0.12066650390625, -0.10968399047851562, -0.09870147705078125, -0.08771896362304688, -0.0767364501953125, -0.06575393676757812, -0.05477142333984375, -0.043788909912109375, -0.032806396484375, -0.021823883056640625, -0.01084136962890625, 0.000141143798828125, 0.0111236572265625, 0.022106170654296875, 0.03308868408203125, 0.044071197509765625, 0.0550537109375, 0.06603622436523438, 0.07701873779296875, 0.08800125122070312, 0.0989837646484375, 0.10996627807617188, 0.12094879150390625, 0.13193130493164062, 0.142913818359375, 0.15389633178710938, 0.16487884521484375, 0.17586135864257812, 0.1868438720703125, 0.19782638549804688, 0.20880889892578125, 0.21979141235351562, 0.23077392578125, 0.24175643920898438, 0.25273895263671875, 0.2637214660644531, 0.2747039794921875, 0.2856864929199219, 0.29666900634765625, 0.3076515197753906, 0.318634033203125, 0.3296165466308594, 0.34059906005859375, 0.3515815734863281, 0.3625640869140625, 0.3735466003417969, 0.38452911376953125, 0.3955116271972656, 0.406494140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 2.0, 6.0, 8.0, 2.0, 10.0, 13.0, 16.0, 16.0, 19.0, 27.0, 24.0, 24.0, 37.0, 46.0, 55.0, 52.0, 75.0, 57.0, 74.0, 67.0, 64.0, 51.0, 40.0, 35.0, 25.0, 35.0, 23.0, 20.0, 8.0, 15.0, 11.0, 6.0, 8.0, 12.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510147094726562, -0.21753692626953125, -0.20997238159179688, -0.2024078369140625, -0.19484329223632812, -0.18727874755859375, -0.17971420288085938, -0.172149658203125, -0.16458511352539062, -0.15702056884765625, -0.14945602416992188, -0.1418914794921875, -0.13432693481445312, -0.12676239013671875, -0.11919784545898438, -0.11163330078125, -0.10406875610351562, -0.09650421142578125, -0.08893966674804688, -0.0813751220703125, -0.07381057739257812, -0.06624603271484375, -0.058681488037109375, -0.051116943359375, -0.043552398681640625, -0.03598785400390625, -0.028423309326171875, -0.0208587646484375, -0.013294219970703125, -0.00572967529296875, 0.001834869384765625, 0.0093994140625, 0.016963958740234375, 0.02452850341796875, 0.032093048095703125, 0.0396575927734375, 0.047222137451171875, 0.05478668212890625, 0.062351226806640625, 0.069915771484375, 0.07748031616210938, 0.08504486083984375, 0.09260940551757812, 0.1001739501953125, 0.10773849487304688, 0.11530303955078125, 0.12286758422851562, 0.13043212890625, 0.13799667358398438, 0.14556121826171875, 0.15312576293945312, 0.1606903076171875, 0.16825485229492188, 0.17581939697265625, 0.18338394165039062, 0.190948486328125, 0.19851303100585938, 0.20607757568359375, 0.21364212036132812, 0.2212066650390625, 0.22877120971679688, 0.23633575439453125, 0.24390029907226562, 0.25146484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 25.0, 44.0, 119.0, 189.0, 286.0, 170.0, 75.0, 36.0, 17.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.636467933654785, -9.363018035888672, -9.089569091796875, -8.816119194030762, -8.542670249938965, -8.269220352172852, -7.9957709312438965, -7.722321510314941, -7.448872089385986, -7.175422668457031, -6.901973247528076, -6.628523826599121, -6.355073928833008, -6.081624984741211, -5.808175086975098, -5.534725666046143, -5.2612762451171875, -4.987826824188232, -4.714377403259277, -4.440927982330322, -4.167478561401367, -3.894028902053833, -3.620579242706299, -3.3471298217773438, -3.0736804008483887, -2.8002309799194336, -2.5267815589904785, -2.2533318996429443, -1.9798824787139893, -1.7064330577850342, -1.4329835176467896, -1.159533977508545, -0.886085033416748, -0.6126355528831482, -0.33918607234954834, -0.06573659181594849, 0.20771288871765137, 0.48116230964660645, 0.7546118497848511, 1.0280613899230957, 1.3015108108520508, 1.5749602317810059, 1.8484097719192505, 2.121859312057495, 2.39530873298645, 2.6687581539154053, 2.9422078132629395, 3.2156572341918945, 3.4891066551208496, 3.7625560760498047, 4.03600549697876, 4.309454917907715, 4.582904815673828, 4.856353759765625, 5.129803657531738, 5.403253078460693, 5.676702499389648, 5.9501519203186035, 6.223601341247559, 6.497050762176514, 6.770500183105469, 7.043950080871582, 7.317399501800537, 7.590848922729492, 7.864298343658447]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 10.0, 7.0, 13.0, 16.0, 12.0, 14.0, 14.0, 33.0, 20.0, 23.0, 25.0, 39.0, 28.0, 28.0, 41.0, 50.0, 56.0, 61.0, 61.0, 49.0, 51.0, 34.0, 30.0, 40.0, 32.0, 26.0, 28.0, 25.0, 22.0, 17.0, 15.0, 9.0, 12.0, 5.0, 11.0, 11.0, 4.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4706637859344482, -3.365431785583496, -3.260199546813965, -3.1549675464630127, -3.0497355461120605, -2.9445033073425293, -2.839271306991577, -2.734039306640625, -2.628807306289673, -2.5235753059387207, -2.4183430671691895, -2.3131110668182373, -2.207879066467285, -2.102646827697754, -1.9974148273468018, -1.8921828269958496, -1.786950707435608, -1.6817185878753662, -1.576486587524414, -1.4712544679641724, -1.3660224676132202, -1.2607903480529785, -1.1555583477020264, -1.0503262281417847, -0.9450941681861877, -0.8398621082305908, -0.7346300482749939, -0.629397988319397, -0.5241658687591553, -0.41893380880355835, -0.3137017488479614, -0.2084696888923645, -0.10323762893676758, 0.0019944384694099426, 0.10722650587558746, 0.21245858073234558, 0.3176906406879425, 0.4229227304458618, 0.5281547904014587, 0.6333868503570557, 0.7386189103126526, 0.8438509702682495, 0.9490830302238464, 1.0543150901794434, 1.159547209739685, 1.2647793292999268, 1.370011329650879, 1.475243330001831, 1.5804754495620728, 1.6857075691223145, 1.7909395694732666, 1.8961716890335083, 2.00140380859375, 2.106635808944702, 2.2118678092956543, 2.3171000480651855, 2.4223320484161377, 2.52756404876709, 2.632796287536621, 2.7380282878875732, 2.8432602882385254, 2.9484925270080566, 3.053724527359009, 3.158956527709961, 3.264188528060913]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 15.0, 16.0, 27.0, 30.0, 57.0, 83.0, 127.0, 205.0, 350.0, 750.0, 1256.0, 2286.0, 4524.0, 9601.0, 21822.0, 56463.0, 198282.0, 1026061.0, 2146598.0, 537878.0, 119089.0, 38364.0, 15695.0, 6954.0, 3544.0, 1804.0, 981.0, 528.0, 325.0, 194.0, 122.0, 73.0, 52.0, 32.0, 27.0, 16.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2354736328125, -0.2277050018310547, -0.21993637084960938, -0.21216773986816406, -0.20439910888671875, -0.19663047790527344, -0.18886184692382812, -0.1810932159423828, -0.1733245849609375, -0.1655559539794922, -0.15778732299804688, -0.15001869201660156, -0.14225006103515625, -0.13448143005371094, -0.12671279907226562, -0.11894416809082031, -0.111175537109375, -0.10340690612792969, -0.09563827514648438, -0.08786964416503906, -0.08010101318359375, -0.07233238220214844, -0.06456375122070312, -0.05679512023925781, -0.0490264892578125, -0.04125785827636719, -0.033489227294921875, -0.025720596313476562, -0.01795196533203125, -0.010183334350585938, -0.002414703369140625, 0.0053539276123046875, 0.01312255859375, 0.020891189575195312, 0.028659820556640625, 0.03642845153808594, 0.04419708251953125, 0.05196571350097656, 0.059734344482421875, 0.06750297546386719, 0.0752716064453125, 0.08304023742675781, 0.09080886840820312, 0.09857749938964844, 0.10634613037109375, 0.11411476135253906, 0.12188339233398438, 0.1296520233154297, 0.137420654296875, 0.1451892852783203, 0.15295791625976562, 0.16072654724121094, 0.16849517822265625, 0.17626380920410156, 0.18403244018554688, 0.1918010711669922, 0.1995697021484375, 0.2073383331298828, 0.21510696411132812, 0.22287559509277344, 0.23064422607421875, 0.23841285705566406, 0.24618148803710938, 0.2539501190185547, 0.26171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 12.0, 9.0, 6.0, 15.0, 13.0, 20.0, 30.0, 23.0, 24.0, 29.0, 25.0, 20.0, 37.0, 37.0, 29.0, 45.0, 46.0, 38.0, 42.0, 37.0, 38.0, 35.0, 48.0, 39.0, 37.0, 31.0, 29.0, 22.0, 19.0, 24.0, 18.0, 22.0, 21.0, 9.0, 10.0, 11.0, 10.0, 8.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16357421875, -0.15834617614746094, -0.15311813354492188, -0.1478900909423828, -0.14266204833984375, -0.1374340057373047, -0.13220596313476562, -0.12697792053222656, -0.1217498779296875, -0.11652183532714844, -0.11129379272460938, -0.10606575012207031, -0.10083770751953125, -0.09560966491699219, -0.09038162231445312, -0.08515357971191406, -0.079925537109375, -0.07469749450683594, -0.06946945190429688, -0.06424140930175781, -0.05901336669921875, -0.05378532409667969, -0.048557281494140625, -0.04332923889160156, -0.0381011962890625, -0.03287315368652344, -0.027645111083984375, -0.022417068481445312, -0.01718902587890625, -0.011960983276367188, -0.006732940673828125, -0.0015048980712890625, 0.00372314453125, 0.008951187133789062, 0.014179229736328125, 0.019407272338867188, 0.02463531494140625, 0.029863357543945312, 0.035091400146484375, 0.04031944274902344, 0.0455474853515625, 0.05077552795410156, 0.056003570556640625, 0.06123161315917969, 0.06645965576171875, 0.07168769836425781, 0.07691574096679688, 0.08214378356933594, 0.087371826171875, 0.09259986877441406, 0.09782791137695312, 0.10305595397949219, 0.10828399658203125, 0.11351203918457031, 0.11874008178710938, 0.12396812438964844, 0.1291961669921875, 0.13442420959472656, 0.13965225219726562, 0.1448802947998047, 0.15010833740234375, 0.1553363800048828, 0.16056442260742188, 0.16579246520996094, 0.1710205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 10.0, 17.0, 29.0, 28.0, 59.0, 110.0, 219.0, 468.0, 1076.0, 3079.0, 11437.0, 60609.0, 929045.0, 3037698.0, 125540.0, 17772.0, 4363.0, 1470.0, 606.0, 256.0, 146.0, 81.0, 52.0, 27.0, 23.0, 11.0, 16.0, 10.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77197265625, -0.750030517578125, -0.72808837890625, -0.706146240234375, -0.6842041015625, -0.662261962890625, -0.64031982421875, -0.618377685546875, -0.596435546875, -0.574493408203125, -0.55255126953125, -0.530609130859375, -0.5086669921875, -0.486724853515625, -0.46478271484375, -0.442840576171875, -0.4208984375, -0.398956298828125, -0.37701416015625, -0.355072021484375, -0.3331298828125, -0.311187744140625, -0.28924560546875, -0.267303466796875, -0.245361328125, -0.223419189453125, -0.20147705078125, -0.179534912109375, -0.1575927734375, -0.135650634765625, -0.11370849609375, -0.091766357421875, -0.06982421875, -0.047882080078125, -0.02593994140625, -0.003997802734375, 0.0179443359375, 0.039886474609375, 0.06182861328125, 0.083770751953125, 0.105712890625, 0.127655029296875, 0.14959716796875, 0.171539306640625, 0.1934814453125, 0.215423583984375, 0.23736572265625, 0.259307861328125, 0.28125, 0.303192138671875, 0.32513427734375, 0.347076416015625, 0.3690185546875, 0.390960693359375, 0.41290283203125, 0.434844970703125, 0.456787109375, 0.478729248046875, 0.50067138671875, 0.522613525390625, 0.5445556640625, 0.566497802734375, 0.58843994140625, 0.610382080078125, 0.63232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 19.0, 24.0, 26.0, 32.0, 35.0, 75.0, 90.0, 115.0, 228.0, 444.0, 648.0, 786.0, 569.0, 344.0, 190.0, 121.0, 85.0, 53.0, 47.0, 34.0, 25.0, 7.0, 13.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5054855346679688, -0.4855804443359375, -0.46567535400390625, -0.445770263671875, -0.42586517333984375, -0.4059600830078125, -0.38605499267578125, -0.36614990234375, -0.34624481201171875, -0.3263397216796875, -0.30643463134765625, -0.286529541015625, -0.26662445068359375, -0.2467193603515625, -0.22681427001953125, -0.2069091796875, -0.18700408935546875, -0.1670989990234375, -0.14719390869140625, -0.127288818359375, -0.10738372802734375, -0.0874786376953125, -0.06757354736328125, -0.04766845703125, -0.02776336669921875, -0.0078582763671875, 0.01204681396484375, 0.031951904296875, 0.05185699462890625, 0.0717620849609375, 0.09166717529296875, 0.111572265625, 0.13147735595703125, 0.1513824462890625, 0.17128753662109375, 0.191192626953125, 0.21109771728515625, 0.2310028076171875, 0.25090789794921875, 0.27081298828125, 0.29071807861328125, 0.3106231689453125, 0.33052825927734375, 0.350433349609375, 0.37033843994140625, 0.3902435302734375, 0.41014862060546875, 0.4300537109375, 0.44995880126953125, 0.4698638916015625, 0.48976898193359375, 0.509674072265625, 0.5295791625976562, 0.5494842529296875, 0.5693893432617188, 0.58929443359375, 0.6091995239257812, 0.6291046142578125, 0.6490097045898438, 0.668914794921875, 0.6888198852539062, 0.7087249755859375, 0.7286300659179688, 0.74853515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 14.0, 18.0, 48.0, 73.0, 161.0, 188.0, 205.0, 141.0, 59.0, 31.0, 15.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.089385032653809, -7.897246837615967, -7.705108642578125, -7.512970447540283, -7.320832252502441, -7.128694534301758, -6.936555862426758, -6.744418144226074, -6.552279949188232, -6.360141754150391, -6.168003559112549, -5.975865364074707, -5.783727169036865, -5.591588973999023, -5.39945125579834, -5.207313060760498, -5.015174865722656, -4.8230366706848145, -4.630898475646973, -4.438760280609131, -4.246622085571289, -4.0544843673706055, -3.8623459339141846, -3.670207977294922, -3.478069305419922, -3.28593111038208, -3.0937929153442383, -2.9016547203063965, -2.709516763687134, -2.517378568649292, -2.32524037361145, -2.1331024169921875, -1.9409642219543457, -1.748826026916504, -1.5566879510879517, -1.3645497560501099, -1.1724116802215576, -0.9802734851837158, -0.788135290145874, -0.5959972143173218, -0.40385901927948, -0.21172086894512177, -0.01958271861076355, 0.17255544662475586, 0.3646935820579529, 0.5568317174911499, 0.7489699125289917, 0.941107988357544, 1.1332461833953857, 1.3253843784332275, 1.5175224542617798, 1.7096606492996216, 1.9017987251281738, 2.0939369201660156, 2.2860751152038574, 2.478213310241699, 2.670351505279541, 2.862489700317383, 3.0546278953552246, 3.2467660903930664, 3.438904047012329, 3.631042242050171, 3.8231804370880127, 4.015318393707275, 4.207456588745117]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 12.0, 7.0, 16.0, 9.0, 20.0, 22.0, 28.0, 36.0, 37.0, 48.0, 47.0, 38.0, 60.0, 53.0, 71.0, 53.0, 56.0, 45.0, 58.0, 45.0, 44.0, 35.0, 32.0, 27.0, 11.0, 15.0, 14.0, 9.0, 8.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.811023712158203, -2.7054712772369385, -2.5999186038970947, -2.49436616897583, -2.3888137340545654, -2.283261299133301, -2.177708625793457, -2.0721561908721924, -1.9666036367416382, -1.861051082611084, -1.7554986476898193, -1.6499460935592651, -1.544393539428711, -1.4388411045074463, -1.333288550376892, -1.227735996246338, -1.1221835613250732, -1.016631007194519, -0.9110785722732544, -0.8055260181427002, -0.6999735236167908, -0.5944210290908813, -0.48886847496032715, -0.3833159804344177, -0.2777634859085083, -0.17221097648143768, -0.06665846705436707, 0.038894057273864746, 0.14444655179977417, 0.2499990463256836, 0.3555516004562378, 0.4611040949821472, 0.5666563510894775, 0.672208845615387, 0.7777613401412964, 0.8833138942718506, 0.98886638879776, 1.0944188833236694, 1.1999714374542236, 1.3055238723754883, 1.4110764265060425, 1.5166289806365967, 1.6221814155578613, 1.7277339696884155, 1.8332865238189697, 1.9388389587402344, 2.044391632080078, 2.1499440670013428, 2.2554965019226074, 2.361048936843872, 2.466601610183716, 2.5721540451049805, 2.677706480026245, 2.7832589149475098, 2.8888115882873535, 2.994364023208618, 3.099916458129883, 3.2054688930511475, 3.311021566390991, 3.416574001312256, 3.5221264362335205, 3.627678871154785, 3.733231544494629, 3.8387839794158936, 3.9443366527557373]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 13.0, 16.0, 22.0, 21.0, 46.0, 67.0, 98.0, 156.0, 240.0, 330.0, 533.0, 809.0, 1398.0, 2214.0, 3913.0, 7064.0, 13934.0, 28905.0, 67016.0, 175969.0, 376958.0, 217251.0, 81846.0, 34557.0, 16136.0, 8149.0, 4374.0, 2401.0, 1501.0, 872.0, 562.0, 358.0, 266.0, 175.0, 119.0, 78.0, 63.0, 28.0, 32.0, 27.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3190574645996094, -0.30828094482421875, -0.2975044250488281, -0.2867279052734375, -0.2759513854980469, -0.26517486572265625, -0.2543983459472656, -0.243621826171875, -0.23284530639648438, -0.22206878662109375, -0.21129226684570312, -0.2005157470703125, -0.18973922729492188, -0.17896270751953125, -0.16818618774414062, -0.15740966796875, -0.14663314819335938, -0.13585662841796875, -0.12508010864257812, -0.1143035888671875, -0.10352706909179688, -0.09275054931640625, -0.08197402954101562, -0.071197509765625, -0.060420989990234375, -0.04964447021484375, -0.038867950439453125, -0.0280914306640625, -0.017314910888671875, -0.00653839111328125, 0.004238128662109375, 0.0150146484375, 0.025791168212890625, 0.03656768798828125, 0.047344207763671875, 0.0581207275390625, 0.06889724731445312, 0.07967376708984375, 0.09045028686523438, 0.101226806640625, 0.11200332641601562, 0.12277984619140625, 0.13355636596679688, 0.1443328857421875, 0.15510940551757812, 0.16588592529296875, 0.17666244506835938, 0.18743896484375, 0.19821548461914062, 0.20899200439453125, 0.21976852416992188, 0.2305450439453125, 0.24132156372070312, 0.25209808349609375, 0.2628746032714844, 0.273651123046875, 0.2844276428222656, 0.29520416259765625, 0.3059806823730469, 0.3167572021484375, 0.3275337219238281, 0.33831024169921875, 0.3490867614746094, 0.35986328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 6.0, 4.0, 4.0, 13.0, 10.0, 20.0, 23.0, 19.0, 26.0, 20.0, 28.0, 28.0, 34.0, 28.0, 41.0, 34.0, 40.0, 38.0, 40.0, 37.0, 36.0, 39.0, 40.0, 40.0, 41.0, 41.0, 37.0, 26.0, 28.0, 22.0, 29.0, 19.0, 12.0, 14.0, 9.0, 14.0, 8.0, 4.0, 6.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1807861328125, -0.17522621154785156, -0.16966629028320312, -0.1641063690185547, -0.15854644775390625, -0.1529865264892578, -0.14742660522460938, -0.14186668395996094, -0.1363067626953125, -0.13074684143066406, -0.12518692016601562, -0.11962699890136719, -0.11406707763671875, -0.10850715637207031, -0.10294723510742188, -0.09738731384277344, -0.091827392578125, -0.08626747131347656, -0.08070755004882812, -0.07514762878417969, -0.06958770751953125, -0.06402778625488281, -0.058467864990234375, -0.05290794372558594, -0.0473480224609375, -0.04178810119628906, -0.036228179931640625, -0.030668258666992188, -0.02510833740234375, -0.019548416137695312, -0.013988494873046875, -0.008428573608398438, -0.00286865234375, 0.0026912689208984375, 0.008251190185546875, 0.013811111450195312, 0.01937103271484375, 0.024930953979492188, 0.030490875244140625, 0.03605079650878906, 0.0416107177734375, 0.04717063903808594, 0.052730560302734375, 0.05829048156738281, 0.06385040283203125, 0.06941032409667969, 0.07497024536132812, 0.08053016662597656, 0.086090087890625, 0.09165000915527344, 0.09720993041992188, 0.10276985168457031, 0.10832977294921875, 0.11388969421386719, 0.11944961547851562, 0.12500953674316406, 0.1305694580078125, 0.13612937927246094, 0.14168930053710938, 0.1472492218017578, 0.15280914306640625, 0.1583690643310547, 0.16392898559570312, 0.16948890686035156, 0.175048828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 2.0, 5.0, 9.0, 17.0, 22.0, 40.0, 48.0, 45.0, 70.0, 116.0, 202.0, 313.0, 528.0, 1003.0, 2219.0, 6539.0, 33606.0, 633257.0, 334903.0, 25942.0, 5377.0, 1930.0, 969.0, 519.0, 282.0, 190.0, 134.0, 72.0, 52.0, 36.0, 26.0, 19.0, 17.0, 13.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.814971923828125, -0.78228759765625, -0.749603271484375, -0.7169189453125, -0.684234619140625, -0.65155029296875, -0.618865966796875, -0.586181640625, -0.553497314453125, -0.52081298828125, -0.488128662109375, -0.4554443359375, -0.422760009765625, -0.39007568359375, -0.357391357421875, -0.32470703125, -0.292022705078125, -0.25933837890625, -0.226654052734375, -0.1939697265625, -0.161285400390625, -0.12860107421875, -0.095916748046875, -0.063232421875, -0.030548095703125, 0.00213623046875, 0.034820556640625, 0.0675048828125, 0.100189208984375, 0.13287353515625, 0.165557861328125, 0.1982421875, 0.230926513671875, 0.26361083984375, 0.296295166015625, 0.3289794921875, 0.361663818359375, 0.39434814453125, 0.427032470703125, 0.459716796875, 0.492401123046875, 0.52508544921875, 0.557769775390625, 0.5904541015625, 0.623138427734375, 0.65582275390625, 0.688507080078125, 0.72119140625, 0.753875732421875, 0.78656005859375, 0.819244384765625, 0.8519287109375, 0.884613037109375, 0.91729736328125, 0.949981689453125, 0.982666015625, 1.015350341796875, 1.04803466796875, 1.080718994140625, 1.1134033203125, 1.146087646484375, 1.17877197265625, 1.211456298828125, 1.244140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 1.0, 6.0, 7.0, 2.0, 12.0, 15.0, 24.0, 25.0, 27.0, 29.0, 39.0, 47.0, 58.0, 56.0, 69.0, 71.0, 79.0, 62.0, 54.0, 47.0, 60.0, 42.0, 43.0, 37.0, 24.0, 10.0, 15.0, 16.0, 6.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.14300537109375, -1.1053466796875, -1.06768798828125, -1.030029296875, -0.99237060546875, -0.9547119140625, -0.91705322265625, -0.87939453125, -0.84173583984375, -0.8040771484375, -0.76641845703125, -0.728759765625, -0.69110107421875, -0.6534423828125, -0.61578369140625, -0.578125, -0.54046630859375, -0.5028076171875, -0.46514892578125, -0.427490234375, -0.38983154296875, -0.3521728515625, -0.31451416015625, -0.27685546875, -0.23919677734375, -0.2015380859375, -0.16387939453125, -0.126220703125, -0.08856201171875, -0.0509033203125, -0.01324462890625, 0.0244140625, 0.06207275390625, 0.0997314453125, 0.13739013671875, 0.175048828125, 0.21270751953125, 0.2503662109375, 0.28802490234375, 0.32568359375, 0.36334228515625, 0.4010009765625, 0.43865966796875, 0.476318359375, 0.51397705078125, 0.5516357421875, 0.58929443359375, 0.626953125, 0.66461181640625, 0.7022705078125, 0.73992919921875, 0.777587890625, 0.81524658203125, 0.8529052734375, 0.89056396484375, 0.92822265625, 0.96588134765625, 1.0035400390625, 1.04119873046875, 1.078857421875, 1.11651611328125, 1.1541748046875, 1.19183349609375, 1.2294921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 9.0, 24.0, 28.0, 26.0, 52.0, 85.0, 149.0, 256.0, 432.0, 679.0, 1390.0, 3154.0, 8714.0, 30127.0, 147238.0, 674794.0, 138682.0, 28288.0, 8222.0, 3127.0, 1391.0, 650.0, 414.0, 190.0, 132.0, 81.0, 48.0, 47.0, 29.0, 24.0, 17.0, 5.0, 6.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.261962890625, -0.2541389465332031, -0.24631500244140625, -0.23849105834960938, -0.2306671142578125, -0.22284317016601562, -0.21501922607421875, -0.20719528198242188, -0.199371337890625, -0.19154739379882812, -0.18372344970703125, -0.17589950561523438, -0.1680755615234375, -0.16025161743164062, -0.15242767333984375, -0.14460372924804688, -0.13677978515625, -0.12895584106445312, -0.12113189697265625, -0.11330795288085938, -0.1054840087890625, -0.09766006469726562, -0.08983612060546875, -0.08201217651367188, -0.074188232421875, -0.06636428833007812, -0.05854034423828125, -0.050716400146484375, -0.0428924560546875, -0.035068511962890625, -0.02724456787109375, -0.019420623779296875, -0.0115966796875, -0.003772735595703125, 0.00405120849609375, 0.011875152587890625, 0.0196990966796875, 0.027523040771484375, 0.03534698486328125, 0.043170928955078125, 0.050994873046875, 0.058818817138671875, 0.06664276123046875, 0.07446670532226562, 0.0822906494140625, 0.09011459350585938, 0.09793853759765625, 0.10576248168945312, 0.11358642578125, 0.12141036987304688, 0.12923431396484375, 0.13705825805664062, 0.1448822021484375, 0.15270614624023438, 0.16053009033203125, 0.16835403442382812, 0.176177978515625, 0.18400192260742188, 0.19182586669921875, 0.19964981079101562, 0.2074737548828125, 0.21529769897460938, 0.22312164306640625, 0.23094558715820312, 0.23876953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 5.0, 9.0, 9.0, 13.0, 13.0, 18.0, 18.0, 29.0, 38.0, 46.0, 74.0, 98.0, 121.0, 116.0, 108.0, 74.0, 51.0, 39.0, 35.0, 21.0, 18.0, 12.0, 11.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0001061558723449707, -0.00010344944894313812, -0.00010074302554130554, -9.803660213947296e-05, -9.533017873764038e-05, -9.26237553358078e-05, -8.991733193397522e-05, -8.721090853214264e-05, -8.450448513031006e-05, -8.179806172847748e-05, -7.90916383266449e-05, -7.638521492481232e-05, -7.367879152297974e-05, -7.097236812114716e-05, -6.826594471931458e-05, -6.5559521317482e-05, -6.285309791564941e-05, -6.0146674513816833e-05, -5.744025111198425e-05, -5.473382771015167e-05, -5.202740430831909e-05, -4.932098090648651e-05, -4.661455750465393e-05, -4.390813410282135e-05, -4.120171070098877e-05, -3.849528729915619e-05, -3.578886389732361e-05, -3.308244049549103e-05, -3.0376017093658447e-05, -2.7669593691825867e-05, -2.4963170289993286e-05, -2.2256746888160706e-05, -1.9550323486328125e-05, -1.6843900084495544e-05, -1.4137476682662964e-05, -1.1431053280830383e-05, -8.724629878997803e-06, -6.018206477165222e-06, -3.3117830753326416e-06, -6.05359673500061e-07, 2.1010637283325195e-06, 4.8074871301651e-06, 7.513910531997681e-06, 1.0220333933830261e-05, 1.2926757335662842e-05, 1.5633180737495422e-05, 1.8339604139328003e-05, 2.1046027541160583e-05, 2.3752450942993164e-05, 2.6458874344825745e-05, 2.9165297746658325e-05, 3.1871721148490906e-05, 3.4578144550323486e-05, 3.728456795215607e-05, 3.999099135398865e-05, 4.269741475582123e-05, 4.540383815765381e-05, 4.811026155948639e-05, 5.081668496131897e-05, 5.352310836315155e-05, 5.622953176498413e-05, 5.893595516681671e-05, 6.164237856864929e-05, 6.434880197048187e-05, 6.705522537231445e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 0.0, 4.0, 5.0, 5.0, 4.0, 15.0, 13.0, 20.0, 35.0, 33.0, 44.0, 71.0, 134.0, 204.0, 330.0, 515.0, 974.0, 1879.0, 4443.0, 13318.0, 58731.0, 506193.0, 384495.0, 55569.0, 12782.0, 4418.0, 1902.0, 949.0, 558.0, 289.0, 215.0, 146.0, 65.0, 46.0, 46.0, 32.0, 19.0, 15.0, 8.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2410888671875, -0.2337799072265625, -0.226470947265625, -0.2191619873046875, -0.21185302734375, -0.2045440673828125, -0.197235107421875, -0.1899261474609375, -0.1826171875, -0.1753082275390625, -0.167999267578125, -0.1606903076171875, -0.15338134765625, -0.1460723876953125, -0.138763427734375, -0.1314544677734375, -0.1241455078125, -0.1168365478515625, -0.109527587890625, -0.1022186279296875, -0.09490966796875, -0.0876007080078125, -0.080291748046875, -0.0729827880859375, -0.065673828125, -0.0583648681640625, -0.051055908203125, -0.0437469482421875, -0.03643798828125, -0.0291290283203125, -0.021820068359375, -0.0145111083984375, -0.0072021484375, 0.0001068115234375, 0.007415771484375, 0.0147247314453125, 0.02203369140625, 0.0293426513671875, 0.036651611328125, 0.0439605712890625, 0.05126953125, 0.0585784912109375, 0.065887451171875, 0.0731964111328125, 0.08050537109375, 0.0878143310546875, 0.095123291015625, 0.1024322509765625, 0.1097412109375, 0.1170501708984375, 0.124359130859375, 0.1316680908203125, 0.13897705078125, 0.1462860107421875, 0.153594970703125, 0.1609039306640625, 0.168212890625, 0.1755218505859375, 0.182830810546875, 0.1901397705078125, 0.19744873046875, 0.2047576904296875, 0.212066650390625, 0.2193756103515625, 0.2266845703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 4.0, 12.0, 16.0, 13.0, 20.0, 34.0, 41.0, 56.0, 75.0, 101.0, 108.0, 91.0, 109.0, 93.0, 58.0, 44.0, 29.0, 25.0, 20.0, 7.0, 8.0, 7.0, 10.0, 9.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219970703125, -0.21078109741210938, -0.20159149169921875, -0.19240188598632812, -0.1832122802734375, -0.17402267456054688, -0.16483306884765625, -0.15564346313476562, -0.146453857421875, -0.13726425170898438, -0.12807464599609375, -0.11888504028320312, -0.1096954345703125, -0.10050582885742188, -0.09131622314453125, -0.08212661743164062, -0.07293701171875, -0.06374740600585938, -0.05455780029296875, -0.045368194580078125, -0.0361785888671875, -0.026988983154296875, -0.01779937744140625, -0.008609771728515625, 0.000579833984375, 0.009769439697265625, 0.01895904541015625, 0.028148651123046875, 0.0373382568359375, 0.046527862548828125, 0.05571746826171875, 0.06490707397460938, 0.0740966796875, 0.08328628540039062, 0.09247589111328125, 0.10166549682617188, 0.1108551025390625, 0.12004470825195312, 0.12923431396484375, 0.13842391967773438, 0.147613525390625, 0.15680313110351562, 0.16599273681640625, 0.17518234252929688, 0.1843719482421875, 0.19356155395507812, 0.20275115966796875, 0.21194076538085938, 0.22113037109375, 0.23031997680664062, 0.23950958251953125, 0.24869918823242188, 0.2578887939453125, 0.2670783996582031, 0.27626800537109375, 0.2854576110839844, 0.294647216796875, 0.3038368225097656, 0.31302642822265625, 0.3222160339355469, 0.3314056396484375, 0.3405952453613281, 0.34978485107421875, 0.3589744567871094, 0.3681640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 16.0, 31.0, 46.0, 80.0, 104.0, 175.0, 184.0, 126.0, 82.0, 49.0, 29.0, 22.0, 8.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-5.8701324462890625, -5.723775386810303, -5.577418327331543, -5.431060791015625, -5.284703731536865, -5.1383466720581055, -4.9919891357421875, -4.845632076263428, -4.699275016784668, -4.552917957305908, -4.406560897827148, -4.2602033615112305, -4.113846302032471, -3.967489242553711, -3.821131944656372, -3.674774646759033, -3.5284175872802734, -3.3820605278015137, -3.235703229904175, -3.089345932006836, -2.942988872528076, -2.7966318130493164, -2.6502745151519775, -2.5039172172546387, -2.357560157775879, -2.211203098297119, -2.0648458003997803, -1.918488621711731, -1.7721314430236816, -1.6257742643356323, -1.479417085647583, -1.3330599069595337, -1.1867024898529053, -1.040345311164856, -0.8939881324768066, -0.7476309537887573, -0.601273775100708, -0.4549165964126587, -0.3085594177246094, -0.16220223903656006, -0.015845060348510742, 0.13051211833953857, 0.2768692970275879, 0.4232264757156372, 0.5695836544036865, 0.7159408330917358, 0.8622980117797852, 1.0086551904678345, 1.1550123691558838, 1.301369547843933, 1.4477267265319824, 1.5940839052200317, 1.740441083908081, 1.8867982625961304, 2.0331554412841797, 2.1795125007629395, 2.3258697986602783, 2.472227096557617, 2.618584156036377, 2.7649412155151367, 2.9112985134124756, 3.0576558113098145, 3.204012870788574, 3.350369930267334, 3.496727228164673]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 10.0, 11.0, 14.0, 19.0, 11.0, 20.0, 23.0, 23.0, 22.0, 30.0, 38.0, 30.0, 38.0, 32.0, 63.0, 72.0, 84.0, 80.0, 48.0, 48.0, 36.0, 23.0, 26.0, 22.0, 28.0, 20.0, 7.0, 22.0, 11.0, 16.0, 21.0, 6.0, 10.0, 8.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.274181365966797, -4.14931058883667, -4.024440288543701, -3.899569511413574, -3.7746989727020264, -3.6498284339904785, -3.5249578952789307, -3.400087356567383, -3.275216579437256, -3.150346040725708, -3.02547550201416, -2.900604724884033, -2.7757341861724854, -2.6508636474609375, -2.5259931087493896, -2.401122570037842, -2.276252031326294, -2.151381492614746, -2.0265109539031982, -1.9016402959823608, -1.7767696380615234, -1.6518990993499756, -1.5270285606384277, -1.4021580219268799, -1.2772873640060425, -1.1524168252944946, -1.0275461673736572, -0.9026756286621094, -0.7778050303459167, -0.6529344320297241, -0.5280638933181763, -0.40319329500198364, -0.278322696685791, -0.15345211327075958, -0.02858152985572815, 0.09628903865814209, 0.22115963697433472, 0.34603023529052734, 0.4709007740020752, 0.5957713723182678, 0.7206419706344604, 0.8455125689506531, 0.9703831672668457, 1.0952537059783936, 1.2201242446899414, 1.3449949026107788, 1.4698654413223267, 1.594736099243164, 1.719606637954712, 1.8444771766662598, 1.9693478345870972, 2.0942182540893555, 2.2190890312194824, 2.3439595699310303, 2.468830108642578, 2.593700647354126, 2.718571186065674, 2.8434417247772217, 2.9683122634887695, 3.0931830406188965, 3.2180535793304443, 3.342924118041992, 3.46779465675354, 3.592665195465088, 3.717535972595215]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 15.0, 19.0, 30.0, 49.0, 61.0, 96.0, 163.0, 250.0, 422.0, 701.0, 1246.0, 2461.0, 5230.0, 12887.0, 38719.0, 181671.0, 1643660.0, 2003345.0, 232041.0, 44923.0, 14368.0, 5787.0, 2743.0, 1391.0, 743.0, 420.0, 276.0, 170.0, 122.0, 78.0, 50.0, 38.0, 20.0, 18.0, 14.0, 9.0, 13.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2666015625, -0.2574272155761719, -0.24825286865234375, -0.23907852172851562, -0.2299041748046875, -0.22072982788085938, -0.21155548095703125, -0.20238113403320312, -0.193206787109375, -0.18403244018554688, -0.17485809326171875, -0.16568374633789062, -0.1565093994140625, -0.14733505249023438, -0.13816070556640625, -0.12898635864257812, -0.11981201171875, -0.11063766479492188, -0.10146331787109375, -0.09228897094726562, -0.0831146240234375, -0.07394027709960938, -0.06476593017578125, -0.055591583251953125, -0.046417236328125, -0.037242889404296875, -0.02806854248046875, -0.018894195556640625, -0.0097198486328125, -0.000545501708984375, 0.00862884521484375, 0.017803192138671875, 0.0269775390625, 0.036151885986328125, 0.04532623291015625, 0.054500579833984375, 0.0636749267578125, 0.07284927368164062, 0.08202362060546875, 0.09119796752929688, 0.100372314453125, 0.10954666137695312, 0.11872100830078125, 0.12789535522460938, 0.1370697021484375, 0.14624404907226562, 0.15541839599609375, 0.16459274291992188, 0.17376708984375, 0.18294143676757812, 0.19211578369140625, 0.20129013061523438, 0.2104644775390625, 0.21963882446289062, 0.22881317138671875, 0.23798751831054688, 0.247161865234375, 0.2563362121582031, 0.26551055908203125, 0.2746849060058594, 0.2838592529296875, 0.2930335998535156, 0.30220794677734375, 0.3113822937011719, 0.320556640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 12.0, 11.0, 12.0, 10.0, 10.0, 25.0, 26.0, 36.0, 41.0, 40.0, 29.0, 33.0, 39.0, 38.0, 48.0, 29.0, 58.0, 46.0, 45.0, 43.0, 36.0, 34.0, 39.0, 35.0, 39.0, 22.0, 19.0, 23.0, 13.0, 21.0, 11.0, 10.0, 11.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.18033218383789062, -0.17450714111328125, -0.16868209838867188, -0.1628570556640625, -0.15703201293945312, -0.15120697021484375, -0.14538192749023438, -0.139556884765625, -0.13373184204101562, -0.12790679931640625, -0.12208175659179688, -0.1162567138671875, -0.11043167114257812, -0.10460662841796875, -0.09878158569335938, -0.09295654296875, -0.08713150024414062, -0.08130645751953125, -0.07548141479492188, -0.0696563720703125, -0.06383132934570312, -0.05800628662109375, -0.052181243896484375, -0.046356201171875, -0.040531158447265625, -0.03470611572265625, -0.028881072998046875, -0.0230560302734375, -0.017230987548828125, -0.01140594482421875, -0.005580902099609375, 0.000244140625, 0.006069183349609375, 0.01189422607421875, 0.017719268798828125, 0.0235443115234375, 0.029369354248046875, 0.03519439697265625, 0.041019439697265625, 0.046844482421875, 0.052669525146484375, 0.05849456787109375, 0.06431961059570312, 0.0701446533203125, 0.07596969604492188, 0.08179473876953125, 0.08761978149414062, 0.09344482421875, 0.09926986694335938, 0.10509490966796875, 0.11091995239257812, 0.1167449951171875, 0.12257003784179688, 0.12839508056640625, 0.13422012329101562, 0.140045166015625, 0.14587020874023438, 0.15169525146484375, 0.15752029418945312, 0.1633453369140625, 0.16917037963867188, 0.17499542236328125, 0.18082046508789062, 0.1866455078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 5.0, 15.0, 33.0, 59.0, 198.0, 649.0, 4825.0, 154960.0, 3994572.0, 36118.0, 2225.0, 407.0, 113.0, 48.0, 23.0, 12.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.9121551513671875, -0.867279052734375, -0.8224029541015625, -0.77752685546875, -0.7326507568359375, -0.687774658203125, -0.6428985595703125, -0.5980224609375, -0.5531463623046875, -0.508270263671875, -0.4633941650390625, -0.41851806640625, -0.3736419677734375, -0.328765869140625, -0.2838897705078125, -0.239013671875, -0.1941375732421875, -0.149261474609375, -0.1043853759765625, -0.05950927734375, -0.0146331787109375, 0.030242919921875, 0.0751190185546875, 0.1199951171875, 0.1648712158203125, 0.209747314453125, 0.2546234130859375, 0.29949951171875, 0.3443756103515625, 0.389251708984375, 0.4341278076171875, 0.47900390625, 0.5238800048828125, 0.568756103515625, 0.6136322021484375, 0.65850830078125, 0.7033843994140625, 0.748260498046875, 0.7931365966796875, 0.8380126953125, 0.8828887939453125, 0.927764892578125, 0.9726409912109375, 1.01751708984375, 1.0623931884765625, 1.107269287109375, 1.1521453857421875, 1.197021484375, 1.2418975830078125, 1.286773681640625, 1.3316497802734375, 1.37652587890625, 1.4214019775390625, 1.466278076171875, 1.5111541748046875, 1.5560302734375, 1.6009063720703125, 1.645782470703125, 1.6906585693359375, 1.73553466796875, 1.7804107666015625, 1.825286865234375, 1.8701629638671875, 1.9150390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 13.0, 18.0, 17.0, 33.0, 43.0, 70.0, 120.0, 194.0, 450.0, 785.0, 1005.0, 591.0, 279.0, 154.0, 94.0, 61.0, 36.0, 29.0, 26.0, 12.0, 3.0, 8.0, 4.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7568359375, -0.7365188598632812, -0.7162017822265625, -0.6958847045898438, -0.675567626953125, -0.6552505493164062, -0.6349334716796875, -0.6146163940429688, -0.59429931640625, -0.5739822387695312, -0.5536651611328125, -0.5333480834960938, -0.513031005859375, -0.49271392822265625, -0.4723968505859375, -0.45207977294921875, -0.4317626953125, -0.41144561767578125, -0.3911285400390625, -0.37081146240234375, -0.350494384765625, -0.33017730712890625, -0.3098602294921875, -0.28954315185546875, -0.26922607421875, -0.24890899658203125, -0.2285919189453125, -0.20827484130859375, -0.187957763671875, -0.16764068603515625, -0.1473236083984375, -0.12700653076171875, -0.106689453125, -0.08637237548828125, -0.0660552978515625, -0.04573822021484375, -0.025421142578125, -0.00510406494140625, 0.0152130126953125, 0.03553009033203125, 0.05584716796875, 0.07616424560546875, 0.0964813232421875, 0.11679840087890625, 0.137115478515625, 0.15743255615234375, 0.1777496337890625, 0.19806671142578125, 0.2183837890625, 0.23870086669921875, 0.2590179443359375, 0.27933502197265625, 0.299652099609375, 0.31996917724609375, 0.3402862548828125, 0.36060333251953125, 0.38092041015625, 0.40123748779296875, 0.4215545654296875, 0.44187164306640625, 0.462188720703125, 0.48250579833984375, 0.5028228759765625, 0.5231399536132812, 0.54345703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 44.0, 120.0, 192.0, 230.0, 189.0, 102.0, 47.0, 15.0, 10.0, 9.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.550397872924805, -6.359920978546143, -6.169444561004639, -5.978967666625977, -5.788491249084473, -5.5980143547058105, -5.407537937164307, -5.2170610427856445, -5.026584625244141, -4.8361077308654785, -4.645631313323975, -4.4551544189453125, -4.264678001403809, -4.0742011070251465, -3.8837246894836426, -3.6932477951049805, -3.5027711391448975, -3.3122944831848145, -3.1218178272247314, -2.9313411712646484, -2.7408645153045654, -2.5503878593444824, -2.3599109649658203, -2.1694345474243164, -1.9789577722549438, -1.7884811162948608, -1.5980044603347778, -1.4075276851654053, -1.2170510292053223, -1.0265743732452393, -0.8360977172851562, -0.6456210613250732, -0.45514440536499023, -0.2646677494049072, -0.07419106364250183, 0.11628562211990356, 0.3067622780799866, 0.4972389340400696, 0.6877156496047974, 0.8781923055648804, 1.0686689615249634, 1.2591456174850464, 1.4496222734451294, 1.640099048614502, 1.830575704574585, 2.021052360534668, 2.211529016494751, 2.402005672454834, 2.592482328414917, 2.782958984375, 2.973435640335083, 3.163912296295166, 3.354388952255249, 3.544865608215332, 3.735342502593994, 3.925818920135498, 4.11629581451416, 4.306772708892822, 4.497249126434326, 4.687726020812988, 4.878202438354492, 5.068679332733154, 5.259155750274658, 5.44963264465332, 5.640109062194824]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 8.0, 4.0, 10.0, 10.0, 11.0, 10.0, 12.0, 10.0, 15.0, 26.0, 23.0, 31.0, 35.0, 34.0, 41.0, 37.0, 30.0, 50.0, 59.0, 38.0, 52.0, 59.0, 32.0, 44.0, 31.0, 32.0, 32.0, 25.0, 35.0, 28.0, 19.0, 12.0, 9.0, 14.0, 16.0, 9.0, 14.0, 13.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8522539138793945, -1.790534496307373, -1.7288150787353516, -1.66709566116333, -1.6053762435913086, -1.543656826019287, -1.4819374084472656, -1.4202179908752441, -1.3584985733032227, -1.2967791557312012, -1.2350597381591797, -1.1733403205871582, -1.1116209030151367, -1.0499014854431152, -0.9881820678710938, -0.9264626502990723, -0.864743173122406, -0.8030237555503845, -0.741304337978363, -0.6795849204063416, -0.6178655028343201, -0.5561460256576538, -0.4944266378879547, -0.4327072203159332, -0.37098780274391174, -0.30926838517189026, -0.24754896759986877, -0.1858295351266861, -0.12411011755466461, -0.062390685081481934, -0.0006712675094604492, 0.061048150062561035, 0.12276756763458252, 0.184486985206604, 0.2462064027786255, 0.307925820350647, 0.36964523792266846, 0.43136468529701233, 0.4930841028690338, 0.5548034906387329, 0.6165229082107544, 0.6782423257827759, 0.7399617433547974, 0.8016811609268188, 0.8634005784988403, 0.9251199960708618, 0.9868394136428833, 1.0485588312149048, 1.1102783679962158, 1.1719977855682373, 1.2337172031402588, 1.2954366207122803, 1.3571560382843018, 1.4188754558563232, 1.4805948734283447, 1.5423142910003662, 1.6040337085723877, 1.6657531261444092, 1.7274725437164307, 1.7891919612884521, 1.8509113788604736, 1.9126307964324951, 1.9743502140045166, 2.036069631576538, 2.0977890491485596]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 3.0, 10.0, 16.0, 23.0, 37.0, 52.0, 76.0, 118.0, 206.0, 300.0, 503.0, 966.0, 1734.0, 3367.0, 6964.0, 15491.0, 41145.0, 121494.0, 328344.0, 331524.0, 123616.0, 42001.0, 15986.0, 7148.0, 3396.0, 1738.0, 940.0, 506.0, 322.0, 187.0, 112.0, 77.0, 56.0, 24.0, 22.0, 11.0, 11.0, 8.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29811859130859375, -0.2893524169921875, -0.28058624267578125, -0.271820068359375, -0.26305389404296875, -0.2542877197265625, -0.24552154541015625, -0.23675537109375, -0.22798919677734375, -0.2192230224609375, -0.21045684814453125, -0.201690673828125, -0.19292449951171875, -0.1841583251953125, -0.17539215087890625, -0.1666259765625, -0.15785980224609375, -0.1490936279296875, -0.14032745361328125, -0.131561279296875, -0.12279510498046875, -0.1140289306640625, -0.10526275634765625, -0.09649658203125, -0.08773040771484375, -0.0789642333984375, -0.07019805908203125, -0.061431884765625, -0.05266571044921875, -0.0438995361328125, -0.03513336181640625, -0.0263671875, -0.01760101318359375, -0.0088348388671875, -6.866455078125e-05, 0.008697509765625, 0.01746368408203125, 0.0262298583984375, 0.03499603271484375, 0.04376220703125, 0.05252838134765625, 0.0612945556640625, 0.07006072998046875, 0.078826904296875, 0.08759307861328125, 0.0963592529296875, 0.10512542724609375, 0.1138916015625, 0.12265777587890625, 0.1314239501953125, 0.14019012451171875, 0.148956298828125, 0.15772247314453125, 0.1664886474609375, 0.17525482177734375, 0.18402099609375, 0.19278717041015625, 0.2015533447265625, 0.21031951904296875, 0.219085693359375, 0.22785186767578125, 0.2366180419921875, 0.24538421630859375, 0.254150390625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 13.0, 5.0, 14.0, 20.0, 20.0, 24.0, 20.0, 26.0, 34.0, 34.0, 38.0, 34.0, 28.0, 45.0, 35.0, 39.0, 38.0, 43.0, 49.0, 43.0, 52.0, 34.0, 36.0, 32.0, 31.0, 29.0, 22.0, 23.0, 18.0, 17.0, 19.0, 12.0, 6.0, 13.0, 7.0, 6.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.20849609375, -0.2026805877685547, -0.19686508178710938, -0.19104957580566406, -0.18523406982421875, -0.17941856384277344, -0.17360305786132812, -0.1677875518798828, -0.1619720458984375, -0.1561565399169922, -0.15034103393554688, -0.14452552795410156, -0.13871002197265625, -0.13289451599121094, -0.12707901000976562, -0.12126350402832031, -0.115447998046875, -0.10963249206542969, -0.10381698608398438, -0.09800148010253906, -0.09218597412109375, -0.08637046813964844, -0.08055496215820312, -0.07473945617675781, -0.0689239501953125, -0.06310844421386719, -0.057292938232421875, -0.05147743225097656, -0.04566192626953125, -0.03984642028808594, -0.034030914306640625, -0.028215408325195312, -0.02239990234375, -0.016584396362304688, -0.010768890380859375, -0.0049533843994140625, 0.00086212158203125, 0.0066776275634765625, 0.012493133544921875, 0.018308639526367188, 0.0241241455078125, 0.029939651489257812, 0.035755157470703125, 0.04157066345214844, 0.04738616943359375, 0.05320167541503906, 0.059017181396484375, 0.06483268737792969, 0.070648193359375, 0.07646369934082031, 0.08227920532226562, 0.08809471130371094, 0.09391021728515625, 0.09972572326660156, 0.10554122924804688, 0.11135673522949219, 0.1171722412109375, 0.12298774719238281, 0.12880325317382812, 0.13461875915527344, 0.14043426513671875, 0.14624977111816406, 0.15206527709960938, 0.1578807830810547, 0.1636962890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 9.0, 14.0, 20.0, 18.0, 27.0, 45.0, 65.0, 108.0, 188.0, 366.0, 892.0, 2355.0, 8555.0, 55067.0, 707147.0, 242614.0, 23429.0, 4809.0, 1477.0, 655.0, 261.0, 165.0, 80.0, 48.0, 33.0, 29.0, 22.0, 10.0, 11.0, 5.0, 4.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.555419921875, -0.5361328125, -0.516845703125, -0.49755859375, -0.478271484375, -0.458984375, -0.439697265625, -0.42041015625, -0.401123046875, -0.3818359375, -0.362548828125, -0.34326171875, -0.323974609375, -0.3046875, -0.285400390625, -0.26611328125, -0.246826171875, -0.2275390625, -0.208251953125, -0.18896484375, -0.169677734375, -0.150390625, -0.131103515625, -0.11181640625, -0.092529296875, -0.0732421875, -0.053955078125, -0.03466796875, -0.015380859375, 0.00390625, 0.023193359375, 0.04248046875, 0.061767578125, 0.0810546875, 0.100341796875, 0.11962890625, 0.138916015625, 0.158203125, 0.177490234375, 0.19677734375, 0.216064453125, 0.2353515625, 0.254638671875, 0.27392578125, 0.293212890625, 0.3125, 0.331787109375, 0.35107421875, 0.370361328125, 0.3896484375, 0.408935546875, 0.42822265625, 0.447509765625, 0.466796875, 0.486083984375, 0.50537109375, 0.524658203125, 0.5439453125, 0.563232421875, 0.58251953125, 0.601806640625, 0.62109375, 0.640380859375, 0.65966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 7.0, 13.0, 12.0, 18.0, 20.0, 24.0, 23.0, 34.0, 39.0, 50.0, 62.0, 78.0, 72.0, 72.0, 69.0, 83.0, 81.0, 58.0, 48.0, 35.0, 26.0, 14.0, 19.0, 15.0, 11.0, 9.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.26953125, -1.234832763671875, -1.20013427734375, -1.165435791015625, -1.1307373046875, -1.096038818359375, -1.06134033203125, -1.026641845703125, -0.991943359375, -0.957244873046875, -0.92254638671875, -0.887847900390625, -0.8531494140625, -0.818450927734375, -0.78375244140625, -0.749053955078125, -0.71435546875, -0.679656982421875, -0.64495849609375, -0.610260009765625, -0.5755615234375, -0.540863037109375, -0.50616455078125, -0.471466064453125, -0.436767578125, -0.402069091796875, -0.36737060546875, -0.332672119140625, -0.2979736328125, -0.263275146484375, -0.22857666015625, -0.193878173828125, -0.1591796875, -0.124481201171875, -0.08978271484375, -0.055084228515625, -0.0203857421875, 0.014312744140625, 0.04901123046875, 0.083709716796875, 0.118408203125, 0.153106689453125, 0.18780517578125, 0.222503662109375, 0.2572021484375, 0.291900634765625, 0.32659912109375, 0.361297607421875, 0.39599609375, 0.430694580078125, 0.46539306640625, 0.500091552734375, 0.5347900390625, 0.569488525390625, 0.60418701171875, 0.638885498046875, 0.673583984375, 0.708282470703125, 0.74298095703125, 0.777679443359375, 0.8123779296875, 0.847076416015625, 0.88177490234375, 0.916473388671875, 0.951171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 8.0, 20.0, 16.0, 13.0, 32.0, 40.0, 106.0, 116.0, 194.0, 383.0, 922.0, 2554.0, 9414.0, 71371.0, 852835.0, 94550.0, 11164.0, 2796.0, 991.0, 441.0, 245.0, 108.0, 67.0, 48.0, 38.0, 18.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29613494873046875, -0.2853851318359375, -0.27463531494140625, -0.263885498046875, -0.25313568115234375, -0.2423858642578125, -0.23163604736328125, -0.22088623046875, -0.21013641357421875, -0.1993865966796875, -0.18863677978515625, -0.177886962890625, -0.16713714599609375, -0.1563873291015625, -0.14563751220703125, -0.1348876953125, -0.12413787841796875, -0.1133880615234375, -0.10263824462890625, -0.091888427734375, -0.08113861083984375, -0.0703887939453125, -0.05963897705078125, -0.04888916015625, -0.03813934326171875, -0.0273895263671875, -0.01663970947265625, -0.005889892578125, 0.00485992431640625, 0.0156097412109375, 0.02635955810546875, 0.037109375, 0.04785919189453125, 0.0586090087890625, 0.06935882568359375, 0.080108642578125, 0.09085845947265625, 0.1016082763671875, 0.11235809326171875, 0.12310791015625, 0.13385772705078125, 0.1446075439453125, 0.15535736083984375, 0.166107177734375, 0.17685699462890625, 0.1876068115234375, 0.19835662841796875, 0.2091064453125, 0.21985626220703125, 0.2306060791015625, 0.24135589599609375, 0.252105712890625, 0.26285552978515625, 0.2736053466796875, 0.28435516357421875, 0.29510498046875, 0.30585479736328125, 0.3166046142578125, 0.32735443115234375, 0.338104248046875, 0.34885406494140625, 0.3596038818359375, 0.37035369873046875, 0.381103515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 5.0, 10.0, 9.0, 8.0, 26.0, 130.0, 362.0, 312.0, 89.0, 22.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002465248107910156, -0.00024002045392990112, -0.00023351609706878662, -0.00022701174020767212, -0.00022050738334655762, -0.00021400302648544312, -0.0002074986696243286, -0.0002009943127632141, -0.0001944899559020996, -0.0001879855990409851, -0.0001814812421798706, -0.0001749768853187561, -0.0001684725284576416, -0.0001619681715965271, -0.0001554638147354126, -0.0001489594578742981, -0.0001424551010131836, -0.0001359507441520691, -0.0001294463872909546, -0.0001229420304298401, -0.00011643767356872559, -0.00010993331670761108, -0.00010342895984649658, -9.692460298538208e-05, -9.042024612426758e-05, -8.391588926315308e-05, -7.741153240203857e-05, -7.090717554092407e-05, -6.440281867980957e-05, -5.789846181869507e-05, -5.1394104957580566e-05, -4.4889748096466064e-05, -3.838539123535156e-05, -3.188103437423706e-05, -2.537667751312256e-05, -1.8872320652008057e-05, -1.2367963790893555e-05, -5.863606929779053e-06, 6.407499313354492e-07, 7.145106792449951e-06, 1.3649463653564453e-05, 2.0153820514678955e-05, 2.6658177375793457e-05, 3.316253423690796e-05, 3.966689109802246e-05, 4.617124795913696e-05, 5.2675604820251465e-05, 5.917996168136597e-05, 6.568431854248047e-05, 7.218867540359497e-05, 7.869303226470947e-05, 8.519738912582397e-05, 9.170174598693848e-05, 9.820610284805298e-05, 0.00010471045970916748, 0.00011121481657028198, 0.00011771917343139648, 0.00012422353029251099, 0.0001307278871536255, 0.00013723224401474, 0.0001437366008758545, 0.000150240957736969, 0.0001567453145980835, 0.000163249671459198, 0.0001697540283203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 10.0, 21.0, 21.0, 49.0, 54.0, 91.0, 144.0, 277.0, 528.0, 1245.0, 3312.0, 12206.0, 95870.0, 819944.0, 96386.0, 12570.0, 3375.0, 1201.0, 574.0, 272.0, 149.0, 91.0, 53.0, 32.0, 23.0, 15.0, 10.0, 7.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3056640625, -0.2956428527832031, -0.28562164306640625, -0.2756004333496094, -0.2655792236328125, -0.2555580139160156, -0.24553680419921875, -0.23551559448242188, -0.225494384765625, -0.21547317504882812, -0.20545196533203125, -0.19543075561523438, -0.1854095458984375, -0.17538833618164062, -0.16536712646484375, -0.15534591674804688, -0.14532470703125, -0.13530349731445312, -0.12528228759765625, -0.11526107788085938, -0.1052398681640625, -0.09521865844726562, -0.08519744873046875, -0.07517623901367188, -0.065155029296875, -0.055133819580078125, -0.04511260986328125, -0.035091400146484375, -0.0250701904296875, -0.015048980712890625, -0.00502777099609375, 0.004993438720703125, 0.0150146484375, 0.025035858154296875, 0.03505706787109375, 0.045078277587890625, 0.0550994873046875, 0.06512069702148438, 0.07514190673828125, 0.08516311645507812, 0.095184326171875, 0.10520553588867188, 0.11522674560546875, 0.12524795532226562, 0.1352691650390625, 0.14529037475585938, 0.15531158447265625, 0.16533279418945312, 0.17535400390625, 0.18537521362304688, 0.19539642333984375, 0.20541763305664062, 0.2154388427734375, 0.22546005249023438, 0.23548126220703125, 0.24550247192382812, 0.255523681640625, 0.2655448913574219, 0.27556610107421875, 0.2855873107910156, 0.2956085205078125, 0.3056297302246094, 0.31565093994140625, 0.3256721496582031, 0.335693359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 1.0, 5.0, 13.0, 10.0, 11.0, 19.0, 23.0, 44.0, 67.0, 106.0, 110.0, 127.0, 125.0, 97.0, 78.0, 44.0, 34.0, 23.0, 18.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24393463134765625, -0.2356719970703125, -0.22740936279296875, -0.219146728515625, -0.21088409423828125, -0.2026214599609375, -0.19435882568359375, -0.18609619140625, -0.17783355712890625, -0.1695709228515625, -0.16130828857421875, -0.153045654296875, -0.14478302001953125, -0.1365203857421875, -0.12825775146484375, -0.1199951171875, -0.11173248291015625, -0.1034698486328125, -0.09520721435546875, -0.086944580078125, -0.07868194580078125, -0.0704193115234375, -0.06215667724609375, -0.05389404296875, -0.04563140869140625, -0.0373687744140625, -0.02910614013671875, -0.020843505859375, -0.01258087158203125, -0.0043182373046875, 0.00394439697265625, 0.01220703125, 0.02046966552734375, 0.0287322998046875, 0.03699493408203125, 0.045257568359375, 0.05352020263671875, 0.0617828369140625, 0.07004547119140625, 0.07830810546875, 0.08657073974609375, 0.0948333740234375, 0.10309600830078125, 0.111358642578125, 0.11962127685546875, 0.1278839111328125, 0.13614654541015625, 0.1444091796875, 0.15267181396484375, 0.1609344482421875, 0.16919708251953125, 0.177459716796875, 0.18572235107421875, 0.1939849853515625, 0.20224761962890625, 0.21051025390625, 0.21877288818359375, 0.2270355224609375, 0.23529815673828125, 0.243560791015625, 0.25182342529296875, 0.2600860595703125, 0.26834869384765625, 0.276611328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 17.0, 101.0, 475.0, 303.0, 71.0, 22.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0348992347717285, -3.6630659103393555, -3.2912325859069824, -2.9193992614746094, -2.5475659370422363, -2.1757326126098633, -1.8038995265960693, -1.4320662021636963, -1.0602328777313232, -0.6883995532989502, -0.3165662884712219, 0.05526697635650635, 0.4271003007888794, 0.7989336252212524, 1.170766830444336, 1.542600154876709, 1.914433479309082, 2.286266803741455, 2.658100128173828, 3.029933452606201, 3.401766777038574, 3.7736001014709473, 4.14543342590332, 4.517266273498535, 4.889100074768066, 5.2609333992004395, 5.6327667236328125, 6.0046000480651855, 6.376433372497559, 6.748266696929932, 7.120100021362305, 7.4919328689575195, 7.863766670227051, 8.235599517822266, 8.607433319091797, 8.979266166687012, 9.351099967956543, 9.722932815551758, 10.094766616821289, 10.466599464416504, 10.838433265686035, 11.21026611328125, 11.582099914550781, 11.953932762145996, 12.325766563415527, 12.697599411010742, 13.069433212280273, 13.441266059875488, 13.813098907470703, 14.184931755065918, 14.55676555633545, 14.928598403930664, 15.300432205200195, 15.67226505279541, 16.044097900390625, 16.415931701660156, 16.787765502929688, 17.15959930419922, 17.531431198120117, 17.90326499938965, 18.27509880065918, 18.64693260192871, 19.01876449584961, 19.39059829711914, 19.762432098388672]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 6.0, 5.0, 12.0, 16.0, 16.0, 10.0, 11.0, 22.0, 21.0, 23.0, 25.0, 44.0, 34.0, 36.0, 49.0, 58.0, 79.0, 73.0, 66.0, 43.0, 42.0, 33.0, 37.0, 36.0, 23.0, 22.0, 24.0, 14.0, 21.0, 15.0, 11.0, 7.0, 14.0, 11.0, 5.0, 6.0, 3.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.664245843887329, -2.5767669677734375, -2.489287853240967, -2.401808977127075, -2.3143301010131836, -2.226851224899292, -2.1393723487854004, -2.0518932342529297, -1.964414358139038, -1.8769354820251465, -1.7894564867019653, -1.7019774913787842, -1.6144986152648926, -1.527019739151001, -1.4395407438278198, -1.3520617485046387, -1.264582872390747, -1.1771039962768555, -1.0896250009536743, -1.0021460056304932, -0.9146671295166016, -0.8271881937980652, -0.7397092580795288, -0.6522303223609924, -0.564751386642456, -0.4772724509239197, -0.3897935152053833, -0.3023145794868469, -0.21483564376831055, -0.12735670804977417, -0.03987777233123779, 0.047601163387298584, 0.13508033752441406, 0.22255927324295044, 0.3100382089614868, 0.3975171446800232, 0.48499608039855957, 0.572475016117096, 0.6599539518356323, 0.7474328875541687, 0.8349118232727051, 0.9223907589912415, 1.0098696947097778, 1.097348690032959, 1.1848275661468506, 1.2723064422607422, 1.3597854375839233, 1.4472644329071045, 1.534743309020996, 1.6222221851348877, 1.7097011804580688, 1.79718017578125, 1.8846590518951416, 1.9721379280090332, 2.059617042541504, 2.1470959186553955, 2.234574794769287, 2.3220536708831787, 2.4095325469970703, 2.497011661529541, 2.5844905376434326, 2.671969413757324, 2.759448528289795, 2.8469274044036865, 2.934406280517578]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 5.0, 26.0, 34.0, 47.0, 72.0, 155.0, 245.0, 442.0, 781.0, 1533.0, 2988.0, 6471.0, 16255.0, 58563.0, 374553.0, 2556402.0, 1002037.0, 126980.0, 28393.0, 9835.0, 4151.0, 2009.0, 1026.0, 533.0, 315.0, 187.0, 91.0, 51.0, 26.0, 22.0, 16.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24271011352539062, -0.23395538330078125, -0.22520065307617188, -0.2164459228515625, -0.20769119262695312, -0.19893646240234375, -0.19018173217773438, -0.181427001953125, -0.17267227172851562, -0.16391754150390625, -0.15516281127929688, -0.1464080810546875, -0.13765335083007812, -0.12889862060546875, -0.12014389038085938, -0.11138916015625, -0.10263442993164062, -0.09387969970703125, -0.08512496948242188, -0.0763702392578125, -0.06761550903320312, -0.05886077880859375, -0.050106048583984375, -0.041351318359375, -0.032596588134765625, -0.02384185791015625, -0.015087127685546875, -0.0063323974609375, 0.002422332763671875, 0.01117706298828125, 0.019931793212890625, 0.0286865234375, 0.037441253662109375, 0.04619598388671875, 0.054950714111328125, 0.0637054443359375, 0.07246017456054688, 0.08121490478515625, 0.08996963500976562, 0.098724365234375, 0.10747909545898438, 0.11623382568359375, 0.12498855590820312, 0.1337432861328125, 0.14249801635742188, 0.15125274658203125, 0.16000747680664062, 0.16876220703125, 0.17751693725585938, 0.18627166748046875, 0.19502639770507812, 0.2037811279296875, 0.21253585815429688, 0.22129058837890625, 0.23004531860351562, 0.238800048828125, 0.24755477905273438, 0.25630950927734375, 0.2650642395019531, 0.2738189697265625, 0.2825736999511719, 0.29132843017578125, 0.3000831604003906, 0.308837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 9.0, 12.0, 13.0, 13.0, 18.0, 18.0, 31.0, 28.0, 36.0, 41.0, 37.0, 40.0, 36.0, 39.0, 36.0, 34.0, 43.0, 41.0, 40.0, 40.0, 44.0, 28.0, 30.0, 41.0, 35.0, 26.0, 26.0, 19.0, 20.0, 14.0, 12.0, 16.0, 7.0, 9.0, 10.0, 5.0, 1.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.190185546875, -0.18480491638183594, -0.17942428588867188, -0.1740436553955078, -0.16866302490234375, -0.1632823944091797, -0.15790176391601562, -0.15252113342285156, -0.1471405029296875, -0.14175987243652344, -0.13637924194335938, -0.1309986114501953, -0.12561798095703125, -0.12023735046386719, -0.11485671997070312, -0.10947608947753906, -0.104095458984375, -0.09871482849121094, -0.09333419799804688, -0.08795356750488281, -0.08257293701171875, -0.07719230651855469, -0.07181167602539062, -0.06643104553222656, -0.0610504150390625, -0.05566978454589844, -0.050289154052734375, -0.04490852355957031, -0.03952789306640625, -0.03414726257324219, -0.028766632080078125, -0.023386001586914062, -0.01800537109375, -0.012624740600585938, -0.007244110107421875, -0.0018634796142578125, 0.00351715087890625, 0.008897781372070312, 0.014278411865234375, 0.019659042358398438, 0.0250396728515625, 0.030420303344726562, 0.035800933837890625, 0.04118156433105469, 0.04656219482421875, 0.05194282531738281, 0.057323455810546875, 0.06270408630371094, 0.068084716796875, 0.07346534729003906, 0.07884597778320312, 0.08422660827636719, 0.08960723876953125, 0.09498786926269531, 0.10036849975585938, 0.10574913024902344, 0.1111297607421875, 0.11651039123535156, 0.12189102172851562, 0.1272716522216797, 0.13265228271484375, 0.1380329132080078, 0.14341354370117188, 0.14879417419433594, 0.1541748046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 13.0, 17.0, 22.0, 45.0, 136.0, 428.0, 2143.0, 43832.0, 4103546.0, 41382.0, 2050.0, 392.0, 136.0, 61.0, 34.0, 19.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.568359375, -1.5185546875, -1.46875, -1.4189453125, -1.369140625, -1.3193359375, -1.26953125, -1.2197265625, -1.169921875, -1.1201171875, -1.0703125, -1.0205078125, -0.970703125, -0.9208984375, -0.87109375, -0.8212890625, -0.771484375, -0.7216796875, -0.671875, -0.6220703125, -0.572265625, -0.5224609375, -0.47265625, -0.4228515625, -0.373046875, -0.3232421875, -0.2734375, -0.2236328125, -0.173828125, -0.1240234375, -0.07421875, -0.0244140625, 0.025390625, 0.0751953125, 0.125, 0.1748046875, 0.224609375, 0.2744140625, 0.32421875, 0.3740234375, 0.423828125, 0.4736328125, 0.5234375, 0.5732421875, 0.623046875, 0.6728515625, 0.72265625, 0.7724609375, 0.822265625, 0.8720703125, 0.921875, 0.9716796875, 1.021484375, 1.0712890625, 1.12109375, 1.1708984375, 1.220703125, 1.2705078125, 1.3203125, 1.3701171875, 1.419921875, 1.4697265625, 1.51953125, 1.5693359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 5.0, 8.0, 2.0, 9.0, 11.0, 12.0, 21.0, 18.0, 42.0, 89.0, 207.0, 381.0, 814.0, 1168.0, 605.0, 292.0, 150.0, 87.0, 60.0, 32.0, 17.0, 16.0, 10.0, 5.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5037384033203125, -0.483062744140625, -0.4623870849609375, -0.44171142578125, -0.4210357666015625, -0.400360107421875, -0.3796844482421875, -0.3590087890625, -0.3383331298828125, -0.317657470703125, -0.2969818115234375, -0.27630615234375, -0.2556304931640625, -0.234954833984375, -0.2142791748046875, -0.193603515625, -0.1729278564453125, -0.152252197265625, -0.1315765380859375, -0.11090087890625, -0.0902252197265625, -0.069549560546875, -0.0488739013671875, -0.0281982421875, -0.0075225830078125, 0.013153076171875, 0.0338287353515625, 0.05450439453125, 0.0751800537109375, 0.095855712890625, 0.1165313720703125, 0.13720703125, 0.1578826904296875, 0.178558349609375, 0.1992340087890625, 0.21990966796875, 0.2405853271484375, 0.261260986328125, 0.2819366455078125, 0.3026123046875, 0.3232879638671875, 0.343963623046875, 0.3646392822265625, 0.38531494140625, 0.4059906005859375, 0.426666259765625, 0.4473419189453125, 0.468017578125, 0.4886932373046875, 0.509368896484375, 0.5300445556640625, 0.55072021484375, 0.5713958740234375, 0.592071533203125, 0.6127471923828125, 0.6334228515625, 0.6540985107421875, 0.674774169921875, 0.6954498291015625, 0.71612548828125, 0.7368011474609375, 0.757476806640625, 0.7781524658203125, 0.798828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 11.0, 25.0, 62.0, 159.0, 249.0, 249.0, 148.0, 53.0, 19.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.129081726074219, -3.9313509464263916, -3.7336199283599854, -3.535889148712158, -3.338158369064331, -3.140427589416504, -2.9426965713500977, -2.7449657917022705, -2.5472350120544434, -2.349504232406616, -2.15177321434021, -1.9540424346923828, -1.7563116550445557, -1.558580756187439, -1.3608498573303223, -1.1631190776824951, -0.9653880596160889, -0.7676572203636169, -0.569926381111145, -0.3721954822540283, -0.1744646430015564, 0.023266196250915527, 0.22099709510803223, 0.4187278747558594, 0.6164587736129761, 0.814189612865448, 1.01192045211792, 1.2096513509750366, 1.4073822498321533, 1.6051130294799805, 1.8028439283370972, 2.0005745887756348, 2.198305606842041, 2.396036386489868, 2.5937674045562744, 2.7914981842041016, 2.9892289638519287, 3.186959743499756, 3.384690761566162, 3.5824215412139893, 3.7801523208618164, 3.9778831005096436, 4.175613880157471, 4.373344898223877, 4.571075916290283, 4.768806457519531, 4.9665374755859375, 5.164268493652344, 5.36199951171875, 5.559730529785156, 5.757461071014404, 5.9551920890808105, 6.152923107147217, 6.350653648376465, 6.548384666442871, 6.746115684509277, 6.943846225738525, 7.141577243804932, 7.33930778503418, 7.537038803100586, 7.734769821166992, 7.93250036239624, 8.130231857299805, 8.327961921691895, 8.5256929397583]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 16.0, 14.0, 14.0, 9.0, 17.0, 23.0, 28.0, 24.0, 35.0, 35.0, 41.0, 33.0, 41.0, 48.0, 41.0, 37.0, 44.0, 40.0, 38.0, 42.0, 41.0, 31.0, 37.0, 34.0, 32.0, 25.0, 22.0, 21.0, 26.0, 10.0, 16.0, 14.0, 6.0, 9.0, 10.0, 7.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.006152391433716, -1.9449986219406128, -1.8838447332382202, -1.8226909637451172, -1.7615370750427246, -1.7003833055496216, -1.6392295360565186, -1.578075647354126, -1.5169217586517334, -1.4557679891586304, -1.3946141004562378, -1.3334603309631348, -1.2723064422607422, -1.2111526727676392, -1.1499989032745361, -1.0888450145721436, -1.0276912450790405, -0.9665374159812927, -0.9053835868835449, -0.8442298173904419, -0.7830759286880493, -0.7219221591949463, -0.6607683300971985, -0.5996145009994507, -0.5384606719017029, -0.4773068428039551, -0.4161530137062073, -0.35499921441078186, -0.29384538531303406, -0.23269155621528625, -0.17153775691986084, -0.11038392782211304, -0.049230098724365234, 0.011923722922801971, 0.07307754456996918, 0.1342313587665558, 0.1953851878643036, 0.2565390169620514, 0.3176928162574768, 0.3788466453552246, 0.4400004744529724, 0.5011543035507202, 0.562308132648468, 0.6234619617462158, 0.6846157312393188, 0.7457696199417114, 0.8069233894348145, 0.8680772185325623, 0.9292310476303101, 0.9903848767280579, 1.0515387058258057, 1.1126924753189087, 1.1738463640213013, 1.2350001335144043, 1.2961540222167969, 1.3573077917099, 1.418461561203003, 1.479615330696106, 1.5407692193984985, 1.6019229888916016, 1.6630768775939941, 1.7242306470870972, 1.7853844165802002, 1.8465383052825928, 1.9076921939849854]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 13.0, 23.0, 30.0, 37.0, 61.0, 64.0, 112.0, 139.0, 218.0, 331.0, 489.0, 721.0, 1132.0, 1857.0, 3113.0, 5342.0, 9656.0, 18495.0, 38947.0, 88148.0, 214720.0, 335047.0, 182651.0, 75474.0, 33646.0, 16700.0, 8685.0, 5004.0, 2901.0, 1737.0, 1051.0, 677.0, 415.0, 275.0, 189.0, 122.0, 97.0, 62.0, 44.0, 41.0, 27.0, 16.0, 15.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.2459716796875, -0.23902511596679688, -0.23207855224609375, -0.22513198852539062, -0.2181854248046875, -0.21123886108398438, -0.20429229736328125, -0.19734573364257812, -0.190399169921875, -0.18345260620117188, -0.17650604248046875, -0.16955947875976562, -0.1626129150390625, -0.15566635131835938, -0.14871978759765625, -0.14177322387695312, -0.13482666015625, -0.12788009643554688, -0.12093353271484375, -0.11398696899414062, -0.1070404052734375, -0.10009384155273438, -0.09314727783203125, -0.08620071411132812, -0.079254150390625, -0.07230758666992188, -0.06536102294921875, -0.058414459228515625, -0.0514678955078125, -0.044521331787109375, -0.03757476806640625, -0.030628204345703125, -0.023681640625, -0.016735076904296875, -0.00978851318359375, -0.002841949462890625, 0.0041046142578125, 0.011051177978515625, 0.01799774169921875, 0.024944305419921875, 0.031890869140625, 0.038837432861328125, 0.04578399658203125, 0.052730560302734375, 0.0596771240234375, 0.06662368774414062, 0.07357025146484375, 0.08051681518554688, 0.08746337890625, 0.09440994262695312, 0.10135650634765625, 0.10830307006835938, 0.1152496337890625, 0.12219619750976562, 0.12914276123046875, 0.13608932495117188, 0.143035888671875, 0.14998245239257812, 0.15692901611328125, 0.16387557983398438, 0.1708221435546875, 0.17776870727539062, 0.18471527099609375, 0.19166183471679688, 0.1986083984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 12.0, 7.0, 13.0, 12.0, 28.0, 29.0, 20.0, 34.0, 24.0, 30.0, 36.0, 46.0, 25.0, 48.0, 44.0, 45.0, 41.0, 38.0, 39.0, 56.0, 40.0, 30.0, 35.0, 35.0, 33.0, 24.0, 32.0, 25.0, 16.0, 18.0, 22.0, 13.0, 5.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.208251953125, -0.2019062042236328, -0.19556045532226562, -0.18921470642089844, -0.18286895751953125, -0.17652320861816406, -0.17017745971679688, -0.1638317108154297, -0.1574859619140625, -0.1511402130126953, -0.14479446411132812, -0.13844871520996094, -0.13210296630859375, -0.12575721740722656, -0.11941146850585938, -0.11306571960449219, -0.106719970703125, -0.10037422180175781, -0.09402847290039062, -0.08768272399902344, -0.08133697509765625, -0.07499122619628906, -0.06864547729492188, -0.06229972839355469, -0.0559539794921875, -0.04960823059082031, -0.043262481689453125, -0.03691673278808594, -0.03057098388671875, -0.024225234985351562, -0.017879486083984375, -0.011533737182617188, -0.00518798828125, 0.0011577606201171875, 0.007503509521484375, 0.013849258422851562, 0.02019500732421875, 0.026540756225585938, 0.032886505126953125, 0.03923225402832031, 0.0455780029296875, 0.05192375183105469, 0.058269500732421875, 0.06461524963378906, 0.07096099853515625, 0.07730674743652344, 0.08365249633789062, 0.08999824523925781, 0.096343994140625, 0.10268974304199219, 0.10903549194335938, 0.11538124084472656, 0.12172698974609375, 0.12807273864746094, 0.13441848754882812, 0.1407642364501953, 0.1471099853515625, 0.1534557342529297, 0.15980148315429688, 0.16614723205566406, 0.17249298095703125, 0.17883872985839844, 0.18518447875976562, 0.1915302276611328, 0.1978759765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 7.0, 15.0, 21.0, 26.0, 31.0, 50.0, 83.0, 90.0, 171.0, 234.0, 398.0, 758.0, 1594.0, 4329.0, 16587.0, 116836.0, 779117.0, 105186.0, 15563.0, 4155.0, 1497.0, 708.0, 373.0, 245.0, 130.0, 93.0, 77.0, 43.0, 21.0, 22.0, 17.0, 16.0, 6.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5008163452148438, -0.4825897216796875, -0.46436309814453125, -0.446136474609375, -0.42790985107421875, -0.4096832275390625, -0.39145660400390625, -0.37322998046875, -0.35500335693359375, -0.3367767333984375, -0.31855010986328125, -0.300323486328125, -0.28209686279296875, -0.2638702392578125, -0.24564361572265625, -0.2274169921875, -0.20919036865234375, -0.1909637451171875, -0.17273712158203125, -0.154510498046875, -0.13628387451171875, -0.1180572509765625, -0.09983062744140625, -0.08160400390625, -0.06337738037109375, -0.0451507568359375, -0.02692413330078125, -0.008697509765625, 0.00952911376953125, 0.0277557373046875, 0.04598236083984375, 0.064208984375, 0.08243560791015625, 0.1006622314453125, 0.11888885498046875, 0.137115478515625, 0.15534210205078125, 0.1735687255859375, 0.19179534912109375, 0.21002197265625, 0.22824859619140625, 0.2464752197265625, 0.26470184326171875, 0.282928466796875, 0.30115509033203125, 0.3193817138671875, 0.33760833740234375, 0.3558349609375, 0.37406158447265625, 0.3922882080078125, 0.41051483154296875, 0.428741455078125, 0.44696807861328125, 0.4651947021484375, 0.48342132568359375, 0.50164794921875, 0.5198745727539062, 0.5381011962890625, 0.5563278198242188, 0.574554443359375, 0.5927810668945312, 0.6110076904296875, 0.6292343139648438, 0.6474609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 11.0, 14.0, 11.0, 13.0, 19.0, 25.0, 25.0, 31.0, 47.0, 58.0, 69.0, 62.0, 68.0, 73.0, 65.0, 60.0, 56.0, 53.0, 37.0, 37.0, 21.0, 24.0, 26.0, 22.0, 19.0, 12.0, 10.0, 8.0, 11.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.22528076171875, -1.1927490234375, -1.16021728515625, -1.127685546875, -1.09515380859375, -1.0626220703125, -1.03009033203125, -0.99755859375, -0.96502685546875, -0.9324951171875, -0.89996337890625, -0.867431640625, -0.83489990234375, -0.8023681640625, -0.76983642578125, -0.7373046875, -0.70477294921875, -0.6722412109375, -0.63970947265625, -0.607177734375, -0.57464599609375, -0.5421142578125, -0.50958251953125, -0.47705078125, -0.44451904296875, -0.4119873046875, -0.37945556640625, -0.346923828125, -0.31439208984375, -0.2818603515625, -0.24932861328125, -0.216796875, -0.18426513671875, -0.1517333984375, -0.11920166015625, -0.086669921875, -0.05413818359375, -0.0216064453125, 0.01092529296875, 0.04345703125, 0.07598876953125, 0.1085205078125, 0.14105224609375, 0.173583984375, 0.20611572265625, 0.2386474609375, 0.27117919921875, 0.3037109375, 0.33624267578125, 0.3687744140625, 0.40130615234375, 0.433837890625, 0.46636962890625, 0.4989013671875, 0.53143310546875, 0.56396484375, 0.59649658203125, 0.6290283203125, 0.66156005859375, 0.694091796875, 0.72662353515625, 0.7591552734375, 0.79168701171875, 0.82421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 10.0, 17.0, 24.0, 46.0, 64.0, 105.0, 200.0, 353.0, 681.0, 1566.0, 4437.0, 17104.0, 157211.0, 809686.0, 44132.0, 8268.0, 2474.0, 1051.0, 496.0, 242.0, 126.0, 80.0, 50.0, 29.0, 19.0, 15.0, 13.0, 14.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.26305389404296875, -0.2534027099609375, -0.24375152587890625, -0.234100341796875, -0.22444915771484375, -0.2147979736328125, -0.20514678955078125, -0.19549560546875, -0.18584442138671875, -0.1761932373046875, -0.16654205322265625, -0.156890869140625, -0.14723968505859375, -0.1375885009765625, -0.12793731689453125, -0.1182861328125, -0.10863494873046875, -0.0989837646484375, -0.08933258056640625, -0.079681396484375, -0.07003021240234375, -0.0603790283203125, -0.05072784423828125, -0.04107666015625, -0.03142547607421875, -0.0217742919921875, -0.01212310791015625, -0.002471923828125, 0.00717926025390625, 0.0168304443359375, 0.02648162841796875, 0.0361328125, 0.04578399658203125, 0.0554351806640625, 0.06508636474609375, 0.074737548828125, 0.08438873291015625, 0.0940399169921875, 0.10369110107421875, 0.11334228515625, 0.12299346923828125, 0.1326446533203125, 0.14229583740234375, 0.151947021484375, 0.16159820556640625, 0.1712493896484375, 0.18090057373046875, 0.1905517578125, 0.20020294189453125, 0.2098541259765625, 0.21950531005859375, 0.229156494140625, 0.23880767822265625, 0.2484588623046875, 0.25811004638671875, 0.26776123046875, 0.27741241455078125, 0.2870635986328125, 0.29671478271484375, 0.306365966796875, 0.31601715087890625, 0.3256683349609375, 0.33531951904296875, 0.344970703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 5.0, 12.0, 9.0, 15.0, 22.0, 35.0, 54.0, 88.0, 153.0, 209.0, 155.0, 73.0, 55.0, 41.0, 15.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.311867713928223e-05, -8.028745651245117e-05, -7.745623588562012e-05, -7.462501525878906e-05, -7.179379463195801e-05, -6.896257400512695e-05, -6.61313533782959e-05, -6.330013275146484e-05, -6.046891212463379e-05, -5.7637691497802734e-05, -5.480647087097168e-05, -5.1975250244140625e-05, -4.914402961730957e-05, -4.6312808990478516e-05, -4.348158836364746e-05, -4.0650367736816406e-05, -3.781914710998535e-05, -3.49879264831543e-05, -3.215670585632324e-05, -2.9325485229492188e-05, -2.6494264602661133e-05, -2.3663043975830078e-05, -2.0831823348999023e-05, -1.800060272216797e-05, -1.5169382095336914e-05, -1.233816146850586e-05, -9.506940841674805e-06, -6.67572021484375e-06, -3.844499588012695e-06, -1.0132789611816406e-06, 1.817941665649414e-06, 4.649162292480469e-06, 7.4803829193115234e-06, 1.0311603546142578e-05, 1.3142824172973633e-05, 1.5974044799804688e-05, 1.8805265426635742e-05, 2.1636486053466797e-05, 2.446770668029785e-05, 2.7298927307128906e-05, 3.013014793395996e-05, 3.2961368560791016e-05, 3.579258918762207e-05, 3.8623809814453125e-05, 4.145503044128418e-05, 4.4286251068115234e-05, 4.711747169494629e-05, 4.9948692321777344e-05, 5.27799129486084e-05, 5.561113357543945e-05, 5.844235420227051e-05, 6.127357482910156e-05, 6.410479545593262e-05, 6.693601608276367e-05, 6.976723670959473e-05, 7.259845733642578e-05, 7.542967796325684e-05, 7.826089859008789e-05, 8.109211921691895e-05, 8.392333984375e-05, 8.675456047058105e-05, 8.958578109741211e-05, 9.241700172424316e-05, 9.524822235107422e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 2.0, 9.0, 16.0, 18.0, 33.0, 53.0, 96.0, 147.0, 315.0, 643.0, 1332.0, 3891.0, 14781.0, 125403.0, 831099.0, 56443.0, 9341.0, 2743.0, 1057.0, 491.0, 251.0, 153.0, 79.0, 39.0, 27.0, 26.0, 23.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2442626953125, -0.23462486267089844, -0.22498703002929688, -0.2153491973876953, -0.20571136474609375, -0.1960735321044922, -0.18643569946289062, -0.17679786682128906, -0.1671600341796875, -0.15752220153808594, -0.14788436889648438, -0.1382465362548828, -0.12860870361328125, -0.11897087097167969, -0.10933303833007812, -0.09969520568847656, -0.090057373046875, -0.08041954040527344, -0.07078170776367188, -0.06114387512207031, -0.05150604248046875, -0.04186820983886719, -0.032230377197265625, -0.022592544555664062, -0.0129547119140625, -0.0033168792724609375, 0.006320953369140625, 0.015958786010742188, 0.02559661865234375, 0.03523445129394531, 0.044872283935546875, 0.05451011657714844, 0.06414794921875, 0.07378578186035156, 0.08342361450195312, 0.09306144714355469, 0.10269927978515625, 0.11233711242675781, 0.12197494506835938, 0.13161277770996094, 0.1412506103515625, 0.15088844299316406, 0.16052627563476562, 0.1701641082763672, 0.17980194091796875, 0.1894397735595703, 0.19907760620117188, 0.20871543884277344, 0.218353271484375, 0.22799110412597656, 0.23762893676757812, 0.2472667694091797, 0.25690460205078125, 0.2665424346923828, 0.2761802673339844, 0.28581809997558594, 0.2954559326171875, 0.30509376525878906, 0.3147315979003906, 0.3243694305419922, 0.33400726318359375, 0.3436450958251953, 0.3532829284667969, 0.36292076110839844, 0.37255859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 3.0, 8.0, 11.0, 7.0, 18.0, 21.0, 34.0, 53.0, 65.0, 93.0, 124.0, 135.0, 104.0, 88.0, 64.0, 41.0, 35.0, 23.0, 9.0, 4.0, 6.0, 12.0, 11.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283203125, -0.27541351318359375, -0.2676239013671875, -0.25983428955078125, -0.252044677734375, -0.24425506591796875, -0.2364654541015625, -0.22867584228515625, -0.22088623046875, -0.21309661865234375, -0.2053070068359375, -0.19751739501953125, -0.189727783203125, -0.18193817138671875, -0.1741485595703125, -0.16635894775390625, -0.1585693359375, -0.15077972412109375, -0.1429901123046875, -0.13520050048828125, -0.127410888671875, -0.11962127685546875, -0.1118316650390625, -0.10404205322265625, -0.09625244140625, -0.08846282958984375, -0.0806732177734375, -0.07288360595703125, -0.065093994140625, -0.05730438232421875, -0.0495147705078125, -0.04172515869140625, -0.033935546875, -0.02614593505859375, -0.0183563232421875, -0.01056671142578125, -0.002777099609375, 0.00501251220703125, 0.0128021240234375, 0.02059173583984375, 0.02838134765625, 0.03617095947265625, 0.0439605712890625, 0.05175018310546875, 0.059539794921875, 0.06732940673828125, 0.0751190185546875, 0.08290863037109375, 0.0906982421875, 0.09848785400390625, 0.1062774658203125, 0.11406707763671875, 0.121856689453125, 0.12964630126953125, 0.1374359130859375, 0.14522552490234375, 0.15301513671875, 0.16080474853515625, 0.1685943603515625, 0.17638397216796875, 0.184173583984375, 0.19196319580078125, 0.1997528076171875, 0.20754241943359375, 0.21533203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 12.0, 37.0, 133.0, 423.0, 250.0, 76.0, 38.0, 18.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4286065101623535, -5.153811454772949, -4.879016399383545, -4.604221343994141, -4.329425811767578, -4.054630756378174, -3.7798357009887695, -3.5050406455993652, -3.230245351791382, -2.9554502964019775, -2.680655002593994, -2.40585994720459, -2.1310648918151855, -1.8562695980072021, -1.5814745426177979, -1.306679368019104, -1.0318841934204102, -0.7570890188217163, -0.48229390382766724, -0.20749878883361816, 0.06729638576507568, 0.34209156036376953, 0.6168866157531738, 0.8916817903518677, 1.1664769649505615, 1.4412721395492554, 1.7160673141479492, 1.9908623695373535, 2.265657424926758, 2.540452718734741, 2.8152477741241455, 3.090043067932129, 3.364837646484375, 3.6396327018737793, 3.9144279956817627, 4.189223289489746, 4.46401834487915, 4.738813400268555, 5.013608455657959, 5.288403511047363, 5.563199043273926, 5.83799409866333, 6.112789154052734, 6.387584686279297, 6.662379741668701, 6.9371747970581055, 7.21196985244751, 7.486764907836914, 7.761559963226318, 8.036355018615723, 8.311150550842285, 8.585945129394531, 8.860740661621094, 9.135536193847656, 9.410330772399902, 9.685126304626465, 9.959920883178711, 10.234716415405273, 10.50951099395752, 10.784306526184082, 11.059101104736328, 11.33389663696289, 11.608692169189453, 11.8834867477417, 12.158282279968262]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 9.0, 17.0, 15.0, 15.0, 22.0, 24.0, 20.0, 19.0, 24.0, 27.0, 34.0, 47.0, 54.0, 65.0, 93.0, 77.0, 68.0, 44.0, 37.0, 41.0, 22.0, 32.0, 20.0, 21.0, 15.0, 20.0, 13.0, 14.0, 12.0, 6.0, 5.0, 7.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0460667610168457, -2.946803569793701, -2.8475406169891357, -2.748277425765991, -2.649014472961426, -2.5497512817382812, -2.450488328933716, -2.3512251377105713, -2.251962184906006, -2.1526989936828613, -2.053436040878296, -1.954172968864441, -1.854909896850586, -1.755646824836731, -1.656383752822876, -1.5571205615997314, -1.4578574895858765, -1.3585944175720215, -1.2593313455581665, -1.1600682735443115, -1.0608052015304565, -0.9615421295166016, -0.8622789978981018, -0.7630159258842468, -0.6637528538703918, -0.5644897818565369, -0.4652267098426819, -0.3659636080265045, -0.26670053601264954, -0.16743746399879456, -0.06817436218261719, 0.031088709831237793, 0.13035178184509277, 0.22961485385894775, 0.32887792587280273, 0.4281410276889801, 0.5274040699005127, 0.6266671419143677, 0.7259302735328674, 0.8251933455467224, 0.9244564175605774, 1.0237195491790771, 1.1229826211929321, 1.222245693206787, 1.321508765220642, 1.420771837234497, 1.520034909248352, 1.619297981262207, 1.718561053276062, 1.817824125289917, 1.917087197303772, 2.016350269317627, 2.1156134605407715, 2.214876413345337, 2.3141396045684814, 2.413402557373047, 2.5126657485961914, 2.611928939819336, 2.7111918926239014, 2.810455083847046, 2.9097180366516113, 3.008981227874756, 3.1082441806793213, 3.207507371902466, 3.3067703247070312]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 8.0, 5.0, 5.0, 7.0, 13.0, 18.0, 27.0, 27.0, 39.0, 47.0, 74.0, 141.0, 220.0, 448.0, 1120.0, 3309.0, 13377.0, 106019.0, 2637079.0, 1357452.0, 61609.0, 9032.0, 2395.0, 864.0, 365.0, 199.0, 99.0, 81.0, 62.0, 25.0, 23.0, 24.0, 16.0, 11.0, 13.0, 5.0, 11.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423828125, -0.4080657958984375, -0.392303466796875, -0.3765411376953125, -0.36077880859375, -0.3450164794921875, -0.329254150390625, -0.3134918212890625, -0.2977294921875, -0.2819671630859375, -0.266204833984375, -0.2504425048828125, -0.23468017578125, -0.2189178466796875, -0.203155517578125, -0.1873931884765625, -0.171630859375, -0.1558685302734375, -0.140106201171875, -0.1243438720703125, -0.10858154296875, -0.0928192138671875, -0.077056884765625, -0.0612945556640625, -0.0455322265625, -0.0297698974609375, -0.014007568359375, 0.0017547607421875, 0.01751708984375, 0.0332794189453125, 0.049041748046875, 0.0648040771484375, 0.08056640625, 0.0963287353515625, 0.112091064453125, 0.1278533935546875, 0.14361572265625, 0.1593780517578125, 0.175140380859375, 0.1909027099609375, 0.2066650390625, 0.2224273681640625, 0.238189697265625, 0.2539520263671875, 0.26971435546875, 0.2854766845703125, 0.301239013671875, 0.3170013427734375, 0.332763671875, 0.3485260009765625, 0.364288330078125, 0.3800506591796875, 0.39581298828125, 0.4115753173828125, 0.427337646484375, 0.4430999755859375, 0.4588623046875, 0.4746246337890625, 0.490386962890625, 0.5061492919921875, 0.52191162109375, 0.5376739501953125, 0.553436279296875, 0.5691986083984375, 0.5849609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 9.0, 6.0, 13.0, 9.0, 6.0, 10.0, 15.0, 26.0, 22.0, 21.0, 26.0, 25.0, 34.0, 38.0, 40.0, 35.0, 43.0, 38.0, 47.0, 42.0, 42.0, 48.0, 43.0, 42.0, 35.0, 34.0, 26.0, 24.0, 22.0, 28.0, 13.0, 28.0, 16.0, 11.0, 10.0, 4.0, 13.0, 8.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1660003662109375, -0.160125732421875, -0.1542510986328125, -0.14837646484375, -0.1425018310546875, -0.136627197265625, -0.1307525634765625, -0.1248779296875, -0.1190032958984375, -0.113128662109375, -0.1072540283203125, -0.10137939453125, -0.0955047607421875, -0.089630126953125, -0.0837554931640625, -0.077880859375, -0.0720062255859375, -0.066131591796875, -0.0602569580078125, -0.05438232421875, -0.0485076904296875, -0.042633056640625, -0.0367584228515625, -0.0308837890625, -0.0250091552734375, -0.019134521484375, -0.0132598876953125, -0.00738525390625, -0.0015106201171875, 0.004364013671875, 0.0102386474609375, 0.01611328125, 0.0219879150390625, 0.027862548828125, 0.0337371826171875, 0.03961181640625, 0.0454864501953125, 0.051361083984375, 0.0572357177734375, 0.0631103515625, 0.0689849853515625, 0.074859619140625, 0.0807342529296875, 0.08660888671875, 0.0924835205078125, 0.098358154296875, 0.1042327880859375, 0.110107421875, 0.1159820556640625, 0.121856689453125, 0.1277313232421875, 0.13360595703125, 0.1394805908203125, 0.145355224609375, 0.1512298583984375, 0.1571044921875, 0.1629791259765625, 0.168853759765625, 0.1747283935546875, 0.18060302734375, 0.1864776611328125, 0.192352294921875, 0.1982269287109375, 0.2041015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 25.0, 33.0, 83.0, 164.0, 514.0, 3489.0, 98485.0, 4058333.0, 30444.0, 2037.0, 379.0, 151.0, 48.0, 23.0, 21.0, 10.0, 12.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.64447021484375, -1.6004638671875, -1.55645751953125, -1.512451171875, -1.46844482421875, -1.4244384765625, -1.38043212890625, -1.33642578125, -1.29241943359375, -1.2484130859375, -1.20440673828125, -1.160400390625, -1.11639404296875, -1.0723876953125, -1.02838134765625, -0.984375, -0.94036865234375, -0.8963623046875, -0.85235595703125, -0.808349609375, -0.76434326171875, -0.7203369140625, -0.67633056640625, -0.63232421875, -0.58831787109375, -0.5443115234375, -0.50030517578125, -0.456298828125, -0.41229248046875, -0.3682861328125, -0.32427978515625, -0.2802734375, -0.23626708984375, -0.1922607421875, -0.14825439453125, -0.104248046875, -0.06024169921875, -0.0162353515625, 0.02777099609375, 0.07177734375, 0.11578369140625, 0.1597900390625, 0.20379638671875, 0.247802734375, 0.29180908203125, 0.3358154296875, 0.37982177734375, 0.423828125, 0.46783447265625, 0.5118408203125, 0.55584716796875, 0.599853515625, 0.64385986328125, 0.6878662109375, 0.73187255859375, 0.77587890625, 0.81988525390625, 0.8638916015625, 0.90789794921875, 0.951904296875, 0.99591064453125, 1.0399169921875, 1.08392333984375, 1.1279296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 7.0, 17.0, 18.0, 27.0, 30.0, 52.0, 87.0, 119.0, 209.0, 300.0, 570.0, 806.0, 673.0, 431.0, 249.0, 146.0, 78.0, 51.0, 43.0, 36.0, 29.0, 12.0, 12.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4501953125, -0.43506622314453125, -0.4199371337890625, -0.40480804443359375, -0.389678955078125, -0.37454986572265625, -0.3594207763671875, -0.34429168701171875, -0.32916259765625, -0.31403350830078125, -0.2989044189453125, -0.28377532958984375, -0.268646240234375, -0.25351715087890625, -0.2383880615234375, -0.22325897216796875, -0.2081298828125, -0.19300079345703125, -0.1778717041015625, -0.16274261474609375, -0.147613525390625, -0.13248443603515625, -0.1173553466796875, -0.10222625732421875, -0.08709716796875, -0.07196807861328125, -0.0568389892578125, -0.04170989990234375, -0.026580810546875, -0.01145172119140625, 0.0036773681640625, 0.01880645751953125, 0.033935546875, 0.04906463623046875, 0.0641937255859375, 0.07932281494140625, 0.094451904296875, 0.10958099365234375, 0.1247100830078125, 0.13983917236328125, 0.15496826171875, 0.17009735107421875, 0.1852264404296875, 0.20035552978515625, 0.215484619140625, 0.23061370849609375, 0.2457427978515625, 0.26087188720703125, 0.2760009765625, 0.29113006591796875, 0.3062591552734375, 0.32138824462890625, 0.336517333984375, 0.35164642333984375, 0.3667755126953125, 0.38190460205078125, 0.39703369140625, 0.41216278076171875, 0.4272918701171875, 0.44242095947265625, 0.457550048828125, 0.47267913818359375, 0.4878082275390625, 0.5029373168945312, 0.51806640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 14.0, 15.0, 50.0, 64.0, 129.0, 157.0, 187.0, 143.0, 96.0, 53.0, 28.0, 14.0, 12.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.864886283874512, -4.737573623657227, -4.610260486602783, -4.482947826385498, -4.355634689331055, -4.2283220291137695, -4.101008892059326, -3.973696231842041, -3.8463833332061768, -3.7190704345703125, -3.5917575359344482, -3.464444637298584, -3.337131977081299, -3.2098188400268555, -3.0825061798095703, -2.955193281173706, -2.827880382537842, -2.7005674839019775, -2.5732545852661133, -2.445941686630249, -2.3186287879943848, -2.1913161277770996, -2.0640032291412354, -1.936690330505371, -1.8093774318695068, -1.6820645332336426, -1.5547516345977783, -1.4274388551712036, -1.3001259565353394, -1.172813057899475, -1.0455002784729004, -0.9181873798370361, -0.7908740043640137, -0.6635611057281494, -0.5362482666969299, -0.40893539786338806, -0.2816225290298462, -0.15430963039398193, -0.02699679136276245, 0.10031604766845703, 0.2276289463043213, 0.35494181513786316, 0.48225468397140503, 0.6095675230026245, 0.7368804216384888, 0.864193320274353, 0.9915061593055725, 1.118818998336792, 1.2461318969726562, 1.3734447956085205, 1.5007576942443848, 1.6280704736709595, 1.7553833723068237, 1.882696270942688, 2.0100090503692627, 2.137321949005127, 2.264634847640991, 2.3919477462768555, 2.5192606449127197, 2.646573543548584, 2.773886203765869, 2.9011993408203125, 3.0285120010375977, 3.155824899673462, 3.283137798309326]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 11.0, 10.0, 10.0, 16.0, 18.0, 14.0, 25.0, 26.0, 21.0, 32.0, 35.0, 44.0, 54.0, 65.0, 49.0, 61.0, 48.0, 62.0, 46.0, 49.0, 42.0, 34.0, 34.0, 33.0, 29.0, 28.0, 27.0, 12.0, 9.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9927042722702026, -1.9288220405578613, -1.86493980884552, -1.8010575771331787, -1.7371753454208374, -1.673293113708496, -1.6094107627868652, -1.5455286502838135, -1.4816462993621826, -1.4177640676498413, -1.3538818359375, -1.2899996042251587, -1.2261173725128174, -1.162235140800476, -1.0983529090881348, -1.034470558166504, -0.9705884456634521, -0.9067062139511108, -0.8428239822387695, -0.7789417505264282, -0.7150595188140869, -0.6511772871017456, -0.5872949957847595, -0.5234127640724182, -0.4595305323600769, -0.3956483006477356, -0.3317660689353943, -0.2678838074207306, -0.20400157570838928, -0.14011934399604797, -0.07623708248138428, -0.012354850769042969, 0.05152726173400879, 0.1154095008969307, 0.1792917400598526, 0.2431739866733551, 0.3070562183856964, 0.3709384500980377, 0.4348207116127014, 0.4987029433250427, 0.562585175037384, 0.6264674067497253, 0.6903496384620667, 0.7542319297790527, 0.818114161491394, 0.8819963932037354, 0.9458786249160767, 1.009760856628418, 1.0736430883407593, 1.1375253200531006, 1.201407551765442, 1.2652897834777832, 1.3291720151901245, 1.3930542469024658, 1.4569365978240967, 1.5208187103271484, 1.5847010612487793, 1.6485832929611206, 1.712465524673462, 1.7763477563858032, 1.8402299880981445, 1.9041122198104858, 1.9679944515228271, 2.031876802444458, 2.0957589149475098]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 9.0, 19.0, 34.0, 51.0, 93.0, 125.0, 213.0, 432.0, 841.0, 1647.0, 3894.0, 9977.0, 28955.0, 112683.0, 532098.0, 274157.0, 55371.0, 16685.0, 6159.0, 2529.0, 1244.0, 604.0, 296.0, 162.0, 94.0, 66.0, 39.0, 18.0, 9.0, 12.0, 8.0, 3.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.52587890625, -0.5123100280761719, -0.49874114990234375, -0.4851722717285156, -0.4716033935546875, -0.4580345153808594, -0.44446563720703125, -0.4308967590332031, -0.417327880859375, -0.4037590026855469, -0.39019012451171875, -0.3766212463378906, -0.3630523681640625, -0.3494834899902344, -0.33591461181640625, -0.3223457336425781, -0.30877685546875, -0.2952079772949219, -0.28163909912109375, -0.2680702209472656, -0.2545013427734375, -0.24093246459960938, -0.22736358642578125, -0.21379470825195312, -0.200225830078125, -0.18665695190429688, -0.17308807373046875, -0.15951919555664062, -0.1459503173828125, -0.13238143920898438, -0.11881256103515625, -0.10524368286132812, -0.0916748046875, -0.07810592651367188, -0.06453704833984375, -0.050968170166015625, -0.0373992919921875, -0.023830413818359375, -0.01026153564453125, 0.003307342529296875, 0.016876220703125, 0.030445098876953125, 0.04401397705078125, 0.057582855224609375, 0.0711517333984375, 0.08472061157226562, 0.09828948974609375, 0.11185836791992188, 0.12542724609375, 0.13899612426757812, 0.15256500244140625, 0.16613388061523438, 0.1797027587890625, 0.19327163696289062, 0.20684051513671875, 0.22040939331054688, 0.233978271484375, 0.24754714965820312, 0.26111602783203125, 0.2746849060058594, 0.2882537841796875, 0.3018226623535156, 0.31539154052734375, 0.3289604187011719, 0.342529296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 2.0, 7.0, 6.0, 7.0, 13.0, 16.0, 17.0, 18.0, 15.0, 31.0, 37.0, 34.0, 27.0, 30.0, 37.0, 30.0, 32.0, 58.0, 58.0, 51.0, 40.0, 44.0, 36.0, 47.0, 43.0, 35.0, 33.0, 31.0, 16.0, 20.0, 24.0, 19.0, 15.0, 12.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2117919921875, -0.20538902282714844, -0.19898605346679688, -0.1925830841064453, -0.18618011474609375, -0.1797771453857422, -0.17337417602539062, -0.16697120666503906, -0.1605682373046875, -0.15416526794433594, -0.14776229858398438, -0.1413593292236328, -0.13495635986328125, -0.1285533905029297, -0.12215042114257812, -0.11574745178222656, -0.109344482421875, -0.10294151306152344, -0.09653854370117188, -0.09013557434082031, -0.08373260498046875, -0.07732963562011719, -0.07092666625976562, -0.06452369689941406, -0.0581207275390625, -0.05171775817871094, -0.045314788818359375, -0.03891181945800781, -0.03250885009765625, -0.026105880737304688, -0.019702911376953125, -0.013299942016601562, -0.00689697265625, -0.0004940032958984375, 0.005908966064453125, 0.012311935424804688, 0.01871490478515625, 0.025117874145507812, 0.031520843505859375, 0.03792381286621094, 0.0443267822265625, 0.05072975158691406, 0.057132720947265625, 0.06353569030761719, 0.06993865966796875, 0.07634162902832031, 0.08274459838867188, 0.08914756774902344, 0.095550537109375, 0.10195350646972656, 0.10835647583007812, 0.11475944519042969, 0.12116241455078125, 0.1275653839111328, 0.13396835327148438, 0.14037132263183594, 0.1467742919921875, 0.15317726135253906, 0.15958023071289062, 0.1659832000732422, 0.17238616943359375, 0.1787891387939453, 0.18519210815429688, 0.19159507751464844, 0.197998046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 8.0, 12.0, 25.0, 31.0, 55.0, 68.0, 102.0, 209.0, 335.0, 695.0, 1574.0, 4411.0, 19488.0, 222266.0, 753335.0, 35421.0, 6561.0, 2026.0, 852.0, 429.0, 214.0, 135.0, 75.0, 62.0, 35.0, 31.0, 13.0, 16.0, 13.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.814239501953125, -0.79107666015625, -0.767913818359375, -0.7447509765625, -0.721588134765625, -0.69842529296875, -0.675262451171875, -0.652099609375, -0.628936767578125, -0.60577392578125, -0.582611083984375, -0.5594482421875, -0.536285400390625, -0.51312255859375, -0.489959716796875, -0.466796875, -0.443634033203125, -0.42047119140625, -0.397308349609375, -0.3741455078125, -0.350982666015625, -0.32781982421875, -0.304656982421875, -0.281494140625, -0.258331298828125, -0.23516845703125, -0.212005615234375, -0.1888427734375, -0.165679931640625, -0.14251708984375, -0.119354248046875, -0.09619140625, -0.073028564453125, -0.04986572265625, -0.026702880859375, -0.0035400390625, 0.019622802734375, 0.04278564453125, 0.065948486328125, 0.089111328125, 0.112274169921875, 0.13543701171875, 0.158599853515625, 0.1817626953125, 0.204925537109375, 0.22808837890625, 0.251251220703125, 0.2744140625, 0.297576904296875, 0.32073974609375, 0.343902587890625, 0.3670654296875, 0.390228271484375, 0.41339111328125, 0.436553955078125, 0.459716796875, 0.482879638671875, 0.50604248046875, 0.529205322265625, 0.5523681640625, 0.575531005859375, 0.59869384765625, 0.621856689453125, 0.64501953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 13.0, 10.0, 6.0, 18.0, 13.0, 23.0, 23.0, 16.0, 31.0, 37.0, 39.0, 42.0, 59.0, 40.0, 65.0, 47.0, 57.0, 41.0, 55.0, 50.0, 54.0, 38.0, 38.0, 36.0, 26.0, 21.0, 17.0, 10.0, 9.0, 8.0, 7.0, 13.0, 2.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.82373046875, -0.7971115112304688, -0.7704925537109375, -0.7438735961914062, -0.717254638671875, -0.6906356811523438, -0.6640167236328125, -0.6373977661132812, -0.61077880859375, -0.5841598510742188, -0.5575408935546875, -0.5309219360351562, -0.504302978515625, -0.47768402099609375, -0.4510650634765625, -0.42444610595703125, -0.3978271484375, -0.37120819091796875, -0.3445892333984375, -0.31797027587890625, -0.291351318359375, -0.26473236083984375, -0.2381134033203125, -0.21149444580078125, -0.18487548828125, -0.15825653076171875, -0.1316375732421875, -0.10501861572265625, -0.078399658203125, -0.05178070068359375, -0.0251617431640625, 0.00145721435546875, 0.028076171875, 0.05469512939453125, 0.0813140869140625, 0.10793304443359375, 0.134552001953125, 0.16117095947265625, 0.1877899169921875, 0.21440887451171875, 0.24102783203125, 0.26764678955078125, 0.2942657470703125, 0.32088470458984375, 0.347503662109375, 0.37412261962890625, 0.4007415771484375, 0.42736053466796875, 0.4539794921875, 0.48059844970703125, 0.5072174072265625, 0.5338363647460938, 0.560455322265625, 0.5870742797851562, 0.6136932373046875, 0.6403121948242188, 0.66693115234375, 0.6935501098632812, 0.7201690673828125, 0.7467880249023438, 0.773406982421875, 0.8000259399414062, 0.8266448974609375, 0.8532638549804688, 0.8798828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 9.0, 10.0, 18.0, 22.0, 27.0, 51.0, 88.0, 183.0, 326.0, 868.0, 2487.0, 13069.0, 768339.0, 249877.0, 9566.0, 2157.0, 758.0, 333.0, 161.0, 89.0, 44.0, 21.0, 13.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3288688659667969, -0.31618499755859375, -0.3035011291503906, -0.2908172607421875, -0.2781333923339844, -0.26544952392578125, -0.2527656555175781, -0.240081787109375, -0.22739791870117188, -0.21471405029296875, -0.20203018188476562, -0.1893463134765625, -0.17666244506835938, -0.16397857666015625, -0.15129470825195312, -0.13861083984375, -0.12592697143554688, -0.11324310302734375, -0.10055923461914062, -0.0878753662109375, -0.07519149780273438, -0.06250762939453125, -0.049823760986328125, -0.037139892578125, -0.024456024169921875, -0.01177215576171875, 0.000911712646484375, 0.0135955810546875, 0.026279449462890625, 0.03896331787109375, 0.051647186279296875, 0.0643310546875, 0.07701492309570312, 0.08969879150390625, 0.10238265991210938, 0.1150665283203125, 0.12775039672851562, 0.14043426513671875, 0.15311813354492188, 0.165802001953125, 0.17848587036132812, 0.19116973876953125, 0.20385360717773438, 0.2165374755859375, 0.22922134399414062, 0.24190521240234375, 0.2545890808105469, 0.26727294921875, 0.2799568176269531, 0.29264068603515625, 0.3053245544433594, 0.3180084228515625, 0.3306922912597656, 0.34337615966796875, 0.3560600280761719, 0.368743896484375, 0.3814277648925781, 0.39411163330078125, 0.4067955017089844, 0.4194793701171875, 0.4321632385253906, 0.44484710693359375, 0.4575309753417969, 0.47021484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 9.0, 13.0, 31.0, 89.0, 333.0, 362.0, 79.0, 30.0, 17.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00032520294189453125, -0.0003184322267770767, -0.0003116615116596222, -0.00030489079654216766, -0.00029812008142471313, -0.0002913493663072586, -0.0002845786511898041, -0.00027780793607234955, -0.000271037220954895, -0.0002642665058374405, -0.00025749579071998596, -0.00025072507560253143, -0.0002439543604850769, -0.00023718364536762238, -0.00023041293025016785, -0.00022364221513271332, -0.0002168715000152588, -0.00021010078489780426, -0.00020333006978034973, -0.0001965593546628952, -0.00018978863954544067, -0.00018301792442798615, -0.00017624720931053162, -0.0001694764941930771, -0.00016270577907562256, -0.00015593506395816803, -0.0001491643488407135, -0.00014239363372325897, -0.00013562291860580444, -0.00012885220348834991, -0.00012208148837089539, -0.00011531077325344086, -0.00010854005813598633, -0.0001017693430185318, -9.499862790107727e-05, -8.822791278362274e-05, -8.145719766616821e-05, -7.468648254871368e-05, -6.791576743125916e-05, -6.114505231380463e-05, -5.43743371963501e-05, -4.760362207889557e-05, -4.083290696144104e-05, -3.406219184398651e-05, -2.7291476726531982e-05, -2.0520761609077454e-05, -1.3750046491622925e-05, -6.979331374168396e-06, -2.086162567138672e-07, 6.562098860740662e-06, 1.333281397819519e-05, 2.010352909564972e-05, 2.6874244213104248e-05, 3.364495933055878e-05, 4.0415674448013306e-05, 4.7186389565467834e-05, 5.395710468292236e-05, 6.072781980037689e-05, 6.749853491783142e-05, 7.426925003528595e-05, 8.103996515274048e-05, 8.781068027019501e-05, 9.458139538764954e-05, 0.00010135211050510406, 0.0001081228256225586]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 10.0, 15.0, 18.0, 31.0, 54.0, 52.0, 102.0, 160.0, 307.0, 614.0, 1741.0, 6154.0, 79463.0, 926386.0, 27272.0, 3801.0, 1181.0, 500.0, 251.0, 145.0, 100.0, 63.0, 32.0, 21.0, 19.0, 17.0, 6.0, 8.0, 2.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34375, -0.3311767578125, -0.318603515625, -0.3060302734375, -0.29345703125, -0.2808837890625, -0.268310546875, -0.2557373046875, -0.2431640625, -0.2305908203125, -0.218017578125, -0.2054443359375, -0.19287109375, -0.1802978515625, -0.167724609375, -0.1551513671875, -0.142578125, -0.1300048828125, -0.117431640625, -0.1048583984375, -0.09228515625, -0.0797119140625, -0.067138671875, -0.0545654296875, -0.0419921875, -0.0294189453125, -0.016845703125, -0.0042724609375, 0.00830078125, 0.0208740234375, 0.033447265625, 0.0460205078125, 0.05859375, 0.0711669921875, 0.083740234375, 0.0963134765625, 0.10888671875, 0.1214599609375, 0.134033203125, 0.1466064453125, 0.1591796875, 0.1717529296875, 0.184326171875, 0.1968994140625, 0.20947265625, 0.2220458984375, 0.234619140625, 0.2471923828125, 0.259765625, 0.2723388671875, 0.284912109375, 0.2974853515625, 0.31005859375, 0.3226318359375, 0.335205078125, 0.3477783203125, 0.3603515625, 0.3729248046875, 0.385498046875, 0.3980712890625, 0.41064453125, 0.4232177734375, 0.435791015625, 0.4483642578125, 0.4609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 5.0, 13.0, 24.0, 41.0, 45.0, 114.0, 157.0, 195.0, 156.0, 83.0, 55.0, 34.0, 18.0, 14.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.369140625, -0.35950279235839844, -0.3498649597167969, -0.3402271270751953, -0.33058929443359375, -0.3209514617919922, -0.3113136291503906, -0.30167579650878906, -0.2920379638671875, -0.28240013122558594, -0.2727622985839844, -0.2631244659423828, -0.25348663330078125, -0.2438488006591797, -0.23421096801757812, -0.22457313537597656, -0.214935302734375, -0.20529747009277344, -0.19565963745117188, -0.1860218048095703, -0.17638397216796875, -0.1667461395263672, -0.15710830688476562, -0.14747047424316406, -0.1378326416015625, -0.12819480895996094, -0.11855697631835938, -0.10891914367675781, -0.09928131103515625, -0.08964347839355469, -0.08000564575195312, -0.07036781311035156, -0.06072998046875, -0.05109214782714844, -0.041454315185546875, -0.03181648254394531, -0.02217864990234375, -0.012540817260742188, -0.002902984619140625, 0.0067348480224609375, 0.0163726806640625, 0.026010513305664062, 0.035648345947265625, 0.04528617858886719, 0.05492401123046875, 0.06456184387207031, 0.07419967651367188, 0.08383750915527344, 0.093475341796875, 0.10311317443847656, 0.11275100708007812, 0.12238883972167969, 0.13202667236328125, 0.1416645050048828, 0.15130233764648438, 0.16094017028808594, 0.1705780029296875, 0.18021583557128906, 0.18985366821289062, 0.1994915008544922, 0.20912933349609375, 0.2187671661376953, 0.22840499877929688, 0.23804283142089844, 0.2476806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 8.0, 15.0, 58.0, 157.0, 498.0, 190.0, 45.0, 19.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.972320556640625, -10.694829940795898, -10.417340278625488, -10.139849662780762, -9.862359046936035, -9.584869384765625, -9.307378768920898, -9.029888153076172, -8.752397537231445, -8.474906921386719, -8.197417259216309, -7.919926643371582, -7.6424360275268555, -7.364945888519287, -7.087455749511719, -6.809965133666992, -6.532475471496582, -6.254985332489014, -5.977494716644287, -5.700004577636719, -5.422513961791992, -5.145023822784424, -4.8675336837768555, -4.590043067932129, -4.3125529289245605, -4.035062789916992, -3.7575721740722656, -3.4800820350646973, -3.20259165763855, -2.9251012802124023, -2.647611141204834, -2.3701207637786865, -2.0926294326782227, -1.8151390552520752, -1.5376487970352173, -1.2601585388183594, -0.9826681613922119, -0.7051777839660645, -0.42768752574920654, -0.15019726753234863, 0.12729310989379883, 0.4047834277153015, 0.6822737455368042, 0.9597640633583069, 1.2372543811798096, 1.514744758605957, 1.792235016822815, 2.069725275039673, 2.3472156524658203, 2.6247060298919678, 2.9021964073181152, 3.1796865463256836, 3.457176923751831, 3.7346673011779785, 4.012157440185547, 4.289648056030273, 4.567138195037842, 4.84462833404541, 5.122118949890137, 5.399609088897705, 5.677099227905273, 5.95458984375, 6.232079982757568, 6.509570121765137, 6.787060737609863]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 2.0, 8.0, 14.0, 10.0, 18.0, 23.0, 16.0, 19.0, 18.0, 26.0, 30.0, 21.0, 27.0, 54.0, 64.0, 74.0, 86.0, 94.0, 55.0, 49.0, 27.0, 27.0, 22.0, 25.0, 16.0, 16.0, 19.0, 19.0, 11.0, 21.0, 10.0, 8.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.8594861030578613, -2.7713756561279297, -2.683264970779419, -2.5951545238494873, -2.5070438385009766, -2.418933391571045, -2.3308229446411133, -2.2427124977111816, -2.154601812362671, -2.0664913654327393, -1.9783806800842285, -1.8902702331542969, -1.8021596670150757, -1.7140491008758545, -1.6259386539459229, -1.5378280878067017, -1.4497175216674805, -1.3616069555282593, -1.273496389389038, -1.1853859424591064, -1.0972753763198853, -1.009164810180664, -0.9210543036460876, -0.8329437971115112, -0.74483323097229, -0.6567226648330688, -0.5686121582984924, -0.48050162196159363, -0.3923910856246948, -0.304280549287796, -0.21617001295089722, -0.1280595064163208, -0.03994917869567871, 0.04816135764122009, 0.1362718939781189, 0.2243824303150177, 0.3124929666519165, 0.4006035029888153, 0.4887140393257141, 0.5768245458602905, 0.6649351119995117, 0.7530456781387329, 0.8411561846733093, 0.9292666912078857, 1.017377257347107, 1.1054878234863281, 1.1935982704162598, 1.281708836555481, 1.3698194026947021, 1.4579299688339233, 1.5460405349731445, 1.6341509819030762, 1.7222615480422974, 1.8103721141815186, 1.8984825611114502, 1.9865931272506714, 2.0747036933898926, 2.162814140319824, 2.250924825668335, 2.3390352725982666, 2.4271459579467773, 2.515256404876709, 2.6033668518066406, 2.6914772987365723, 2.779587984085083]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 13.0, 8.0, 20.0, 22.0, 39.0, 51.0, 110.0, 126.0, 263.0, 462.0, 788.0, 1591.0, 3555.0, 9040.0, 28942.0, 136104.0, 1023603.0, 2419042.0, 469788.0, 71384.0, 18017.0, 5977.0, 2575.0, 1242.0, 623.0, 317.0, 235.0, 119.0, 72.0, 42.0, 37.0, 17.0, 23.0, 10.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48486328125, -0.4693756103515625, -0.453887939453125, -0.4384002685546875, -0.42291259765625, -0.4074249267578125, -0.391937255859375, -0.3764495849609375, -0.3609619140625, -0.3454742431640625, -0.329986572265625, -0.3144989013671875, -0.29901123046875, -0.2835235595703125, -0.268035888671875, -0.2525482177734375, -0.237060546875, -0.2215728759765625, -0.206085205078125, -0.1905975341796875, -0.17510986328125, -0.1596221923828125, -0.144134521484375, -0.1286468505859375, -0.1131591796875, -0.0976715087890625, -0.082183837890625, -0.0666961669921875, -0.05120849609375, -0.0357208251953125, -0.020233154296875, -0.0047454833984375, 0.0107421875, 0.0262298583984375, 0.041717529296875, 0.0572052001953125, 0.07269287109375, 0.0881805419921875, 0.103668212890625, 0.1191558837890625, 0.1346435546875, 0.1501312255859375, 0.165618896484375, 0.1811065673828125, 0.19659423828125, 0.2120819091796875, 0.227569580078125, 0.2430572509765625, 0.258544921875, 0.2740325927734375, 0.289520263671875, 0.3050079345703125, 0.32049560546875, 0.3359832763671875, 0.351470947265625, 0.3669586181640625, 0.3824462890625, 0.3979339599609375, 0.413421630859375, 0.4289093017578125, 0.44439697265625, 0.4598846435546875, 0.475372314453125, 0.4908599853515625, 0.50634765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 6.0, 16.0, 9.0, 11.0, 20.0, 19.0, 15.0, 43.0, 33.0, 35.0, 41.0, 37.0, 51.0, 59.0, 48.0, 60.0, 60.0, 62.0, 53.0, 44.0, 49.0, 38.0, 29.0, 25.0, 24.0, 28.0, 21.0, 16.0, 10.0, 10.0, 3.0, 6.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.281494140625, -0.2739696502685547, -0.2664451599121094, -0.25892066955566406, -0.25139617919921875, -0.24387168884277344, -0.23634719848632812, -0.2288227081298828, -0.2212982177734375, -0.2137737274169922, -0.20624923706054688, -0.19872474670410156, -0.19120025634765625, -0.18367576599121094, -0.17615127563476562, -0.1686267852783203, -0.161102294921875, -0.1535778045654297, -0.14605331420898438, -0.13852882385253906, -0.13100433349609375, -0.12347984313964844, -0.11595535278320312, -0.10843086242675781, -0.1009063720703125, -0.09338188171386719, -0.08585739135742188, -0.07833290100097656, -0.07080841064453125, -0.06328392028808594, -0.055759429931640625, -0.04823493957519531, -0.04071044921875, -0.03318595886230469, -0.025661468505859375, -0.018136978149414062, -0.01061248779296875, -0.0030879974365234375, 0.004436492919921875, 0.011960983276367188, 0.0194854736328125, 0.027009963989257812, 0.034534454345703125, 0.04205894470214844, 0.04958343505859375, 0.05710792541503906, 0.06463241577148438, 0.07215690612792969, 0.079681396484375, 0.08720588684082031, 0.09473037719726562, 0.10225486755371094, 0.10977935791015625, 0.11730384826660156, 0.12482833862304688, 0.1323528289794922, 0.1398773193359375, 0.1474018096923828, 0.15492630004882812, 0.16245079040527344, 0.16997528076171875, 0.17749977111816406, 0.18502426147460938, 0.1925487518310547, 0.2000732421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 15.0, 27.0, 59.0, 111.0, 325.0, 1256.0, 23576.0, 4160329.0, 7361.0, 791.0, 223.0, 100.0, 38.0, 26.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37890625, -5.24566650390625, -5.1124267578125, -4.97918701171875, -4.845947265625, -4.71270751953125, -4.5794677734375, -4.44622802734375, -4.31298828125, -4.17974853515625, -4.0465087890625, -3.91326904296875, -3.780029296875, -3.64678955078125, -3.5135498046875, -3.38031005859375, -3.2470703125, -3.11383056640625, -2.9805908203125, -2.84735107421875, -2.714111328125, -2.58087158203125, -2.4476318359375, -2.31439208984375, -2.18115234375, -2.04791259765625, -1.9146728515625, -1.78143310546875, -1.648193359375, -1.51495361328125, -1.3817138671875, -1.24847412109375, -1.115234375, -0.98199462890625, -0.8487548828125, -0.71551513671875, -0.582275390625, -0.44903564453125, -0.3157958984375, -0.18255615234375, -0.04931640625, 0.08392333984375, 0.2171630859375, 0.35040283203125, 0.483642578125, 0.61688232421875, 0.7501220703125, 0.88336181640625, 1.0166015625, 1.14984130859375, 1.2830810546875, 1.41632080078125, 1.549560546875, 1.68280029296875, 1.8160400390625, 1.94927978515625, 2.08251953125, 2.21575927734375, 2.3489990234375, 2.48223876953125, 2.615478515625, 2.74871826171875, 2.8819580078125, 3.01519775390625, 3.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 16.0, 31.0, 45.0, 92.0, 155.0, 259.0, 503.0, 954.0, 968.0, 497.0, 224.0, 148.0, 59.0, 45.0, 26.0, 11.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1131134033203125, -1.071929931640625, -1.0307464599609375, -0.98956298828125, -0.9483795166015625, -0.907196044921875, -0.8660125732421875, -0.8248291015625, -0.7836456298828125, -0.742462158203125, -0.7012786865234375, -0.66009521484375, -0.6189117431640625, -0.577728271484375, -0.5365447998046875, -0.495361328125, -0.4541778564453125, -0.412994384765625, -0.3718109130859375, -0.33062744140625, -0.2894439697265625, -0.248260498046875, -0.2070770263671875, -0.1658935546875, -0.1247100830078125, -0.083526611328125, -0.0423431396484375, -0.00115966796875, 0.0400238037109375, 0.081207275390625, 0.1223907470703125, 0.16357421875, 0.2047576904296875, 0.245941162109375, 0.2871246337890625, 0.32830810546875, 0.3694915771484375, 0.410675048828125, 0.4518585205078125, 0.4930419921875, 0.5342254638671875, 0.575408935546875, 0.6165924072265625, 0.65777587890625, 0.6989593505859375, 0.740142822265625, 0.7813262939453125, 0.822509765625, 0.8636932373046875, 0.904876708984375, 0.9460601806640625, 0.98724365234375, 1.0284271240234375, 1.069610595703125, 1.1107940673828125, 1.1519775390625, 1.1931610107421875, 1.234344482421875, 1.2755279541015625, 1.31671142578125, 1.3578948974609375, 1.399078369140625, 1.4402618408203125, 1.4814453125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 15.0, 50.0, 236.0, 466.0, 171.0, 41.0, 14.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.747618675231934, -11.972113609313965, -11.196608543395996, -10.421104431152344, -9.645599365234375, -8.870094299316406, -8.094589233398438, -7.319084167480469, -6.5435791015625, -5.768074035644531, -4.9925689697265625, -4.217064380645752, -3.441559314727783, -2.6660542488098145, -1.890549659729004, -1.1150445938110352, -0.3395395278930664, 0.4359654188156128, 1.211470365524292, 1.9869751930236816, 2.7624802589416504, 3.537985324859619, 4.31348991394043, 5.088994979858398, 5.864500045776367, 6.640005111694336, 7.415510177612305, 8.191015243530273, 8.966520309448242, 9.742025375366211, 10.517529487609863, 11.293034553527832, 12.068538665771484, 12.844043731689453, 13.619548797607422, 14.39505386352539, 15.17055892944336, 15.946063995361328, 16.721569061279297, 17.497074127197266, 18.272579193115234, 19.048084259033203, 19.823589324951172, 20.59909439086914, 21.37459945678711, 22.150104522705078, 22.925609588623047, 23.701114654541016, 24.47661781311035, 25.25212287902832, 26.02762794494629, 26.803133010864258, 27.578638076782227, 28.354143142700195, 29.12964630126953, 29.9051513671875, 30.68065643310547, 31.456161499023438, 32.231666564941406, 33.007171630859375, 33.782676696777344, 34.55818176269531, 35.33368682861328, 36.10919189453125, 36.88469696044922]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 6.0, 9.0, 10.0, 9.0, 15.0, 13.0, 14.0, 17.0, 21.0, 38.0, 36.0, 41.0, 38.0, 43.0, 42.0, 61.0, 76.0, 59.0, 50.0, 47.0, 48.0, 49.0, 40.0, 33.0, 31.0, 33.0, 22.0, 20.0, 18.0, 9.0, 13.0, 11.0, 10.0, 6.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.924989700317383, -3.778637170791626, -3.632284641265869, -3.485931873321533, -3.3395793437957764, -3.1932268142700195, -3.0468740463256836, -2.9005215167999268, -2.75416898727417, -2.607816457748413, -2.4614639282226562, -2.3151111602783203, -2.1687586307525635, -2.0224061012268066, -1.8760534524917603, -1.7297008037567139, -1.583348274230957, -1.4369957447052002, -1.2906430959701538, -1.1442904472351074, -0.9979379177093506, -0.851585328578949, -0.7052327394485474, -0.558880090713501, -0.41252756118774414, -0.26617497205734253, -0.11982238292694092, 0.026530206203460693, 0.1728827953338623, 0.3192353844642639, 0.4655879735946655, 0.6119406223297119, 0.7582931518554688, 0.9046457409858704, 1.050998330116272, 1.1973509788513184, 1.3437035083770752, 1.490056037902832, 1.6364086866378784, 1.7827613353729248, 1.9291138648986816, 2.0754663944244385, 2.2218189239501953, 2.3681716918945312, 2.514524221420288, 2.660876750946045, 2.807229518890381, 2.9535820484161377, 3.0999345779418945, 3.2462871074676514, 3.392639636993408, 3.538992404937744, 3.685344934463501, 3.831697463989258, 3.9780502319335938, 4.12440299987793, 4.270755290985107, 4.417108058929443, 4.563460350036621, 4.709813117980957, 4.856165885925293, 5.002518177032471, 5.148870944976807, 5.295223236083984, 5.44157600402832]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 11.0, 8.0, 8.0, 7.0, 16.0, 16.0, 19.0, 34.0, 45.0, 104.0, 305.0, 1134.0, 5583.0, 46435.0, 811663.0, 166800.0, 13263.0, 2161.0, 538.0, 180.0, 73.0, 48.0, 22.0, 13.0, 16.0, 8.0, 9.0, 5.0, 9.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0400390625, -1.01171875, -0.9833984375, -0.955078125, -0.9267578125, -0.8984375, -0.8701171875, -0.841796875, -0.8134765625, -0.78515625, -0.7568359375, -0.728515625, -0.7001953125, -0.671875, -0.6435546875, -0.615234375, -0.5869140625, -0.55859375, -0.5302734375, -0.501953125, -0.4736328125, -0.4453125, -0.4169921875, -0.388671875, -0.3603515625, -0.33203125, -0.3037109375, -0.275390625, -0.2470703125, -0.21875, -0.1904296875, -0.162109375, -0.1337890625, -0.10546875, -0.0771484375, -0.048828125, -0.0205078125, 0.0078125, 0.0361328125, 0.064453125, 0.0927734375, 0.12109375, 0.1494140625, 0.177734375, 0.2060546875, 0.234375, 0.2626953125, 0.291015625, 0.3193359375, 0.34765625, 0.3759765625, 0.404296875, 0.4326171875, 0.4609375, 0.4892578125, 0.517578125, 0.5458984375, 0.57421875, 0.6025390625, 0.630859375, 0.6591796875, 0.6875, 0.7158203125, 0.744140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 12.0, 29.0, 40.0, 77.0, 96.0, 151.0, 156.0, 144.0, 122.0, 75.0, 47.0, 27.0, 11.0, 11.0, 3.0, 1.0, 7.0], "bins": [-1.677734375, -1.6464385986328125, -1.615142822265625, -1.5838470458984375, -1.55255126953125, -1.5212554931640625, -1.489959716796875, -1.4586639404296875, -1.4273681640625, -1.3960723876953125, -1.364776611328125, -1.3334808349609375, -1.30218505859375, -1.2708892822265625, -1.239593505859375, -1.2082977294921875, -1.177001953125, -1.1457061767578125, -1.114410400390625, -1.0831146240234375, -1.05181884765625, -1.0205230712890625, -0.989227294921875, -0.9579315185546875, -0.9266357421875, -0.8953399658203125, -0.864044189453125, -0.8327484130859375, -0.80145263671875, -0.7701568603515625, -0.738861083984375, -0.7075653076171875, -0.67626953125, -0.6449737548828125, -0.613677978515625, -0.5823822021484375, -0.55108642578125, -0.5197906494140625, -0.488494873046875, -0.4571990966796875, -0.4259033203125, -0.3946075439453125, -0.363311767578125, -0.3320159912109375, -0.30072021484375, -0.2694244384765625, -0.238128662109375, -0.2068328857421875, -0.175537109375, -0.1442413330078125, -0.112945556640625, -0.0816497802734375, -0.05035400390625, -0.0190582275390625, 0.012237548828125, 0.0435333251953125, 0.0748291015625, 0.1061248779296875, 0.137420654296875, 0.1687164306640625, 0.20001220703125, 0.2313079833984375, 0.262603759765625, 0.2938995361328125, 0.3251953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 10.0, 16.0, 25.0, 35.0, 59.0, 79.0, 178.0, 316.0, 761.0, 2056.0, 7994.0, 61268.0, 908799.0, 55750.0, 7774.0, 1943.0, 723.0, 297.0, 184.0, 105.0, 63.0, 41.0, 19.0, 18.0, 7.0, 5.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5624771118164062, -0.5395050048828125, -0.5165328979492188, -0.493560791015625, -0.47058868408203125, -0.4476165771484375, -0.42464447021484375, -0.40167236328125, -0.37870025634765625, -0.3557281494140625, -0.33275604248046875, -0.309783935546875, -0.28681182861328125, -0.2638397216796875, -0.24086761474609375, -0.2178955078125, -0.19492340087890625, -0.1719512939453125, -0.14897918701171875, -0.126007080078125, -0.10303497314453125, -0.0800628662109375, -0.05709075927734375, -0.03411865234375, -0.01114654541015625, 0.0118255615234375, 0.03479766845703125, 0.057769775390625, 0.08074188232421875, 0.1037139892578125, 0.12668609619140625, 0.149658203125, 0.17263031005859375, 0.1956024169921875, 0.21857452392578125, 0.241546630859375, 0.26451873779296875, 0.2874908447265625, 0.31046295166015625, 0.33343505859375, 0.35640716552734375, 0.3793792724609375, 0.40235137939453125, 0.425323486328125, 0.44829559326171875, 0.4712677001953125, 0.49423980712890625, 0.5172119140625, 0.5401840209960938, 0.5631561279296875, 0.5861282348632812, 0.609100341796875, 0.6320724487304688, 0.6550445556640625, 0.6780166625976562, 0.70098876953125, 0.7239608764648438, 0.7469329833984375, 0.7699050903320312, 0.792877197265625, 0.8158493041992188, 0.8388214111328125, 0.8617935180664062, 0.884765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 9.0, 12.0, 6.0, 11.0, 18.0, 13.0, 10.0, 27.0, 23.0, 21.0, 29.0, 44.0, 37.0, 49.0, 64.0, 65.0, 86.0, 72.0, 73.0, 52.0, 54.0, 33.0, 25.0, 27.0, 21.0, 20.0, 12.0, 9.0, 17.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.423828125, -1.3787384033203125, -1.333648681640625, -1.2885589599609375, -1.24346923828125, -1.1983795166015625, -1.153289794921875, -1.1082000732421875, -1.0631103515625, -1.0180206298828125, -0.972930908203125, -0.9278411865234375, -0.88275146484375, -0.8376617431640625, -0.792572021484375, -0.7474822998046875, -0.702392578125, -0.6573028564453125, -0.612213134765625, -0.5671234130859375, -0.52203369140625, -0.4769439697265625, -0.431854248046875, -0.3867645263671875, -0.3416748046875, -0.2965850830078125, -0.251495361328125, -0.2064056396484375, -0.16131591796875, -0.1162261962890625, -0.071136474609375, -0.0260467529296875, 0.01904296875, 0.0641326904296875, 0.109222412109375, 0.1543121337890625, 0.19940185546875, 0.2444915771484375, 0.289581298828125, 0.3346710205078125, 0.3797607421875, 0.4248504638671875, 0.469940185546875, 0.5150299072265625, 0.56011962890625, 0.6052093505859375, 0.650299072265625, 0.6953887939453125, 0.740478515625, 0.7855682373046875, 0.830657958984375, 0.8757476806640625, 0.92083740234375, 0.9659271240234375, 1.011016845703125, 1.0561065673828125, 1.1011962890625, 1.1462860107421875, 1.191375732421875, 1.2364654541015625, 1.28155517578125, 1.3266448974609375, 1.371734619140625, 1.4168243408203125, 1.4619140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 9.0, 5.0, 9.0, 16.0, 22.0, 37.0, 46.0, 89.0, 162.0, 294.0, 657.0, 1486.0, 4189.0, 16307.0, 113123.0, 854329.0, 44253.0, 8934.0, 2565.0, 1004.0, 462.0, 214.0, 120.0, 68.0, 46.0, 25.0, 17.0, 22.0, 13.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13916969299316406, -0.13441848754882812, -0.1296672821044922, -0.12491607666015625, -0.12016487121582031, -0.11541366577148438, -0.11066246032714844, -0.1059112548828125, -0.10116004943847656, -0.09640884399414062, -0.09165763854980469, -0.08690643310546875, -0.08215522766113281, -0.07740402221679688, -0.07265281677246094, -0.067901611328125, -0.06315040588378906, -0.058399200439453125, -0.05364799499511719, -0.04889678955078125, -0.04414558410644531, -0.039394378662109375, -0.03464317321777344, -0.0298919677734375, -0.025140762329101562, -0.020389556884765625, -0.015638351440429688, -0.01088714599609375, -0.0061359405517578125, -0.001384735107421875, 0.0033664703369140625, 0.00811767578125, 0.012868881225585938, 0.017620086669921875, 0.022371292114257812, 0.02712249755859375, 0.03187370300292969, 0.036624908447265625, 0.04137611389160156, 0.0461273193359375, 0.05087852478027344, 0.055629730224609375, 0.06038093566894531, 0.06513214111328125, 0.06988334655761719, 0.07463455200195312, 0.07938575744628906, 0.084136962890625, 0.08888816833496094, 0.09363937377929688, 0.09839057922363281, 0.10314178466796875, 0.10789299011230469, 0.11264419555664062, 0.11739540100097656, 0.1221466064453125, 0.12689781188964844, 0.13164901733398438, 0.1364002227783203, 0.14115142822265625, 0.1459026336669922, 0.15065383911132812, 0.15540504455566406, 0.16015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 3.0, 10.0, 7.0, 7.0, 6.0, 13.0, 21.0, 20.0, 35.0, 30.0, 49.0, 59.0, 80.0, 115.0, 103.0, 91.0, 79.0, 63.0, 45.0, 26.0, 23.0, 15.0, 12.0, 20.0, 10.0, 6.0, 6.0, 10.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.9981136322021484e-05, -2.895388752222061e-05, -2.792663872241974e-05, -2.6899389922618866e-05, -2.5872141122817993e-05, -2.484489232301712e-05, -2.3817643523216248e-05, -2.2790394723415375e-05, -2.1763145923614502e-05, -2.073589712381363e-05, -1.9708648324012756e-05, -1.8681399524211884e-05, -1.765415072441101e-05, -1.6626901924610138e-05, -1.5599653124809265e-05, -1.4572404325008392e-05, -1.354515552520752e-05, -1.2517906725406647e-05, -1.1490657925605774e-05, -1.0463409125804901e-05, -9.436160326004028e-06, -8.408911526203156e-06, -7.381662726402283e-06, -6.35441392660141e-06, -5.327165126800537e-06, -4.299916326999664e-06, -3.2726675271987915e-06, -2.2454187273979187e-06, -1.218169927597046e-06, -1.909211277961731e-07, 8.363276720046997e-07, 1.8635764718055725e-06, 2.8908252716064453e-06, 3.918074071407318e-06, 4.945322871208191e-06, 5.972571671009064e-06, 6.9998204708099365e-06, 8.02706927061081e-06, 9.054318070411682e-06, 1.0081566870212555e-05, 1.1108815670013428e-05, 1.21360644698143e-05, 1.3163313269615173e-05, 1.4190562069416046e-05, 1.5217810869216919e-05, 1.6245059669017792e-05, 1.7272308468818665e-05, 1.8299557268619537e-05, 1.932680606842041e-05, 2.0354054868221283e-05, 2.1381303668022156e-05, 2.240855246782303e-05, 2.34358012676239e-05, 2.4463050067424774e-05, 2.5490298867225647e-05, 2.651754766702652e-05, 2.7544796466827393e-05, 2.8572045266628265e-05, 2.9599294066429138e-05, 3.062654286623001e-05, 3.1653791666030884e-05, 3.2681040465831757e-05, 3.370828926563263e-05, 3.47355380654335e-05, 3.5762786865234375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 13.0, 11.0, 18.0, 20.0, 41.0, 96.0, 184.0, 451.0, 1779.0, 9885.0, 168127.0, 848172.0, 16293.0, 2450.0, 614.0, 192.0, 75.0, 49.0, 27.0, 15.0, 9.0, 11.0, 6.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.2509040832519531, -0.24228668212890625, -0.23366928100585938, -0.2250518798828125, -0.21643447875976562, -0.20781707763671875, -0.19919967651367188, -0.190582275390625, -0.18196487426757812, -0.17334747314453125, -0.16473007202148438, -0.1561126708984375, -0.14749526977539062, -0.13887786865234375, -0.13026046752929688, -0.12164306640625, -0.11302566528320312, -0.10440826416015625, -0.09579086303710938, -0.0871734619140625, -0.07855606079101562, -0.06993865966796875, -0.061321258544921875, -0.052703857421875, -0.044086456298828125, -0.03546905517578125, -0.026851654052734375, -0.0182342529296875, -0.009616851806640625, -0.00099945068359375, 0.007617950439453125, 0.0162353515625, 0.024852752685546875, 0.03347015380859375, 0.042087554931640625, 0.0507049560546875, 0.059322357177734375, 0.06793975830078125, 0.07655715942382812, 0.085174560546875, 0.09379196166992188, 0.10240936279296875, 0.11102676391601562, 0.1196441650390625, 0.12826156616210938, 0.13687896728515625, 0.14549636840820312, 0.15411376953125, 0.16273117065429688, 0.17134857177734375, 0.17996597290039062, 0.1885833740234375, 0.19720077514648438, 0.20581817626953125, 0.21443557739257812, 0.223052978515625, 0.23167037963867188, 0.24028778076171875, 0.24890518188476562, 0.2575225830078125, 0.2661399841308594, 0.27475738525390625, 0.2833747863769531, 0.2919921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 5.0, 4.0, 9.0, 9.0, 25.0, 25.0, 20.0, 37.0, 41.0, 43.0, 52.0, 64.0, 83.0, 81.0, 88.0, 85.0, 60.0, 60.0, 33.0, 36.0, 34.0, 19.0, 16.0, 12.0, 7.0, 14.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16049575805664062, -0.15558624267578125, -0.15067672729492188, -0.1457672119140625, -0.14085769653320312, -0.13594818115234375, -0.13103866577148438, -0.126129150390625, -0.12121963500976562, -0.11631011962890625, -0.11140060424804688, -0.1064910888671875, -0.10158157348632812, -0.09667205810546875, -0.09176254272460938, -0.08685302734375, -0.08194351196289062, -0.07703399658203125, -0.07212448120117188, -0.0672149658203125, -0.062305450439453125, -0.05739593505859375, -0.052486419677734375, -0.047576904296875, -0.042667388916015625, -0.03775787353515625, -0.032848358154296875, -0.0279388427734375, -0.023029327392578125, -0.01811981201171875, -0.013210296630859375, -0.00830078125, -0.003391265869140625, 0.00151824951171875, 0.006427764892578125, 0.0113372802734375, 0.016246795654296875, 0.02115631103515625, 0.026065826416015625, 0.030975341796875, 0.035884857177734375, 0.04079437255859375, 0.045703887939453125, 0.0506134033203125, 0.055522918701171875, 0.06043243408203125, 0.06534194946289062, 0.07025146484375, 0.07516098022460938, 0.08007049560546875, 0.08498001098632812, 0.0898895263671875, 0.09479904174804688, 0.09970855712890625, 0.10461807250976562, 0.109527587890625, 0.11443710327148438, 0.11934661865234375, 0.12425613403320312, 0.1291656494140625, 0.13407516479492188, 0.13898468017578125, 0.14389419555664062, 0.1488037109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 4.0, 18.0, 35.0, 51.0, 82.0, 327.0, 262.0, 76.0, 51.0, 30.0, 16.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.079756736755371, -3.922390937805176, -3.7650251388549805, -3.607659339904785, -3.45029354095459, -3.2929277420043945, -3.135561943054199, -2.978196144104004, -2.8208303451538086, -2.6634645462036133, -2.506098747253418, -2.3487329483032227, -2.1913671493530273, -2.034001350402832, -1.8766355514526367, -1.7192697525024414, -1.561903953552246, -1.4045381546020508, -1.2471723556518555, -1.0898065567016602, -0.9324407577514648, -0.7750749588012695, -0.6177091598510742, -0.4603433609008789, -0.3029775619506836, -0.14561176300048828, 0.011754035949707031, 0.16911983489990234, 0.32648563385009766, 0.48385143280029297, 0.6412172317504883, 0.7985830307006836, 0.9559488296508789, 1.1133146286010742, 1.2706804275512695, 1.4280462265014648, 1.5854120254516602, 1.7427778244018555, 1.9001436233520508, 2.057509422302246, 2.2148752212524414, 2.3722410202026367, 2.529606819152832, 2.6869726181030273, 2.8443384170532227, 3.001704216003418, 3.1590700149536133, 3.3164358139038086, 3.473801612854004, 3.631167411804199, 3.7885332107543945, 3.94589900970459, 4.103264808654785, 4.2606306076049805, 4.417996406555176, 4.575362205505371, 4.732728004455566, 4.890093803405762, 5.047459602355957, 5.204825401306152, 5.362191200256348, 5.519556999206543, 5.676922798156738, 5.834288597106934, 5.991654396057129]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 5.0, 12.0, 6.0, 9.0, 9.0, 16.0, 12.0, 14.0, 22.0, 13.0, 21.0, 22.0, 27.0, 65.0, 95.0, 114.0, 109.0, 90.0, 84.0, 47.0, 18.0, 20.0, 23.0, 18.0, 20.0, 13.0, 12.0, 7.0, 7.0, 13.0, 5.0, 6.0, 4.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.4178333282470703, -3.3118650913238525, -3.205897092819214, -3.099928855895996, -2.9939608573913574, -2.8879926204681396, -2.782024383544922, -2.676056385040283, -2.5700881481170654, -2.4641199111938477, -2.358151912689209, -2.252183675765991, -2.1462154388427734, -2.0402474403381348, -1.934279203414917, -1.8283110857009888, -1.7223429679870605, -1.6163748502731323, -1.510406732559204, -1.4044384956359863, -1.298470377922058, -1.1925022602081299, -1.086534023284912, -0.9805659055709839, -0.8745977878570557, -0.7686296701431274, -0.6626614928245544, -0.5566933155059814, -0.4507251977920532, -0.344757080078125, -0.238788902759552, -0.132820725440979, -0.026852846145629883, 0.07911530137062073, 0.18508344888687134, 0.29105159640312195, 0.39701974391937256, 0.5029878616333008, 0.6089560389518738, 0.7149242162704468, 0.820892333984375, 0.9268604516983032, 1.0328285694122314, 1.1387968063354492, 1.2447649240493774, 1.3507330417633057, 1.4567012786865234, 1.5626693964004517, 1.6686375141143799, 1.774605631828308, 1.8805737495422363, 1.986541986465454, 2.092510223388672, 2.1984782218933105, 2.3044464588165283, 2.410414695739746, 2.5163826942443848, 2.6223509311676025, 2.728318929672241, 2.834287166595459, 2.9402551651000977, 3.0462234020233154, 3.152191638946533, 3.258159637451172, 3.3641278743743896]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 4.0, 9.0, 17.0, 11.0, 18.0, 19.0, 37.0, 35.0, 43.0, 40.0, 65.0, 139.0, 196.0, 84.0, 41.0, 39.0, 38.0, 36.0, 25.0, 13.0, 17.0, 18.0, 14.0, 7.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49169921875, -0.477691650390625, -0.46368408203125, -0.449676513671875, -0.4356689453125, -0.421661376953125, -0.40765380859375, -0.393646240234375, -0.379638671875, -0.365631103515625, -0.35162353515625, -0.337615966796875, -0.3236083984375, -0.309600830078125, -0.29559326171875, -0.281585693359375, -0.267578125, -0.253570556640625, -0.23956298828125, -0.225555419921875, -0.2115478515625, -0.197540283203125, -0.18353271484375, -0.169525146484375, -0.155517578125, -0.141510009765625, -0.12750244140625, -0.113494873046875, -0.0994873046875, -0.085479736328125, -0.07147216796875, -0.057464599609375, -0.04345703125, -0.029449462890625, -0.01544189453125, -0.001434326171875, 0.0125732421875, 0.026580810546875, 0.04058837890625, 0.054595947265625, 0.068603515625, 0.082611083984375, 0.09661865234375, 0.110626220703125, 0.1246337890625, 0.138641357421875, 0.15264892578125, 0.166656494140625, 0.1806640625, 0.194671630859375, 0.20867919921875, 0.222686767578125, 0.2366943359375, 0.250701904296875, 0.26470947265625, 0.278717041015625, 0.292724609375, 0.306732177734375, 0.32073974609375, 0.334747314453125, 0.3487548828125, 0.362762451171875, 0.37677001953125, 0.390777587890625, 0.40478515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 9.0, 7.0, 11.0, 26.0, 45.0, 57.0, 88.0, 162.0, 277.0, 567.0, 1209.0, 3033.0, 11080.0, 801048.0, 7553075.0, 11709.0, 3495.0, 1338.0, 585.0, 259.0, 135.0, 86.0, 60.0, 50.0, 37.0, 27.0, 19.0, 9.0, 2.0, 5.0, 12.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0], "bins": [-1.5678791999816895, -1.51895010471344, -1.4700210094451904, -1.4210920333862305, -1.372162938117981, -1.3232338428497314, -1.274304747581482, -1.2253756523132324, -1.1764466762542725, -1.127517580986023, -1.0785884857177734, -1.0296595096588135, -0.980730414390564, -0.9318013191223145, -0.8828722238540649, -0.8339431285858154, -0.7850140333175659, -0.7360849380493164, -0.6871559023857117, -0.6382268071174622, -0.5892977714538574, -0.5403686761856079, -0.4914395809173584, -0.4425105154514313, -0.39358144998550415, -0.344652384519577, -0.2957233190536499, -0.2467942237854004, -0.19786515831947327, -0.14893609285354614, -0.10000699758529663, -0.05107793211936951, -0.002148747444152832, 0.04678032547235489, 0.09570939838886261, 0.14463847875595093, 0.19356754422187805, 0.24249660968780518, 0.2914257049560547, 0.3403547704219818, 0.38928383588790894, 0.43821290135383606, 0.4871419668197632, 0.5360710620880127, 0.5850001573562622, 0.6339291930198669, 0.6828582882881165, 0.7317873239517212, 0.7807164192199707, 0.8296455144882202, 0.878574550151825, 0.9275036454200745, 0.9764326810836792, 1.0253617763519287, 1.0742908716201782, 1.1232199668884277, 1.1721489429473877, 1.2210780382156372, 1.2700071334838867, 1.3189361095428467, 1.3678652048110962, 1.4167943000793457, 1.4657233953475952, 1.5146524906158447, 1.5635815858840942]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 13.0, 4.0, 6.0, 7.0, 5.0, 9.0, 5.0, 11.0, 7.0, 10.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.238897323608398, -10.036127090454102, -9.833356857299805, -9.630587577819824, -9.427817344665527, -9.22504711151123, -9.022276878356934, -8.819507598876953, -8.616737365722656, -8.41396713256836, -8.211196899414062, -8.008427619934082, -7.805657386779785, -7.602887153625488, -7.400116920471191, -7.197347164154053, -6.994576930999756, -6.791806697845459, -6.58903694152832, -6.386266708374023, -6.183496952056885, -5.980726718902588, -5.777956962585449, -5.575186729431152, -5.3724164962768555, -5.169646263122559, -4.96687650680542, -4.764106273651123, -4.561336517333984, -4.3585662841796875, -4.155796051025391, -3.953026294708252, -3.7502570152282715, -3.5474870204925537, -3.344717025756836, -3.141946792602539, -2.9391770362854004, -2.7364068031311035, -2.5336368083953857, -2.330866813659668, -2.12809681892395, -1.9253268241882324, -1.7225568294525146, -1.5197867155075073, -1.3170167207717896, -1.1142467260360718, -0.9114766120910645, -0.7087066173553467, -0.5059366226196289, -0.30316659808158875, -0.10039657354354858, 0.10237348079681396, 0.30514347553253174, 0.5079134702682495, 0.7106835842132568, 0.9134535789489746, 1.1162235736846924, 1.3189935684204102, 1.521763563156128, 1.7245336771011353, 1.927303671836853, 2.1300735473632812, 2.332843780517578, 2.535613775253296, 2.7383837699890137]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 5.0, 24.0, 12.0, 30.0, 35.0, 44.0, 43.0, 70.0, 78.0, 64.0, 60.0, 69.0, 71.0, 73.0, 58.0, 49.0, 49.0, 34.0, 26.0, 13.0, 18.0, 10.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.3018646240234375, -0.290252685546875, -0.2786407470703125, -0.26702880859375, -0.2554168701171875, -0.243804931640625, -0.2321929931640625, -0.2205810546875, -0.2089691162109375, -0.197357177734375, -0.1857452392578125, -0.17413330078125, -0.1625213623046875, -0.150909423828125, -0.1392974853515625, -0.127685546875, -0.1160736083984375, -0.104461669921875, -0.0928497314453125, -0.08123779296875, -0.0696258544921875, -0.058013916015625, -0.0464019775390625, -0.0347900390625, -0.0231781005859375, -0.011566162109375, 4.57763671875e-05, 0.01165771484375, 0.0232696533203125, 0.034881591796875, 0.0464935302734375, 0.05810546875, 0.0697174072265625, 0.081329345703125, 0.0929412841796875, 0.10455322265625, 0.1161651611328125, 0.127777099609375, 0.1393890380859375, 0.1510009765625, 0.1626129150390625, 0.174224853515625, 0.1858367919921875, 0.19744873046875, 0.2090606689453125, 0.220672607421875, 0.2322845458984375, 0.243896484375, 0.2555084228515625, 0.267120361328125, 0.2787322998046875, 0.29034423828125, 0.3019561767578125, 0.313568115234375, 0.3251800537109375, 0.3367919921875, 0.3484039306640625, 0.360015869140625, 0.3716278076171875, 0.38323974609375, 0.3948516845703125, 0.406463623046875, 0.4180755615234375, 0.4296875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 16.0, 20.0, 29.0, 39.0, 69.0, 112.0, 159.0, 238.0, 419.0, 719.0, 1420.0, 2874.0, 6284.0, 15060.0, 39028.0, 102712.0, 182009.0, 105552.0, 39658.0, 15596.0, 6461.0, 2862.0, 1368.0, 700.0, 320.0, 194.0, 113.0, 80.0, 50.0, 21.0, 22.0, 16.0, 3.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.59765625, -1.551361083984375, -1.50506591796875, -1.458770751953125, -1.4124755859375, -1.366180419921875, -1.31988525390625, -1.273590087890625, -1.227294921875, -1.180999755859375, -1.13470458984375, -1.088409423828125, -1.0421142578125, -0.995819091796875, -0.94952392578125, -0.903228759765625, -0.85693359375, -0.810638427734375, -0.76434326171875, -0.718048095703125, -0.6717529296875, -0.625457763671875, -0.57916259765625, -0.532867431640625, -0.486572265625, -0.440277099609375, -0.39398193359375, -0.347686767578125, -0.3013916015625, -0.255096435546875, -0.20880126953125, -0.162506103515625, -0.1162109375, -0.069915771484375, -0.02362060546875, 0.022674560546875, 0.0689697265625, 0.115264892578125, 0.16156005859375, 0.207855224609375, 0.254150390625, 0.300445556640625, 0.34674072265625, 0.393035888671875, 0.4393310546875, 0.485626220703125, 0.53192138671875, 0.578216552734375, 0.62451171875, 0.670806884765625, 0.71710205078125, 0.763397216796875, 0.8096923828125, 0.855987548828125, 0.90228271484375, 0.948577880859375, 0.994873046875, 1.041168212890625, 1.08746337890625, 1.133758544921875, 1.1800537109375, 1.226348876953125, 1.27264404296875, 1.318939208984375, 1.365234375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 8.0, 4.0, 6.0, 10.0, 6.0, 8.0, 11.0, 17.0, 16.0, 20.0, 25.0, 25.0, 45.0, 35.0, 31.0, 52.0, 50.0, 59.0, 52.0, 55.0, 60.0, 45.0, 54.0, 49.0, 34.0, 33.0, 38.0, 32.0, 23.0, 19.0, 10.0, 8.0, 12.0, 11.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.27734375, -0.2700366973876953, -0.2627296447753906, -0.25542259216308594, -0.24811553955078125, -0.24080848693847656, -0.23350143432617188, -0.2261943817138672, -0.2188873291015625, -0.2115802764892578, -0.20427322387695312, -0.19696617126464844, -0.18965911865234375, -0.18235206604003906, -0.17504501342773438, -0.1677379608154297, -0.160430908203125, -0.1531238555908203, -0.14581680297851562, -0.13850975036621094, -0.13120269775390625, -0.12389564514160156, -0.11658859252929688, -0.10928153991699219, -0.1019744873046875, -0.09466743469238281, -0.08736038208007812, -0.08005332946777344, -0.07274627685546875, -0.06543922424316406, -0.058132171630859375, -0.05082511901855469, -0.04351806640625, -0.03621101379394531, -0.028903961181640625, -0.021596908569335938, -0.01428985595703125, -0.0069828033447265625, 0.000324249267578125, 0.0076313018798828125, 0.0149383544921875, 0.022245407104492188, 0.029552459716796875, 0.03685951232910156, 0.04416656494140625, 0.05147361755371094, 0.058780670166015625, 0.06608772277832031, 0.073394775390625, 0.08070182800292969, 0.08800888061523438, 0.09531593322753906, 0.10262298583984375, 0.10993003845214844, 0.11723709106445312, 0.12454414367675781, 0.1318511962890625, 0.1391582489013672, 0.14646530151367188, 0.15377235412597656, 0.16107940673828125, 0.16838645935058594, 0.17569351196289062, 0.1830005645751953, 0.1903076171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 11.0, 12.0, 11.0, 31.0, 44.0, 76.0, 100.0, 82.0, 44.0, 23.0, 10.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5849573612213135, -2.513430595397949, -2.441904067993164, -2.3703773021698, -2.2988505363464355, -2.2273240089416504, -2.155797243118286, -2.084270477294922, -2.0127439498901367, -1.941217303276062, -1.8696905374526978, -1.798163890838623, -1.7266372442245483, -1.6551105976104736, -1.5835838317871094, -1.5120571851730347, -1.4405304193496704, -1.3690037727355957, -1.2974770069122314, -1.2259503602981567, -1.154423713684082, -1.0828969478607178, -1.011370301246643, -0.9398436546325684, -0.8683169484138489, -0.7967902421951294, -0.7252635955810547, -0.6537368893623352, -0.5822101831436157, -0.510683536529541, -0.43915683031082153, -0.3676301836967468, -0.2961033582687378, -0.2245766818523407, -0.1530499905347824, -0.08152329921722412, -0.009996622800827026, 0.06153005361557007, 0.13305675983428955, 0.20458340644836426, 0.27611011266708374, 0.34763678908348083, 0.41916346549987793, 0.4906901717185974, 0.5622168779373169, 0.6337435245513916, 0.7052702307701111, 0.7767968773841858, 0.8483235836029053, 0.9198502898216248, 0.9913769364356995, 1.062903642654419, 1.1344302892684937, 1.2059569358825684, 1.2774837017059326, 1.3490103483200073, 1.420536994934082, 1.4920636415481567, 1.563590407371521, 1.6351170539855957, 1.7066437005996704, 1.7781703472137451, 1.8496971130371094, 1.921223759651184, 1.9927505254745483]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 8.0, 19.0, 28.0, 50.0, 77.0, 65.0, 59.0, 44.0, 16.0, 17.0, 15.0, 6.0, 7.0, 9.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-1.6058992147445679, -1.5647358894348145, -1.5235724449157715, -1.482409119606018, -1.4412457942962646, -1.4000824689865112, -1.3589191436767578, -1.3177556991577148, -1.2765923738479614, -1.235429048538208, -1.194265604019165, -1.1531022787094116, -1.1119389533996582, -1.0707756280899048, -1.0296123027801514, -0.9884488582611084, -0.947285532951355, -0.9061222076416016, -0.8649588227272034, -0.8237954378128052, -0.7826321125030518, -0.7414687871932983, -0.7003054022789001, -0.659142017364502, -0.6179786920547485, -0.5768153667449951, -0.5356519818305969, -0.4944886267185211, -0.4533252716064453, -0.4121619164943695, -0.3709985613822937, -0.3298352062702179, -0.28867197036743164, -0.24750861525535583, -0.20634526014328003, -0.16518190503120422, -0.12401854991912842, -0.08285519480705261, -0.04169183969497681, -0.000528484582901001, 0.040634870529174805, 0.08179822564125061, 0.12296158075332642, 0.16412493586540222, 0.20528829097747803, 0.24645164608955383, 0.28761500120162964, 0.32877835631370544, 0.36994171142578125, 0.41110506653785706, 0.45226842164993286, 0.49343177676200867, 0.5345951318740845, 0.5757584571838379, 0.6169218420982361, 0.6580852270126343, 0.6992485523223877, 0.7404118776321411, 0.7815752625465393, 0.8227386474609375, 0.8639019727706909, 0.9050652980804443, 0.9462286829948425, 0.9873920679092407, 1.0285553932189941]}, "eval/loss": 0.32257843017578125, "eval/wer": 0.09236414121380404, "eval/runtime": 558.1846, "eval/samples_per_second": 4.733, "eval/steps_per_second": 0.593, "train/train_runtime": 26664.6603, "train/train_samples_per_second": 5.351, "train/train_steps_per_second": 0.084, "train/total_flos": 0.0, "train/train_loss": 1.6266609489166015} \ No newline at end of file +{"train/loss": 0.0607, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 5.0, "train/global_step": 2230, "_runtime": 27450, "_timestamp": 1648082204, "_step": 2235, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 68.0, 378.0, 461.0, 73.0, 23.0, 5.0], "bins": [-18.02739143371582, -17.72731590270996, -17.4272403717041, -17.127166748046875, -16.827091217041016, -16.527015686035156, -16.226940155029297, -15.926865577697754, -15.626791000366211, -15.326715469360352, -15.026640892028809, -14.72656536102295, -14.426490783691406, -14.126415252685547, -13.826340675354004, -13.526265144348145, -13.226189613342285, -12.926114082336426, -12.626039505004883, -12.325963973999023, -12.02588939666748, -11.725813865661621, -11.425739288330078, -11.125663757324219, -10.82558822631836, -10.5255126953125, -10.225438117980957, -9.925362586975098, -9.625288009643555, -9.325212478637695, -9.025137901306152, -8.725062370300293, -8.42498779296875, -8.12491226196289, -7.824837684631348, -7.5247626304626465, -7.224687576293945, -6.924612045288086, -6.624536991119385, -6.324461936950684, -6.024386882781982, -5.724311828613281, -5.42423677444458, -5.124161720275879, -4.8240861892700195, -4.524011611938477, -4.223936080932617, -3.923861026763916, -3.623785972595215, -3.3237109184265137, -3.0236358642578125, -2.7235605716705322, -2.423485517501831, -2.12341046333313, -1.8233352899551392, -1.5232601165771484, -1.2231850624084473, -0.9231099486351013, -0.6230348348617554, -0.3229597210884094, -0.022884607315063477, 0.2771904468536377, 0.5772656202316284, 0.8773407936096191, 1.1774158477783203]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 11.0, 14.0, 14.0, 20.0, 26.0, 20.0, 29.0, 30.0, 47.0, 41.0, 36.0, 27.0, 36.0, 39.0, 42.0, 64.0, 43.0, 57.0, 43.0, 37.0, 54.0, 40.0, 31.0, 31.0, 27.0, 24.0, 22.0, 22.0, 21.0, 7.0, 10.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5585064888000488, -1.5144308805465698, -1.4703552722930908, -1.4262796640396118, -1.3822040557861328, -1.3381283283233643, -1.2940528392791748, -1.2499771118164062, -1.2059015035629272, -1.1618258953094482, -1.1177502870559692, -1.0736746788024902, -1.0295990705490112, -0.9855234026908875, -0.9414477944374084, -0.8973721265792847, -0.8532965779304504, -0.8092209696769714, -0.7651453614234924, -0.7210696935653687, -0.6769940853118896, -0.6329184770584106, -0.5888428688049316, -0.5447672605514526, -0.5006916522979736, -0.45661604404449463, -0.41254040598869324, -0.36846479773521423, -0.32438915967941284, -0.28031355142593384, -0.23623794317245483, -0.19216230511665344, -0.14808666706085205, -0.10401104390621185, -0.05993542820215225, -0.01585981249809265, 0.028215810656547546, 0.07229143381118774, 0.11636704206466675, 0.16044268012046814, 0.20451828837394714, 0.24859391152858734, 0.29266953468322754, 0.33674514293670654, 0.38082075119018555, 0.42489638924598694, 0.46897199749946594, 0.5130476355552673, 0.5571232438087463, 0.6011988520622253, 0.6452744603157043, 0.6893501281738281, 0.7334257364273071, 0.7775013446807861, 0.8215769529342651, 0.8656525611877441, 0.9097281694412231, 0.9538037776947021, 0.9978793859481812, 1.0419549942016602, 1.0860306024551392, 1.1301062107086182, 1.1741819381713867, 1.2182575464248657, 1.2623331546783447]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 15.0, 18.0, 25.0, 39.0, 64.0, 77.0, 122.0, 168.0, 265.0, 409.0, 597.0, 977.0, 1516.0, 2377.0, 3912.0, 7508.0, 26892.0, 350221.0, 3272449.0, 467680.0, 39875.0, 8556.0, 4066.0, 2386.0, 1466.0, 911.0, 571.0, 376.0, 238.0, 168.0, 115.0, 81.0, 39.0, 27.0, 22.0, 20.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.497314453125, -4.35009765625, -4.202880859375, -4.0556640625, -3.908447265625, -3.76123046875, -3.614013671875, -3.466796875, -3.319580078125, -3.17236328125, -3.025146484375, -2.8779296875, -2.730712890625, -2.58349609375, -2.436279296875, -2.2890625, -2.141845703125, -1.99462890625, -1.847412109375, -1.7001953125, -1.552978515625, -1.40576171875, -1.258544921875, -1.111328125, -0.964111328125, -0.81689453125, -0.669677734375, -0.5224609375, -0.375244140625, -0.22802734375, -0.080810546875, 0.06640625, 0.213623046875, 0.36083984375, 0.508056640625, 0.6552734375, 0.802490234375, 0.94970703125, 1.096923828125, 1.244140625, 1.391357421875, 1.53857421875, 1.685791015625, 1.8330078125, 1.980224609375, 2.12744140625, 2.274658203125, 2.421875, 2.569091796875, 2.71630859375, 2.863525390625, 3.0107421875, 3.157958984375, 3.30517578125, 3.452392578125, 3.599609375, 3.746826171875, 3.89404296875, 4.041259765625, 4.1884765625, 4.335693359375, 4.48291015625, 4.630126953125, 4.77734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 15.0, 17.0, 23.0, 21.0, 27.0, 31.0, 29.0, 33.0, 34.0, 27.0, 40.0, 35.0, 35.0, 55.0, 54.0, 52.0, 42.0, 45.0, 38.0, 34.0, 50.0, 24.0, 26.0, 26.0, 29.0, 12.0, 17.0, 22.0, 13.0, 6.0, 10.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0], "bins": [-2.458984375, -2.390777587890625, -2.32257080078125, -2.254364013671875, -2.1861572265625, -2.117950439453125, -2.04974365234375, -1.981536865234375, -1.913330078125, -1.845123291015625, -1.77691650390625, -1.708709716796875, -1.6405029296875, -1.572296142578125, -1.50408935546875, -1.435882568359375, -1.36767578125, -1.299468994140625, -1.23126220703125, -1.163055419921875, -1.0948486328125, -1.026641845703125, -0.95843505859375, -0.890228271484375, -0.822021484375, -0.753814697265625, -0.68560791015625, -0.617401123046875, -0.5491943359375, -0.480987548828125, -0.41278076171875, -0.344573974609375, -0.2763671875, -0.208160400390625, -0.13995361328125, -0.071746826171875, -0.0035400390625, 0.064666748046875, 0.13287353515625, 0.201080322265625, 0.269287109375, 0.337493896484375, 0.40570068359375, 0.473907470703125, 0.5421142578125, 0.610321044921875, 0.67852783203125, 0.746734619140625, 0.81494140625, 0.883148193359375, 0.95135498046875, 1.019561767578125, 1.0877685546875, 1.155975341796875, 1.22418212890625, 1.292388916015625, 1.360595703125, 1.428802490234375, 1.49700927734375, 1.565216064453125, 1.6334228515625, 1.701629638671875, 1.76983642578125, 1.838043212890625, 1.90625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 10.0, 21.0, 21.0, 29.0, 86.0, 312.0, 6910.0, 4183939.0, 2593.0, 203.0, 59.0, 28.0, 21.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.5, -50.001953125, -48.50390625, -47.005859375, -45.5078125, -44.009765625, -42.51171875, -41.013671875, -39.515625, -38.017578125, -36.51953125, -35.021484375, -33.5234375, -32.025390625, -30.52734375, -29.029296875, -27.53125, -26.033203125, -24.53515625, -23.037109375, -21.5390625, -20.041015625, -18.54296875, -17.044921875, -15.546875, -14.048828125, -12.55078125, -11.052734375, -9.5546875, -8.056640625, -6.55859375, -5.060546875, -3.5625, -2.064453125, -0.56640625, 0.931640625, 2.4296875, 3.927734375, 5.42578125, 6.923828125, 8.421875, 9.919921875, 11.41796875, 12.916015625, 14.4140625, 15.912109375, 17.41015625, 18.908203125, 20.40625, 21.904296875, 23.40234375, 24.900390625, 26.3984375, 27.896484375, 29.39453125, 30.892578125, 32.390625, 33.888671875, 35.38671875, 36.884765625, 38.3828125, 39.880859375, 41.37890625, 42.876953125, 44.375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 20.0, 16.0, 29.0, 66.0, 144.0, 864.0, 2344.0, 370.0, 80.0, 45.0, 16.0, 23.0, 14.0, 7.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.607421875, -2.533538818359375, -2.45965576171875, -2.385772705078125, -2.3118896484375, -2.238006591796875, -2.16412353515625, -2.090240478515625, -2.016357421875, -1.942474365234375, -1.86859130859375, -1.794708251953125, -1.7208251953125, -1.646942138671875, -1.57305908203125, -1.499176025390625, -1.42529296875, -1.351409912109375, -1.27752685546875, -1.203643798828125, -1.1297607421875, -1.055877685546875, -0.98199462890625, -0.908111572265625, -0.834228515625, -0.760345458984375, -0.68646240234375, -0.612579345703125, -0.5386962890625, -0.464813232421875, -0.39093017578125, -0.317047119140625, -0.2431640625, -0.169281005859375, -0.09539794921875, -0.021514892578125, 0.0523681640625, 0.126251220703125, 0.20013427734375, 0.274017333984375, 0.347900390625, 0.421783447265625, 0.49566650390625, 0.569549560546875, 0.6434326171875, 0.717315673828125, 0.79119873046875, 0.865081787109375, 0.93896484375, 1.012847900390625, 1.08673095703125, 1.160614013671875, 1.2344970703125, 1.308380126953125, 1.38226318359375, 1.456146240234375, 1.530029296875, 1.603912353515625, 1.67779541015625, 1.751678466796875, 1.8255615234375, 1.899444580078125, 1.97332763671875, 2.047210693359375, 2.12109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 20.0, 23.0, 24.0, 29.0, 54.0, 62.0, 87.0, 85.0, 102.0, 96.0, 86.0, 60.0, 49.0, 35.0, 28.0, 20.0, 25.0, 10.0, 12.0, 6.0, 5.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.95149827003479, -2.8608500957489014, -2.7702019214630127, -2.679553985595703, -2.5889058113098145, -2.498257637023926, -2.407609462738037, -2.3169612884521484, -2.2263131141662598, -2.135664939880371, -2.0450167655944824, -1.9543687105178833, -1.8637206554412842, -1.7730724811553955, -1.6824243068695068, -1.5917761325836182, -1.5011281967163086, -1.41048002243042, -1.3198319673538208, -1.2291837930679321, -1.138535737991333, -1.0478875637054443, -0.9572393894195557, -0.8665912747383118, -0.7759431600570679, -0.685295045375824, -0.5946469306945801, -0.5039987564086914, -0.4133506417274475, -0.3227025270462036, -0.23205435276031494, -0.14140623807907104, -0.05075812339782715, 0.03989000618457794, 0.13053813576698303, 0.22118628025054932, 0.3118343949317932, 0.4024825096130371, 0.4931306838989258, 0.5837787985801697, 0.6744269132614136, 0.7650750279426575, 0.8557231426239014, 0.94637131690979, 1.0370194911956787, 1.1276675462722778, 1.2183157205581665, 1.3089637756347656, 1.3996119499206543, 1.490260124206543, 1.580908179283142, 1.6715563535690308, 1.7622044086456299, 1.8528525829315186, 1.9435007572174072, 2.034148931503296, 2.1247968673706055, 2.215445041656494, 2.306093215942383, 2.3967413902282715, 2.487389326095581, 2.5780375003814697, 2.6686856746673584, 2.759333848953247, 2.8499820232391357]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 1.0, 5.0, 9.0, 6.0, 12.0, 13.0, 15.0, 19.0, 20.0, 22.0, 32.0, 32.0, 28.0, 35.0, 31.0, 33.0, 36.0, 44.0, 40.0, 29.0, 58.0, 43.0, 46.0, 36.0, 34.0, 40.0, 33.0, 30.0, 26.0, 21.0, 26.0, 20.0, 18.0, 20.0, 18.0, 9.0, 15.0, 8.0, 10.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.039533853530884, -1.9769076108932495, -1.9142814874649048, -1.8516552448272705, -1.7890291213989258, -1.7264028787612915, -1.6637766361236572, -1.6011505126953125, -1.5385242700576782, -1.475898027420044, -1.4132719039916992, -1.350645661354065, -1.2880194187164307, -1.225393295288086, -1.1627670526504517, -1.1001408100128174, -1.0375146865844727, -0.9748885035514832, -0.9122623205184937, -0.8496360778808594, -0.7870098948478699, -0.7243837118148804, -0.6617574691772461, -0.5991312861442566, -0.5365051031112671, -0.4738789200782776, -0.4112527072429657, -0.3486264944076538, -0.2860003113746643, -0.2233741283416748, -0.16074791550636292, -0.09812170267105103, -0.03549528121948242, 0.027130916714668274, 0.08975711464881897, 0.15238331258296967, 0.21500951051712036, 0.27763569355010986, 0.34026190638542175, 0.40288811922073364, 0.46551430225372314, 0.5281404852867126, 0.5907666683197021, 0.6533929109573364, 0.7160190939903259, 0.7786452770233154, 0.8412715196609497, 0.9038977026939392, 0.9665238857269287, 1.029150128364563, 1.0917762517929077, 1.154402494430542, 1.2170286178588867, 1.279654860496521, 1.3422811031341553, 1.4049072265625, 1.4675334692001343, 1.5301597118377686, 1.5927858352661133, 1.6554120779037476, 1.7180383205413818, 1.7806644439697266, 1.8432906866073608, 1.9059169292449951, 1.9685430526733398]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 13.0, 12.0, 19.0, 36.0, 41.0, 56.0, 86.0, 116.0, 169.0, 263.0, 363.0, 556.0, 840.0, 1318.0, 2252.0, 3521.0, 6272.0, 11190.0, 21637.0, 44246.0, 99651.0, 244308.0, 335984.0, 148025.0, 63239.0, 29368.0, 14888.0, 8000.0, 4501.0, 2753.0, 1727.0, 1051.0, 682.0, 442.0, 298.0, 176.0, 135.0, 94.0, 63.0, 46.0, 39.0, 23.0, 16.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.708984375, -0.6876449584960938, -0.6663055419921875, -0.6449661254882812, -0.623626708984375, -0.6022872924804688, -0.5809478759765625, -0.5596084594726562, -0.53826904296875, -0.5169296264648438, -0.4955902099609375, -0.47425079345703125, -0.452911376953125, -0.43157196044921875, -0.4102325439453125, -0.38889312744140625, -0.3675537109375, -0.34621429443359375, -0.3248748779296875, -0.30353546142578125, -0.282196044921875, -0.26085662841796875, -0.2395172119140625, -0.21817779541015625, -0.19683837890625, -0.17549896240234375, -0.1541595458984375, -0.13282012939453125, -0.111480712890625, -0.09014129638671875, -0.0688018798828125, -0.04746246337890625, -0.026123046875, -0.00478363037109375, 0.0165557861328125, 0.03789520263671875, 0.059234619140625, 0.08057403564453125, 0.1019134521484375, 0.12325286865234375, 0.14459228515625, 0.16593170166015625, 0.1872711181640625, 0.20861053466796875, 0.229949951171875, 0.25128936767578125, 0.2726287841796875, 0.29396820068359375, 0.3153076171875, 0.33664703369140625, 0.3579864501953125, 0.37932586669921875, 0.400665283203125, 0.42200469970703125, 0.4433441162109375, 0.46468353271484375, 0.48602294921875, 0.5073623657226562, 0.5287017822265625, 0.5500411987304688, 0.571380615234375, 0.5927200317382812, 0.6140594482421875, 0.6353988647460938, 0.65673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 4.0, 6.0, 7.0, 22.0, 9.0, 18.0, 14.0, 19.0, 39.0, 32.0, 31.0, 30.0, 41.0, 42.0, 52.0, 53.0, 45.0, 48.0, 65.0, 56.0, 41.0, 54.0, 32.0, 40.0, 24.0, 37.0, 10.0, 19.0, 18.0, 17.0, 16.0, 18.0, 12.0, 5.0, 9.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8525390625, -1.7936248779296875, -1.734710693359375, -1.6757965087890625, -1.61688232421875, -1.5579681396484375, -1.499053955078125, -1.4401397705078125, -1.3812255859375, -1.3223114013671875, -1.263397216796875, -1.2044830322265625, -1.14556884765625, -1.0866546630859375, -1.027740478515625, -0.9688262939453125, -0.909912109375, -0.8509979248046875, -0.792083740234375, -0.7331695556640625, -0.67425537109375, -0.6153411865234375, -0.556427001953125, -0.4975128173828125, -0.4385986328125, -0.3796844482421875, -0.320770263671875, -0.2618560791015625, -0.20294189453125, -0.1440277099609375, -0.085113525390625, -0.0261993408203125, 0.03271484375, 0.0916290283203125, 0.150543212890625, 0.2094573974609375, 0.26837158203125, 0.3272857666015625, 0.386199951171875, 0.4451141357421875, 0.5040283203125, 0.5629425048828125, 0.621856689453125, 0.6807708740234375, 0.73968505859375, 0.7985992431640625, 0.857513427734375, 0.9164276123046875, 0.975341796875, 1.0342559814453125, 1.093170166015625, 1.1520843505859375, 1.21099853515625, 1.2699127197265625, 1.328826904296875, 1.3877410888671875, 1.4466552734375, 1.5055694580078125, 1.564483642578125, 1.6233978271484375, 1.68231201171875, 1.7412261962890625, 1.800140380859375, 1.8590545654296875, 1.91796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 8.0, 14.0, 16.0, 34.0, 42.0, 48.0, 80.0, 104.0, 115.0, 207.0, 283.0, 366.0, 585.0, 890.0, 1314.0, 2122.0, 3317.0, 5547.0, 10256.0, 21772.0, 56196.0, 187567.0, 465487.0, 187973.0, 56884.0, 21818.0, 10281.0, 5666.0, 3281.0, 2050.0, 1350.0, 884.0, 591.0, 455.0, 271.0, 169.0, 132.0, 92.0, 66.0, 57.0, 36.0, 26.0, 27.0, 22.0, 8.0, 7.0, 8.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70849609375, -0.6852645874023438, -0.6620330810546875, -0.6388015747070312, -0.615570068359375, -0.5923385620117188, -0.5691070556640625, -0.5458755493164062, -0.52264404296875, -0.49941253662109375, -0.4761810302734375, -0.45294952392578125, -0.429718017578125, -0.40648651123046875, -0.3832550048828125, -0.36002349853515625, -0.3367919921875, -0.31356048583984375, -0.2903289794921875, -0.26709747314453125, -0.243865966796875, -0.22063446044921875, -0.1974029541015625, -0.17417144775390625, -0.15093994140625, -0.12770843505859375, -0.1044769287109375, -0.08124542236328125, -0.058013916015625, -0.03478240966796875, -0.0115509033203125, 0.01168060302734375, 0.034912109375, 0.05814361572265625, 0.0813751220703125, 0.10460662841796875, 0.127838134765625, 0.15106964111328125, 0.1743011474609375, 0.19753265380859375, 0.22076416015625, 0.24399566650390625, 0.2672271728515625, 0.29045867919921875, 0.313690185546875, 0.33692169189453125, 0.3601531982421875, 0.38338470458984375, 0.4066162109375, 0.42984771728515625, 0.4530792236328125, 0.47631072998046875, 0.499542236328125, 0.5227737426757812, 0.5460052490234375, 0.5692367553710938, 0.59246826171875, 0.6156997680664062, 0.6389312744140625, 0.6621627807617188, 0.685394287109375, 0.7086257934570312, 0.7318572998046875, 0.7550888061523438, 0.7783203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 6.0, 12.0, 12.0, 20.0, 16.0, 7.0, 22.0, 28.0, 39.0, 35.0, 30.0, 56.0, 34.0, 43.0, 49.0, 45.0, 39.0, 41.0, 43.0, 51.0, 32.0, 50.0, 40.0, 23.0, 25.0, 24.0, 27.0, 18.0, 9.0, 19.0, 11.0, 14.0, 12.0, 12.0, 4.0, 5.0, 7.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.44921875, -3.3392333984375, -3.229248046875, -3.1192626953125, -3.00927734375, -2.8992919921875, -2.789306640625, -2.6793212890625, -2.5693359375, -2.4593505859375, -2.349365234375, -2.2393798828125, -2.12939453125, -2.0194091796875, -1.909423828125, -1.7994384765625, -1.689453125, -1.5794677734375, -1.469482421875, -1.3594970703125, -1.24951171875, -1.1395263671875, -1.029541015625, -0.9195556640625, -0.8095703125, -0.6995849609375, -0.589599609375, -0.4796142578125, -0.36962890625, -0.2596435546875, -0.149658203125, -0.0396728515625, 0.0703125, 0.1802978515625, 0.290283203125, 0.4002685546875, 0.51025390625, 0.6202392578125, 0.730224609375, 0.8402099609375, 0.9501953125, 1.0601806640625, 1.170166015625, 1.2801513671875, 1.39013671875, 1.5001220703125, 1.610107421875, 1.7200927734375, 1.830078125, 1.9400634765625, 2.050048828125, 2.1600341796875, 2.27001953125, 2.3800048828125, 2.489990234375, 2.5999755859375, 2.7099609375, 2.8199462890625, 2.929931640625, 3.0399169921875, 3.14990234375, 3.2598876953125, 3.369873046875, 3.4798583984375, 3.58984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 18.0, 23.0, 37.0, 57.0, 74.0, 125.0, 217.0, 385.0, 715.0, 1460.0, 3476.0, 10271.0, 44002.0, 572482.0, 365937.0, 34546.0, 8662.0, 3029.0, 1363.0, 666.0, 366.0, 205.0, 133.0, 82.0, 61.0, 39.0, 29.0, 21.0, 17.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.326446533203125, -0.31475830078125, -0.303070068359375, -0.2913818359375, -0.279693603515625, -0.26800537109375, -0.256317138671875, -0.24462890625, -0.232940673828125, -0.22125244140625, -0.209564208984375, -0.1978759765625, -0.186187744140625, -0.17449951171875, -0.162811279296875, -0.151123046875, -0.139434814453125, -0.12774658203125, -0.116058349609375, -0.1043701171875, -0.092681884765625, -0.08099365234375, -0.069305419921875, -0.0576171875, -0.045928955078125, -0.03424072265625, -0.022552490234375, -0.0108642578125, 0.000823974609375, 0.01251220703125, 0.024200439453125, 0.035888671875, 0.047576904296875, 0.05926513671875, 0.070953369140625, 0.0826416015625, 0.094329833984375, 0.10601806640625, 0.117706298828125, 0.12939453125, 0.141082763671875, 0.15277099609375, 0.164459228515625, 0.1761474609375, 0.187835693359375, 0.19952392578125, 0.211212158203125, 0.222900390625, 0.234588623046875, 0.24627685546875, 0.257965087890625, 0.2696533203125, 0.281341552734375, 0.29302978515625, 0.304718017578125, 0.31640625, 0.328094482421875, 0.33978271484375, 0.351470947265625, 0.3631591796875, 0.374847412109375, 0.38653564453125, 0.398223876953125, 0.409912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 10.0, 17.0, 14.0, 41.0, 69.0, 100.0, 209.0, 223.0, 124.0, 60.0, 39.0, 24.0, 12.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002739429473876953, -0.0002659037709236145, -0.0002578645944595337, -0.0002498254179954529, -0.00024178624153137207, -0.00023374706506729126, -0.00022570788860321045, -0.00021766871213912964, -0.00020962953567504883, -0.00020159035921096802, -0.0001935511827468872, -0.0001855120062828064, -0.00017747282981872559, -0.00016943365335464478, -0.00016139447689056396, -0.00015335530042648315, -0.00014531612396240234, -0.00013727694749832153, -0.00012923777103424072, -0.00012119859457015991, -0.0001131594181060791, -0.00010512024164199829, -9.708106517791748e-05, -8.904188871383667e-05, -8.100271224975586e-05, -7.296353578567505e-05, -6.492435932159424e-05, -5.688518285751343e-05, -4.884600639343262e-05, -4.080682992935181e-05, -3.2767653465270996e-05, -2.4728477001190186e-05, -1.6689300537109375e-05, -8.650124073028564e-06, -6.109476089477539e-07, 7.428228855133057e-06, 1.5467405319213867e-05, 2.3506581783294678e-05, 3.154575824737549e-05, 3.95849347114563e-05, 4.762411117553711e-05, 5.566328763961792e-05, 6.370246410369873e-05, 7.174164056777954e-05, 7.978081703186035e-05, 8.781999349594116e-05, 9.585916996002197e-05, 0.00010389834642410278, 0.0001119375228881836, 0.0001199766993522644, 0.00012801587581634521, 0.00013605505228042603, 0.00014409422874450684, 0.00015213340520858765, 0.00016017258167266846, 0.00016821175813674927, 0.00017625093460083008, 0.0001842901110649109, 0.0001923292875289917, 0.0002003684639930725, 0.00020840764045715332, 0.00021644681692123413, 0.00022448599338531494, 0.00023252516984939575, 0.00024056434631347656]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 6.0, 12.0, 27.0, 44.0, 101.0, 160.0, 367.0, 973.0, 2628.0, 9675.0, 47184.0, 656701.0, 291334.0, 29329.0, 6594.0, 2026.0, 759.0, 324.0, 131.0, 66.0, 35.0, 11.0, 12.0, 12.0, 10.0, 3.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67333984375, -0.6534576416015625, -0.633575439453125, -0.6136932373046875, -0.59381103515625, -0.5739288330078125, -0.554046630859375, -0.5341644287109375, -0.5142822265625, -0.4944000244140625, -0.474517822265625, -0.4546356201171875, -0.43475341796875, -0.4148712158203125, -0.394989013671875, -0.3751068115234375, -0.355224609375, -0.3353424072265625, -0.315460205078125, -0.2955780029296875, -0.27569580078125, -0.2558135986328125, -0.235931396484375, -0.2160491943359375, -0.1961669921875, -0.1762847900390625, -0.156402587890625, -0.1365203857421875, -0.11663818359375, -0.0967559814453125, -0.076873779296875, -0.0569915771484375, -0.037109375, -0.0172271728515625, 0.002655029296875, 0.0225372314453125, 0.04241943359375, 0.0623016357421875, 0.082183837890625, 0.1020660400390625, 0.1219482421875, 0.1418304443359375, 0.161712646484375, 0.1815948486328125, 0.20147705078125, 0.2213592529296875, 0.241241455078125, 0.2611236572265625, 0.281005859375, 0.3008880615234375, 0.320770263671875, 0.3406524658203125, 0.36053466796875, 0.3804168701171875, 0.400299072265625, 0.4201812744140625, 0.4400634765625, 0.4599456787109375, 0.479827880859375, 0.4997100830078125, 0.51959228515625, 0.5394744873046875, 0.559356689453125, 0.5792388916015625, 0.59912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 7.0, 5.0, 2.0, 4.0, 13.0, 18.0, 20.0, 29.0, 28.0, 34.0, 47.0, 67.0, 99.0, 104.0, 140.0, 93.0, 73.0, 52.0, 45.0, 26.0, 28.0, 10.0, 13.0, 8.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.137939453125, -0.13399505615234375, -0.1300506591796875, -0.12610626220703125, -0.122161865234375, -0.11821746826171875, -0.1142730712890625, -0.11032867431640625, -0.10638427734375, -0.10243988037109375, -0.0984954833984375, -0.09455108642578125, -0.090606689453125, -0.08666229248046875, -0.0827178955078125, -0.07877349853515625, -0.0748291015625, -0.07088470458984375, -0.0669403076171875, -0.06299591064453125, -0.059051513671875, -0.05510711669921875, -0.0511627197265625, -0.04721832275390625, -0.04327392578125, -0.03932952880859375, -0.0353851318359375, -0.03144073486328125, -0.027496337890625, -0.02355194091796875, -0.0196075439453125, -0.01566314697265625, -0.01171875, -0.00777435302734375, -0.0038299560546875, 0.00011444091796875, 0.004058837890625, 0.00800323486328125, 0.0119476318359375, 0.01589202880859375, 0.01983642578125, 0.02378082275390625, 0.0277252197265625, 0.03166961669921875, 0.035614013671875, 0.03955841064453125, 0.0435028076171875, 0.04744720458984375, 0.0513916015625, 0.05533599853515625, 0.0592803955078125, 0.06322479248046875, 0.067169189453125, 0.07111358642578125, 0.0750579833984375, 0.07900238037109375, 0.08294677734375, 0.08689117431640625, 0.0908355712890625, 0.09477996826171875, 0.098724365234375, 0.10266876220703125, 0.1066131591796875, 0.11055755615234375, 0.114501953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 11.0, 11.0, 9.0, 12.0, 26.0, 34.0, 40.0, 72.0, 86.0, 120.0, 145.0, 113.0, 87.0, 56.0, 42.0, 36.0, 20.0, 17.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.930957317352295, -2.8432822227478027, -2.7556071281433105, -2.6679320335388184, -2.580256938934326, -2.492581844329834, -2.404906749725342, -2.3172316551208496, -2.2295565605163574, -2.1418814659118652, -2.054206371307373, -1.9665312767028809, -1.8788561820983887, -1.7911810874938965, -1.7035058736801147, -1.6158307790756226, -1.5281555652618408, -1.4404804706573486, -1.3528053760528564, -1.2651302814483643, -1.177455186843872, -1.0897800922393799, -1.0021048784255981, -0.914429783821106, -0.8267546892166138, -0.7390795946121216, -0.6514045000076294, -0.5637293457984924, -0.47605425119400024, -0.38837915658950806, -0.3007040023803711, -0.2130289077758789, -0.12535405158996582, -0.03767894208431244, 0.04999616742134094, 0.13767129182815552, 0.2253463864326477, 0.3130214810371399, 0.40069663524627686, 0.48837172985076904, 0.5760468244552612, 0.6637219190597534, 0.7513970136642456, 0.8390721678733826, 0.9267472624778748, 1.0144224166870117, 1.102097511291504, 1.189772605895996, 1.2774477005004883, 1.3651227951049805, 1.4527978897094727, 1.5404729843139648, 1.628148078918457, 1.7158231735229492, 1.803498387336731, 1.8911734819412231, 1.9788485765457153, 2.066523790359497, 2.1541988849639893, 2.2418739795684814, 2.3295490741729736, 2.417224168777466, 2.504899263381958, 2.59257435798645, 2.6802494525909424]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 0.0, 1.0, 10.0, 3.0, 7.0, 14.0, 15.0, 20.0, 16.0, 24.0, 33.0, 26.0, 43.0, 31.0, 44.0, 41.0, 38.0, 47.0, 45.0, 64.0, 50.0, 49.0, 47.0, 42.0, 40.0, 38.0, 23.0, 31.0, 19.0, 18.0, 27.0, 22.0, 23.0, 13.0, 8.0, 5.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7804385423660278, -1.7255982160568237, -1.67075777053833, -1.615917444229126, -1.5610769987106323, -1.5062366724014282, -1.4513962268829346, -1.3965559005737305, -1.3417155742645264, -1.2868752479553223, -1.2320348024368286, -1.1771944761276245, -1.1223540306091309, -1.0675137042999268, -1.0126733779907227, -0.957832932472229, -0.9029924869537354, -0.8481521010398865, -0.7933117151260376, -0.7384713888168335, -0.6836309432983398, -0.6287906169891357, -0.5739502310752869, -0.519109845161438, -0.4642694592475891, -0.40942907333374023, -0.35458868741989136, -0.29974833130836487, -0.244907945394516, -0.19006755948066711, -0.13522720336914062, -0.08038681745529175, -0.02554631233215332, 0.02929406613111496, 0.08413444459438324, 0.13897481560707092, 0.1938152015209198, 0.24865558743476868, 0.30349594354629517, 0.35833632946014404, 0.4131767153739929, 0.4680171012878418, 0.5228574872016907, 0.5776978731155396, 0.6325381994247437, 0.6873786449432373, 0.7422189712524414, 0.7970593571662903, 0.8518997430801392, 0.906740128993988, 0.9615805149078369, 1.016420841217041, 1.0712612867355347, 1.1261016130447388, 1.1809420585632324, 1.2357823848724365, 1.2906227111816406, 1.3454630374908447, 1.4003034830093384, 1.4551438093185425, 1.5099842548370361, 1.5648245811462402, 1.6196649074554443, 1.674505352973938, 1.7293457984924316]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 20.0, 28.0, 56.0, 58.0, 104.0, 147.0, 251.0, 434.0, 601.0, 1047.0, 1671.0, 2732.0, 4621.0, 7970.0, 15159.0, 34077.0, 167967.0, 690710.0, 69267.0, 24022.0, 11784.0, 6347.0, 3722.0, 2156.0, 1356.0, 808.0, 493.0, 323.0, 174.0, 141.0, 101.0, 47.0, 30.0, 22.0, 12.0, 14.0, 10.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.21875, -2.152099609375, -2.08544921875, -2.018798828125, -1.9521484375, -1.885498046875, -1.81884765625, -1.752197265625, -1.685546875, -1.618896484375, -1.55224609375, -1.485595703125, -1.4189453125, -1.352294921875, -1.28564453125, -1.218994140625, -1.15234375, -1.085693359375, -1.01904296875, -0.952392578125, -0.8857421875, -0.819091796875, -0.75244140625, -0.685791015625, -0.619140625, -0.552490234375, -0.48583984375, -0.419189453125, -0.3525390625, -0.285888671875, -0.21923828125, -0.152587890625, -0.0859375, -0.019287109375, 0.04736328125, 0.114013671875, 0.1806640625, 0.247314453125, 0.31396484375, 0.380615234375, 0.447265625, 0.513916015625, 0.58056640625, 0.647216796875, 0.7138671875, 0.780517578125, 0.84716796875, 0.913818359375, 0.98046875, 1.047119140625, 1.11376953125, 1.180419921875, 1.2470703125, 1.313720703125, 1.38037109375, 1.447021484375, 1.513671875, 1.580322265625, 1.64697265625, 1.713623046875, 1.7802734375, 1.846923828125, 1.91357421875, 1.980224609375, 2.046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 5.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 15.0, 23.0, 23.0, 24.0, 17.0, 33.0, 40.0, 25.0, 27.0, 31.0, 54.0, 42.0, 51.0, 41.0, 51.0, 45.0, 37.0, 39.0, 40.0, 28.0, 26.0, 25.0, 24.0, 21.0, 22.0, 13.0, 28.0, 18.0, 16.0, 15.0, 6.0, 11.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.05859375, -2.9703369140625, -2.882080078125, -2.7938232421875, -2.70556640625, -2.6173095703125, -2.529052734375, -2.4407958984375, -2.3525390625, -2.2642822265625, -2.176025390625, -2.0877685546875, -1.99951171875, -1.9112548828125, -1.822998046875, -1.7347412109375, -1.646484375, -1.5582275390625, -1.469970703125, -1.3817138671875, -1.29345703125, -1.2052001953125, -1.116943359375, -1.0286865234375, -0.9404296875, -0.8521728515625, -0.763916015625, -0.6756591796875, -0.58740234375, -0.4991455078125, -0.410888671875, -0.3226318359375, -0.234375, -0.1461181640625, -0.057861328125, 0.0303955078125, 0.11865234375, 0.2069091796875, 0.295166015625, 0.3834228515625, 0.4716796875, 0.5599365234375, 0.648193359375, 0.7364501953125, 0.82470703125, 0.9129638671875, 1.001220703125, 1.0894775390625, 1.177734375, 1.2659912109375, 1.354248046875, 1.4425048828125, 1.53076171875, 1.6190185546875, 1.707275390625, 1.7955322265625, 1.8837890625, 1.9720458984375, 2.060302734375, 2.1485595703125, 2.23681640625, 2.3250732421875, 2.413330078125, 2.5015869140625, 2.58984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 20.0, 16.0, 17.0, 25.0, 38.0, 56.0, 72.0, 100.0, 123.0, 210.0, 323.0, 536.0, 907.0, 1728.0, 3448.0, 7046.0, 16164.0, 47933.0, 506600.0, 390783.0, 43192.0, 15279.0, 6607.0, 3126.0, 1684.0, 955.0, 544.0, 324.0, 219.0, 114.0, 88.0, 68.0, 49.0, 41.0, 23.0, 19.0, 13.0, 11.0, 11.0, 7.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.1470947265625, -2.075439453125, -2.0037841796875, -1.93212890625, -1.8604736328125, -1.788818359375, -1.7171630859375, -1.6455078125, -1.5738525390625, -1.502197265625, -1.4305419921875, -1.35888671875, -1.2872314453125, -1.215576171875, -1.1439208984375, -1.072265625, -1.0006103515625, -0.928955078125, -0.8572998046875, -0.78564453125, -0.7139892578125, -0.642333984375, -0.5706787109375, -0.4990234375, -0.4273681640625, -0.355712890625, -0.2840576171875, -0.21240234375, -0.1407470703125, -0.069091796875, 0.0025634765625, 0.07421875, 0.1458740234375, 0.217529296875, 0.2891845703125, 0.36083984375, 0.4324951171875, 0.504150390625, 0.5758056640625, 0.6474609375, 0.7191162109375, 0.790771484375, 0.8624267578125, 0.93408203125, 1.0057373046875, 1.077392578125, 1.1490478515625, 1.220703125, 1.2923583984375, 1.364013671875, 1.4356689453125, 1.50732421875, 1.5789794921875, 1.650634765625, 1.7222900390625, 1.7939453125, 1.8656005859375, 1.937255859375, 2.0089111328125, 2.08056640625, 2.1522216796875, 2.223876953125, 2.2955322265625, 2.3671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 4.0, 5.0, 7.0, 12.0, 8.0, 13.0, 19.0, 9.0, 20.0, 15.0, 25.0, 37.0, 32.0, 30.0, 30.0, 45.0, 51.0, 35.0, 43.0, 42.0, 41.0, 53.0, 30.0, 36.0, 45.0, 33.0, 32.0, 25.0, 33.0, 22.0, 28.0, 25.0, 24.0, 16.0, 9.0, 7.0, 11.0, 15.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.03497314453125, -2.9410400390625, -2.84710693359375, -2.753173828125, -2.65924072265625, -2.5653076171875, -2.47137451171875, -2.37744140625, -2.28350830078125, -2.1895751953125, -2.09564208984375, -2.001708984375, -1.90777587890625, -1.8138427734375, -1.71990966796875, -1.6259765625, -1.53204345703125, -1.4381103515625, -1.34417724609375, -1.250244140625, -1.15631103515625, -1.0623779296875, -0.96844482421875, -0.87451171875, -0.78057861328125, -0.6866455078125, -0.59271240234375, -0.498779296875, -0.40484619140625, -0.3109130859375, -0.21697998046875, -0.123046875, -0.02911376953125, 0.0648193359375, 0.15875244140625, 0.252685546875, 0.34661865234375, 0.4405517578125, 0.53448486328125, 0.62841796875, 0.72235107421875, 0.8162841796875, 0.91021728515625, 1.004150390625, 1.09808349609375, 1.1920166015625, 1.28594970703125, 1.3798828125, 1.47381591796875, 1.5677490234375, 1.66168212890625, 1.755615234375, 1.84954833984375, 1.9434814453125, 2.03741455078125, 2.13134765625, 2.22528076171875, 2.3192138671875, 2.41314697265625, 2.507080078125, 2.60101318359375, 2.6949462890625, 2.78887939453125, 2.8828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 15.0, 18.0, 14.0, 24.0, 38.0, 58.0, 59.0, 97.0, 151.0, 253.0, 451.0, 800.0, 1596.0, 2942.0, 6542.0, 21353.0, 933773.0, 60981.0, 10562.0, 4107.0, 2112.0, 1085.0, 590.0, 333.0, 187.0, 114.0, 76.0, 54.0, 50.0, 36.0, 23.0, 15.0, 7.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.130859375, -2.065765380859375, -2.00067138671875, -1.935577392578125, -1.8704833984375, -1.805389404296875, -1.74029541015625, -1.675201416015625, -1.610107421875, -1.545013427734375, -1.47991943359375, -1.414825439453125, -1.3497314453125, -1.284637451171875, -1.21954345703125, -1.154449462890625, -1.08935546875, -1.024261474609375, -0.95916748046875, -0.894073486328125, -0.8289794921875, -0.763885498046875, -0.69879150390625, -0.633697509765625, -0.568603515625, -0.503509521484375, -0.43841552734375, -0.373321533203125, -0.3082275390625, -0.243133544921875, -0.17803955078125, -0.112945556640625, -0.0478515625, 0.017242431640625, 0.08233642578125, 0.147430419921875, 0.2125244140625, 0.277618408203125, 0.34271240234375, 0.407806396484375, 0.472900390625, 0.537994384765625, 0.60308837890625, 0.668182373046875, 0.7332763671875, 0.798370361328125, 0.86346435546875, 0.928558349609375, 0.99365234375, 1.058746337890625, 1.12384033203125, 1.188934326171875, 1.2540283203125, 1.319122314453125, 1.38421630859375, 1.449310302734375, 1.514404296875, 1.579498291015625, 1.64459228515625, 1.709686279296875, 1.7747802734375, 1.839874267578125, 1.90496826171875, 1.970062255859375, 2.03515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 3.0, 2.0, 8.0, 12.0, 46.0, 333.0, 500.0, 33.0, 16.0, 11.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331878662109375, -0.00031444430351257324, -0.0002970099449157715, -0.0002795755863189697, -0.00026214122772216797, -0.0002447068691253662, -0.00022727251052856445, -0.0002098381519317627, -0.00019240379333496094, -0.00017496943473815918, -0.00015753507614135742, -0.00014010071754455566, -0.0001226663589477539, -0.00010523200035095215, -8.779764175415039e-05, -7.036328315734863e-05, -5.2928924560546875e-05, -3.549456596374512e-05, -1.806020736694336e-05, -6.258487701416016e-07, 1.6808509826660156e-05, 3.4242868423461914e-05, 5.167722702026367e-05, 6.911158561706543e-05, 8.654594421386719e-05, 0.00010398030281066895, 0.0001214146614074707, 0.00013884902000427246, 0.00015628337860107422, 0.00017371773719787598, 0.00019115209579467773, 0.0002085864543914795, 0.00022602081298828125, 0.000243455171585083, 0.00026088953018188477, 0.0002783238887786865, 0.0002957582473754883, 0.00031319260597229004, 0.0003306269645690918, 0.00034806132316589355, 0.0003654956817626953, 0.00038293004035949707, 0.00040036439895629883, 0.0004177987575531006, 0.00043523311614990234, 0.0004526674747467041, 0.00047010183334350586, 0.0004875361919403076, 0.0005049705505371094, 0.0005224049091339111, 0.0005398392677307129, 0.0005572736263275146, 0.0005747079849243164, 0.0005921423435211182, 0.0006095767021179199, 0.0006270110607147217, 0.0006444454193115234, 0.0006618797779083252, 0.000679314136505127, 0.0006967484951019287, 0.0007141828536987305, 0.0007316172122955322, 0.000749051570892334, 0.0007664859294891357, 0.0007839202880859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 13.0, 12.0, 21.0, 28.0, 47.0, 70.0, 81.0, 141.0, 182.0, 267.0, 414.0, 679.0, 1077.0, 1869.0, 3831.0, 10748.0, 126518.0, 876760.0, 15522.0, 4696.0, 2179.0, 1199.0, 746.0, 488.0, 293.0, 199.0, 145.0, 103.0, 62.0, 55.0, 34.0, 25.0, 20.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.79364013671875, -1.7298583984375, -1.66607666015625, -1.602294921875, -1.53851318359375, -1.4747314453125, -1.41094970703125, -1.34716796875, -1.28338623046875, -1.2196044921875, -1.15582275390625, -1.092041015625, -1.02825927734375, -0.9644775390625, -0.90069580078125, -0.8369140625, -0.77313232421875, -0.7093505859375, -0.64556884765625, -0.581787109375, -0.51800537109375, -0.4542236328125, -0.39044189453125, -0.32666015625, -0.26287841796875, -0.1990966796875, -0.13531494140625, -0.071533203125, -0.00775146484375, 0.0560302734375, 0.11981201171875, 0.18359375, 0.24737548828125, 0.3111572265625, 0.37493896484375, 0.438720703125, 0.50250244140625, 0.5662841796875, 0.63006591796875, 0.69384765625, 0.75762939453125, 0.8214111328125, 0.88519287109375, 0.948974609375, 1.01275634765625, 1.0765380859375, 1.14031982421875, 1.2041015625, 1.26788330078125, 1.3316650390625, 1.39544677734375, 1.459228515625, 1.52301025390625, 1.5867919921875, 1.65057373046875, 1.71435546875, 1.77813720703125, 1.8419189453125, 1.90570068359375, 1.969482421875, 2.03326416015625, 2.0970458984375, 2.16082763671875, 2.224609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 24.0, 41.0, 286.0, 473.0, 72.0, 25.0, 16.0, 7.0, 8.0, 6.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.941131591796875, -0.90765380859375, -0.874176025390625, -0.8406982421875, -0.807220458984375, -0.77374267578125, -0.740264892578125, -0.706787109375, -0.673309326171875, -0.63983154296875, -0.606353759765625, -0.5728759765625, -0.539398193359375, -0.50592041015625, -0.472442626953125, -0.43896484375, -0.405487060546875, -0.37200927734375, -0.338531494140625, -0.3050537109375, -0.271575927734375, -0.23809814453125, -0.204620361328125, -0.171142578125, -0.137664794921875, -0.10418701171875, -0.070709228515625, -0.0372314453125, -0.003753662109375, 0.02972412109375, 0.063201904296875, 0.0966796875, 0.130157470703125, 0.16363525390625, 0.197113037109375, 0.2305908203125, 0.264068603515625, 0.29754638671875, 0.331024169921875, 0.364501953125, 0.397979736328125, 0.43145751953125, 0.464935302734375, 0.4984130859375, 0.531890869140625, 0.56536865234375, 0.598846435546875, 0.63232421875, 0.665802001953125, 0.69927978515625, 0.732757568359375, 0.7662353515625, 0.799713134765625, 0.83319091796875, 0.866668701171875, 0.900146484375, 0.933624267578125, 0.96710205078125, 1.000579833984375, 1.0340576171875, 1.067535400390625, 1.10101318359375, 1.134490966796875, 1.16796875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 31.0, 811.0, 173.0, 7.0], "bins": [-150.4115753173828, -147.9746856689453, -145.5377960205078, -143.1009063720703, -140.6640167236328, -138.2271270751953, -135.7902374267578, -133.3533477783203, -130.9164581298828, -128.4795684814453, -126.04267883300781, -123.60578918457031, -121.16889953613281, -118.73200988769531, -116.29512023925781, -113.85823059082031, -111.42134094238281, -108.98445129394531, -106.54756164550781, -104.11067199707031, -101.67378234863281, -99.23689270019531, -96.80000305175781, -94.36311340332031, -91.92621612548828, -89.48932647705078, -87.05243682861328, -84.61554718017578, -82.17865753173828, -79.74176788330078, -77.30487823486328, -74.86798858642578, -72.43109130859375, -69.99420166015625, -67.55731201171875, -65.12042236328125, -62.68353271484375, -60.24664306640625, -57.80975341796875, -55.37286376953125, -52.93597412109375, -50.49908447265625, -48.06219482421875, -45.62530517578125, -43.18841552734375, -40.75152587890625, -38.31463623046875, -35.87774658203125, -33.440853118896484, -31.003963470458984, -28.567073822021484, -26.130184173583984, -23.693294525146484, -21.256404876708984, -18.81951332092285, -16.38262367248535, -13.945734977722168, -11.508845329284668, -9.071954727172852, -6.635065078735352, -4.198175430297852, -1.7612857818603516, 0.6756048202514648, 3.112494468688965, 5.549384117126465]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 0.0, 8.0, 7.0, 12.0, 16.0, 15.0, 20.0, 23.0, 21.0, 25.0, 31.0, 30.0, 33.0, 21.0, 29.0, 40.0, 35.0, 39.0, 46.0, 34.0, 39.0, 51.0, 37.0, 33.0, 34.0, 35.0, 29.0, 39.0, 34.0, 22.0, 25.0, 18.0, 21.0, 15.0, 19.0, 9.0, 18.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3116960525512695, -5.159384727478027, -5.007073402404785, -4.854762554168701, -4.702451229095459, -4.550139904022217, -4.397828578948975, -4.245517253875732, -4.093206405639648, -3.9408950805664062, -3.788583993911743, -3.636272668838501, -3.483961582183838, -3.3316502571105957, -3.1793389320373535, -3.0270276069641113, -2.874716281890869, -2.722404956817627, -2.570093870162964, -2.4177825450897217, -2.2654714584350586, -2.1131601333618164, -1.9608488082885742, -1.8085376024246216, -1.656226396560669, -1.5039151906967163, -1.3516039848327637, -1.1992926597595215, -1.0469814538955688, -0.8946702480316162, -0.7423589825630188, -0.5900477170944214, -0.43773651123046875, -0.2854252755641937, -0.1331140398979187, 0.019197195768356323, 0.17150843143463135, 0.323819637298584, 0.4761309027671814, 0.6284421682357788, 0.7807533740997314, 0.9330645799636841, 1.0853757858276367, 1.237687110900879, 1.3899983167648315, 1.5423095226287842, 1.6946208477020264, 1.846932053565979, 1.9992432594299316, 2.151554584503174, 2.303865671157837, 2.456176996231079, 2.608488082885742, 2.7607994079589844, 2.9131107330322266, 3.0654220581054688, 3.217733144760132, 3.370044469833374, 3.522355556488037, 3.6746668815612793, 3.8269782066345215, 3.9792892932891846, 4.131600379943848, 4.28391170501709, 4.436223030090332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 3.0, 14.0, 31.0, 27.0, 37.0, 66.0, 118.0, 232.0, 558.0, 2089.0, 10890.0, 3698554.0, 472496.0, 6517.0, 1563.0, 561.0, 205.0, 119.0, 65.0, 32.0, 29.0, 23.0, 9.0, 15.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.02490234375, -12.5888671875, -12.15283203125, -11.716796875, -11.28076171875, -10.8447265625, -10.40869140625, -9.97265625, -9.53662109375, -9.1005859375, -8.66455078125, -8.228515625, -7.79248046875, -7.3564453125, -6.92041015625, -6.484375, -6.04833984375, -5.6123046875, -5.17626953125, -4.740234375, -4.30419921875, -3.8681640625, -3.43212890625, -2.99609375, -2.56005859375, -2.1240234375, -1.68798828125, -1.251953125, -0.81591796875, -0.3798828125, 0.05615234375, 0.4921875, 0.92822265625, 1.3642578125, 1.80029296875, 2.236328125, 2.67236328125, 3.1083984375, 3.54443359375, 3.98046875, 4.41650390625, 4.8525390625, 5.28857421875, 5.724609375, 6.16064453125, 6.5966796875, 7.03271484375, 7.46875, 7.90478515625, 8.3408203125, 8.77685546875, 9.212890625, 9.64892578125, 10.0849609375, 10.52099609375, 10.95703125, 11.39306640625, 11.8291015625, 12.26513671875, 12.701171875, 13.13720703125, 13.5732421875, 14.00927734375, 14.4453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 14.0, 18.0, 13.0, 25.0, 44.0, 47.0, 44.0, 69.0, 57.0, 58.0, 66.0, 83.0, 83.0, 55.0, 66.0, 45.0, 38.0, 37.0, 46.0, 16.0, 16.0, 19.0, 14.0, 8.0, 3.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.57354736328125, -2.4888916015625, -2.40423583984375, -2.319580078125, -2.23492431640625, -2.1502685546875, -2.06561279296875, -1.98095703125, -1.89630126953125, -1.8116455078125, -1.72698974609375, -1.642333984375, -1.55767822265625, -1.4730224609375, -1.38836669921875, -1.3037109375, -1.21905517578125, -1.1343994140625, -1.04974365234375, -0.965087890625, -0.88043212890625, -0.7957763671875, -0.71112060546875, -0.62646484375, -0.54180908203125, -0.4571533203125, -0.37249755859375, -0.287841796875, -0.20318603515625, -0.1185302734375, -0.03387451171875, 0.05078125, 0.13543701171875, 0.2200927734375, 0.30474853515625, 0.389404296875, 0.47406005859375, 0.5587158203125, 0.64337158203125, 0.72802734375, 0.81268310546875, 0.8973388671875, 0.98199462890625, 1.066650390625, 1.15130615234375, 1.2359619140625, 1.32061767578125, 1.4052734375, 1.48992919921875, 1.5745849609375, 1.65924072265625, 1.743896484375, 1.82855224609375, 1.9132080078125, 1.99786376953125, 2.08251953125, 2.16717529296875, 2.2518310546875, 2.33648681640625, 2.421142578125, 2.50579833984375, 2.5904541015625, 2.67510986328125, 2.759765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 11.0, 19.0, 28.0, 52.0, 115.0, 481.0, 7503.0, 4175189.0, 10101.0, 490.0, 128.0, 46.0, 32.0, 18.0, 13.0, 10.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.7724609375, -18.966796875, -18.1611328125, -17.35546875, -16.5498046875, -15.744140625, -14.9384765625, -14.1328125, -13.3271484375, -12.521484375, -11.7158203125, -10.91015625, -10.1044921875, -9.298828125, -8.4931640625, -7.6875, -6.8818359375, -6.076171875, -5.2705078125, -4.46484375, -3.6591796875, -2.853515625, -2.0478515625, -1.2421875, -0.4365234375, 0.369140625, 1.1748046875, 1.98046875, 2.7861328125, 3.591796875, 4.3974609375, 5.203125, 6.0087890625, 6.814453125, 7.6201171875, 8.42578125, 9.2314453125, 10.037109375, 10.8427734375, 11.6484375, 12.4541015625, 13.259765625, 14.0654296875, 14.87109375, 15.6767578125, 16.482421875, 17.2880859375, 18.09375, 18.8994140625, 19.705078125, 20.5107421875, 21.31640625, 22.1220703125, 22.927734375, 23.7333984375, 24.5390625, 25.3447265625, 26.150390625, 26.9560546875, 27.76171875, 28.5673828125, 29.373046875, 30.1787109375, 30.984375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 11.0, 15.0, 32.0, 46.0, 82.0, 292.0, 1887.0, 1341.0, 195.0, 61.0, 28.0, 19.0, 19.0, 5.0, 9.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8271484375, -1.7616729736328125, -1.696197509765625, -1.6307220458984375, -1.56524658203125, -1.4997711181640625, -1.434295654296875, -1.3688201904296875, -1.3033447265625, -1.2378692626953125, -1.172393798828125, -1.1069183349609375, -1.04144287109375, -0.9759674072265625, -0.910491943359375, -0.8450164794921875, -0.779541015625, -0.7140655517578125, -0.648590087890625, -0.5831146240234375, -0.51763916015625, -0.4521636962890625, -0.386688232421875, -0.3212127685546875, -0.2557373046875, -0.1902618408203125, -0.124786376953125, -0.0593109130859375, 0.00616455078125, 0.0716400146484375, 0.137115478515625, 0.2025909423828125, 0.26806640625, 0.3335418701171875, 0.399017333984375, 0.4644927978515625, 0.52996826171875, 0.5954437255859375, 0.660919189453125, 0.7263946533203125, 0.7918701171875, 0.8573455810546875, 0.922821044921875, 0.9882965087890625, 1.05377197265625, 1.1192474365234375, 1.184722900390625, 1.2501983642578125, 1.315673828125, 1.3811492919921875, 1.446624755859375, 1.5121002197265625, 1.57757568359375, 1.6430511474609375, 1.708526611328125, 1.7740020751953125, 1.8394775390625, 1.9049530029296875, 1.970428466796875, 2.0359039306640625, 2.10137939453125, 2.1668548583984375, 2.232330322265625, 2.2978057861328125, 2.36328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 3.0, 14.0, 19.0, 17.0, 15.0, 34.0, 49.0, 62.0, 73.0, 86.0, 102.0, 92.0, 96.0, 89.0, 53.0, 34.0, 30.0, 29.0, 20.0, 17.0, 13.0, 6.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7544424533843994, -2.671036958694458, -2.5876314640045166, -2.504225969314575, -2.420820713043213, -2.3374152183532715, -2.25400972366333, -2.1706042289733887, -2.0871987342834473, -2.003793239593506, -1.9203877449035645, -1.8369823694229126, -1.7535768747329712, -1.6701713800430298, -1.586766004562378, -1.5033605098724365, -1.4199550151824951, -1.3365495204925537, -1.2531440258026123, -1.1697386503219604, -1.086333155632019, -1.0029276609420776, -0.919522225856781, -0.8361167907714844, -0.752711296081543, -0.6693058013916016, -0.5859003663063049, -0.5024949312210083, -0.4190894365310669, -0.3356839716434479, -0.25227850675582886, -0.16887307167053223, -0.08546781539916992, -0.0020623505115509033, 0.08134311437606812, 0.16474857926368713, 0.24815404415130615, 0.33155950903892517, 0.4149649739265442, 0.4983704090118408, 0.5817759037017822, 0.6651813983917236, 0.7485868334770203, 0.8319922685623169, 0.9153977632522583, 0.9988032579421997, 1.0822086334228516, 1.165614128112793, 1.2490196228027344, 1.3324251174926758, 1.4158306121826172, 1.499235987663269, 1.5826414823532104, 1.6660469770431519, 1.7494523525238037, 1.8328578472137451, 1.9162633419036865, 1.999668836593628, 2.0830743312835693, 2.1664798259735107, 2.249885082244873, 2.3332905769348145, 2.416696071624756, 2.5001015663146973, 2.5835070610046387]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 7.0, 10.0, 11.0, 21.0, 19.0, 16.0, 27.0, 24.0, 32.0, 32.0, 36.0, 32.0, 42.0, 40.0, 56.0, 36.0, 52.0, 44.0, 47.0, 49.0, 35.0, 27.0, 35.0, 32.0, 36.0, 25.0, 29.0, 15.0, 23.0, 13.0, 21.0, 10.0, 6.0, 6.0, 10.0, 5.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1681621074676514, -2.1113107204437256, -2.054459571838379, -1.9976081848144531, -1.9407567977905273, -1.8839055299758911, -1.8270541429519653, -1.770202875137329, -1.7133514881134033, -1.656500220298767, -1.5996488332748413, -1.542797565460205, -1.4859461784362793, -1.429094910621643, -1.3722435235977173, -1.315392255783081, -1.2585408687591553, -1.201689600944519, -1.1448382139205933, -1.087986946105957, -1.0311355590820312, -0.974284291267395, -0.9174329042434692, -0.860581636428833, -0.8037303686141968, -0.7468790411949158, -0.6900277137756348, -0.6331763863563538, -0.5763250589370728, -0.5194737911224365, -0.46262243390083313, -0.4057711064815521, -0.34891974925994873, -0.2920684218406677, -0.23521709442138672, -0.1783657819032669, -0.1215144544839859, -0.06466314196586609, -0.007811814546585083, 0.04903951287269592, 0.10589084029197693, 0.16274216771125793, 0.21959349513053894, 0.27644479274749756, 0.33329612016677856, 0.39014744758605957, 0.4469987750053406, 0.5038501024246216, 0.5607014298439026, 0.6175527572631836, 0.6744040846824646, 0.7312554121017456, 0.7881067395210266, 0.8449580669403076, 0.9018093347549438, 0.9586607217788696, 1.0155119895935059, 1.072363257408142, 1.1292146444320679, 1.186065912246704, 1.2429172992706299, 1.2997685670852661, 1.356619954109192, 1.4134712219238281, 1.470322608947754]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 8.0, 10.0, 19.0, 28.0, 39.0, 61.0, 153.0, 363.0, 977.0, 2735.0, 9230.0, 40653.0, 384261.0, 541903.0, 51936.0, 11016.0, 3297.0, 1079.0, 405.0, 177.0, 69.0, 37.0, 19.0, 19.0, 10.0, 10.0, 5.0, 8.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3151092529296875, -1.269866943359375, -1.2246246337890625, -1.17938232421875, -1.1341400146484375, -1.088897705078125, -1.0436553955078125, -0.9984130859375, -0.9531707763671875, -0.907928466796875, -0.8626861572265625, -0.81744384765625, -0.7722015380859375, -0.726959228515625, -0.6817169189453125, -0.636474609375, -0.5912322998046875, -0.545989990234375, -0.5007476806640625, -0.45550537109375, -0.4102630615234375, -0.365020751953125, -0.3197784423828125, -0.2745361328125, -0.2292938232421875, -0.184051513671875, -0.1388092041015625, -0.09356689453125, -0.0483245849609375, -0.003082275390625, 0.0421600341796875, 0.08740234375, 0.1326446533203125, 0.177886962890625, 0.2231292724609375, 0.26837158203125, 0.3136138916015625, 0.358856201171875, 0.4040985107421875, 0.4493408203125, 0.4945831298828125, 0.539825439453125, 0.5850677490234375, 0.63031005859375, 0.6755523681640625, 0.720794677734375, 0.7660369873046875, 0.811279296875, 0.8565216064453125, 0.901763916015625, 0.9470062255859375, 0.99224853515625, 1.0374908447265625, 1.082733154296875, 1.1279754638671875, 1.1732177734375, 1.2184600830078125, 1.263702392578125, 1.3089447021484375, 1.35418701171875, 1.3994293212890625, 1.444671630859375, 1.4899139404296875, 1.53515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 17.0, 14.0, 19.0, 50.0, 29.0, 62.0, 71.0, 92.0, 97.0, 106.0, 102.0, 73.0, 81.0, 61.0, 36.0, 30.0, 26.0, 11.0, 15.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.5949554443359375, -1.513153076171875, -1.4313507080078125, -1.34954833984375, -1.2677459716796875, -1.185943603515625, -1.1041412353515625, -1.0223388671875, -0.9405364990234375, -0.858734130859375, -0.7769317626953125, -0.69512939453125, -0.6133270263671875, -0.531524658203125, -0.4497222900390625, -0.367919921875, -0.2861175537109375, -0.204315185546875, -0.1225128173828125, -0.04071044921875, 0.0410919189453125, 0.122894287109375, 0.2046966552734375, 0.2864990234375, 0.3683013916015625, 0.450103759765625, 0.5319061279296875, 0.61370849609375, 0.6955108642578125, 0.777313232421875, 0.8591156005859375, 0.94091796875, 1.0227203369140625, 1.104522705078125, 1.1863250732421875, 1.26812744140625, 1.3499298095703125, 1.431732177734375, 1.5135345458984375, 1.5953369140625, 1.6771392822265625, 1.758941650390625, 1.8407440185546875, 1.92254638671875, 2.0043487548828125, 2.086151123046875, 2.1679534912109375, 2.249755859375, 2.3315582275390625, 2.413360595703125, 2.4951629638671875, 2.57696533203125, 2.6587677001953125, 2.740570068359375, 2.8223724365234375, 2.9041748046875, 2.9859771728515625, 3.067779541015625, 3.1495819091796875, 3.23138427734375, 3.3131866455078125, 3.394989013671875, 3.4767913818359375, 3.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 10.0, 21.0, 25.0, 32.0, 43.0, 74.0, 105.0, 176.0, 224.0, 399.0, 642.0, 1000.0, 1943.0, 3658.0, 7585.0, 17788.0, 50204.0, 198266.0, 542977.0, 152395.0, 41458.0, 15293.0, 6662.0, 3343.0, 1669.0, 951.0, 568.0, 336.0, 236.0, 145.0, 95.0, 67.0, 41.0, 29.0, 17.0, 13.0, 19.0, 6.0, 5.0, 1.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.6484375, -0.6284332275390625, -0.608428955078125, -0.5884246826171875, -0.56842041015625, -0.5484161376953125, -0.528411865234375, -0.5084075927734375, -0.4884033203125, -0.4683990478515625, -0.448394775390625, -0.4283905029296875, -0.40838623046875, -0.3883819580078125, -0.368377685546875, -0.3483734130859375, -0.328369140625, -0.3083648681640625, -0.288360595703125, -0.2683563232421875, -0.24835205078125, -0.2283477783203125, -0.208343505859375, -0.1883392333984375, -0.1683349609375, -0.1483306884765625, -0.128326416015625, -0.1083221435546875, -0.08831787109375, -0.0683135986328125, -0.048309326171875, -0.0283050537109375, -0.00830078125, 0.0117034912109375, 0.031707763671875, 0.0517120361328125, 0.07171630859375, 0.0917205810546875, 0.111724853515625, 0.1317291259765625, 0.1517333984375, 0.1717376708984375, 0.191741943359375, 0.2117462158203125, 0.23175048828125, 0.2517547607421875, 0.271759033203125, 0.2917633056640625, 0.311767578125, 0.3317718505859375, 0.351776123046875, 0.3717803955078125, 0.39178466796875, 0.4117889404296875, 0.431793212890625, 0.4517974853515625, 0.4718017578125, 0.4918060302734375, 0.511810302734375, 0.5318145751953125, 0.55181884765625, 0.5718231201171875, 0.591827392578125, 0.6118316650390625, 0.6318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 20.0, 10.0, 12.0, 11.0, 15.0, 19.0, 20.0, 21.0, 27.0, 35.0, 45.0, 36.0, 44.0, 46.0, 55.0, 48.0, 56.0, 45.0, 42.0, 58.0, 47.0, 45.0, 32.0, 26.0, 27.0, 21.0, 28.0, 22.0, 12.0, 9.0, 8.0, 8.0, 12.0, 5.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4453125, -2.367218017578125, -2.28912353515625, -2.211029052734375, -2.1329345703125, -2.054840087890625, -1.97674560546875, -1.898651123046875, -1.820556640625, -1.742462158203125, -1.66436767578125, -1.586273193359375, -1.5081787109375, -1.430084228515625, -1.35198974609375, -1.273895263671875, -1.19580078125, -1.117706298828125, -1.03961181640625, -0.961517333984375, -0.8834228515625, -0.805328369140625, -0.72723388671875, -0.649139404296875, -0.571044921875, -0.492950439453125, -0.41485595703125, -0.336761474609375, -0.2586669921875, -0.180572509765625, -0.10247802734375, -0.024383544921875, 0.0537109375, 0.131805419921875, 0.20989990234375, 0.287994384765625, 0.3660888671875, 0.444183349609375, 0.52227783203125, 0.600372314453125, 0.678466796875, 0.756561279296875, 0.83465576171875, 0.912750244140625, 0.9908447265625, 1.068939208984375, 1.14703369140625, 1.225128173828125, 1.30322265625, 1.381317138671875, 1.45941162109375, 1.537506103515625, 1.6156005859375, 1.693695068359375, 1.77178955078125, 1.849884033203125, 1.927978515625, 2.006072998046875, 2.08416748046875, 2.162261962890625, 2.2403564453125, 2.318450927734375, 2.39654541015625, 2.474639892578125, 2.552734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 13.0, 23.0, 18.0, 38.0, 53.0, 121.0, 167.0, 276.0, 484.0, 1047.0, 2168.0, 4957.0, 13092.0, 46912.0, 423910.0, 480812.0, 50976.0, 13783.0, 5216.0, 2168.0, 1028.0, 544.0, 298.0, 157.0, 105.0, 58.0, 39.0, 27.0, 13.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1552448272705078, -0.14850234985351562, -0.14175987243652344, -0.13501739501953125, -0.12827491760253906, -0.12153244018554688, -0.11478996276855469, -0.1080474853515625, -0.10130500793457031, -0.09456253051757812, -0.08782005310058594, -0.08107757568359375, -0.07433509826660156, -0.06759262084960938, -0.06085014343261719, -0.054107666015625, -0.04736518859863281, -0.040622711181640625, -0.03388023376464844, -0.02713775634765625, -0.020395278930664062, -0.013652801513671875, -0.0069103240966796875, -0.0001678466796875, 0.0065746307373046875, 0.013317108154296875, 0.020059585571289062, 0.02680206298828125, 0.03354454040527344, 0.040287017822265625, 0.04702949523925781, 0.05377197265625, 0.06051445007324219, 0.06725692749023438, 0.07399940490722656, 0.08074188232421875, 0.08748435974121094, 0.09422683715820312, 0.10096931457519531, 0.1077117919921875, 0.11445426940917969, 0.12119674682617188, 0.12793922424316406, 0.13468170166015625, 0.14142417907714844, 0.14816665649414062, 0.1549091339111328, 0.161651611328125, 0.1683940887451172, 0.17513656616210938, 0.18187904357910156, 0.18862152099609375, 0.19536399841308594, 0.20210647583007812, 0.2088489532470703, 0.2155914306640625, 0.2223339080810547, 0.22907638549804688, 0.23581886291503906, 0.24256134033203125, 0.24930381774902344, 0.2560462951660156, 0.2627887725830078, 0.26953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 5.0, 5.0, 6.0, 15.0, 19.0, 13.0, 16.0, 35.0, 54.0, 66.0, 115.0, 160.0, 156.0, 116.0, 64.0, 37.0, 39.0, 22.0, 11.0, 7.0, 7.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00017189979553222656, -0.0001672450453042984, -0.00016259029507637024, -0.00015793554484844208, -0.00015328079462051392, -0.00014862604439258575, -0.0001439712941646576, -0.00013931654393672943, -0.00013466179370880127, -0.0001300070434808731, -0.00012535229325294495, -0.00012069754302501678, -0.00011604279279708862, -0.00011138804256916046, -0.0001067332923412323, -0.00010207854211330414, -9.742379188537598e-05, -9.276904165744781e-05, -8.811429142951965e-05, -8.345954120159149e-05, -7.880479097366333e-05, -7.415004074573517e-05, -6.949529051780701e-05, -6.484054028987885e-05, -6.0185790061950684e-05, -5.553103983402252e-05, -5.087628960609436e-05, -4.62215393781662e-05, -4.156678915023804e-05, -3.6912038922309875e-05, -3.2257288694381714e-05, -2.7602538466453552e-05, -2.294778823852539e-05, -1.829303801059723e-05, -1.3638287782669067e-05, -8.983537554740906e-06, -4.328787326812744e-06, 3.259629011154175e-07, 4.980713129043579e-06, 9.63546335697174e-06, 1.4290213584899902e-05, 1.8944963812828064e-05, 2.3599714040756226e-05, 2.8254464268684387e-05, 3.290921449661255e-05, 3.756396472454071e-05, 4.221871495246887e-05, 4.6873465180397034e-05, 5.1528215408325195e-05, 5.618296563625336e-05, 6.083771586418152e-05, 6.549246609210968e-05, 7.014721632003784e-05, 7.4801966547966e-05, 7.945671677589417e-05, 8.411146700382233e-05, 8.876621723175049e-05, 9.342096745967865e-05, 9.807571768760681e-05, 0.00010273046791553497, 0.00010738521814346313, 0.0001120399683713913, 0.00011669471859931946, 0.00012134946882724762, 0.00012600421905517578]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 17.0, 33.0, 120.0, 533.0, 4067.0, 129270.0, 901820.0, 11190.0, 1136.0, 222.0, 67.0, 27.0, 14.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6297378540039062, -0.6037139892578125, -0.5776901245117188, -0.551666259765625, -0.5256423950195312, -0.4996185302734375, -0.47359466552734375, -0.44757080078125, -0.42154693603515625, -0.3955230712890625, -0.36949920654296875, -0.343475341796875, -0.31745147705078125, -0.2914276123046875, -0.26540374755859375, -0.2393798828125, -0.21335601806640625, -0.1873321533203125, -0.16130828857421875, -0.135284423828125, -0.10926055908203125, -0.0832366943359375, -0.05721282958984375, -0.03118896484375, -0.00516510009765625, 0.0208587646484375, 0.04688262939453125, 0.072906494140625, 0.09893035888671875, 0.1249542236328125, 0.15097808837890625, 0.177001953125, 0.20302581787109375, 0.2290496826171875, 0.25507354736328125, 0.281097412109375, 0.30712127685546875, 0.3331451416015625, 0.35916900634765625, 0.38519287109375, 0.41121673583984375, 0.4372406005859375, 0.46326446533203125, 0.489288330078125, 0.5153121948242188, 0.5413360595703125, 0.5673599243164062, 0.5933837890625, 0.6194076538085938, 0.6454315185546875, 0.6714553833007812, 0.697479248046875, 0.7235031127929688, 0.7495269775390625, 0.7755508422851562, 0.80157470703125, 0.8275985717773438, 0.8536224365234375, 0.8796463012695312, 0.905670166015625, 0.9316940307617188, 0.9577178955078125, 0.9837417602539062, 1.009765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 10.0, 19.0, 17.0, 24.0, 37.0, 41.0, 52.0, 78.0, 85.0, 114.0, 114.0, 78.0, 74.0, 53.0, 41.0, 35.0, 24.0, 21.0, 9.0, 12.0, 11.0, 7.0, 8.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06536865234375, -0.06344318389892578, -0.06151771545410156, -0.059592247009277344, -0.057666778564453125, -0.055741310119628906, -0.05381584167480469, -0.05189037322998047, -0.04996490478515625, -0.04803943634033203, -0.04611396789550781, -0.044188499450683594, -0.042263031005859375, -0.040337562561035156, -0.03841209411621094, -0.03648662567138672, -0.0345611572265625, -0.03263568878173828, -0.030710220336914062, -0.028784751892089844, -0.026859283447265625, -0.024933815002441406, -0.023008346557617188, -0.02108287811279297, -0.01915740966796875, -0.01723194122314453, -0.015306472778320312, -0.013381004333496094, -0.011455535888671875, -0.009530067443847656, -0.0076045989990234375, -0.005679130554199219, -0.003753662109375, -0.0018281936645507812, 9.72747802734375e-05, 0.0020227432250976562, 0.003948211669921875, 0.005873680114746094, 0.0077991485595703125, 0.009724617004394531, 0.01165008544921875, 0.013575553894042969, 0.015501022338867188, 0.017426490783691406, 0.019351959228515625, 0.021277427673339844, 0.023202896118164062, 0.02512836456298828, 0.0270538330078125, 0.02897930145263672, 0.030904769897460938, 0.032830238342285156, 0.034755706787109375, 0.036681175231933594, 0.03860664367675781, 0.04053211212158203, 0.04245758056640625, 0.04438304901123047, 0.04630851745605469, 0.048233985900878906, 0.050159454345703125, 0.052084922790527344, 0.05401039123535156, 0.05593585968017578, 0.057861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 14.0, 17.0, 24.0, 60.0, 95.0, 237.0, 215.0, 154.0, 82.0, 47.0, 22.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4313602447509766, -2.3174726963043213, -2.203585147857666, -2.0896973609924316, -1.975809931755066, -1.861922264099121, -1.7480347156524658, -1.6341471672058105, -1.5202596187591553, -1.4063720703125, -1.2924844026565552, -1.1785968542099, -1.0647093057632446, -0.9508216977119446, -0.8369340896606445, -0.7230465412139893, -0.6091588735580444, -0.4952712953090668, -0.3813837170600891, -0.26749610900878906, -0.1536085307598114, -0.03972095251083374, 0.07416665554046631, 0.18805420398712158, 0.30194181203842163, 0.4158293902873993, 0.529716968536377, 0.643604576587677, 0.757492184638977, 0.8713797330856323, 0.9852673411369324, 1.0991549491882324, 1.2130424976348877, 1.326930046081543, 1.4408177137374878, 1.554705262184143, 1.6685928106307983, 1.7824804782867432, 1.8963680267333984, 2.0102555751800537, 2.124143123626709, 2.2380306720733643, 2.3519182205200195, 2.465806007385254, 2.579693555831909, 2.6935811042785645, 2.8074686527252197, 2.921356201171875, 3.0352439880371094, 3.1491315364837646, 3.26301908493042, 3.3769068717956543, 3.4907944202423096, 3.604681968688965, 3.71856951713562, 3.8324570655822754, 3.9463446140289307, 4.060232162475586, 4.17411994934082, 4.2880072593688965, 4.401895046234131, 4.515782356262207, 4.629670143127441, 4.743557929992676, 4.857445240020752]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 14.0, 22.0, 18.0, 35.0, 42.0, 54.0, 61.0, 75.0, 83.0, 106.0, 115.0, 71.0, 77.0, 60.0, 52.0, 40.0, 26.0, 28.0, 12.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.684027075767517, -1.607417106628418, -1.5308072566986084, -1.4541972875595093, -1.3775873184204102, -1.3009774684906006, -1.2243674993515015, -1.1477575302124023, -1.0711476802825928, -0.9945377707481384, -0.9179278016090393, -0.841317892074585, -0.7647079229354858, -0.6880980134010315, -0.6114881038665771, -0.534878134727478, -0.4582681655883789, -0.3816582262516022, -0.30504828691482544, -0.2284383773803711, -0.15182843804359436, -0.07521849870681763, 0.0013914108276367188, 0.07800137996673584, 0.15461128950119019, 0.23122122883796692, 0.30783116817474365, 0.384441077709198, 0.46105101704597473, 0.5376609563827515, 0.6142708659172058, 0.6908808350563049, 0.7674908638000488, 0.8441007733345032, 0.9207107424736023, 0.9973206520080566, 1.0739306211471558, 1.1505405902862549, 1.2271504402160645, 1.3037604093551636, 1.3803703784942627, 1.4569803476333618, 1.5335901975631714, 1.6102001667022705, 1.6868101358413696, 1.7634201049804688, 1.8400299549102783, 1.9166399240493774, 1.993249773979187, 2.069859743118286, 2.1464695930480957, 2.2230796813964844, 2.299689531326294, 2.3762993812561035, 2.452909469604492, 2.5295193195343018, 2.6061291694641113, 2.682739019393921, 2.7593491077423096, 2.835958957672119, 2.9125688076019287, 2.9891788959503174, 3.065788745880127, 3.1423988342285156, 3.219008684158325]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 6.0, 15.0, 32.0, 85.0, 270.0, 739.0, 2174.0, 14801.0, 1011544.0, 15497.0, 2189.0, 765.0, 263.0, 97.0, 41.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9970703125, -8.736328125, -8.4755859375, -8.21484375, -7.9541015625, -7.693359375, -7.4326171875, -7.171875, -6.9111328125, -6.650390625, -6.3896484375, -6.12890625, -5.8681640625, -5.607421875, -5.3466796875, -5.0859375, -4.8251953125, -4.564453125, -4.3037109375, -4.04296875, -3.7822265625, -3.521484375, -3.2607421875, -3.0, -2.7392578125, -2.478515625, -2.2177734375, -1.95703125, -1.6962890625, -1.435546875, -1.1748046875, -0.9140625, -0.6533203125, -0.392578125, -0.1318359375, 0.12890625, 0.3896484375, 0.650390625, 0.9111328125, 1.171875, 1.4326171875, 1.693359375, 1.9541015625, 2.21484375, 2.4755859375, 2.736328125, 2.9970703125, 3.2578125, 3.5185546875, 3.779296875, 4.0400390625, 4.30078125, 4.5615234375, 4.822265625, 5.0830078125, 5.34375, 5.6044921875, 5.865234375, 6.1259765625, 6.38671875, 6.6474609375, 6.908203125, 7.1689453125, 7.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 17.0, 26.0, 35.0, 35.0, 55.0, 76.0, 108.0, 117.0, 104.0, 101.0, 94.0, 69.0, 55.0, 27.0, 37.0, 25.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.53021240234375, -2.3533935546875, -2.17657470703125, -1.999755859375, -1.82293701171875, -1.6461181640625, -1.46929931640625, -1.29248046875, -1.11566162109375, -0.9388427734375, -0.76202392578125, -0.585205078125, -0.40838623046875, -0.2315673828125, -0.05474853515625, 0.1220703125, 0.29888916015625, 0.4757080078125, 0.65252685546875, 0.829345703125, 1.00616455078125, 1.1829833984375, 1.35980224609375, 1.53662109375, 1.71343994140625, 1.8902587890625, 2.06707763671875, 2.243896484375, 2.42071533203125, 2.5975341796875, 2.77435302734375, 2.951171875, 3.12799072265625, 3.3048095703125, 3.48162841796875, 3.658447265625, 3.83526611328125, 4.0120849609375, 4.18890380859375, 4.36572265625, 4.54254150390625, 4.7193603515625, 4.89617919921875, 5.072998046875, 5.24981689453125, 5.4266357421875, 5.60345458984375, 5.7802734375, 5.95709228515625, 6.1339111328125, 6.31072998046875, 6.487548828125, 6.66436767578125, 6.8411865234375, 7.01800537109375, 7.19482421875, 7.37164306640625, 7.5484619140625, 7.72528076171875, 7.902099609375, 8.07891845703125, 8.2557373046875, 8.43255615234375, 8.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 11.0, 12.0, 14.0, 31.0, 51.0, 51.0, 92.0, 182.0, 423.0, 1178.0, 4959.0, 971537.0, 65308.0, 3168.0, 821.0, 304.0, 119.0, 70.0, 45.0, 34.0, 24.0, 25.0, 11.0, 14.0, 9.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.8861083984375, -7.592529296875, -7.2989501953125, -7.00537109375, -6.7117919921875, -6.418212890625, -6.1246337890625, -5.8310546875, -5.5374755859375, -5.243896484375, -4.9503173828125, -4.65673828125, -4.3631591796875, -4.069580078125, -3.7760009765625, -3.482421875, -3.1888427734375, -2.895263671875, -2.6016845703125, -2.30810546875, -2.0145263671875, -1.720947265625, -1.4273681640625, -1.1337890625, -0.8402099609375, -0.546630859375, -0.2530517578125, 0.04052734375, 0.3341064453125, 0.627685546875, 0.9212646484375, 1.21484375, 1.5084228515625, 1.802001953125, 2.0955810546875, 2.38916015625, 2.6827392578125, 2.976318359375, 3.2698974609375, 3.5634765625, 3.8570556640625, 4.150634765625, 4.4442138671875, 4.73779296875, 5.0313720703125, 5.324951171875, 5.6185302734375, 5.912109375, 6.2056884765625, 6.499267578125, 6.7928466796875, 7.08642578125, 7.3800048828125, 7.673583984375, 7.9671630859375, 8.2607421875, 8.5543212890625, 8.847900390625, 9.1414794921875, 9.43505859375, 9.7286376953125, 10.022216796875, 10.3157958984375, 10.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 12.0, 15.0, 31.0, 23.0, 36.0, 44.0, 46.0, 53.0, 62.0, 54.0, 66.0, 53.0, 57.0, 58.0, 48.0, 53.0, 55.0, 34.0, 28.0, 25.0, 21.0, 13.0, 21.0, 7.0, 14.0, 8.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.658416748046875, -2.55316162109375, -2.447906494140625, -2.3426513671875, -2.237396240234375, -2.13214111328125, -2.026885986328125, -1.921630859375, -1.816375732421875, -1.71112060546875, -1.605865478515625, -1.5006103515625, -1.395355224609375, -1.29010009765625, -1.184844970703125, -1.07958984375, -0.974334716796875, -0.86907958984375, -0.763824462890625, -0.6585693359375, -0.553314208984375, -0.44805908203125, -0.342803955078125, -0.237548828125, -0.132293701171875, -0.02703857421875, 0.078216552734375, 0.1834716796875, 0.288726806640625, 0.39398193359375, 0.499237060546875, 0.6044921875, 0.709747314453125, 0.81500244140625, 0.920257568359375, 1.0255126953125, 1.130767822265625, 1.23602294921875, 1.341278076171875, 1.446533203125, 1.551788330078125, 1.65704345703125, 1.762298583984375, 1.8675537109375, 1.972808837890625, 2.07806396484375, 2.183319091796875, 2.28857421875, 2.393829345703125, 2.49908447265625, 2.604339599609375, 2.7095947265625, 2.814849853515625, 2.92010498046875, 3.025360107421875, 3.130615234375, 3.235870361328125, 3.34112548828125, 3.446380615234375, 3.5516357421875, 3.656890869140625, 3.76214599609375, 3.867401123046875, 3.97265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 5.0, 12.0, 7.0, 15.0, 20.0, 40.0, 74.0, 244.0, 1425.0, 13914.0, 981718.0, 47442.0, 2943.0, 429.0, 99.0, 47.0, 21.0, 20.0, 8.0, 13.0, 4.0, 5.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9833984375, -1.9278106689453125, -1.872222900390625, -1.8166351318359375, -1.76104736328125, -1.7054595947265625, -1.649871826171875, -1.5942840576171875, -1.5386962890625, -1.4831085205078125, -1.427520751953125, -1.3719329833984375, -1.31634521484375, -1.2607574462890625, -1.205169677734375, -1.1495819091796875, -1.093994140625, -1.0384063720703125, -0.982818603515625, -0.9272308349609375, -0.87164306640625, -0.8160552978515625, -0.760467529296875, -0.7048797607421875, -0.6492919921875, -0.5937042236328125, -0.538116455078125, -0.4825286865234375, -0.42694091796875, -0.3713531494140625, -0.315765380859375, -0.2601776123046875, -0.20458984375, -0.1490020751953125, -0.093414306640625, -0.0378265380859375, 0.01776123046875, 0.0733489990234375, 0.128936767578125, 0.1845245361328125, 0.2401123046875, 0.2957000732421875, 0.351287841796875, 0.4068756103515625, 0.46246337890625, 0.5180511474609375, 0.573638916015625, 0.6292266845703125, 0.684814453125, 0.7404022216796875, 0.795989990234375, 0.8515777587890625, 0.90716552734375, 0.9627532958984375, 1.018341064453125, 1.0739288330078125, 1.1295166015625, 1.1851043701171875, 1.240692138671875, 1.2962799072265625, 1.35186767578125, 1.4074554443359375, 1.463043212890625, 1.5186309814453125, 1.57421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 9.0, 12.0, 10.0, 12.0, 16.0, 23.0, 40.0, 66.0, 210.0, 321.0, 121.0, 57.0, 31.0, 18.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.465217590332031e-05, -9.140651673078537e-05, -8.816085755825043e-05, -8.491519838571548e-05, -8.166953921318054e-05, -7.84238800406456e-05, -7.517822086811066e-05, -7.193256169557571e-05, -6.868690252304077e-05, -6.544124335050583e-05, -6.219558417797089e-05, -5.8949925005435944e-05, -5.5704265832901e-05, -5.245860666036606e-05, -4.9212947487831116e-05, -4.596728831529617e-05, -4.272162914276123e-05, -3.947596997022629e-05, -3.6230310797691345e-05, -3.29846516251564e-05, -2.973899245262146e-05, -2.6493333280086517e-05, -2.3247674107551575e-05, -2.0002014935016632e-05, -1.675635576248169e-05, -1.3510696589946747e-05, -1.0265037417411804e-05, -7.0193782448768616e-06, -3.773719072341919e-06, -5.280598998069763e-07, 2.7175992727279663e-06, 5.963258445262909e-06, 9.208917617797852e-06, 1.2454576790332794e-05, 1.5700235962867737e-05, 1.894589513540268e-05, 2.2191554307937622e-05, 2.5437213480472565e-05, 2.8682872653007507e-05, 3.192853182554245e-05, 3.517419099807739e-05, 3.8419850170612335e-05, 4.166550934314728e-05, 4.491116851568222e-05, 4.815682768821716e-05, 5.1402486860752106e-05, 5.464814603328705e-05, 5.789380520582199e-05, 6.113946437835693e-05, 6.438512355089188e-05, 6.763078272342682e-05, 7.087644189596176e-05, 7.41221010684967e-05, 7.736776024103165e-05, 8.061341941356659e-05, 8.385907858610153e-05, 8.710473775863647e-05, 9.035039693117142e-05, 9.359605610370636e-05, 9.68417152762413e-05, 0.00010008737444877625, 0.00010333303362131119, 0.00010657869279384613, 0.00010982435196638107, 0.00011307001113891602]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 12.0, 8.0, 15.0, 20.0, 32.0, 65.0, 150.0, 404.0, 1385.0, 8625.0, 258555.0, 765219.0, 11493.0, 1784.0, 454.0, 137.0, 60.0, 39.0, 23.0, 19.0, 8.0, 6.0, 3.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.989166259765625, -0.94805908203125, -0.906951904296875, -0.8658447265625, -0.824737548828125, -0.78363037109375, -0.742523193359375, -0.701416015625, -0.660308837890625, -0.61920166015625, -0.578094482421875, -0.5369873046875, -0.495880126953125, -0.45477294921875, -0.413665771484375, -0.37255859375, -0.331451416015625, -0.29034423828125, -0.249237060546875, -0.2081298828125, -0.167022705078125, -0.12591552734375, -0.084808349609375, -0.043701171875, -0.002593994140625, 0.03851318359375, 0.079620361328125, 0.1207275390625, 0.161834716796875, 0.20294189453125, 0.244049072265625, 0.28515625, 0.326263427734375, 0.36737060546875, 0.408477783203125, 0.4495849609375, 0.490692138671875, 0.53179931640625, 0.572906494140625, 0.614013671875, 0.655120849609375, 0.69622802734375, 0.737335205078125, 0.7784423828125, 0.819549560546875, 0.86065673828125, 0.901763916015625, 0.94287109375, 0.983978271484375, 1.02508544921875, 1.066192626953125, 1.1072998046875, 1.148406982421875, 1.18951416015625, 1.230621337890625, 1.271728515625, 1.312835693359375, 1.35394287109375, 1.395050048828125, 1.4361572265625, 1.477264404296875, 1.51837158203125, 1.559478759765625, 1.6005859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 12.0, 18.0, 19.0, 22.0, 31.0, 32.0, 53.0, 95.0, 179.0, 201.0, 97.0, 54.0, 31.0, 34.0, 20.0, 18.0, 9.0, 13.0, 7.0, 11.0, 2.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.267822265625, -0.2609672546386719, -0.25411224365234375, -0.24725723266601562, -0.2404022216796875, -0.23354721069335938, -0.22669219970703125, -0.21983718872070312, -0.212982177734375, -0.20612716674804688, -0.19927215576171875, -0.19241714477539062, -0.1855621337890625, -0.17870712280273438, -0.17185211181640625, -0.16499710083007812, -0.15814208984375, -0.15128707885742188, -0.14443206787109375, -0.13757705688476562, -0.1307220458984375, -0.12386703491210938, -0.11701202392578125, -0.11015701293945312, -0.103302001953125, -0.09644699096679688, -0.08959197998046875, -0.08273696899414062, -0.0758819580078125, -0.06902694702148438, -0.06217193603515625, -0.055316925048828125, -0.0484619140625, -0.041606903076171875, -0.03475189208984375, -0.027896881103515625, -0.0210418701171875, -0.014186859130859375, -0.00733184814453125, -0.000476837158203125, 0.006378173828125, 0.013233184814453125, 0.02008819580078125, 0.026943206787109375, 0.0337982177734375, 0.040653228759765625, 0.04750823974609375, 0.054363250732421875, 0.06121826171875, 0.06807327270507812, 0.07492828369140625, 0.08178329467773438, 0.0886383056640625, 0.09549331665039062, 0.10234832763671875, 0.10920333862304688, 0.116058349609375, 0.12291336059570312, 0.12976837158203125, 0.13662338256835938, 0.1434783935546875, 0.15033340454101562, 0.15718841552734375, 0.16404342651367188, 0.1708984375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 34.0, 186.0, 633.0, 135.0, 22.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.469989061355591, -1.7525253295898438, -1.0350614786148071, -0.3175976276397705, 0.39986610412597656, 1.1173298358917236, 1.8347938060760498, 2.5522572994232178, 3.269721269607544, 3.987185001373291, 4.704648971557617, 5.422112464904785, 6.139576435089111, 6.8570404052734375, 7.5745038986206055, 8.291967391967773, 9.009431838989258, 9.726895332336426, 10.44435977935791, 11.161823272705078, 11.879286766052246, 12.596750259399414, 13.314214706420898, 14.031678199768066, 14.749141693115234, 15.466605186462402, 16.18406867980957, 16.901533126831055, 17.61899757385254, 18.33646011352539, 19.053924560546875, 19.77138900756836, 20.48885154724121, 21.206315994262695, 21.923778533935547, 22.64124298095703, 23.358707427978516, 24.076169967651367, 24.79363441467285, 25.511096954345703, 26.228561401367188, 26.946025848388672, 27.663488388061523, 28.380952835083008, 29.098417282104492, 29.815879821777344, 30.533344268798828, 31.250808715820312, 31.968273162841797, 32.68573760986328, 33.403202056884766, 34.12066650390625, 34.83812713623047, 35.55559158325195, 36.27305603027344, 36.99052047729492, 37.70798110961914, 38.425445556640625, 39.14291000366211, 39.860374450683594, 40.57783508300781, 41.2952995300293, 42.01276397705078, 42.730228424072266, 43.44769287109375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 13.0, 17.0, 16.0, 27.0, 39.0, 42.0, 50.0, 56.0, 41.0, 78.0, 65.0, 58.0, 49.0, 49.0, 56.0, 48.0, 43.0, 46.0, 31.0, 36.0, 43.0, 23.0, 19.0, 14.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7473456859588623, -3.5792205333709717, -3.411095142364502, -3.2429699897766113, -3.0748448371887207, -2.90671968460083, -2.7385945320129395, -2.5704691410064697, -2.402343988418579, -2.2342188358306885, -2.0660934448242188, -1.8979682922363281, -1.7298431396484375, -1.5617179870605469, -1.3935927152633667, -1.2254674434661865, -1.057342290878296, -0.8892170786857605, -0.7210918664932251, -0.5529666543006897, -0.3848414421081543, -0.2167162299156189, -0.048591017723083496, 0.11953425407409668, 0.2876594066619873, 0.4557846188545227, 0.6239098310470581, 0.7920350432395935, 0.9601602554321289, 1.1282854080200195, 1.2964106798171997, 1.4645359516143799, 1.6326613426208496, 1.8007864952087402, 1.9689117670059204, 2.1370370388031006, 2.305162191390991, 2.473287343978882, 2.6414127349853516, 2.809537887573242, 2.977663040161133, 3.1457881927490234, 3.313913345336914, 3.482038736343384, 3.6501638889312744, 3.818289041519165, 3.9864144325256348, 4.154539585113525, 4.322664737701416, 4.490789890289307, 4.658915042877197, 4.827040195465088, 4.995165824890137, 5.163290977478027, 5.331416130065918, 5.499541282653809, 5.667666435241699, 5.83579158782959, 6.0039167404174805, 6.172041893005371, 6.340167045593262, 6.5082926750183105, 6.676417827606201, 6.844542980194092, 7.012668132781982]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 8.0, 11.0, 20.0, 31.0, 46.0, 56.0, 83.0, 84.0, 143.0, 220.0, 369.0, 588.0, 1142.0, 3074.0, 12078.0, 847305.0, 3294529.0, 26550.0, 4348.0, 1555.0, 774.0, 394.0, 253.0, 173.0, 129.0, 83.0, 63.0, 41.0, 26.0, 17.0, 18.0, 15.0, 13.0, 6.0, 11.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.29608154296875, -6.1116943359375, -5.92730712890625, -5.742919921875, -5.55853271484375, -5.3741455078125, -5.18975830078125, -5.00537109375, -4.82098388671875, -4.6365966796875, -4.45220947265625, -4.267822265625, -4.08343505859375, -3.8990478515625, -3.71466064453125, -3.5302734375, -3.34588623046875, -3.1614990234375, -2.97711181640625, -2.792724609375, -2.60833740234375, -2.4239501953125, -2.23956298828125, -2.05517578125, -1.87078857421875, -1.6864013671875, -1.50201416015625, -1.317626953125, -1.13323974609375, -0.9488525390625, -0.76446533203125, -0.580078125, -0.39569091796875, -0.2113037109375, -0.02691650390625, 0.157470703125, 0.34185791015625, 0.5262451171875, 0.71063232421875, 0.89501953125, 1.07940673828125, 1.2637939453125, 1.44818115234375, 1.632568359375, 1.81695556640625, 2.0013427734375, 2.18572998046875, 2.3701171875, 2.55450439453125, 2.7388916015625, 2.92327880859375, 3.107666015625, 3.29205322265625, 3.4764404296875, 3.66082763671875, 3.84521484375, 4.02960205078125, 4.2139892578125, 4.39837646484375, 4.582763671875, 4.76715087890625, 4.9515380859375, 5.13592529296875, 5.3203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 30.0, 13.0, 27.0, 31.0, 34.0, 26.0, 40.0, 55.0, 58.0, 55.0, 60.0, 62.0, 67.0, 43.0, 54.0, 47.0, 47.0, 33.0, 25.0, 31.0, 22.0, 28.0, 11.0, 8.0, 12.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9716796875, -1.9201812744140625, -1.868682861328125, -1.8171844482421875, -1.76568603515625, -1.7141876220703125, -1.662689208984375, -1.6111907958984375, -1.5596923828125, -1.5081939697265625, -1.456695556640625, -1.4051971435546875, -1.35369873046875, -1.3022003173828125, -1.250701904296875, -1.1992034912109375, -1.147705078125, -1.0962066650390625, -1.044708251953125, -0.9932098388671875, -0.94171142578125, -0.8902130126953125, -0.838714599609375, -0.7872161865234375, -0.7357177734375, -0.6842193603515625, -0.632720947265625, -0.5812225341796875, -0.52972412109375, -0.4782257080078125, -0.426727294921875, -0.3752288818359375, -0.32373046875, -0.2722320556640625, -0.220733642578125, -0.1692352294921875, -0.11773681640625, -0.0662384033203125, -0.014739990234375, 0.0367584228515625, 0.0882568359375, 0.1397552490234375, 0.191253662109375, 0.2427520751953125, 0.29425048828125, 0.3457489013671875, 0.397247314453125, 0.4487457275390625, 0.500244140625, 0.5517425537109375, 0.603240966796875, 0.6547393798828125, 0.70623779296875, 0.7577362060546875, 0.809234619140625, 0.8607330322265625, 0.9122314453125, 0.9637298583984375, 1.015228271484375, 1.0667266845703125, 1.11822509765625, 1.1697235107421875, 1.221221923828125, 1.2727203369140625, 1.32421875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 10.0, 6.0, 15.0, 9.0, 22.0, 28.0, 43.0, 77.0, 162.0, 302.0, 941.0, 3852.0, 35359.0, 4094043.0, 52897.0, 4643.0, 1094.0, 339.0, 158.0, 93.0, 36.0, 34.0, 24.0, 19.0, 15.0, 6.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.96484375, -7.7408447265625, -7.516845703125, -7.2928466796875, -7.06884765625, -6.8448486328125, -6.620849609375, -6.3968505859375, -6.1728515625, -5.9488525390625, -5.724853515625, -5.5008544921875, -5.27685546875, -5.0528564453125, -4.828857421875, -4.6048583984375, -4.380859375, -4.1568603515625, -3.932861328125, -3.7088623046875, -3.48486328125, -3.2608642578125, -3.036865234375, -2.8128662109375, -2.5888671875, -2.3648681640625, -2.140869140625, -1.9168701171875, -1.69287109375, -1.4688720703125, -1.244873046875, -1.0208740234375, -0.796875, -0.5728759765625, -0.348876953125, -0.1248779296875, 0.09912109375, 0.3231201171875, 0.547119140625, 0.7711181640625, 0.9951171875, 1.2191162109375, 1.443115234375, 1.6671142578125, 1.89111328125, 2.1151123046875, 2.339111328125, 2.5631103515625, 2.787109375, 3.0111083984375, 3.235107421875, 3.4591064453125, 3.68310546875, 3.9071044921875, 4.131103515625, 4.3551025390625, 4.5791015625, 4.8031005859375, 5.027099609375, 5.2510986328125, 5.47509765625, 5.6990966796875, 5.923095703125, 6.1470947265625, 6.37109375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 4.0, 10.0, 13.0, 15.0, 16.0, 33.0, 51.0, 91.0, 182.0, 491.0, 1129.0, 1121.0, 487.0, 174.0, 87.0, 37.0, 33.0, 21.0, 13.0, 8.0, 14.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9563369750976562, -0.9273223876953125, -0.8983078002929688, -0.869293212890625, -0.8402786254882812, -0.8112640380859375, -0.7822494506835938, -0.75323486328125, -0.7242202758789062, -0.6952056884765625, -0.6661911010742188, -0.637176513671875, -0.6081619262695312, -0.5791473388671875, -0.5501327514648438, -0.5211181640625, -0.49210357666015625, -0.4630889892578125, -0.43407440185546875, -0.405059814453125, -0.37604522705078125, -0.3470306396484375, -0.31801605224609375, -0.28900146484375, -0.25998687744140625, -0.2309722900390625, -0.20195770263671875, -0.172943115234375, -0.14392852783203125, -0.1149139404296875, -0.08589935302734375, -0.056884765625, -0.02787017822265625, 0.0011444091796875, 0.03015899658203125, 0.059173583984375, 0.08818817138671875, 0.1172027587890625, 0.14621734619140625, 0.17523193359375, 0.20424652099609375, 0.2332611083984375, 0.26227569580078125, 0.291290283203125, 0.32030487060546875, 0.3493194580078125, 0.37833404541015625, 0.4073486328125, 0.43636322021484375, 0.4653778076171875, 0.49439239501953125, 0.523406982421875, 0.5524215698242188, 0.5814361572265625, 0.6104507446289062, 0.63946533203125, 0.6684799194335938, 0.6974945068359375, 0.7265090942382812, 0.755523681640625, 0.7845382690429688, 0.8135528564453125, 0.8425674438476562, 0.87158203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 7.0, 22.0, 29.0, 52.0, 91.0, 107.0, 120.0, 165.0, 132.0, 77.0, 62.0, 39.0, 24.0, 18.0, 7.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.905581474304199, -3.803659677505493, -3.701737880706787, -3.59981632232666, -3.497894525527954, -3.395972728729248, -3.294050931930542, -3.192129135131836, -3.090207576751709, -2.988285779953003, -2.886363983154297, -2.78444242477417, -2.682520627975464, -2.580598831176758, -2.4786770343780518, -2.3767552375793457, -2.2748334407806396, -2.1729116439819336, -2.0709898471832275, -1.969068169593811, -1.8671464920043945, -1.7652246952056885, -1.6633028984069824, -1.5613811016082764, -1.4594594240188599, -1.3575376272201538, -1.2556159496307373, -1.1536941528320312, -1.0517723560333252, -0.9498506784439087, -0.8479288816452026, -0.7460071444511414, -0.6440856456756592, -0.5421639084815979, -0.44024214148521423, -0.33832037448883057, -0.2363986372947693, -0.134476900100708, -0.03255510330200195, 0.06936663389205933, 0.1712883710861206, 0.2732101082801819, 0.37513187527656555, 0.4770536422729492, 0.5789753794670105, 0.6808971166610718, 0.7828189134597778, 0.8847406506538391, 0.9866623878479004, 1.0885841846466064, 1.190505862236023, 1.292427659034729, 1.3943493366241455, 1.4962711334228516, 1.5981929302215576, 1.7001147270202637, 1.8020364046096802, 1.9039582014083862, 2.0058798789978027, 2.107801675796509, 2.209723472595215, 2.311645030975342, 2.413567066192627, 2.515488624572754, 2.61741042137146]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 1.0, 6.0, 14.0, 23.0, 18.0, 22.0, 28.0, 30.0, 38.0, 45.0, 41.0, 51.0, 57.0, 51.0, 62.0, 59.0, 53.0, 61.0, 51.0, 59.0, 42.0, 31.0, 26.0, 28.0, 26.0, 13.0, 9.0, 14.0, 9.0, 8.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.178774833679199, -2.117802858352661, -2.056831121444702, -1.9958592653274536, -1.934887409210205, -1.873915433883667, -1.8129435777664185, -1.75197172164917, -1.6909998655319214, -1.6300280094146729, -1.5690561532974243, -1.5080842971801758, -1.4471123218536377, -1.3861405849456787, -1.3251686096191406, -1.264196753501892, -1.2032248973846436, -1.142253041267395, -1.0812811851501465, -1.020309329032898, -0.9593374133110046, -0.8983655571937561, -0.8373936414718628, -0.7764217853546143, -0.7154499292373657, -0.6544780731201172, -0.5935062170028687, -0.5325343012809753, -0.4715624451637268, -0.41059058904647827, -0.34961870312690735, -0.2886468172073364, -0.22767508029937744, -0.1667032092809677, -0.10573133826255798, -0.044759467244148254, 0.016212403774261475, 0.07718425989151001, 0.13815614581108093, 0.19912803173065186, 0.2600998878479004, 0.3210717439651489, 0.38204362988471985, 0.44301551580429077, 0.5039873719215393, 0.5649592280387878, 0.6259311437606812, 0.6869029998779297, 0.7478748559951782, 0.8088467121124268, 0.8698185682296753, 0.9307904839515686, 0.9917623400688171, 1.052734136581421, 1.113706111907959, 1.1746779680252075, 1.235649824142456, 1.2966216802597046, 1.3575935363769531, 1.4185653924942017, 1.4795372486114502, 1.5405092239379883, 1.6014810800552368, 1.6624529361724854, 1.7234247922897339]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 13.0, 8.0, 7.0, 12.0, 9.0, 14.0, 22.0, 27.0, 61.0, 150.0, 373.0, 1375.0, 6529.0, 45116.0, 869081.0, 110698.0, 11702.0, 2314.0, 575.0, 206.0, 81.0, 34.0, 27.0, 19.0, 19.0, 9.0, 5.0, 13.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.10546875, -2.041015625, -1.9765625, -1.912109375, -1.84765625, -1.783203125, -1.71875, -1.654296875, -1.58984375, -1.525390625, -1.4609375, -1.396484375, -1.33203125, -1.267578125, -1.203125, -1.138671875, -1.07421875, -1.009765625, -0.9453125, -0.880859375, -0.81640625, -0.751953125, -0.6875, -0.623046875, -0.55859375, -0.494140625, -0.4296875, -0.365234375, -0.30078125, -0.236328125, -0.171875, -0.107421875, -0.04296875, 0.021484375, 0.0859375, 0.150390625, 0.21484375, 0.279296875, 0.34375, 0.408203125, 0.47265625, 0.537109375, 0.6015625, 0.666015625, 0.73046875, 0.794921875, 0.859375, 0.923828125, 0.98828125, 1.052734375, 1.1171875, 1.181640625, 1.24609375, 1.310546875, 1.375, 1.439453125, 1.50390625, 1.568359375, 1.6328125, 1.697265625, 1.76171875, 1.826171875, 1.890625, 1.955078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 21.0, 50.0, 69.0, 83.0, 109.0, 147.0, 121.0, 139.0, 106.0, 67.0, 32.0, 20.0, 13.0, 11.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6845703125, -1.6005096435546875, -1.516448974609375, -1.4323883056640625, -1.34832763671875, -1.2642669677734375, -1.180206298828125, -1.0961456298828125, -1.0120849609375, -0.9280242919921875, -0.843963623046875, -0.7599029541015625, -0.67584228515625, -0.5917816162109375, -0.507720947265625, -0.4236602783203125, -0.339599609375, -0.2555389404296875, -0.171478271484375, -0.0874176025390625, -0.00335693359375, 0.0807037353515625, 0.164764404296875, 0.2488250732421875, 0.3328857421875, 0.4169464111328125, 0.501007080078125, 0.5850677490234375, 0.66912841796875, 0.7531890869140625, 0.837249755859375, 0.9213104248046875, 1.00537109375, 1.0894317626953125, 1.173492431640625, 1.2575531005859375, 1.34161376953125, 1.4256744384765625, 1.509735107421875, 1.5937957763671875, 1.6778564453125, 1.7619171142578125, 1.845977783203125, 1.9300384521484375, 2.01409912109375, 2.0981597900390625, 2.182220458984375, 2.2662811279296875, 2.350341796875, 2.4344024658203125, 2.518463134765625, 2.6025238037109375, 2.68658447265625, 2.7706451416015625, 2.854705810546875, 2.9387664794921875, 3.0228271484375, 3.1068878173828125, 3.190948486328125, 3.2750091552734375, 3.35906982421875, 3.4431304931640625, 3.527191162109375, 3.6112518310546875, 3.6953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 6.0, 13.0, 26.0, 33.0, 55.0, 108.0, 194.0, 283.0, 467.0, 888.0, 1692.0, 3450.0, 7705.0, 18884.0, 57623.0, 342602.0, 499653.0, 74893.0, 22619.0, 8974.0, 4054.0, 1952.0, 1006.0, 555.0, 311.0, 178.0, 123.0, 76.0, 48.0, 30.0, 14.0, 12.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.49554443359375, -0.4779052734375, -0.46026611328125, -0.442626953125, -0.42498779296875, -0.4073486328125, -0.38970947265625, -0.3720703125, -0.35443115234375, -0.3367919921875, -0.31915283203125, -0.301513671875, -0.28387451171875, -0.2662353515625, -0.24859619140625, -0.23095703125, -0.21331787109375, -0.1956787109375, -0.17803955078125, -0.160400390625, -0.14276123046875, -0.1251220703125, -0.10748291015625, -0.08984375, -0.07220458984375, -0.0545654296875, -0.03692626953125, -0.019287109375, -0.00164794921875, 0.0159912109375, 0.03363037109375, 0.05126953125, 0.06890869140625, 0.0865478515625, 0.10418701171875, 0.121826171875, 0.13946533203125, 0.1571044921875, 0.17474365234375, 0.1923828125, 0.21002197265625, 0.2276611328125, 0.24530029296875, 0.262939453125, 0.28057861328125, 0.2982177734375, 0.31585693359375, 0.33349609375, 0.35113525390625, 0.3687744140625, 0.38641357421875, 0.404052734375, 0.42169189453125, 0.4393310546875, 0.45697021484375, 0.474609375, 0.49224853515625, 0.5098876953125, 0.52752685546875, 0.545166015625, 0.56280517578125, 0.5804443359375, 0.59808349609375, 0.61572265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 14.0, 6.0, 8.0, 17.0, 17.0, 20.0, 15.0, 32.0, 40.0, 28.0, 38.0, 41.0, 46.0, 56.0, 48.0, 59.0, 53.0, 63.0, 52.0, 50.0, 44.0, 32.0, 49.0, 35.0, 20.0, 14.0, 19.0, 16.0, 9.0, 13.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8896484375, -1.8306121826171875, -1.771575927734375, -1.7125396728515625, -1.65350341796875, -1.5944671630859375, -1.535430908203125, -1.4763946533203125, -1.4173583984375, -1.3583221435546875, -1.299285888671875, -1.2402496337890625, -1.18121337890625, -1.1221771240234375, -1.063140869140625, -1.0041046142578125, -0.945068359375, -0.8860321044921875, -0.826995849609375, -0.7679595947265625, -0.70892333984375, -0.6498870849609375, -0.590850830078125, -0.5318145751953125, -0.4727783203125, -0.4137420654296875, -0.354705810546875, -0.2956695556640625, -0.23663330078125, -0.1775970458984375, -0.118560791015625, -0.0595245361328125, -0.00048828125, 0.0585479736328125, 0.117584228515625, 0.1766204833984375, 0.23565673828125, 0.2946929931640625, 0.353729248046875, 0.4127655029296875, 0.4718017578125, 0.5308380126953125, 0.589874267578125, 0.6489105224609375, 0.70794677734375, 0.7669830322265625, 0.826019287109375, 0.8850555419921875, 0.944091796875, 1.0031280517578125, 1.062164306640625, 1.1212005615234375, 1.18023681640625, 1.2392730712890625, 1.298309326171875, 1.3573455810546875, 1.4163818359375, 1.4754180908203125, 1.534454345703125, 1.5934906005859375, 1.65252685546875, 1.7115631103515625, 1.770599365234375, 1.8296356201171875, 1.888671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 16.0, 31.0, 37.0, 63.0, 106.0, 156.0, 286.0, 596.0, 1201.0, 2601.0, 7436.0, 25906.0, 168115.0, 743987.0, 73165.0, 15769.0, 5096.0, 1961.0, 868.0, 465.0, 243.0, 163.0, 83.0, 53.0, 39.0, 23.0, 23.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.149505615234375, -0.14422607421875, -0.138946533203125, -0.1336669921875, -0.128387451171875, -0.12310791015625, -0.117828369140625, -0.112548828125, -0.107269287109375, -0.10198974609375, -0.096710205078125, -0.0914306640625, -0.086151123046875, -0.08087158203125, -0.075592041015625, -0.0703125, -0.065032958984375, -0.05975341796875, -0.054473876953125, -0.0491943359375, -0.043914794921875, -0.03863525390625, -0.033355712890625, -0.028076171875, -0.022796630859375, -0.01751708984375, -0.012237548828125, -0.0069580078125, -0.001678466796875, 0.00360107421875, 0.008880615234375, 0.01416015625, 0.019439697265625, 0.02471923828125, 0.029998779296875, 0.0352783203125, 0.040557861328125, 0.04583740234375, 0.051116943359375, 0.056396484375, 0.061676025390625, 0.06695556640625, 0.072235107421875, 0.0775146484375, 0.082794189453125, 0.08807373046875, 0.093353271484375, 0.0986328125, 0.103912353515625, 0.10919189453125, 0.114471435546875, 0.1197509765625, 0.125030517578125, 0.13031005859375, 0.135589599609375, 0.140869140625, 0.146148681640625, 0.15142822265625, 0.156707763671875, 0.1619873046875, 0.167266845703125, 0.17254638671875, 0.177825927734375, 0.18310546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 24.0, 36.0, 54.0, 91.0, 203.0, 250.0, 110.0, 73.0, 39.0, 22.0, 17.0, 13.0, 11.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001537799835205078, -0.00014941394329071045, -0.00014504790306091309, -0.00014068186283111572, -0.00013631582260131836, -0.000131949782371521, -0.00012758374214172363, -0.00012321770191192627, -0.0001188516616821289, -0.00011448562145233154, -0.00011011958122253418, -0.00010575354099273682, -0.00010138750076293945, -9.702146053314209e-05, -9.265542030334473e-05, -8.828938007354736e-05, -8.392333984375e-05, -7.955729961395264e-05, -7.519125938415527e-05, -7.082521915435791e-05, -6.645917892456055e-05, -6.209313869476318e-05, -5.772709846496582e-05, -5.336105823516846e-05, -4.8995018005371094e-05, -4.462897777557373e-05, -4.026293754577637e-05, -3.5896897315979004e-05, -3.153085708618164e-05, -2.7164816856384277e-05, -2.2798776626586914e-05, -1.843273639678955e-05, -1.4066696166992188e-05, -9.700655937194824e-06, -5.334615707397461e-06, -9.685754776000977e-07, 3.3974647521972656e-06, 7.763504981994629e-06, 1.2129545211791992e-05, 1.6495585441589355e-05, 2.086162567138672e-05, 2.5227665901184082e-05, 2.9593706130981445e-05, 3.395974636077881e-05, 3.832578659057617e-05, 4.2691826820373535e-05, 4.70578670501709e-05, 5.142390727996826e-05, 5.5789947509765625e-05, 6.015598773956299e-05, 6.452202796936035e-05, 6.888806819915771e-05, 7.325410842895508e-05, 7.762014865875244e-05, 8.19861888885498e-05, 8.635222911834717e-05, 9.071826934814453e-05, 9.50843095779419e-05, 9.945034980773926e-05, 0.00010381639003753662, 0.00010818243026733398, 0.00011254847049713135, 0.00011691451072692871, 0.00012128055095672607, 0.00012564659118652344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 9.0, 2.0, 10.0, 17.0, 18.0, 24.0, 41.0, 55.0, 102.0, 195.0, 371.0, 846.0, 1875.0, 4724.0, 14013.0, 60315.0, 637229.0, 279206.0, 33879.0, 9400.0, 3490.0, 1362.0, 650.0, 323.0, 156.0, 74.0, 66.0, 32.0, 16.0, 18.0, 12.0, 8.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1912841796875, -0.1859455108642578, -0.18060684204101562, -0.17526817321777344, -0.16992950439453125, -0.16459083557128906, -0.15925216674804688, -0.1539134979248047, -0.1485748291015625, -0.1432361602783203, -0.13789749145507812, -0.13255882263183594, -0.12722015380859375, -0.12188148498535156, -0.11654281616210938, -0.11120414733886719, -0.105865478515625, -0.10052680969238281, -0.09518814086914062, -0.08984947204589844, -0.08451080322265625, -0.07917213439941406, -0.07383346557617188, -0.06849479675292969, -0.0631561279296875, -0.05781745910644531, -0.052478790283203125, -0.04714012145996094, -0.04180145263671875, -0.03646278381347656, -0.031124114990234375, -0.025785446166992188, -0.02044677734375, -0.015108108520507812, -0.009769439697265625, -0.0044307708740234375, 0.00090789794921875, 0.0062465667724609375, 0.011585235595703125, 0.016923904418945312, 0.0222625732421875, 0.027601242065429688, 0.032939910888671875, 0.03827857971191406, 0.04361724853515625, 0.04895591735839844, 0.054294586181640625, 0.05963325500488281, 0.064971923828125, 0.07031059265136719, 0.07564926147460938, 0.08098793029785156, 0.08632659912109375, 0.09166526794433594, 0.09700393676757812, 0.10234260559082031, 0.1076812744140625, 0.11301994323730469, 0.11835861206054688, 0.12369728088378906, 0.12903594970703125, 0.13437461853027344, 0.13971328735351562, 0.1450519561767578, 0.150390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 1.0, 7.0, 10.0, 5.0, 20.0, 24.0, 41.0, 36.0, 57.0, 67.0, 70.0, 116.0, 144.0, 95.0, 60.0, 61.0, 37.0, 29.0, 18.0, 17.0, 15.0, 9.0, 7.0, 8.0, 7.0, 5.0, 5.0, 4.0, 6.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.028013944625854492, -0.027020931243896484, -0.026027917861938477, -0.02503490447998047, -0.02404189109802246, -0.023048877716064453, -0.022055864334106445, -0.021062850952148438, -0.02006983757019043, -0.019076824188232422, -0.018083810806274414, -0.017090797424316406, -0.0160977840423584, -0.01510477066040039, -0.014111757278442383, -0.013118743896484375, -0.012125730514526367, -0.01113271713256836, -0.010139703750610352, -0.009146690368652344, -0.008153676986694336, -0.007160663604736328, -0.00616765022277832, -0.0051746368408203125, -0.004181623458862305, -0.003188610076904297, -0.002195596694946289, -0.0012025833129882812, -0.00020956993103027344, 0.0007834434509277344, 0.0017764568328857422, 0.00276947021484375, 0.003762483596801758, 0.004755496978759766, 0.0057485103607177734, 0.006741523742675781, 0.007734537124633789, 0.008727550506591797, 0.009720563888549805, 0.010713577270507812, 0.01170659065246582, 0.012699604034423828, 0.013692617416381836, 0.014685630798339844, 0.01567864418029785, 0.01667165756225586, 0.017664670944213867, 0.018657684326171875, 0.019650697708129883, 0.02064371109008789, 0.0216367244720459, 0.022629737854003906, 0.023622751235961914, 0.024615764617919922, 0.02560877799987793, 0.026601791381835938, 0.027594804763793945, 0.028587818145751953, 0.02958083152770996, 0.03057384490966797, 0.03156685829162598, 0.032559871673583984, 0.03355288505554199, 0.0345458984375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 16.0, 23.0, 63.0, 137.0, 276.0, 243.0, 123.0, 58.0, 29.0, 13.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.240875244140625, -4.134738445281982, -4.02860164642334, -3.922464609146118, -3.8163275718688965, -3.710190773010254, -3.6040539741516113, -3.4979169368743896, -3.391779899597168, -3.2856431007385254, -3.1795060634613037, -3.073369264602661, -2.9672322273254395, -2.861095428466797, -2.7549586296081543, -2.6488215923309326, -2.54268479347229, -2.4365479946136475, -2.330410957336426, -2.224274158477783, -2.1181371212005615, -2.012000322341919, -1.9058634042739868, -1.7997264862060547, -1.6935895681381226, -1.5874526500701904, -1.4813157320022583, -1.3751788139343262, -1.2690420150756836, -1.162904977798462, -1.0567681789398193, -0.9506312608718872, -0.8444943428039551, -0.738357424736023, -0.6322205066680908, -0.5260836482048035, -0.41994673013687134, -0.3138098120689392, -0.20767295360565186, -0.10153603553771973, 0.004600882530212402, 0.11073778569698334, 0.21687468886375427, 0.323011577129364, 0.42914849519729614, 0.5352854132652283, 0.6414222717285156, 0.7475591897964478, 0.8536961078643799, 0.959833025932312, 1.0659699440002441, 1.1721067428588867, 1.2782437801361084, 1.384380578994751, 1.490517497062683, 1.5966544151306152, 1.7027913331985474, 1.8089282512664795, 1.9150651693344116, 2.0212020874023438, 2.1273388862609863, 2.233475923538208, 2.3396127223968506, 2.4457497596740723, 2.551886558532715]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 12.0, 14.0, 47.0, 55.0, 80.0, 107.0, 117.0, 125.0, 130.0, 111.0, 79.0, 50.0, 28.0, 20.0, 14.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5628656148910522, -1.4866338968276978, -1.4104021787643433, -1.3341704607009888, -1.2579387426376343, -1.1817070245742798, -1.1054753065109253, -1.0292435884475708, -0.9530118703842163, -0.8767801523208618, -0.8005484342575073, -0.7243167161941528, -0.6480849981307983, -0.5718532800674438, -0.49562156200408936, -0.41938984394073486, -0.34315812587738037, -0.2669264078140259, -0.1906946897506714, -0.1144629716873169, -0.0382312536239624, 0.03800046443939209, 0.11423218250274658, 0.19046390056610107, 0.26669561862945557, 0.34292733669281006, 0.41915905475616455, 0.49539077281951904, 0.5716224908828735, 0.647854208946228, 0.7240859270095825, 0.800317645072937, 0.876549243927002, 0.9527809619903564, 1.029012680053711, 1.1052443981170654, 1.18147611618042, 1.2577078342437744, 1.333939552307129, 1.4101712703704834, 1.486402988433838, 1.5626347064971924, 1.6388664245605469, 1.7150981426239014, 1.7913298606872559, 1.8675615787506104, 1.9437932968139648, 2.0200250148773193, 2.096256732940674, 2.1724884510040283, 2.248720169067383, 2.3249518871307373, 2.401183605194092, 2.4774153232574463, 2.553647041320801, 2.6298787593841553, 2.7061104774475098, 2.7823421955108643, 2.8585739135742188, 2.9348056316375732, 3.0110373497009277, 3.0872690677642822, 3.1635007858276367, 3.239732503890991, 3.3159642219543457]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 5.0, 8.0, 16.0, 32.0, 118.0, 469.0, 1653.0, 7448.0, 112744.0, 908152.0, 14005.0, 2856.0, 703.0, 209.0, 54.0, 16.0, 14.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.7916259765625, -4.637939453125, -4.4842529296875, -4.33056640625, -4.1768798828125, -4.023193359375, -3.8695068359375, -3.7158203125, -3.5621337890625, -3.408447265625, -3.2547607421875, -3.10107421875, -2.9473876953125, -2.793701171875, -2.6400146484375, -2.486328125, -2.3326416015625, -2.178955078125, -2.0252685546875, -1.87158203125, -1.7178955078125, -1.564208984375, -1.4105224609375, -1.2568359375, -1.1031494140625, -0.949462890625, -0.7957763671875, -0.64208984375, -0.4884033203125, -0.334716796875, -0.1810302734375, -0.02734375, 0.1263427734375, 0.280029296875, 0.4337158203125, 0.58740234375, 0.7410888671875, 0.894775390625, 1.0484619140625, 1.2021484375, 1.3558349609375, 1.509521484375, 1.6632080078125, 1.81689453125, 1.9705810546875, 2.124267578125, 2.2779541015625, 2.431640625, 2.5853271484375, 2.739013671875, 2.8927001953125, 3.04638671875, 3.2000732421875, 3.353759765625, 3.5074462890625, 3.6611328125, 3.8148193359375, 3.968505859375, 4.1221923828125, 4.27587890625, 4.4295654296875, 4.583251953125, 4.7369384765625, 4.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [7.0, 4.0, 6.0, 9.0, 8.0, 9.0, 29.0, 22.0, 44.0, 58.0, 58.0, 78.0, 90.0, 94.0, 94.0, 88.0, 64.0, 73.0, 55.0, 37.0, 28.0, 19.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.532684326171875, -1.41497802734375, -1.297271728515625, -1.1795654296875, -1.061859130859375, -0.94415283203125, -0.826446533203125, -0.708740234375, -0.591033935546875, -0.47332763671875, -0.355621337890625, -0.2379150390625, -0.120208740234375, -0.00250244140625, 0.115203857421875, 0.23291015625, 0.350616455078125, 0.46832275390625, 0.586029052734375, 0.7037353515625, 0.821441650390625, 0.93914794921875, 1.056854248046875, 1.174560546875, 1.292266845703125, 1.40997314453125, 1.527679443359375, 1.6453857421875, 1.763092041015625, 1.88079833984375, 1.998504638671875, 2.1162109375, 2.233917236328125, 2.35162353515625, 2.469329833984375, 2.5870361328125, 2.704742431640625, 2.82244873046875, 2.940155029296875, 3.057861328125, 3.175567626953125, 3.29327392578125, 3.410980224609375, 3.5286865234375, 3.646392822265625, 3.76409912109375, 3.881805419921875, 3.99951171875, 4.117218017578125, 4.23492431640625, 4.352630615234375, 4.4703369140625, 4.588043212890625, 4.70574951171875, 4.823455810546875, 4.941162109375, 5.058868408203125, 5.17657470703125, 5.294281005859375, 5.4119873046875, 5.529693603515625, 5.64739990234375, 5.765106201171875, 5.8828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 9.0, 13.0, 17.0, 11.0, 20.0, 27.0, 27.0, 32.0, 46.0, 41.0, 55.0, 71.0, 189.0, 754.0, 11338.0, 1022694.0, 11897.0, 708.0, 140.0, 76.0, 38.0, 46.0, 38.0, 33.0, 20.0, 30.0, 29.0, 12.0, 16.0, 15.0, 15.0, 12.0, 11.0, 13.0, 4.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8839111328125, -6.650634765625, -6.4173583984375, -6.18408203125, -5.9508056640625, -5.717529296875, -5.4842529296875, -5.2509765625, -5.0177001953125, -4.784423828125, -4.5511474609375, -4.31787109375, -4.0845947265625, -3.851318359375, -3.6180419921875, -3.384765625, -3.1514892578125, -2.918212890625, -2.6849365234375, -2.45166015625, -2.2183837890625, -1.985107421875, -1.7518310546875, -1.5185546875, -1.2852783203125, -1.052001953125, -0.8187255859375, -0.58544921875, -0.3521728515625, -0.118896484375, 0.1143798828125, 0.34765625, 0.5809326171875, 0.814208984375, 1.0474853515625, 1.28076171875, 1.5140380859375, 1.747314453125, 1.9805908203125, 2.2138671875, 2.4471435546875, 2.680419921875, 2.9136962890625, 3.14697265625, 3.3802490234375, 3.613525390625, 3.8468017578125, 4.080078125, 4.3133544921875, 4.546630859375, 4.7799072265625, 5.01318359375, 5.2464599609375, 5.479736328125, 5.7130126953125, 5.9462890625, 6.1795654296875, 6.412841796875, 6.6461181640625, 6.87939453125, 7.1126708984375, 7.345947265625, 7.5792236328125, 7.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 8.0, 7.0, 1.0, 10.0, 4.0, 9.0, 14.0, 18.0, 24.0, 15.0, 17.0, 16.0, 22.0, 44.0, 35.0, 25.0, 41.0, 34.0, 32.0, 32.0, 41.0, 39.0, 50.0, 40.0, 35.0, 37.0, 37.0, 28.0, 34.0, 29.0, 22.0, 29.0, 29.0, 17.0, 15.0, 15.0, 14.0, 9.0, 14.0, 16.0, 11.0, 5.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615234375, -1.5607757568359375, -1.506317138671875, -1.4518585205078125, -1.39739990234375, -1.3429412841796875, -1.288482666015625, -1.2340240478515625, -1.1795654296875, -1.1251068115234375, -1.070648193359375, -1.0161895751953125, -0.96173095703125, -0.9072723388671875, -0.852813720703125, -0.7983551025390625, -0.743896484375, -0.6894378662109375, -0.634979248046875, -0.5805206298828125, -0.52606201171875, -0.4716033935546875, -0.417144775390625, -0.3626861572265625, -0.3082275390625, -0.2537689208984375, -0.199310302734375, -0.1448516845703125, -0.09039306640625, -0.0359344482421875, 0.018524169921875, 0.0729827880859375, 0.12744140625, 0.1819000244140625, 0.236358642578125, 0.2908172607421875, 0.34527587890625, 0.3997344970703125, 0.454193115234375, 0.5086517333984375, 0.5631103515625, 0.6175689697265625, 0.672027587890625, 0.7264862060546875, 0.78094482421875, 0.8354034423828125, 0.889862060546875, 0.9443206787109375, 0.998779296875, 1.0532379150390625, 1.107696533203125, 1.1621551513671875, 1.21661376953125, 1.2710723876953125, 1.325531005859375, 1.3799896240234375, 1.4344482421875, 1.4889068603515625, 1.543365478515625, 1.5978240966796875, 1.65228271484375, 1.7067413330078125, 1.761199951171875, 1.8156585693359375, 1.8701171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 10.0, 12.0, 19.0, 24.0, 26.0, 36.0, 52.0, 58.0, 134.0, 245.0, 435.0, 959.0, 2551.0, 8551.0, 53586.0, 910460.0, 57741.0, 8911.0, 2646.0, 1007.0, 468.0, 220.0, 132.0, 74.0, 46.0, 31.0, 32.0, 17.0, 14.0, 12.0, 5.0, 6.0, 13.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.6025390625, -0.5860366821289062, -0.5695343017578125, -0.5530319213867188, -0.536529541015625, -0.5200271606445312, -0.5035247802734375, -0.48702239990234375, -0.47052001953125, -0.45401763916015625, -0.4375152587890625, -0.42101287841796875, -0.404510498046875, -0.38800811767578125, -0.3715057373046875, -0.35500335693359375, -0.3385009765625, -0.32199859619140625, -0.3054962158203125, -0.28899383544921875, -0.272491455078125, -0.25598907470703125, -0.2394866943359375, -0.22298431396484375, -0.20648193359375, -0.18997955322265625, -0.1734771728515625, -0.15697479248046875, -0.140472412109375, -0.12397003173828125, -0.1074676513671875, -0.09096527099609375, -0.074462890625, -0.05796051025390625, -0.0414581298828125, -0.02495574951171875, -0.008453369140625, 0.00804901123046875, 0.0245513916015625, 0.04105377197265625, 0.05755615234375, 0.07405853271484375, 0.0905609130859375, 0.10706329345703125, 0.123565673828125, 0.14006805419921875, 0.1565704345703125, 0.17307281494140625, 0.1895751953125, 0.20607757568359375, 0.2225799560546875, 0.23908233642578125, 0.255584716796875, 0.27208709716796875, 0.2885894775390625, 0.30509185791015625, 0.32159423828125, 0.33809661865234375, 0.3545989990234375, 0.37110137939453125, 0.387603759765625, 0.40410614013671875, 0.4206085205078125, 0.43711090087890625, 0.45361328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 13.0, 12.0, 15.0, 21.0, 44.0, 95.0, 194.0, 307.0, 100.0, 63.0, 29.0, 14.0, 18.0, 17.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.296966552734375e-05, -8.079409599304199e-05, -7.861852645874023e-05, -7.644295692443848e-05, -7.426738739013672e-05, -7.209181785583496e-05, -6.99162483215332e-05, -6.774067878723145e-05, -6.556510925292969e-05, -6.338953971862793e-05, -6.121397018432617e-05, -5.9038400650024414e-05, -5.6862831115722656e-05, -5.46872615814209e-05, -5.251169204711914e-05, -5.033612251281738e-05, -4.8160552978515625e-05, -4.598498344421387e-05, -4.380941390991211e-05, -4.163384437561035e-05, -3.9458274841308594e-05, -3.7282705307006836e-05, -3.510713577270508e-05, -3.293156623840332e-05, -3.075599670410156e-05, -2.8580427169799805e-05, -2.6404857635498047e-05, -2.422928810119629e-05, -2.205371856689453e-05, -1.9878149032592773e-05, -1.7702579498291016e-05, -1.5527009963989258e-05, -1.33514404296875e-05, -1.1175870895385742e-05, -9.000301361083984e-06, -6.8247318267822266e-06, -4.649162292480469e-06, -2.473592758178711e-06, -2.980232238769531e-07, 1.8775463104248047e-06, 4.0531158447265625e-06, 6.22868537902832e-06, 8.404254913330078e-06, 1.0579824447631836e-05, 1.2755393981933594e-05, 1.4930963516235352e-05, 1.710653305053711e-05, 1.9282102584838867e-05, 2.1457672119140625e-05, 2.3633241653442383e-05, 2.580881118774414e-05, 2.79843807220459e-05, 3.0159950256347656e-05, 3.2335519790649414e-05, 3.451108932495117e-05, 3.668665885925293e-05, 3.886222839355469e-05, 4.1037797927856445e-05, 4.32133674621582e-05, 4.538893699645996e-05, 4.756450653076172e-05, 4.9740076065063477e-05, 5.1915645599365234e-05, 5.409121513366699e-05, 5.626678466796875e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 3.0, 13.0, 10.0, 10.0, 22.0, 24.0, 46.0, 77.0, 175.0, 375.0, 972.0, 3599.0, 20136.0, 871043.0, 138548.0, 10056.0, 2186.0, 690.0, 271.0, 129.0, 64.0, 41.0, 16.0, 9.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63671875, -0.6153640747070312, -0.5940093994140625, -0.5726547241210938, -0.551300048828125, -0.5299453735351562, -0.5085906982421875, -0.48723602294921875, -0.46588134765625, -0.44452667236328125, -0.4231719970703125, -0.40181732177734375, -0.380462646484375, -0.35910797119140625, -0.3377532958984375, -0.31639862060546875, -0.2950439453125, -0.27368927001953125, -0.2523345947265625, -0.23097991943359375, -0.209625244140625, -0.18827056884765625, -0.1669158935546875, -0.14556121826171875, -0.12420654296875, -0.10285186767578125, -0.0814971923828125, -0.06014251708984375, -0.038787841796875, -0.01743316650390625, 0.0039215087890625, 0.02527618408203125, 0.046630859375, 0.06798553466796875, 0.0893402099609375, 0.11069488525390625, 0.132049560546875, 0.15340423583984375, 0.1747589111328125, 0.19611358642578125, 0.21746826171875, 0.23882293701171875, 0.2601776123046875, 0.28153228759765625, 0.302886962890625, 0.32424163818359375, 0.3455963134765625, 0.36695098876953125, 0.3883056640625, 0.40966033935546875, 0.4310150146484375, 0.45236968994140625, 0.473724365234375, 0.49507904052734375, 0.5164337158203125, 0.5377883911132812, 0.55914306640625, 0.5804977416992188, 0.6018524169921875, 0.6232070922851562, 0.644561767578125, 0.6659164428710938, 0.6872711181640625, 0.7086257934570312, 0.72998046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 18.0, 15.0, 18.0, 42.0, 75.0, 156.0, 255.0, 138.0, 76.0, 44.0, 30.0, 22.0, 26.0, 13.0, 7.0, 7.0, 6.0, 6.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.2054290771484375, -0.199310302734375, -0.1931915283203125, -0.18707275390625, -0.1809539794921875, -0.174835205078125, -0.1687164306640625, -0.16259765625, -0.1564788818359375, -0.150360107421875, -0.1442413330078125, -0.13812255859375, -0.1320037841796875, -0.125885009765625, -0.1197662353515625, -0.1136474609375, -0.1075286865234375, -0.101409912109375, -0.0952911376953125, -0.08917236328125, -0.0830535888671875, -0.076934814453125, -0.0708160400390625, -0.064697265625, -0.0585784912109375, -0.052459716796875, -0.0463409423828125, -0.04022216796875, -0.0341033935546875, -0.027984619140625, -0.0218658447265625, -0.0157470703125, -0.0096282958984375, -0.003509521484375, 0.0026092529296875, 0.00872802734375, 0.0148468017578125, 0.020965576171875, 0.0270843505859375, 0.033203125, 0.0393218994140625, 0.045440673828125, 0.0515594482421875, 0.05767822265625, 0.0637969970703125, 0.069915771484375, 0.0760345458984375, 0.0821533203125, 0.0882720947265625, 0.094390869140625, 0.1005096435546875, 0.10662841796875, 0.1127471923828125, 0.118865966796875, 0.1249847412109375, 0.131103515625, 0.1372222900390625, 0.143341064453125, 0.1494598388671875, 0.15557861328125, 0.1616973876953125, 0.167816162109375, 0.1739349365234375, 0.1800537109375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 16.0, 13.0, 30.0, 45.0, 75.0, 168.0, 215.0, 163.0, 91.0, 64.0, 42.0, 20.0, 11.0, 9.0, 9.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.364039421081543, -5.232263565063477, -5.10048770904541, -4.9687113761901855, -4.836935520172119, -4.705159664154053, -4.573383808135986, -4.44160795211792, -4.309831619262695, -4.178055763244629, -4.0462799072265625, -3.914503812789917, -3.7827277183532715, -3.650951862335205, -3.5191760063171387, -3.3874001502990723, -3.255624294281006, -3.1238484382629395, -2.992072343826294, -2.8602964878082275, -2.728520393371582, -2.5967445373535156, -2.464968681335449, -2.333192825317383, -2.2014167308807373, -2.069640874862671, -1.9378647804260254, -1.806088924407959, -1.674312949180603, -1.542536973953247, -1.4107611179351807, -1.2789851427078247, -1.1472094058990479, -1.015433430671692, -0.8836575150489807, -0.7518815994262695, -0.6201056241989136, -0.4883296489715576, -0.35655373334884644, -0.22477781772613525, -0.0930018424987793, 0.03877410292625427, 0.17055004835128784, 0.3023259937763214, 0.434101939201355, 0.5658779144287109, 0.6976538300514221, 0.8294297456741333, 0.9612057209014893, 1.0929816961288452, 1.2247576713562012, 1.3565335273742676, 1.4883095026016235, 1.6200854778289795, 1.751861333847046, 1.8836373090744019, 2.015413284301758, 2.147189140319824, 2.2789652347564697, 2.410741090774536, 2.5425171852111816, 2.674293041229248, 2.8060688972473145, 2.937844753265381, 3.0696208477020264]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 3.0, 5.0, 4.0, 8.0, 14.0, 14.0, 16.0, 26.0, 32.0, 33.0, 40.0, 45.0, 51.0, 50.0, 50.0, 64.0, 67.0, 56.0, 45.0, 65.0, 50.0, 47.0, 35.0, 41.0, 33.0, 25.0, 24.0, 18.0, 11.0, 8.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515451192855835, -2.3930253982543945, -2.270599842071533, -2.148174285888672, -2.0257484912872314, -1.9033228158950806, -1.7808971405029297, -1.6584714651107788, -1.536045789718628, -1.413620114326477, -1.2911944389343262, -1.1687687635421753, -1.0463430881500244, -0.9239174127578735, -0.8014917373657227, -0.6790660619735718, -0.5566403865814209, -0.43421471118927, -0.31178903579711914, -0.18936336040496826, -0.06693768501281738, 0.055487990379333496, 0.17791366577148438, 0.30033934116363525, 0.42276501655578613, 0.545190691947937, 0.6676163673400879, 0.7900420427322388, 0.9124677181243896, 1.0348933935165405, 1.1573190689086914, 1.2797447443008423, 1.402170181274414, 1.524595856666565, 1.6470215320587158, 1.7694472074508667, 1.8918728828430176, 2.014298439025879, 2.1367242336273193, 2.2591500282287598, 2.381575584411621, 2.5040011405944824, 2.626426935195923, 2.7488527297973633, 2.8712782859802246, 2.993703842163086, 3.1161296367645264, 3.238555431365967, 3.360980987548828, 3.4834065437316895, 3.60583233833313, 3.7282581329345703, 3.8506836891174316, 3.973109245300293, 4.0955352783203125, 4.217960834503174, 4.340386390686035, 4.4628119468688965, 4.585237503051758, 4.707663536071777, 4.830089092254639, 4.9525146484375, 5.0749406814575195, 5.197366237640381, 5.319791793823242]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 5.0, 7.0, 14.0, 10.0, 14.0, 8.0, 16.0, 12.0, 18.0, 33.0, 42.0, 39.0, 79.0, 114.0, 241.0, 461.0, 1210.0, 5910.0, 2078111.0, 2099369.0, 6270.0, 1184.0, 467.0, 220.0, 143.0, 78.0, 41.0, 32.0, 25.0, 19.0, 23.0, 11.0, 10.0, 3.0, 2.0, 10.0, 3.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.14739990234375, -5.9354248046875, -5.72344970703125, -5.511474609375, -5.29949951171875, -5.0875244140625, -4.87554931640625, -4.66357421875, -4.45159912109375, -4.2396240234375, -4.02764892578125, -3.815673828125, -3.60369873046875, -3.3917236328125, -3.17974853515625, -2.9677734375, -2.75579833984375, -2.5438232421875, -2.33184814453125, -2.119873046875, -1.90789794921875, -1.6959228515625, -1.48394775390625, -1.27197265625, -1.05999755859375, -0.8480224609375, -0.63604736328125, -0.424072265625, -0.21209716796875, -0.0001220703125, 0.21185302734375, 0.423828125, 0.63580322265625, 0.8477783203125, 1.05975341796875, 1.271728515625, 1.48370361328125, 1.6956787109375, 1.90765380859375, 2.11962890625, 2.33160400390625, 2.5435791015625, 2.75555419921875, 2.967529296875, 3.17950439453125, 3.3914794921875, 3.60345458984375, 3.8154296875, 4.02740478515625, 4.2393798828125, 4.45135498046875, 4.663330078125, 4.87530517578125, 5.0872802734375, 5.29925537109375, 5.51123046875, 5.72320556640625, 5.9351806640625, 6.14715576171875, 6.359130859375, 6.57110595703125, 6.7830810546875, 6.99505615234375, 7.20703125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 8.0, 16.0, 16.0, 18.0, 28.0, 25.0, 41.0, 40.0, 49.0, 53.0, 63.0, 68.0, 68.0, 57.0, 60.0, 64.0, 57.0, 54.0, 34.0, 38.0, 27.0, 23.0, 20.0, 12.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.880859375, -1.8299560546875, -1.779052734375, -1.7281494140625, -1.67724609375, -1.6263427734375, -1.575439453125, -1.5245361328125, -1.4736328125, -1.4227294921875, -1.371826171875, -1.3209228515625, -1.27001953125, -1.2191162109375, -1.168212890625, -1.1173095703125, -1.06640625, -1.0155029296875, -0.964599609375, -0.9136962890625, -0.86279296875, -0.8118896484375, -0.760986328125, -0.7100830078125, -0.6591796875, -0.6082763671875, -0.557373046875, -0.5064697265625, -0.45556640625, -0.4046630859375, -0.353759765625, -0.3028564453125, -0.251953125, -0.2010498046875, -0.150146484375, -0.0992431640625, -0.04833984375, 0.0025634765625, 0.053466796875, 0.1043701171875, 0.1552734375, 0.2061767578125, 0.257080078125, 0.3079833984375, 0.35888671875, 0.4097900390625, 0.460693359375, 0.5115966796875, 0.5625, 0.6134033203125, 0.664306640625, 0.7152099609375, 0.76611328125, 0.8170166015625, 0.867919921875, 0.9188232421875, 0.9697265625, 1.0206298828125, 1.071533203125, 1.1224365234375, 1.17333984375, 1.2242431640625, 1.275146484375, 1.3260498046875, 1.376953125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 9.0, 14.0, 20.0, 66.0, 208.0, 1175.0, 3583173.0, 608237.0, 991.0, 192.0, 71.0, 39.0, 27.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.3515625, -13.9027099609375, -13.453857421875, -13.0050048828125, -12.55615234375, -12.1072998046875, -11.658447265625, -11.2095947265625, -10.7607421875, -10.3118896484375, -9.863037109375, -9.4141845703125, -8.96533203125, -8.5164794921875, -8.067626953125, -7.6187744140625, -7.169921875, -6.7210693359375, -6.272216796875, -5.8233642578125, -5.37451171875, -4.9256591796875, -4.476806640625, -4.0279541015625, -3.5791015625, -3.1302490234375, -2.681396484375, -2.2325439453125, -1.78369140625, -1.3348388671875, -0.885986328125, -0.4371337890625, 0.01171875, 0.4605712890625, 0.909423828125, 1.3582763671875, 1.80712890625, 2.2559814453125, 2.704833984375, 3.1536865234375, 3.6025390625, 4.0513916015625, 4.500244140625, 4.9490966796875, 5.39794921875, 5.8468017578125, 6.295654296875, 6.7445068359375, 7.193359375, 7.6422119140625, 8.091064453125, 8.5399169921875, 8.98876953125, 9.4376220703125, 9.886474609375, 10.3353271484375, 10.7841796875, 11.2330322265625, 11.681884765625, 12.1307373046875, 12.57958984375, 13.0284423828125, 13.477294921875, 13.9261474609375, 14.375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 12.0, 23.0, 36.0, 74.0, 260.0, 1573.0, 1606.0, 321.0, 86.0, 35.0, 15.0, 15.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.3364715576171875, -1.295989990234375, -1.2555084228515625, -1.21502685546875, -1.1745452880859375, -1.134063720703125, -1.0935821533203125, -1.0531005859375, -1.0126190185546875, -0.972137451171875, -0.9316558837890625, -0.89117431640625, -0.8506927490234375, -0.810211181640625, -0.7697296142578125, -0.729248046875, -0.6887664794921875, -0.648284912109375, -0.6078033447265625, -0.56732177734375, -0.5268402099609375, -0.486358642578125, -0.4458770751953125, -0.4053955078125, -0.3649139404296875, -0.324432373046875, -0.2839508056640625, -0.24346923828125, -0.2029876708984375, -0.162506103515625, -0.1220245361328125, -0.08154296875, -0.0410614013671875, -0.000579833984375, 0.0399017333984375, 0.08038330078125, 0.1208648681640625, 0.161346435546875, 0.2018280029296875, 0.2423095703125, 0.2827911376953125, 0.323272705078125, 0.3637542724609375, 0.40423583984375, 0.4447174072265625, 0.485198974609375, 0.5256805419921875, 0.566162109375, 0.6066436767578125, 0.647125244140625, 0.6876068115234375, 0.72808837890625, 0.7685699462890625, 0.809051513671875, 0.8495330810546875, 0.8900146484375, 0.9304962158203125, 0.970977783203125, 1.0114593505859375, 1.05194091796875, 1.0924224853515625, 1.132904052734375, 1.1733856201171875, 1.2138671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 10.0, 17.0, 24.0, 49.0, 77.0, 128.0, 197.0, 177.0, 124.0, 72.0, 48.0, 25.0, 17.0, 13.0, 3.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4512486457824707, -3.3520452976226807, -3.2528417110443115, -3.1536383628845215, -3.0544350147247314, -2.9552314281463623, -2.8560280799865723, -2.756824493408203, -2.657621145248413, -2.558417797088623, -2.459214210510254, -2.360010862350464, -2.260807514190674, -2.1616039276123047, -2.0624005794525146, -1.963197112083435, -1.863993763923645, -1.7647902965545654, -1.6655869483947754, -1.5663834810256958, -1.4671800136566162, -1.3679766654968262, -1.2687731981277466, -1.169569730758667, -1.070366382598877, -0.9711629748344421, -0.8719595074653625, -0.7727560997009277, -0.6735526323318481, -0.5743492245674133, -0.4751458168029785, -0.3759423494338989, -0.27673888206481934, -0.17753544449806213, -0.07833202183246613, 0.020871400833129883, 0.12007483839988708, 0.2192782759666443, 0.3184816837310791, 0.4176851511001587, 0.5168885588645935, 0.6160919666290283, 0.7152954339981079, 0.8144988417625427, 0.9137022495269775, 1.0129057168960571, 1.1121091842651367, 1.2113125324249268, 1.3105159997940063, 1.409719467163086, 1.508922815322876, 1.6081262826919556, 1.7073297500610352, 1.8065330982208252, 1.9057365655899048, 2.0049400329589844, 2.1041433811187744, 2.2033467292785645, 2.3025503158569336, 2.4017536640167236, 2.5009570121765137, 2.600160598754883, 2.699363946914673, 2.798567295074463, 2.897770881652832]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 5.0, 9.0, 16.0, 16.0, 19.0, 33.0, 32.0, 32.0, 52.0, 46.0, 42.0, 55.0, 58.0, 61.0, 53.0, 58.0, 61.0, 50.0, 43.0, 53.0, 45.0, 32.0, 25.0, 21.0, 24.0, 20.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7910429239273071, -1.7389572858810425, -1.6868716478347778, -1.6347860097885132, -1.5827003717422485, -1.5306147336959839, -1.4785289764404297, -1.426443338394165, -1.3743577003479004, -1.3222720623016357, -1.270186424255371, -1.2181007862091064, -1.1660151481628418, -1.1139295101165771, -1.0618438720703125, -1.0097582340240479, -0.9576725959777832, -0.9055869579315186, -0.8535013198852539, -0.8014156818389893, -0.7493300437927246, -0.69724440574646, -0.6451587080955505, -0.5930730700492859, -0.5409874320030212, -0.4889017939567566, -0.43681615591049194, -0.3847304880619049, -0.33264485001564026, -0.2805592119693756, -0.22847354412078857, -0.17638790607452393, -0.12430238723754883, -0.07221674174070358, -0.020131096243858337, 0.031954556703567505, 0.08404019474983215, 0.1361258327960968, 0.18821150064468384, 0.2402971386909485, 0.29238277673721313, 0.3444684147834778, 0.39655405282974243, 0.44863972067832947, 0.5007253885269165, 0.5528110265731812, 0.6048966646194458, 0.6569823026657104, 0.7090679407119751, 0.7611535787582397, 0.8132392168045044, 0.865324854850769, 0.9174104928970337, 0.9694961309432983, 1.0215818881988525, 1.0736675262451172, 1.1257531642913818, 1.1778388023376465, 1.2299244403839111, 1.2820100784301758, 1.3340957164764404, 1.386181354522705, 1.4382669925689697, 1.4903526306152344, 1.542438268661499]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 6.0, 7.0, 16.0, 17.0, 34.0, 64.0, 142.0, 350.0, 865.0, 2737.0, 10385.0, 70445.0, 909373.0, 42752.0, 7928.0, 2161.0, 718.0, 278.0, 126.0, 61.0, 30.0, 13.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6762847900390625, -1.628936767578125, -1.5815887451171875, -1.53424072265625, -1.4868927001953125, -1.439544677734375, -1.3921966552734375, -1.3448486328125, -1.2975006103515625, -1.250152587890625, -1.2028045654296875, -1.15545654296875, -1.1081085205078125, -1.060760498046875, -1.0134124755859375, -0.966064453125, -0.9187164306640625, -0.871368408203125, -0.8240203857421875, -0.77667236328125, -0.7293243408203125, -0.681976318359375, -0.6346282958984375, -0.5872802734375, -0.5399322509765625, -0.492584228515625, -0.4452362060546875, -0.39788818359375, -0.3505401611328125, -0.303192138671875, -0.2558441162109375, -0.20849609375, -0.1611480712890625, -0.113800048828125, -0.0664520263671875, -0.01910400390625, 0.0282440185546875, 0.075592041015625, 0.1229400634765625, 0.1702880859375, 0.2176361083984375, 0.264984130859375, 0.3123321533203125, 0.35968017578125, 0.4070281982421875, 0.454376220703125, 0.5017242431640625, 0.549072265625, 0.5964202880859375, 0.643768310546875, 0.6911163330078125, 0.73846435546875, 0.7858123779296875, 0.833160400390625, 0.8805084228515625, 0.9278564453125, 0.9752044677734375, 1.022552490234375, 1.0699005126953125, 1.11724853515625, 1.1645965576171875, 1.211944580078125, 1.2592926025390625, 1.306640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 6.0, 8.0, 18.0, 22.0, 27.0, 38.0, 53.0, 62.0, 72.0, 81.0, 85.0, 81.0, 92.0, 78.0, 60.0, 56.0, 39.0, 40.0, 19.0, 27.0, 12.0, 12.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.7027130126953125, -1.659332275390625, -1.6159515380859375, -1.57257080078125, -1.5291900634765625, -1.485809326171875, -1.4424285888671875, -1.3990478515625, -1.3556671142578125, -1.312286376953125, -1.2689056396484375, -1.22552490234375, -1.1821441650390625, -1.138763427734375, -1.0953826904296875, -1.052001953125, -1.0086212158203125, -0.965240478515625, -0.9218597412109375, -0.87847900390625, -0.8350982666015625, -0.791717529296875, -0.7483367919921875, -0.7049560546875, -0.6615753173828125, -0.618194580078125, -0.5748138427734375, -0.53143310546875, -0.4880523681640625, -0.444671630859375, -0.4012908935546875, -0.35791015625, -0.3145294189453125, -0.271148681640625, -0.2277679443359375, -0.18438720703125, -0.1410064697265625, -0.097625732421875, -0.0542449951171875, -0.0108642578125, 0.0325164794921875, 0.075897216796875, 0.1192779541015625, 0.16265869140625, 0.2060394287109375, 0.249420166015625, 0.2928009033203125, 0.336181640625, 0.3795623779296875, 0.422943115234375, 0.4663238525390625, 0.50970458984375, 0.5530853271484375, 0.596466064453125, 0.6398468017578125, 0.6832275390625, 0.7266082763671875, 0.769989013671875, 0.8133697509765625, 0.85675048828125, 0.9001312255859375, 0.943511962890625, 0.9868927001953125, 1.0302734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 13.0, 9.0, 12.0, 18.0, 33.0, 40.0, 88.0, 126.0, 216.0, 459.0, 826.0, 1847.0, 4413.0, 12832.0, 51023.0, 612549.0, 313743.0, 34027.0, 9528.0, 3621.0, 1485.0, 745.0, 383.0, 198.0, 110.0, 80.0, 34.0, 22.0, 24.0, 4.0, 6.0, 8.0, 7.0, 6.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.515625, -0.49892425537109375, -0.4822235107421875, -0.46552276611328125, -0.448822021484375, -0.43212127685546875, -0.4154205322265625, -0.39871978759765625, -0.38201904296875, -0.36531829833984375, -0.3486175537109375, -0.33191680908203125, -0.315216064453125, -0.29851531982421875, -0.2818145751953125, -0.26511383056640625, -0.2484130859375, -0.23171234130859375, -0.2150115966796875, -0.19831085205078125, -0.181610107421875, -0.16490936279296875, -0.1482086181640625, -0.13150787353515625, -0.11480712890625, -0.09810638427734375, -0.0814056396484375, -0.06470489501953125, -0.048004150390625, -0.03130340576171875, -0.0146026611328125, 0.00209808349609375, 0.018798828125, 0.03549957275390625, 0.0522003173828125, 0.06890106201171875, 0.085601806640625, 0.10230255126953125, 0.1190032958984375, 0.13570404052734375, 0.15240478515625, 0.16910552978515625, 0.1858062744140625, 0.20250701904296875, 0.219207763671875, 0.23590850830078125, 0.2526092529296875, 0.26930999755859375, 0.2860107421875, 0.30271148681640625, 0.3194122314453125, 0.33611297607421875, 0.352813720703125, 0.36951446533203125, 0.3862152099609375, 0.40291595458984375, 0.41961669921875, 0.43631744384765625, 0.4530181884765625, 0.46971893310546875, 0.486419677734375, 0.5031204223632812, 0.5198211669921875, 0.5365219116210938, 0.55322265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 1.0, 8.0, 12.0, 16.0, 15.0, 16.0, 21.0, 27.0, 30.0, 44.0, 41.0, 49.0, 49.0, 42.0, 62.0, 55.0, 60.0, 47.0, 40.0, 54.0, 45.0, 47.0, 38.0, 39.0, 24.0, 11.0, 26.0, 15.0, 18.0, 7.0, 7.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.69140625, -1.6441192626953125, -1.596832275390625, -1.5495452880859375, -1.50225830078125, -1.4549713134765625, -1.407684326171875, -1.3603973388671875, -1.3131103515625, -1.2658233642578125, -1.218536376953125, -1.1712493896484375, -1.12396240234375, -1.0766754150390625, -1.029388427734375, -0.9821014404296875, -0.934814453125, -0.8875274658203125, -0.840240478515625, -0.7929534912109375, -0.74566650390625, -0.6983795166015625, -0.651092529296875, -0.6038055419921875, -0.5565185546875, -0.5092315673828125, -0.461944580078125, -0.4146575927734375, -0.36737060546875, -0.3200836181640625, -0.272796630859375, -0.2255096435546875, -0.17822265625, -0.1309356689453125, -0.083648681640625, -0.0363616943359375, 0.01092529296875, 0.0582122802734375, 0.105499267578125, 0.1527862548828125, 0.2000732421875, 0.2473602294921875, 0.294647216796875, 0.3419342041015625, 0.38922119140625, 0.4365081787109375, 0.483795166015625, 0.5310821533203125, 0.578369140625, 0.6256561279296875, 0.672943115234375, 0.7202301025390625, 0.76751708984375, 0.8148040771484375, 0.862091064453125, 0.9093780517578125, 0.9566650390625, 1.0039520263671875, 1.051239013671875, 1.0985260009765625, 1.14581298828125, 1.1930999755859375, 1.240386962890625, 1.2876739501953125, 1.3349609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 9.0, 18.0, 23.0, 36.0, 41.0, 71.0, 85.0, 136.0, 195.0, 343.0, 552.0, 1033.0, 2053.0, 5045.0, 16951.0, 111584.0, 782196.0, 102506.0, 16211.0, 4873.0, 2016.0, 1029.0, 539.0, 349.0, 185.0, 136.0, 85.0, 71.0, 47.0, 29.0, 27.0, 14.0, 11.0, 14.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10308837890625, -0.09946918487548828, -0.09584999084472656, -0.09223079681396484, -0.08861160278320312, -0.0849924087524414, -0.08137321472167969, -0.07775402069091797, -0.07413482666015625, -0.07051563262939453, -0.06689643859863281, -0.0632772445678711, -0.059658050537109375, -0.056038856506347656, -0.05241966247558594, -0.04880046844482422, -0.0451812744140625, -0.04156208038330078, -0.03794288635253906, -0.034323692321777344, -0.030704498291015625, -0.027085304260253906, -0.023466110229492188, -0.01984691619873047, -0.01622772216796875, -0.012608528137207031, -0.008989334106445312, -0.005370140075683594, -0.001750946044921875, 0.0018682479858398438, 0.0054874420166015625, 0.009106636047363281, 0.012725830078125, 0.01634502410888672, 0.019964218139648438, 0.023583412170410156, 0.027202606201171875, 0.030821800231933594, 0.03444099426269531, 0.03806018829345703, 0.04167938232421875, 0.04529857635498047, 0.04891777038574219, 0.052536964416503906, 0.056156158447265625, 0.059775352478027344, 0.06339454650878906, 0.06701374053955078, 0.0706329345703125, 0.07425212860107422, 0.07787132263183594, 0.08149051666259766, 0.08510971069335938, 0.0887289047241211, 0.09234809875488281, 0.09596729278564453, 0.09958648681640625, 0.10320568084716797, 0.10682487487792969, 0.1104440689086914, 0.11406326293945312, 0.11768245697021484, 0.12130165100097656, 0.12492084503173828, 0.1285400390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 10.0, 28.0, 32.0, 67.0, 118.0, 203.0, 184.0, 139.0, 86.0, 43.0, 29.0, 13.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.562471389770508e-05, -6.311200559139252e-05, -6.0599297285079956e-05, -5.8086588978767395e-05, -5.5573880672454834e-05, -5.306117236614227e-05, -5.054846405982971e-05, -4.803575575351715e-05, -4.552304744720459e-05, -4.301033914089203e-05, -4.049763083457947e-05, -3.798492252826691e-05, -3.5472214221954346e-05, -3.2959505915641785e-05, -3.0446797609329224e-05, -2.7934089303016663e-05, -2.54213809967041e-05, -2.290867269039154e-05, -2.039596438407898e-05, -1.788325607776642e-05, -1.5370547771453857e-05, -1.2857839465141296e-05, -1.0345131158828735e-05, -7.832422852516174e-06, -5.319714546203613e-06, -2.8070062398910522e-06, -2.942979335784912e-07, 2.21841037273407e-06, 4.731118679046631e-06, 7.243826985359192e-06, 9.756535291671753e-06, 1.2269243597984314e-05, 1.4781951904296875e-05, 1.7294660210609436e-05, 1.9807368516921997e-05, 2.2320076823234558e-05, 2.483278512954712e-05, 2.734549343585968e-05, 2.985820174217224e-05, 3.23709100484848e-05, 3.488361835479736e-05, 3.7396326661109924e-05, 3.9909034967422485e-05, 4.2421743273735046e-05, 4.493445158004761e-05, 4.744715988636017e-05, 4.995986819267273e-05, 5.247257649898529e-05, 5.498528480529785e-05, 5.749799311161041e-05, 6.0010701417922974e-05, 6.252340972423553e-05, 6.50361180305481e-05, 6.754882633686066e-05, 7.006153464317322e-05, 7.257424294948578e-05, 7.508695125579834e-05, 7.75996595621109e-05, 8.011236786842346e-05, 8.262507617473602e-05, 8.513778448104858e-05, 8.765049278736115e-05, 9.01632010936737e-05, 9.267590939998627e-05, 9.518861770629883e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 10.0, 10.0, 12.0, 14.0, 37.0, 72.0, 245.0, 654.0, 2726.0, 30165.0, 990137.0, 21225.0, 2305.0, 573.0, 196.0, 70.0, 30.0, 17.0, 16.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3935546875, -0.38245391845703125, -0.3713531494140625, -0.36025238037109375, -0.349151611328125, -0.33805084228515625, -0.3269500732421875, -0.31584930419921875, -0.30474853515625, -0.29364776611328125, -0.2825469970703125, -0.27144622802734375, -0.260345458984375, -0.24924468994140625, -0.2381439208984375, -0.22704315185546875, -0.2159423828125, -0.20484161376953125, -0.1937408447265625, -0.18264007568359375, -0.171539306640625, -0.16043853759765625, -0.1493377685546875, -0.13823699951171875, -0.12713623046875, -0.11603546142578125, -0.1049346923828125, -0.09383392333984375, -0.082733154296875, -0.07163238525390625, -0.0605316162109375, -0.04943084716796875, -0.038330078125, -0.02722930908203125, -0.0161285400390625, -0.00502777099609375, 0.006072998046875, 0.01717376708984375, 0.0282745361328125, 0.03937530517578125, 0.05047607421875, 0.06157684326171875, 0.0726776123046875, 0.08377838134765625, 0.094879150390625, 0.10597991943359375, 0.1170806884765625, 0.12818145751953125, 0.1392822265625, 0.15038299560546875, 0.1614837646484375, 0.17258453369140625, 0.183685302734375, 0.19478607177734375, 0.2058868408203125, 0.21698760986328125, 0.22808837890625, 0.23918914794921875, 0.2502899169921875, 0.26139068603515625, 0.272491455078125, 0.28359222412109375, 0.2946929931640625, 0.30579376220703125, 0.31689453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 20.0, 29.0, 34.0, 31.0, 71.0, 103.0, 141.0, 133.0, 118.0, 80.0, 60.0, 35.0, 27.0, 18.0, 20.0, 11.0, 7.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0280914306640625, -0.027221202850341797, -0.026350975036621094, -0.02548074722290039, -0.024610519409179688, -0.023740291595458984, -0.02287006378173828, -0.021999835968017578, -0.021129608154296875, -0.020259380340576172, -0.01938915252685547, -0.018518924713134766, -0.017648696899414062, -0.01677846908569336, -0.015908241271972656, -0.015038013458251953, -0.01416778564453125, -0.013297557830810547, -0.012427330017089844, -0.01155710220336914, -0.010686874389648438, -0.009816646575927734, -0.008946418762207031, -0.008076190948486328, -0.007205963134765625, -0.006335735321044922, -0.005465507507324219, -0.004595279693603516, -0.0037250518798828125, -0.0028548240661621094, -0.0019845962524414062, -0.0011143684387207031, -0.000244140625, 0.0006260871887207031, 0.0014963150024414062, 0.0023665428161621094, 0.0032367706298828125, 0.004106998443603516, 0.004977226257324219, 0.005847454071044922, 0.006717681884765625, 0.007587909698486328, 0.008458137512207031, 0.009328365325927734, 0.010198593139648438, 0.01106882095336914, 0.011939048767089844, 0.012809276580810547, 0.01367950439453125, 0.014549732208251953, 0.015419960021972656, 0.01629018783569336, 0.017160415649414062, 0.018030643463134766, 0.01890087127685547, 0.019771099090576172, 0.020641326904296875, 0.021511554718017578, 0.02238178253173828, 0.023252010345458984, 0.024122238159179688, 0.02499246597290039, 0.025862693786621094, 0.026732921600341797, 0.0276031494140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 16.0, 30.0, 53.0, 102.0, 263.0, 260.0, 140.0, 71.0, 23.0, 10.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.3868608474731445, -3.309995412826538, -3.2331299781799316, -3.1562647819519043, -3.079399347305298, -3.0025339126586914, -2.925668478012085, -2.8488030433654785, -2.771937847137451, -2.6950724124908447, -2.6182069778442383, -2.541341781616211, -2.4644763469696045, -2.387610912322998, -2.3107454776763916, -2.233880043029785, -2.1570146083831787, -2.0801491737365723, -2.003283739089966, -1.926418423652649, -1.849553108215332, -1.7726876735687256, -1.6958222389221191, -1.6189568042755127, -1.5420914888381958, -1.4652260541915894, -1.3883607387542725, -1.311495304107666, -1.2346298694610596, -1.1577645540237427, -1.0808991193771362, -1.0040338039398193, -0.9271682500839233, -0.8503028750419617, -0.7734375, -0.6965720653533936, -0.6197066903114319, -0.5428413152694702, -0.46597591042518616, -0.3891105055809021, -0.31224513053894043, -0.23537974059581757, -0.1585143506526947, -0.08164896070957184, -0.004783570766448975, 0.0720818042755127, 0.14894720911979675, 0.2258126139640808, 0.3026779890060425, 0.37954336404800415, 0.4564087688922882, 0.5332741737365723, 0.6101395487785339, 0.6870049238204956, 0.763870358467102, 0.8407357335090637, 0.9176011085510254, 0.9944664835929871, 1.0713318586349487, 1.1481972932815552, 1.225062608718872, 1.3019280433654785, 1.378793478012085, 1.4556589126586914, 1.5325242280960083]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 13.0, 28.0, 33.0, 41.0, 57.0, 63.0, 55.0, 72.0, 84.0, 67.0, 90.0, 68.0, 58.0, 64.0, 39.0, 41.0, 35.0, 16.0, 23.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5457602739334106, -1.5074880123138428, -1.4692156314849854, -1.430943250656128, -1.39267098903656, -1.3543987274169922, -1.3161263465881348, -1.2778539657592773, -1.2395817041397095, -1.2013094425201416, -1.1630370616912842, -1.1247646808624268, -1.0864924192428589, -1.048220157623291, -1.0099477767944336, -0.971675455570221, -0.9334031343460083, -0.8951308131217957, -0.856858491897583, -0.8185861706733704, -0.7803138494491577, -0.7420415282249451, -0.7037692070007324, -0.6654968857765198, -0.6272245645523071, -0.5889522433280945, -0.5506799221038818, -0.5124076008796692, -0.47413527965545654, -0.4358629584312439, -0.39759063720703125, -0.3593183159828186, -0.32104605436325073, -0.2827737331390381, -0.24450141191482544, -0.2062290906906128, -0.16795676946640015, -0.1296844482421875, -0.09141212701797485, -0.05313980579376221, -0.01486748456954956, 0.023404836654663086, 0.06167715787887573, 0.09994947910308838, 0.13822180032730103, 0.17649412155151367, 0.21476644277572632, 0.25303876399993896, 0.2913110852241516, 0.32958340644836426, 0.3678557276725769, 0.40612804889678955, 0.4444003701210022, 0.48267269134521484, 0.5209450125694275, 0.5592173337936401, 0.5974896550178528, 0.6357619762420654, 0.6740342974662781, 0.7123066186904907, 0.7505789399147034, 0.788851261138916, 0.8271235823631287, 0.8653959035873413, 0.903668224811554]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 13.0, 18.0, 44.0, 78.0, 140.0, 310.0, 805.0, 2258.0, 7211.0, 28975.0, 857963.0, 127729.0, 15924.0, 4493.0, 1500.0, 601.0, 245.0, 99.0, 41.0, 29.0, 19.0, 5.0, 9.0, 3.0, 4.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.676605224609375, -2.58367919921875, -2.490753173828125, -2.3978271484375, -2.304901123046875, -2.21197509765625, -2.119049072265625, -2.026123046875, -1.933197021484375, -1.84027099609375, -1.747344970703125, -1.6544189453125, -1.561492919921875, -1.46856689453125, -1.375640869140625, -1.28271484375, -1.189788818359375, -1.09686279296875, -1.003936767578125, -0.9110107421875, -0.818084716796875, -0.72515869140625, -0.632232666015625, -0.539306640625, -0.446380615234375, -0.35345458984375, -0.260528564453125, -0.1676025390625, -0.074676513671875, 0.01824951171875, 0.111175537109375, 0.2041015625, 0.297027587890625, 0.38995361328125, 0.482879638671875, 0.5758056640625, 0.668731689453125, 0.76165771484375, 0.854583740234375, 0.947509765625, 1.040435791015625, 1.13336181640625, 1.226287841796875, 1.3192138671875, 1.412139892578125, 1.50506591796875, 1.597991943359375, 1.69091796875, 1.783843994140625, 1.87677001953125, 1.969696044921875, 2.0626220703125, 2.155548095703125, 2.24847412109375, 2.341400146484375, 2.434326171875, 2.527252197265625, 2.62017822265625, 2.713104248046875, 2.8060302734375, 2.898956298828125, 2.99188232421875, 3.084808349609375, 3.177734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 13.0, 8.0, 15.0, 10.0, 26.0, 25.0, 18.0, 31.0, 33.0, 26.0, 46.0, 50.0, 48.0, 49.0, 47.0, 48.0, 61.0, 59.0, 55.0, 42.0, 42.0, 44.0, 35.0, 20.0, 32.0, 18.0, 11.0, 20.0, 11.0, 9.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6140289306640625, -1.553253173828125, -1.4924774169921875, -1.43170166015625, -1.3709259033203125, -1.310150146484375, -1.2493743896484375, -1.1885986328125, -1.1278228759765625, -1.067047119140625, -1.0062713623046875, -0.94549560546875, -0.8847198486328125, -0.823944091796875, -0.7631683349609375, -0.702392578125, -0.6416168212890625, -0.580841064453125, -0.5200653076171875, -0.45928955078125, -0.3985137939453125, -0.337738037109375, -0.2769622802734375, -0.2161865234375, -0.1554107666015625, -0.094635009765625, -0.0338592529296875, 0.02691650390625, 0.0876922607421875, 0.148468017578125, 0.2092437744140625, 0.27001953125, 0.3307952880859375, 0.391571044921875, 0.4523468017578125, 0.51312255859375, 0.5738983154296875, 0.634674072265625, 0.6954498291015625, 0.7562255859375, 0.8170013427734375, 0.877777099609375, 0.9385528564453125, 0.99932861328125, 1.0601043701171875, 1.120880126953125, 1.1816558837890625, 1.242431640625, 1.3032073974609375, 1.363983154296875, 1.4247589111328125, 1.48553466796875, 1.5463104248046875, 1.607086181640625, 1.6678619384765625, 1.7286376953125, 1.7894134521484375, 1.850189208984375, 1.9109649658203125, 1.97174072265625, 2.0325164794921875, 2.093292236328125, 2.1540679931640625, 2.21484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 12.0, 13.0, 26.0, 25.0, 15.0, 27.0, 23.0, 33.0, 42.0, 74.0, 86.0, 184.0, 479.0, 2553.0, 36455.0, 994964.0, 11429.0, 1236.0, 325.0, 147.0, 62.0, 57.0, 47.0, 34.0, 34.0, 18.0, 15.0, 17.0, 22.0, 12.0, 8.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.04296875, -5.86163330078125, -5.6802978515625, -5.49896240234375, -5.317626953125, -5.13629150390625, -4.9549560546875, -4.77362060546875, -4.59228515625, -4.41094970703125, -4.2296142578125, -4.04827880859375, -3.866943359375, -3.68560791015625, -3.5042724609375, -3.32293701171875, -3.1416015625, -2.96026611328125, -2.7789306640625, -2.59759521484375, -2.416259765625, -2.23492431640625, -2.0535888671875, -1.87225341796875, -1.69091796875, -1.50958251953125, -1.3282470703125, -1.14691162109375, -0.965576171875, -0.78424072265625, -0.6029052734375, -0.42156982421875, -0.240234375, -0.05889892578125, 0.1224365234375, 0.30377197265625, 0.485107421875, 0.66644287109375, 0.8477783203125, 1.02911376953125, 1.21044921875, 1.39178466796875, 1.5731201171875, 1.75445556640625, 1.935791015625, 2.11712646484375, 2.2984619140625, 2.47979736328125, 2.6611328125, 2.84246826171875, 3.0238037109375, 3.20513916015625, 3.386474609375, 3.56781005859375, 3.7491455078125, 3.93048095703125, 4.11181640625, 4.29315185546875, 4.4744873046875, 4.65582275390625, 4.837158203125, 5.01849365234375, 5.1998291015625, 5.38116455078125, 5.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 13.0, 13.0, 24.0, 18.0, 21.0, 19.0, 26.0, 31.0, 34.0, 54.0, 44.0, 43.0, 54.0, 43.0, 58.0, 57.0, 56.0, 42.0, 35.0, 39.0, 31.0, 32.0, 30.0, 17.0, 21.0, 18.0, 19.0, 21.0, 10.0, 7.0, 7.0, 7.0, 13.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.708984375, -1.653228759765625, -1.59747314453125, -1.541717529296875, -1.4859619140625, -1.430206298828125, -1.37445068359375, -1.318695068359375, -1.262939453125, -1.207183837890625, -1.15142822265625, -1.095672607421875, -1.0399169921875, -0.984161376953125, -0.92840576171875, -0.872650146484375, -0.81689453125, -0.761138916015625, -0.70538330078125, -0.649627685546875, -0.5938720703125, -0.538116455078125, -0.48236083984375, -0.426605224609375, -0.370849609375, -0.315093994140625, -0.25933837890625, -0.203582763671875, -0.1478271484375, -0.092071533203125, -0.03631591796875, 0.019439697265625, 0.0751953125, 0.130950927734375, 0.18670654296875, 0.242462158203125, 0.2982177734375, 0.353973388671875, 0.40972900390625, 0.465484619140625, 0.521240234375, 0.576995849609375, 0.63275146484375, 0.688507080078125, 0.7442626953125, 0.800018310546875, 0.85577392578125, 0.911529541015625, 0.96728515625, 1.023040771484375, 1.07879638671875, 1.134552001953125, 1.1903076171875, 1.246063232421875, 1.30181884765625, 1.357574462890625, 1.413330078125, 1.469085693359375, 1.52484130859375, 1.580596923828125, 1.6363525390625, 1.692108154296875, 1.74786376953125, 1.803619384765625, 1.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 3.0, 8.0, 3.0, 8.0, 11.0, 18.0, 26.0, 30.0, 47.0, 94.0, 156.0, 341.0, 899.0, 2617.0, 10008.0, 217973.0, 798886.0, 12419.0, 2960.0, 1029.0, 465.0, 225.0, 97.0, 68.0, 39.0, 28.0, 24.0, 15.0, 11.0, 4.0, 11.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9715957641601562, -0.9446563720703125, -0.9177169799804688, -0.890777587890625, -0.8638381958007812, -0.8368988037109375, -0.8099594116210938, -0.78302001953125, -0.7560806274414062, -0.7291412353515625, -0.7022018432617188, -0.675262451171875, -0.6483230590820312, -0.6213836669921875, -0.5944442749023438, -0.5675048828125, -0.5405654907226562, -0.5136260986328125, -0.48668670654296875, -0.459747314453125, -0.43280792236328125, -0.4058685302734375, -0.37892913818359375, -0.35198974609375, -0.32505035400390625, -0.2981109619140625, -0.27117156982421875, -0.244232177734375, -0.21729278564453125, -0.1903533935546875, -0.16341400146484375, -0.136474609375, -0.10953521728515625, -0.0825958251953125, -0.05565643310546875, -0.028717041015625, -0.00177764892578125, 0.0251617431640625, 0.05210113525390625, 0.07904052734375, 0.10597991943359375, 0.1329193115234375, 0.15985870361328125, 0.186798095703125, 0.21373748779296875, 0.2406768798828125, 0.26761627197265625, 0.2945556640625, 0.32149505615234375, 0.3484344482421875, 0.37537384033203125, 0.402313232421875, 0.42925262451171875, 0.4561920166015625, 0.48313140869140625, 0.51007080078125, 0.5370101928710938, 0.5639495849609375, 0.5908889770507812, 0.617828369140625, 0.6447677612304688, 0.6717071533203125, 0.6986465454101562, 0.7255859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 3.0, 10.0, 9.0, 11.0, 35.0, 54.0, 138.0, 487.0, 109.0, 54.0, 19.0, 11.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.0001100366935133934, -0.00010664574801921844, -0.00010325480252504349, -9.986385703086853e-05, -9.647291153669357e-05, -9.308196604251862e-05, -8.969102054834366e-05, -8.63000750541687e-05, -8.290912955999374e-05, -7.951818406581879e-05, -7.612723857164383e-05, -7.273629307746887e-05, -6.934534758329391e-05, -6.595440208911896e-05, -6.2563456594944e-05, -5.917251110076904e-05, -5.5781565606594086e-05, -5.239062011241913e-05, -4.899967461824417e-05, -4.5608729124069214e-05, -4.2217783629894257e-05, -3.88268381357193e-05, -3.543589264154434e-05, -3.2044947147369385e-05, -2.8654001653194427e-05, -2.526305615901947e-05, -2.1872110664844513e-05, -1.8481165170669556e-05, -1.5090219676494598e-05, -1.1699274182319641e-05, -8.308328688144684e-06, -4.9173831939697266e-06, -1.5264376997947693e-06, 1.864507794380188e-06, 5.255453288555145e-06, 8.646398782730103e-06, 1.203734427690506e-05, 1.5428289771080017e-05, 1.8819235265254974e-05, 2.221018075942993e-05, 2.560112625360489e-05, 2.8992071747779846e-05, 3.2383017241954803e-05, 3.577396273612976e-05, 3.916490823030472e-05, 4.2555853724479675e-05, 4.594679921865463e-05, 4.933774471282959e-05, 5.272869020700455e-05, 5.6119635701179504e-05, 5.951058119535446e-05, 6.290152668952942e-05, 6.629247218370438e-05, 6.968341767787933e-05, 7.307436317205429e-05, 7.646530866622925e-05, 7.98562541604042e-05, 8.324719965457916e-05, 8.663814514875412e-05, 9.002909064292908e-05, 9.342003613710403e-05, 9.681098163127899e-05, 0.00010020192712545395, 0.0001035928726196289]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 5.0, 9.0, 4.0, 17.0, 31.0, 53.0, 67.0, 143.0, 373.0, 974.0, 3387.0, 21421.0, 992084.0, 24486.0, 3724.0, 1029.0, 362.0, 165.0, 73.0, 47.0, 32.0, 19.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9280014038085938, -0.8916473388671875, -0.8552932739257812, -0.818939208984375, -0.7825851440429688, -0.7462310791015625, -0.7098770141601562, -0.67352294921875, -0.6371688842773438, -0.6008148193359375, -0.5644607543945312, -0.528106689453125, -0.49175262451171875, -0.4553985595703125, -0.41904449462890625, -0.3826904296875, -0.34633636474609375, -0.3099822998046875, -0.27362823486328125, -0.237274169921875, -0.20092010498046875, -0.1645660400390625, -0.12821197509765625, -0.09185791015625, -0.05550384521484375, -0.0191497802734375, 0.01720428466796875, 0.053558349609375, 0.08991241455078125, 0.1262664794921875, 0.16262054443359375, 0.198974609375, 0.23532867431640625, 0.2716827392578125, 0.30803680419921875, 0.344390869140625, 0.38074493408203125, 0.4170989990234375, 0.45345306396484375, 0.48980712890625, 0.5261611938476562, 0.5625152587890625, 0.5988693237304688, 0.635223388671875, 0.6715774536132812, 0.7079315185546875, 0.7442855834960938, 0.7806396484375, 0.8169937133789062, 0.8533477783203125, 0.8897018432617188, 0.926055908203125, 0.9624099731445312, 0.9987640380859375, 1.0351181030273438, 1.07147216796875, 1.1078262329101562, 1.1441802978515625, 1.1805343627929688, 1.216888427734375, 1.2532424926757812, 1.2895965576171875, 1.3259506225585938, 1.3623046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 15.0, 20.0, 53.0, 103.0, 380.0, 219.0, 72.0, 40.0, 17.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.339599609375, -0.3306083679199219, -0.32161712646484375, -0.3126258850097656, -0.3036346435546875, -0.2946434020996094, -0.28565216064453125, -0.2766609191894531, -0.267669677734375, -0.2586784362792969, -0.24968719482421875, -0.24069595336914062, -0.2317047119140625, -0.22271347045898438, -0.21372222900390625, -0.20473098754882812, -0.19573974609375, -0.18674850463867188, -0.17775726318359375, -0.16876602172851562, -0.1597747802734375, -0.15078353881835938, -0.14179229736328125, -0.13280105590820312, -0.123809814453125, -0.11481857299804688, -0.10582733154296875, -0.09683609008789062, -0.0878448486328125, -0.07885360717773438, -0.06986236572265625, -0.060871124267578125, -0.0518798828125, -0.042888641357421875, -0.03389739990234375, -0.024906158447265625, -0.0159149169921875, -0.006923675537109375, 0.00206756591796875, 0.011058807373046875, 0.020050048828125, 0.029041290283203125, 0.03803253173828125, 0.047023773193359375, 0.0560150146484375, 0.06500625610351562, 0.07399749755859375, 0.08298873901367188, 0.09197998046875, 0.10097122192382812, 0.10996246337890625, 0.11895370483398438, 0.1279449462890625, 0.13693618774414062, 0.14592742919921875, 0.15491867065429688, 0.163909912109375, 0.17290115356445312, 0.18189239501953125, 0.19088363647460938, 0.1998748779296875, 0.20886611938476562, 0.21785736083984375, 0.22684860229492188, 0.23583984375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 22.0, 131.0, 596.0, 201.0, 45.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-22.348182678222656, -21.938617706298828, -21.529050827026367, -21.11948585510254, -20.709918975830078, -20.30035400390625, -19.89078712463379, -19.48122215270996, -19.0716552734375, -18.662090301513672, -18.25252342224121, -17.842958450317383, -17.433391571044922, -17.023826599121094, -16.614259719848633, -16.204694747924805, -15.795129776000977, -15.385563850402832, -14.975997924804688, -14.566431999206543, -14.156866073608398, -13.74730110168457, -13.33773422241211, -12.928169250488281, -12.51860237121582, -12.109036445617676, -11.699470520019531, -11.289904594421387, -10.880338668823242, -10.470773696899414, -10.061206817626953, -9.651641845703125, -9.242074966430664, -8.83250904083252, -8.422943115234375, -8.01337718963623, -7.603811740875244, -7.1942458152771, -6.784679889678955, -6.375114440917969, -5.965548515319824, -5.55598258972168, -5.146416664123535, -4.736850738525391, -4.327285289764404, -3.9177193641662598, -3.5081534385681152, -3.09858775138855, -2.6890218257904053, -2.2794559001922607, -1.8698902130126953, -1.4603242874145508, -1.0507584810256958, -0.6411926746368408, -0.2316267490386963, 0.17793893814086914, 0.5875048637390137, 0.9970706701278687, 1.4066364765167236, 1.8162024021148682, 2.2257680892944336, 2.635334014892578, 3.0448999404907227, 3.454465627670288, 3.8640315532684326]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 9.0, 12.0, 12.0, 12.0, 14.0, 13.0, 27.0, 38.0, 23.0, 20.0, 33.0, 30.0, 41.0, 35.0, 52.0, 39.0, 38.0, 54.0, 51.0, 42.0, 34.0, 38.0, 26.0, 32.0, 20.0, 27.0, 30.0, 19.0, 25.0, 24.0, 27.0, 14.0, 16.0, 7.0, 9.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0938031673431396, -3.0046226978302, -2.9154422283172607, -2.826261520385742, -2.7370810508728027, -2.6479005813598633, -2.558720111846924, -2.4695396423339844, -2.380359172821045, -2.2911787033081055, -2.201998233795166, -2.1128177642822266, -2.023637056350708, -1.9344565868377686, -1.845276117324829, -1.7560956478118896, -1.666914939880371, -1.5777344703674316, -1.4885538816452026, -1.3993734121322632, -1.3101928234100342, -1.2210123538970947, -1.1318318843841553, -1.0426514148712158, -0.9534708261489868, -0.8642902970314026, -0.7751097679138184, -0.6859292984008789, -0.5967487692832947, -0.5075682401657104, -0.418387770652771, -0.32920724153518677, -0.24002671241760254, -0.1508461982011795, -0.06166568398475647, 0.02751481533050537, 0.1166953444480896, 0.20587587356567383, 0.2950563430786133, 0.3842368721961975, 0.47341740131378174, 0.562597930431366, 0.6517784595489502, 0.7409589290618896, 0.8301394581794739, 0.9193199872970581, 1.0085004568099976, 1.0976810455322266, 1.186861515045166, 1.2760419845581055, 1.3652225732803345, 1.454403042793274, 1.543583631515503, 1.6327641010284424, 1.7219445705413818, 1.8111250400543213, 1.9003056287765503, 1.9894860982894897, 2.0786666870117188, 2.167847156524658, 2.2570276260375977, 2.346208095550537, 2.4353885650634766, 2.524569272994995, 2.6137497425079346]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 9.0, 15.0, 19.0, 34.0, 48.0, 69.0, 117.0, 178.0, 342.0, 609.0, 1176.0, 2565.0, 7696.0, 56772.0, 2193297.0, 1868468.0, 50135.0, 6914.0, 3087.0, 1183.0, 623.0, 354.0, 211.0, 124.0, 86.0, 41.0, 36.0, 20.0, 14.0, 10.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.52880859375, -2.4521484375, -2.37548828125, -2.298828125, -2.22216796875, -2.1455078125, -2.06884765625, -1.9921875, -1.91552734375, -1.8388671875, -1.76220703125, -1.685546875, -1.60888671875, -1.5322265625, -1.45556640625, -1.37890625, -1.30224609375, -1.2255859375, -1.14892578125, -1.072265625, -0.99560546875, -0.9189453125, -0.84228515625, -0.765625, -0.68896484375, -0.6123046875, -0.53564453125, -0.458984375, -0.38232421875, -0.3056640625, -0.22900390625, -0.15234375, -0.07568359375, 0.0009765625, 0.07763671875, 0.154296875, 0.23095703125, 0.3076171875, 0.38427734375, 0.4609375, 0.53759765625, 0.6142578125, 0.69091796875, 0.767578125, 0.84423828125, 0.9208984375, 0.99755859375, 1.07421875, 1.15087890625, 1.2275390625, 1.30419921875, 1.380859375, 1.45751953125, 1.5341796875, 1.61083984375, 1.6875, 1.76416015625, 1.8408203125, 1.91748046875, 1.994140625, 2.07080078125, 2.1474609375, 2.22412109375, 2.30078125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 11.0, 9.0, 18.0, 22.0, 24.0, 48.0, 43.0, 45.0, 58.0, 74.0, 49.0, 76.0, 81.0, 63.0, 58.0, 67.0, 52.0, 52.0, 33.0, 28.0, 26.0, 20.0, 15.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8133697509765625, -1.764434814453125, -1.7154998779296875, -1.66656494140625, -1.6176300048828125, -1.568695068359375, -1.5197601318359375, -1.4708251953125, -1.4218902587890625, -1.372955322265625, -1.3240203857421875, -1.27508544921875, -1.2261505126953125, -1.177215576171875, -1.1282806396484375, -1.079345703125, -1.0304107666015625, -0.981475830078125, -0.9325408935546875, -0.88360595703125, -0.8346710205078125, -0.785736083984375, -0.7368011474609375, -0.6878662109375, -0.6389312744140625, -0.589996337890625, -0.5410614013671875, -0.49212646484375, -0.4431915283203125, -0.394256591796875, -0.3453216552734375, -0.29638671875, -0.2474517822265625, -0.198516845703125, -0.1495819091796875, -0.10064697265625, -0.0517120361328125, -0.002777099609375, 0.0461578369140625, 0.0950927734375, 0.1440277099609375, 0.192962646484375, 0.2418975830078125, 0.29083251953125, 0.3397674560546875, 0.388702392578125, 0.4376373291015625, 0.486572265625, 0.5355072021484375, 0.584442138671875, 0.6333770751953125, 0.68231201171875, 0.7312469482421875, 0.780181884765625, 0.8291168212890625, 0.8780517578125, 0.9269866943359375, 0.975921630859375, 1.0248565673828125, 1.07379150390625, 1.1227264404296875, 1.171661376953125, 1.2205963134765625, 1.26953125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 12.0, 20.0, 31.0, 104.0, 274.0, 1266.0, 25191.0, 4161344.0, 5151.0, 580.0, 154.0, 59.0, 32.0, 23.0, 7.0, 12.0, 5.0, 0.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.34375, -10.0234375, -9.703125, -9.3828125, -9.0625, -8.7421875, -8.421875, -8.1015625, -7.78125, -7.4609375, -7.140625, -6.8203125, -6.5, -6.1796875, -5.859375, -5.5390625, -5.21875, -4.8984375, -4.578125, -4.2578125, -3.9375, -3.6171875, -3.296875, -2.9765625, -2.65625, -2.3359375, -2.015625, -1.6953125, -1.375, -1.0546875, -0.734375, -0.4140625, -0.09375, 0.2265625, 0.546875, 0.8671875, 1.1875, 1.5078125, 1.828125, 2.1484375, 2.46875, 2.7890625, 3.109375, 3.4296875, 3.75, 4.0703125, 4.390625, 4.7109375, 5.03125, 5.3515625, 5.671875, 5.9921875, 6.3125, 6.6328125, 6.953125, 7.2734375, 7.59375, 7.9140625, 8.234375, 8.5546875, 8.875, 9.1953125, 9.515625, 9.8359375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 0.0, 7.0, 8.0, 6.0, 12.0, 28.0, 30.0, 64.0, 179.0, 906.0, 2105.0, 512.0, 122.0, 45.0, 18.0, 10.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.91796875, -0.8876953125, -0.857421875, -0.8271484375, -0.796875, -0.7666015625, -0.736328125, -0.7060546875, -0.67578125, -0.6455078125, -0.615234375, -0.5849609375, -0.5546875, -0.5244140625, -0.494140625, -0.4638671875, -0.43359375, -0.4033203125, -0.373046875, -0.3427734375, -0.3125, -0.2822265625, -0.251953125, -0.2216796875, -0.19140625, -0.1611328125, -0.130859375, -0.1005859375, -0.0703125, -0.0400390625, -0.009765625, 0.0205078125, 0.05078125, 0.0810546875, 0.111328125, 0.1416015625, 0.171875, 0.2021484375, 0.232421875, 0.2626953125, 0.29296875, 0.3232421875, 0.353515625, 0.3837890625, 0.4140625, 0.4443359375, 0.474609375, 0.5048828125, 0.53515625, 0.5654296875, 0.595703125, 0.6259765625, 0.65625, 0.6865234375, 0.716796875, 0.7470703125, 0.77734375, 0.8076171875, 0.837890625, 0.8681640625, 0.8984375, 0.9287109375, 0.958984375, 0.9892578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 23.0, 34.0, 66.0, 143.0, 232.0, 228.0, 111.0, 69.0, 40.0, 11.0, 17.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.052628517150879, -3.945894718170166, -3.8391611576080322, -3.7324273586273193, -3.6256935596466064, -3.5189599990844727, -3.4122262001037598, -3.305492401123047, -3.198758602142334, -3.092024803161621, -2.9852912425994873, -2.8785574436187744, -2.7718236446380615, -2.6650900840759277, -2.558356285095215, -2.451622486114502, -2.344888925552368, -2.2381551265716553, -2.1314215660095215, -2.0246877670288086, -1.9179539680480957, -1.8112202882766724, -1.704486608505249, -1.5977528095245361, -1.4910191297531128, -1.3842854499816895, -1.2775516510009766, -1.1708179712295532, -1.0640842914581299, -0.957350492477417, -0.8506168127059937, -0.7438830733299255, -0.6371493339538574, -0.5304155945777893, -0.4236818850040436, -0.31694817543029785, -0.21021443605422974, -0.10348069667816162, 0.0032529830932617188, 0.10998672246932983, 0.21672046184539795, 0.32345420122146606, 0.4301879107952118, 0.5369216203689575, 0.6436553597450256, 0.7503890991210938, 0.8571227788925171, 0.9638565182685852, 1.0705902576446533, 1.1773239374160767, 1.2840577363967896, 1.390791416168213, 1.4975252151489258, 1.6042588949203491, 1.7109925746917725, 1.8177263736724854, 1.9244600534439087, 2.031193733215332, 2.137927532196045, 2.244661331176758, 2.3513948917388916, 2.4581286907196045, 2.5648622512817383, 2.671596050262451, 2.778329849243164]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 7.0, 8.0, 15.0, 22.0, 19.0, 30.0, 51.0, 39.0, 59.0, 65.0, 70.0, 64.0, 71.0, 88.0, 70.0, 66.0, 66.0, 48.0, 35.0, 34.0, 25.0, 15.0, 9.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2870242595672607, -2.230461835861206, -2.1738996505737305, -2.117337226867676, -2.060774803161621, -2.0042126178741455, -1.9476501941680908, -1.8910878896713257, -1.8345255851745605, -1.7779632806777954, -1.7214008569717407, -1.6648385524749756, -1.6082762479782104, -1.5517139434814453, -1.4951515197753906, -1.4385892152786255, -1.3820269107818604, -1.3254646062850952, -1.2689021825790405, -1.2123398780822754, -1.1557775735855103, -1.0992152690887451, -1.0426528453826904, -0.9860905408859253, -0.9295281171798706, -0.8729657530784607, -0.8164034485816956, -0.7598410844802856, -0.7032787799835205, -0.6467164158821106, -0.5901540517807007, -0.5335917472839355, -0.4770294427871704, -0.4204671084880829, -0.36390477418899536, -0.30734241008758545, -0.2507801055908203, -0.1942177414894104, -0.13765540719032288, -0.08109307289123535, -0.024530738592147827, 0.032031599432229996, 0.08859393745660782, 0.14515627920627594, 0.20171861350536346, 0.2582809627056122, 0.3148432970046997, 0.37140563130378723, 0.42796796560287476, 0.4845302999019623, 0.5410926342010498, 0.5976549983024597, 0.6542173027992249, 0.7107796669006348, 0.7673419713973999, 0.8239043354988098, 0.8804666996002197, 0.9370290637016296, 0.9935913681983948, 1.0501537322998047, 1.1067160367965698, 1.163278341293335, 1.2198407649993896, 1.2764030694961548, 1.33296537399292]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 10.0, 20.0, 31.0, 44.0, 57.0, 121.0, 219.0, 377.0, 759.0, 1781.0, 4496.0, 14461.0, 75425.0, 680279.0, 228599.0, 29365.0, 7514.0, 2662.0, 1157.0, 484.0, 295.0, 140.0, 73.0, 53.0, 38.0, 19.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.336669921875, -0.3240776062011719, -0.31148529052734375, -0.2988929748535156, -0.2863006591796875, -0.2737083435058594, -0.26111602783203125, -0.24852371215820312, -0.235931396484375, -0.22333908081054688, -0.21074676513671875, -0.19815444946289062, -0.1855621337890625, -0.17296981811523438, -0.16037750244140625, -0.14778518676757812, -0.13519287109375, -0.12260055541992188, -0.11000823974609375, -0.09741592407226562, -0.0848236083984375, -0.07223129272460938, -0.05963897705078125, -0.047046661376953125, -0.034454345703125, -0.021862030029296875, -0.00926971435546875, 0.003322601318359375, 0.0159149169921875, 0.028507232666015625, 0.04109954833984375, 0.053691864013671875, 0.0662841796875, 0.07887649536132812, 0.09146881103515625, 0.10406112670898438, 0.1166534423828125, 0.12924575805664062, 0.14183807373046875, 0.15443038940429688, 0.167022705078125, 0.17961502075195312, 0.19220733642578125, 0.20479965209960938, 0.2173919677734375, 0.22998428344726562, 0.24257659912109375, 0.2551689147949219, 0.26776123046875, 0.2803535461425781, 0.29294586181640625, 0.3055381774902344, 0.3181304931640625, 0.3307228088378906, 0.34331512451171875, 0.3559074401855469, 0.368499755859375, 0.3810920715332031, 0.39368438720703125, 0.4062767028808594, 0.4188690185546875, 0.4314613342285156, 0.44405364990234375, 0.4566459655761719, 0.46923828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 17.0, 22.0, 33.0, 55.0, 69.0, 82.0, 99.0, 103.0, 118.0, 106.0, 85.0, 57.0, 54.0, 38.0, 22.0, 10.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.947418212890625, -1.89483642578125, -1.842254638671875, -1.7896728515625, -1.737091064453125, -1.68450927734375, -1.631927490234375, -1.579345703125, -1.526763916015625, -1.47418212890625, -1.421600341796875, -1.3690185546875, -1.316436767578125, -1.26385498046875, -1.211273193359375, -1.15869140625, -1.106109619140625, -1.05352783203125, -1.000946044921875, -0.9483642578125, -0.895782470703125, -0.84320068359375, -0.790618896484375, -0.738037109375, -0.685455322265625, -0.63287353515625, -0.580291748046875, -0.5277099609375, -0.475128173828125, -0.42254638671875, -0.369964599609375, -0.3173828125, -0.264801025390625, -0.21221923828125, -0.159637451171875, -0.1070556640625, -0.054473876953125, -0.00189208984375, 0.050689697265625, 0.103271484375, 0.155853271484375, 0.20843505859375, 0.261016845703125, 0.3135986328125, 0.366180419921875, 0.41876220703125, 0.471343994140625, 0.52392578125, 0.576507568359375, 0.62908935546875, 0.681671142578125, 0.7342529296875, 0.786834716796875, 0.83941650390625, 0.891998291015625, 0.944580078125, 0.997161865234375, 1.04974365234375, 1.102325439453125, 1.1549072265625, 1.207489013671875, 1.26007080078125, 1.312652587890625, 1.365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 9.0, 6.0, 7.0, 11.0, 10.0, 17.0, 34.0, 41.0, 63.0, 87.0, 123.0, 203.0, 263.0, 423.0, 633.0, 968.0, 1684.0, 3043.0, 6238.0, 13890.0, 35238.0, 108347.0, 406200.0, 329752.0, 87505.0, 29454.0, 11821.0, 5435.0, 2831.0, 1522.0, 887.0, 549.0, 389.0, 274.0, 174.0, 128.0, 109.0, 54.0, 40.0, 34.0, 22.0, 15.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17476463317871094, -0.16910934448242188, -0.1634540557861328, -0.15779876708984375, -0.1521434783935547, -0.14648818969726562, -0.14083290100097656, -0.1351776123046875, -0.12952232360839844, -0.12386703491210938, -0.11821174621582031, -0.11255645751953125, -0.10690116882324219, -0.10124588012695312, -0.09559059143066406, -0.089935302734375, -0.08428001403808594, -0.07862472534179688, -0.07296943664550781, -0.06731414794921875, -0.06165885925292969, -0.056003570556640625, -0.05034828186035156, -0.0446929931640625, -0.03903770446777344, -0.033382415771484375, -0.027727127075195312, -0.02207183837890625, -0.016416549682617188, -0.010761260986328125, -0.0051059722900390625, 0.00054931640625, 0.0062046051025390625, 0.011859893798828125, 0.017515182495117188, 0.02317047119140625, 0.028825759887695312, 0.034481048583984375, 0.04013633728027344, 0.0457916259765625, 0.05144691467285156, 0.057102203369140625, 0.06275749206542969, 0.06841278076171875, 0.07406806945800781, 0.07972335815429688, 0.08537864685058594, 0.091033935546875, 0.09668922424316406, 0.10234451293945312, 0.10799980163574219, 0.11365509033203125, 0.11931037902832031, 0.12496566772460938, 0.13062095642089844, 0.1362762451171875, 0.14193153381347656, 0.14758682250976562, 0.1532421112060547, 0.15889739990234375, 0.1645526885986328, 0.17020797729492188, 0.17586326599121094, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 12.0, 9.0, 9.0, 17.0, 22.0, 20.0, 28.0, 40.0, 53.0, 52.0, 54.0, 42.0, 55.0, 71.0, 52.0, 65.0, 68.0, 52.0, 48.0, 42.0, 36.0, 24.0, 26.0, 20.0, 21.0, 20.0, 8.0, 12.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.5984344482421875, -1.542572021484375, -1.4867095947265625, -1.43084716796875, -1.3749847412109375, -1.319122314453125, -1.2632598876953125, -1.2073974609375, -1.1515350341796875, -1.095672607421875, -1.0398101806640625, -0.98394775390625, -0.9280853271484375, -0.872222900390625, -0.8163604736328125, -0.760498046875, -0.7046356201171875, -0.648773193359375, -0.5929107666015625, -0.53704833984375, -0.4811859130859375, -0.425323486328125, -0.3694610595703125, -0.3135986328125, -0.2577362060546875, -0.201873779296875, -0.1460113525390625, -0.09014892578125, -0.0342864990234375, 0.021575927734375, 0.0774383544921875, 0.13330078125, 0.1891632080078125, 0.245025634765625, 0.3008880615234375, 0.35675048828125, 0.4126129150390625, 0.468475341796875, 0.5243377685546875, 0.5802001953125, 0.6360626220703125, 0.691925048828125, 0.7477874755859375, 0.80364990234375, 0.8595123291015625, 0.915374755859375, 0.9712371826171875, 1.027099609375, 1.0829620361328125, 1.138824462890625, 1.1946868896484375, 1.25054931640625, 1.3064117431640625, 1.362274169921875, 1.4181365966796875, 1.4739990234375, 1.5298614501953125, 1.585723876953125, 1.6415863037109375, 1.69744873046875, 1.7533111572265625, 1.809173583984375, 1.8650360107421875, 1.9208984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 13.0, 8.0, 21.0, 28.0, 29.0, 58.0, 78.0, 126.0, 193.0, 339.0, 772.0, 1447.0, 3128.0, 7886.0, 24737.0, 117379.0, 649130.0, 191485.0, 34275.0, 10130.0, 3816.0, 1645.0, 791.0, 419.0, 236.0, 122.0, 84.0, 51.0, 33.0, 24.0, 20.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07354736328125, -0.07122135162353516, -0.06889533996582031, -0.06656932830810547, -0.06424331665039062, -0.06191730499267578, -0.05959129333496094, -0.057265281677246094, -0.05493927001953125, -0.052613258361816406, -0.05028724670410156, -0.04796123504638672, -0.045635223388671875, -0.04330921173095703, -0.04098320007324219, -0.038657188415527344, -0.0363311767578125, -0.034005165100097656, -0.03167915344238281, -0.02935314178466797, -0.027027130126953125, -0.02470111846923828, -0.022375106811523438, -0.020049095153808594, -0.01772308349609375, -0.015397071838378906, -0.013071060180664062, -0.010745048522949219, -0.008419036865234375, -0.006093025207519531, -0.0037670135498046875, -0.0014410018920898438, 0.000885009765625, 0.0032110214233398438, 0.0055370330810546875, 0.007863044738769531, 0.010189056396484375, 0.012515068054199219, 0.014841079711914062, 0.017167091369628906, 0.01949310302734375, 0.021819114685058594, 0.024145126342773438, 0.02647113800048828, 0.028797149658203125, 0.03112316131591797, 0.03344917297363281, 0.035775184631347656, 0.0381011962890625, 0.040427207946777344, 0.04275321960449219, 0.04507923126220703, 0.047405242919921875, 0.04973125457763672, 0.05205726623535156, 0.054383277893066406, 0.05670928955078125, 0.059035301208496094, 0.06136131286621094, 0.06368732452392578, 0.06601333618164062, 0.06833934783935547, 0.07066535949707031, 0.07299137115478516, 0.0753173828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 14.0, 6.0, 14.0, 27.0, 21.0, 30.0, 45.0, 81.0, 84.0, 116.0, 147.0, 101.0, 82.0, 61.0, 38.0, 32.0, 20.0, 13.0, 13.0, 14.0, 11.0, 3.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.707408905029297e-05, -3.5713426768779755e-05, -3.435276448726654e-05, -3.2992102205753326e-05, -3.163143992424011e-05, -3.0270777642726898e-05, -2.8910115361213684e-05, -2.754945307970047e-05, -2.6188790798187256e-05, -2.4828128516674042e-05, -2.3467466235160828e-05, -2.2106803953647614e-05, -2.07461416721344e-05, -1.9385479390621185e-05, -1.802481710910797e-05, -1.6664154827594757e-05, -1.5303492546081543e-05, -1.3942830264568329e-05, -1.2582167983055115e-05, -1.12215057015419e-05, -9.860843420028687e-06, -8.500181138515472e-06, -7.139518857002258e-06, -5.778856575489044e-06, -4.41819429397583e-06, -3.057532012462616e-06, -1.6968697309494019e-06, -3.3620744943618774e-07, 1.0244548320770264e-06, 2.3851171135902405e-06, 3.7457793951034546e-06, 5.106441676616669e-06, 6.467103958129883e-06, 7.827766239643097e-06, 9.188428521156311e-06, 1.0549090802669525e-05, 1.190975308418274e-05, 1.3270415365695953e-05, 1.4631077647209167e-05, 1.599173992872238e-05, 1.7352402210235596e-05, 1.871306449174881e-05, 2.0073726773262024e-05, 2.1434389054775238e-05, 2.2795051336288452e-05, 2.4155713617801666e-05, 2.551637589931488e-05, 2.6877038180828094e-05, 2.823770046234131e-05, 2.9598362743854523e-05, 3.095902502536774e-05, 3.231968730688095e-05, 3.3680349588394165e-05, 3.504101186990738e-05, 3.640167415142059e-05, 3.776233643293381e-05, 3.912299871444702e-05, 4.0483660995960236e-05, 4.184432327747345e-05, 4.3204985558986664e-05, 4.456564784049988e-05, 4.592631012201309e-05, 4.7286972403526306e-05, 4.864763468503952e-05, 5.0008296966552734e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 10.0, 9.0, 13.0, 25.0, 36.0, 46.0, 82.0, 168.0, 410.0, 966.0, 2814.0, 10819.0, 61322.0, 626469.0, 303313.0, 32262.0, 6591.0, 1906.0, 654.0, 296.0, 133.0, 72.0, 44.0, 25.0, 22.0, 15.0, 7.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10919189453125, -0.10605716705322266, -0.10292243957519531, -0.09978771209716797, -0.09665298461914062, -0.09351825714111328, -0.09038352966308594, -0.0872488021850586, -0.08411407470703125, -0.0809793472290039, -0.07784461975097656, -0.07470989227294922, -0.07157516479492188, -0.06844043731689453, -0.06530570983886719, -0.062170982360839844, -0.0590362548828125, -0.055901527404785156, -0.05276679992675781, -0.04963207244873047, -0.046497344970703125, -0.04336261749267578, -0.04022789001464844, -0.037093162536621094, -0.03395843505859375, -0.030823707580566406, -0.027688980102539062, -0.02455425262451172, -0.021419525146484375, -0.01828479766845703, -0.015150070190429688, -0.012015342712402344, -0.008880615234375, -0.005745887756347656, -0.0026111602783203125, 0.0005235671997070312, 0.003658294677734375, 0.006793022155761719, 0.009927749633789062, 0.013062477111816406, 0.01619720458984375, 0.019331932067871094, 0.022466659545898438, 0.02560138702392578, 0.028736114501953125, 0.03187084197998047, 0.03500556945800781, 0.038140296936035156, 0.0412750244140625, 0.044409751892089844, 0.04754447937011719, 0.05067920684814453, 0.053813934326171875, 0.05694866180419922, 0.06008338928222656, 0.0632181167602539, 0.06635284423828125, 0.0694875717163086, 0.07262229919433594, 0.07575702667236328, 0.07889175415039062, 0.08202648162841797, 0.08516120910644531, 0.08829593658447266, 0.0914306640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 8.0, 9.0, 10.0, 7.0, 21.0, 22.0, 16.0, 33.0, 33.0, 60.0, 49.0, 59.0, 88.0, 66.0, 67.0, 76.0, 73.0, 64.0, 65.0, 38.0, 27.0, 26.0, 16.0, 13.0, 17.0, 10.0, 5.0, 7.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01541900634765625, -0.014920353889465332, -0.014421701431274414, -0.013923048973083496, -0.013424396514892578, -0.01292574405670166, -0.012427091598510742, -0.011928439140319824, -0.011429786682128906, -0.010931134223937988, -0.01043248176574707, -0.009933829307556152, -0.009435176849365234, -0.008936524391174316, -0.008437871932983398, -0.00793921947479248, -0.0074405670166015625, -0.0069419145584106445, -0.0064432621002197266, -0.005944609642028809, -0.005445957183837891, -0.004947304725646973, -0.004448652267456055, -0.003949999809265137, -0.0034513473510742188, -0.0029526948928833008, -0.002454042434692383, -0.001955389976501465, -0.0014567375183105469, -0.0009580850601196289, -0.00045943260192871094, 3.921985626220703e-05, 0.000537872314453125, 0.001036524772644043, 0.001535177230834961, 0.002033829689025879, 0.002532482147216797, 0.003031134605407715, 0.003529787063598633, 0.004028439521789551, 0.004527091979980469, 0.005025744438171387, 0.005524396896362305, 0.006023049354553223, 0.006521701812744141, 0.007020354270935059, 0.0075190067291259766, 0.008017659187316895, 0.008516311645507812, 0.00901496410369873, 0.009513616561889648, 0.010012269020080566, 0.010510921478271484, 0.011009573936462402, 0.01150822639465332, 0.012006878852844238, 0.012505531311035156, 0.013004183769226074, 0.013502836227416992, 0.01400148868560791, 0.014500141143798828, 0.014998793601989746, 0.015497446060180664, 0.015996098518371582, 0.0164947509765625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 11.0, 17.0, 51.0, 143.0, 376.0, 252.0, 98.0, 23.0, 18.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140503406524658, -4.036479473114014, -3.932455062866211, -3.8284311294555664, -3.7244069576263428, -3.620382785797119, -3.5163586139678955, -3.412334442138672, -3.3083105087280273, -3.2042863368988037, -3.10026216506958, -2.9962382316589355, -2.892214059829712, -2.7881898880004883, -2.6841657161712646, -2.580141544342041, -2.4761176109313965, -2.372093439102173, -2.268069267272949, -2.1640453338623047, -2.060021162033081, -1.9559969902038574, -1.8519728183746338, -1.7479487657546997, -1.6439244747161865, -1.539900302886963, -1.4358762502670288, -1.3318520784378052, -1.227828025817871, -1.1238038539886475, -1.0197796821594238, -0.9157556295394897, -0.8117315769195557, -0.7077074646949768, -0.603683352470398, -0.4996592104434967, -0.39563509821891785, -0.2916109561920166, -0.18758684396743774, -0.08356273174285889, 0.02046138048171997, 0.12448550015687943, 0.22850961983203888, 0.33253374695777893, 0.4365578591823578, 0.540582001209259, 0.6446061134338379, 0.7486302256584167, 0.8526543378829956, 0.9566784501075745, 1.0607025623321533, 1.164726734161377, 1.268750786781311, 1.3727749586105347, 1.4767990112304688, 1.5808231830596924, 1.684847354888916, 1.7888715267181396, 1.8928955793380737, 1.9969197511672974, 2.1009438037872314, 2.204967975616455, 2.3089921474456787, 2.4130163192749023, 2.517040252685547]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 10.0, 9.0, 24.0, 32.0, 40.0, 54.0, 80.0, 87.0, 96.0, 97.0, 121.0, 82.0, 76.0, 64.0, 47.0, 32.0, 17.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8105216026306152, -1.762357234954834, -1.7141928672790527, -1.6660284996032715, -1.6178641319274902, -1.569699764251709, -1.5215353965759277, -1.4733710289001465, -1.4252066612243652, -1.377042293548584, -1.3288779258728027, -1.2807135581970215, -1.2325491905212402, -1.184384822845459, -1.1362204551696777, -1.0880560874938965, -1.0398917198181152, -0.991727352142334, -0.9435629844665527, -0.8953986167907715, -0.8472342491149902, -0.799069881439209, -0.7509055137634277, -0.7027411460876465, -0.6545767784118652, -0.606412410736084, -0.5582480430603027, -0.5100836753845215, -0.46191930770874023, -0.413754940032959, -0.36559057235717773, -0.3174262046813965, -0.26926183700561523, -0.22109746932983398, -0.17293310165405273, -0.12476873397827148, -0.07660436630249023, -0.028439998626708984, 0.019724369049072266, 0.06788873672485352, 0.11605310440063477, 0.16421747207641602, 0.21238183975219727, 0.2605462074279785, 0.30871057510375977, 0.356874942779541, 0.40503931045532227, 0.4532036781311035, 0.5013680458068848, 0.549532413482666, 0.5976967811584473, 0.6458611488342285, 0.6940255165100098, 0.742189884185791, 0.7903542518615723, 0.8385186195373535, 0.8866829872131348, 0.934847354888916, 0.9830117225646973, 1.0311760902404785, 1.0793404579162598, 1.127504825592041, 1.1756691932678223, 1.2238335609436035, 1.2719979286193848]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 19.0, 46.0, 182.0, 635.0, 3850.0, 153918.0, 883016.0, 5693.0, 869.0, 188.0, 54.0, 33.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.401123046875, -5.25146484375, -5.101806640625, -4.9521484375, -4.802490234375, -4.65283203125, -4.503173828125, -4.353515625, -4.203857421875, -4.05419921875, -3.904541015625, -3.7548828125, -3.605224609375, -3.45556640625, -3.305908203125, -3.15625, -3.006591796875, -2.85693359375, -2.707275390625, -2.5576171875, -2.407958984375, -2.25830078125, -2.108642578125, -1.958984375, -1.809326171875, -1.65966796875, -1.510009765625, -1.3603515625, -1.210693359375, -1.06103515625, -0.911376953125, -0.76171875, -0.612060546875, -0.46240234375, -0.312744140625, -0.1630859375, -0.013427734375, 0.13623046875, 0.285888671875, 0.435546875, 0.585205078125, 0.73486328125, 0.884521484375, 1.0341796875, 1.183837890625, 1.33349609375, 1.483154296875, 1.6328125, 1.782470703125, 1.93212890625, 2.081787109375, 2.2314453125, 2.381103515625, 2.53076171875, 2.680419921875, 2.830078125, 2.979736328125, 3.12939453125, 3.279052734375, 3.4287109375, 3.578369140625, 3.72802734375, 3.877685546875, 4.02734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 18.0, 41.0, 52.0, 87.0, 148.0, 146.0, 184.0, 122.0, 85.0, 61.0, 23.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.409027099609375, -2.25750732421875, -2.105987548828125, -1.9544677734375, -1.802947998046875, -1.65142822265625, -1.499908447265625, -1.348388671875, -1.196868896484375, -1.04534912109375, -0.893829345703125, -0.7423095703125, -0.590789794921875, -0.43927001953125, -0.287750244140625, -0.13623046875, 0.015289306640625, 0.16680908203125, 0.318328857421875, 0.4698486328125, 0.621368408203125, 0.77288818359375, 0.924407958984375, 1.075927734375, 1.227447509765625, 1.37896728515625, 1.530487060546875, 1.6820068359375, 1.833526611328125, 1.98504638671875, 2.136566162109375, 2.2880859375, 2.439605712890625, 2.59112548828125, 2.742645263671875, 2.8941650390625, 3.045684814453125, 3.19720458984375, 3.348724365234375, 3.500244140625, 3.651763916015625, 3.80328369140625, 3.954803466796875, 4.1063232421875, 4.257843017578125, 4.40936279296875, 4.560882568359375, 4.71240234375, 4.863922119140625, 5.01544189453125, 5.166961669921875, 5.3184814453125, 5.470001220703125, 5.62152099609375, 5.773040771484375, 5.924560546875, 6.076080322265625, 6.22760009765625, 6.379119873046875, 6.5306396484375, 6.682159423828125, 6.83367919921875, 6.985198974609375, 7.13671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 5.0, 6.0, 7.0, 8.0, 21.0, 7.0, 19.0, 24.0, 36.0, 48.0, 48.0, 62.0, 82.0, 120.0, 193.0, 285.0, 536.0, 1225.0, 3680.0, 18013.0, 880941.0, 129064.0, 9440.0, 2419.0, 902.0, 449.0, 265.0, 141.0, 115.0, 96.0, 56.0, 55.0, 41.0, 32.0, 20.0, 18.0, 18.0, 15.0, 8.0, 7.0, 8.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.532745361328125, -2.46002197265625, -2.387298583984375, -2.3145751953125, -2.241851806640625, -2.16912841796875, -2.096405029296875, -2.023681640625, -1.950958251953125, -1.87823486328125, -1.805511474609375, -1.7327880859375, -1.660064697265625, -1.58734130859375, -1.514617919921875, -1.44189453125, -1.369171142578125, -1.29644775390625, -1.223724365234375, -1.1510009765625, -1.078277587890625, -1.00555419921875, -0.932830810546875, -0.860107421875, -0.787384033203125, -0.71466064453125, -0.641937255859375, -0.5692138671875, -0.496490478515625, -0.42376708984375, -0.351043701171875, -0.2783203125, -0.205596923828125, -0.13287353515625, -0.060150146484375, 0.0125732421875, 0.085296630859375, 0.15802001953125, 0.230743408203125, 0.303466796875, 0.376190185546875, 0.44891357421875, 0.521636962890625, 0.5943603515625, 0.667083740234375, 0.73980712890625, 0.812530517578125, 0.88525390625, 0.957977294921875, 1.03070068359375, 1.103424072265625, 1.1761474609375, 1.248870849609375, 1.32159423828125, 1.394317626953125, 1.467041015625, 1.539764404296875, 1.61248779296875, 1.685211181640625, 1.7579345703125, 1.830657958984375, 1.90338134765625, 1.976104736328125, 2.048828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 10.0, 13.0, 8.0, 10.0, 18.0, 21.0, 23.0, 21.0, 24.0, 21.0, 28.0, 36.0, 47.0, 40.0, 49.0, 35.0, 38.0, 60.0, 40.0, 53.0, 36.0, 40.0, 32.0, 24.0, 33.0, 28.0, 24.0, 31.0, 22.0, 17.0, 19.0, 21.0, 9.0, 18.0, 7.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4453125, -1.4024200439453125, -1.359527587890625, -1.3166351318359375, -1.27374267578125, -1.2308502197265625, -1.187957763671875, -1.1450653076171875, -1.1021728515625, -1.0592803955078125, -1.016387939453125, -0.9734954833984375, -0.93060302734375, -0.8877105712890625, -0.844818115234375, -0.8019256591796875, -0.759033203125, -0.7161407470703125, -0.673248291015625, -0.6303558349609375, -0.58746337890625, -0.5445709228515625, -0.501678466796875, -0.4587860107421875, -0.4158935546875, -0.3730010986328125, -0.330108642578125, -0.2872161865234375, -0.24432373046875, -0.2014312744140625, -0.158538818359375, -0.1156463623046875, -0.07275390625, -0.0298614501953125, 0.013031005859375, 0.0559234619140625, 0.09881591796875, 0.1417083740234375, 0.184600830078125, 0.2274932861328125, 0.2703857421875, 0.3132781982421875, 0.356170654296875, 0.3990631103515625, 0.44195556640625, 0.4848480224609375, 0.527740478515625, 0.5706329345703125, 0.613525390625, 0.6564178466796875, 0.699310302734375, 0.7422027587890625, 0.78509521484375, 0.8279876708984375, 0.870880126953125, 0.9137725830078125, 0.9566650390625, 0.9995574951171875, 1.042449951171875, 1.0853424072265625, 1.12823486328125, 1.1711273193359375, 1.214019775390625, 1.2569122314453125, 1.2998046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 7.0, 7.0, 9.0, 13.0, 24.0, 29.0, 44.0, 72.0, 146.0, 268.0, 602.0, 1745.0, 7381.0, 64764.0, 913148.0, 51111.0, 6590.0, 1501.0, 551.0, 245.0, 105.0, 74.0, 37.0, 21.0, 21.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2847442626953125, -0.273101806640625, -0.2614593505859375, -0.24981689453125, -0.2381744384765625, -0.226531982421875, -0.2148895263671875, -0.2032470703125, -0.1916046142578125, -0.179962158203125, -0.1683197021484375, -0.15667724609375, -0.1450347900390625, -0.133392333984375, -0.1217498779296875, -0.110107421875, -0.0984649658203125, -0.086822509765625, -0.0751800537109375, -0.06353759765625, -0.0518951416015625, -0.040252685546875, -0.0286102294921875, -0.0169677734375, -0.0053253173828125, 0.006317138671875, 0.0179595947265625, 0.02960205078125, 0.0412445068359375, 0.052886962890625, 0.0645294189453125, 0.076171875, 0.0878143310546875, 0.099456787109375, 0.1110992431640625, 0.12274169921875, 0.1343841552734375, 0.146026611328125, 0.1576690673828125, 0.1693115234375, 0.1809539794921875, 0.192596435546875, 0.2042388916015625, 0.21588134765625, 0.2275238037109375, 0.239166259765625, 0.2508087158203125, 0.262451171875, 0.2740936279296875, 0.285736083984375, 0.2973785400390625, 0.30902099609375, 0.3206634521484375, 0.332305908203125, 0.3439483642578125, 0.3555908203125, 0.3672332763671875, 0.378875732421875, 0.3905181884765625, 0.40216064453125, 0.4138031005859375, 0.425445556640625, 0.4370880126953125, 0.44873046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 26.0, 25.0, 44.0, 93.0, 149.0, 207.0, 153.0, 100.0, 57.0, 28.0, 20.0, 11.0, 11.0, 10.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082918167114258e-05, -3.9686448872089386e-05, -3.8543716073036194e-05, -3.7400983273983e-05, -3.625825047492981e-05, -3.511551767587662e-05, -3.3972784876823425e-05, -3.283005207777023e-05, -3.168731927871704e-05, -3.054458647966385e-05, -2.9401853680610657e-05, -2.8259120881557465e-05, -2.7116388082504272e-05, -2.597365528345108e-05, -2.4830922484397888e-05, -2.3688189685344696e-05, -2.2545456886291504e-05, -2.1402724087238312e-05, -2.025999128818512e-05, -1.9117258489131927e-05, -1.7974525690078735e-05, -1.6831792891025543e-05, -1.568906009197235e-05, -1.4546327292919159e-05, -1.3403594493865967e-05, -1.2260861694812775e-05, -1.1118128895759583e-05, -9.97539609670639e-06, -8.832663297653198e-06, -7.689930498600006e-06, -6.547197699546814e-06, -5.404464900493622e-06, -4.26173210144043e-06, -3.1189993023872375e-06, -1.9762665033340454e-06, -8.335337042808533e-07, 3.0919909477233887e-07, 1.451931893825531e-06, 2.594664692878723e-06, 3.7373974919319153e-06, 4.880130290985107e-06, 6.0228630900382996e-06, 7.165595889091492e-06, 8.308328688144684e-06, 9.451061487197876e-06, 1.0593794286251068e-05, 1.173652708530426e-05, 1.2879259884357452e-05, 1.4021992683410645e-05, 1.5164725482463837e-05, 1.630745828151703e-05, 1.745019108057022e-05, 1.8592923879623413e-05, 1.9735656678676605e-05, 2.0878389477729797e-05, 2.202112227678299e-05, 2.316385507583618e-05, 2.4306587874889374e-05, 2.5449320673942566e-05, 2.6592053472995758e-05, 2.773478627204895e-05, 2.8877519071102142e-05, 3.0020251870155334e-05, 3.1162984669208527e-05, 3.230571746826172e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 15.0, 20.0, 35.0, 57.0, 77.0, 135.0, 204.0, 436.0, 952.0, 2307.0, 7574.0, 44677.0, 872694.0, 101725.0, 11885.0, 3242.0, 1199.0, 532.0, 290.0, 169.0, 95.0, 64.0, 41.0, 30.0, 18.0, 11.0, 10.0, 4.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343017578125, -0.3321800231933594, -0.32134246826171875, -0.3105049133300781, -0.2996673583984375, -0.2888298034667969, -0.27799224853515625, -0.2671546936035156, -0.256317138671875, -0.24547958374023438, -0.23464202880859375, -0.22380447387695312, -0.2129669189453125, -0.20212936401367188, -0.19129180908203125, -0.18045425415039062, -0.16961669921875, -0.15877914428710938, -0.14794158935546875, -0.13710403442382812, -0.1262664794921875, -0.11542892456054688, -0.10459136962890625, -0.09375381469726562, -0.082916259765625, -0.07207870483398438, -0.06124114990234375, -0.050403594970703125, -0.0395660400390625, -0.028728485107421875, -0.01789093017578125, -0.007053375244140625, 0.0037841796875, 0.014621734619140625, 0.02545928955078125, 0.036296844482421875, 0.0471343994140625, 0.057971954345703125, 0.06880950927734375, 0.07964706420898438, 0.090484619140625, 0.10132217407226562, 0.11215972900390625, 0.12299728393554688, 0.1338348388671875, 0.14467239379882812, 0.15550994873046875, 0.16634750366210938, 0.17718505859375, 0.18802261352539062, 0.19886016845703125, 0.20969772338867188, 0.2205352783203125, 0.23137283325195312, 0.24221038818359375, 0.2530479431152344, 0.263885498046875, 0.2747230529785156, 0.28556060791015625, 0.2963981628417969, 0.3072357177734375, 0.3180732727050781, 0.32891082763671875, 0.3397483825683594, 0.3505859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 6.0, 13.0, 14.0, 15.0, 29.0, 36.0, 57.0, 107.0, 169.0, 206.0, 144.0, 60.0, 34.0, 26.0, 20.0, 10.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1260986328125, -0.12218761444091797, -0.11827659606933594, -0.1143655776977539, -0.11045455932617188, -0.10654354095458984, -0.10263252258300781, -0.09872150421142578, -0.09481048583984375, -0.09089946746826172, -0.08698844909667969, -0.08307743072509766, -0.07916641235351562, -0.0752553939819336, -0.07134437561035156, -0.06743335723876953, -0.0635223388671875, -0.05961132049560547, -0.05570030212402344, -0.051789283752441406, -0.047878265380859375, -0.043967247009277344, -0.04005622863769531, -0.03614521026611328, -0.03223419189453125, -0.02832317352294922, -0.024412155151367188, -0.020501136779785156, -0.016590118408203125, -0.012679100036621094, -0.008768081665039062, -0.004857063293457031, -0.000946044921875, 0.0029649734497070312, 0.0068759918212890625, 0.010787010192871094, 0.014698028564453125, 0.018609046936035156, 0.022520065307617188, 0.02643108367919922, 0.03034210205078125, 0.03425312042236328, 0.03816413879394531, 0.042075157165527344, 0.045986175537109375, 0.049897193908691406, 0.05380821228027344, 0.05771923065185547, 0.0616302490234375, 0.06554126739501953, 0.06945228576660156, 0.0733633041381836, 0.07727432250976562, 0.08118534088134766, 0.08509635925292969, 0.08900737762451172, 0.09291839599609375, 0.09682941436767578, 0.10074043273925781, 0.10465145111083984, 0.10856246948242188, 0.1124734878540039, 0.11638450622558594, 0.12029552459716797, 0.12420654296875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 28.0, 79.0, 204.0, 351.0, 197.0, 66.0, 33.0, 12.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.962121963500977, -7.778932094573975, -7.5957417488098145, -7.4125518798828125, -7.2293620109558105, -7.046172142028809, -6.862981796264648, -6.6797919273376465, -6.4966020584106445, -6.313412189483643, -6.130221843719482, -5.9470319747924805, -5.7638421058654785, -5.580652236938477, -5.397461891174316, -5.2142720222473145, -5.031081676483154, -4.847891807556152, -4.664701461791992, -4.48151159286499, -4.298321723937988, -4.115131378173828, -3.931941509246826, -3.748751640319824, -3.565561532974243, -3.382371425628662, -3.19918155670166, -3.015991449356079, -2.832801342010498, -2.649611473083496, -2.466421365737915, -2.283231258392334, -2.100041389465332, -1.9168514013290405, -1.733661413192749, -1.550471305847168, -1.3672813177108765, -1.184091329574585, -1.000901222229004, -0.8177112340927124, -0.6345212459564209, -0.451331228017807, -0.2681412100791931, -0.08495116233825684, 0.09823882579803467, 0.28142881393432617, 0.4646189212799072, 0.6478089094161987, 0.8309988975524902, 1.0141888856887817, 1.1973788738250732, 1.3805689811706543, 1.5637589693069458, 1.7469489574432373, 1.9301390647888184, 2.1133289337158203, 2.2965190410614014, 2.4797091484069824, 2.6628990173339844, 2.8460891246795654, 3.0292792320251465, 3.2124691009521484, 3.3956592082977295, 3.5788493156433105, 3.7620391845703125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 15.0, 23.0, 19.0, 32.0, 44.0, 52.0, 59.0, 59.0, 74.0, 82.0, 63.0, 73.0, 72.0, 68.0, 64.0, 44.0, 36.0, 41.0, 21.0, 21.0, 10.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.457720994949341, -2.319880962371826, -2.1820411682128906, -2.044201374053955, -1.9063613414764404, -1.7685214281082153, -1.6306815147399902, -1.4928416013717651, -1.35500168800354, -1.217161774635315, -1.0793218612670898, -0.9414819478988647, -0.8036420345306396, -0.6658021211624146, -0.5279622077941895, -0.39012229442596436, -0.25228238105773926, -0.11444246768951416, 0.023397445678710938, 0.16123735904693604, 0.29907727241516113, 0.43691718578338623, 0.5747570991516113, 0.7125970125198364, 0.8504369258880615, 0.9882768392562866, 1.1261167526245117, 1.2639566659927368, 1.401796579360962, 1.539636492729187, 1.677476406097412, 1.8153163194656372, 1.9531564712524414, 2.090996265411377, 2.2288362979888916, 2.3666763305664062, 2.504516124725342, 2.6423559188842773, 2.780195951461792, 2.9180359840393066, 3.055875778198242, 3.1937155723571777, 3.3315556049346924, 3.469395637512207, 3.6072354316711426, 3.745075225830078, 3.8829152584075928, 4.020755290985107, 4.158595085144043, 4.2964348793029785, 4.434274673461914, 4.572114944458008, 4.709954738616943, 4.847794532775879, 4.985634803771973, 5.123474597930908, 5.261314392089844, 5.399154186248779, 5.536993980407715, 5.674834251403809, 5.812674045562744, 5.95051383972168, 6.088354110717773, 6.226193904876709, 6.3640336990356445]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 12.0, 16.0, 32.0, 32.0, 52.0, 112.0, 165.0, 290.0, 513.0, 1064.0, 2546.0, 7845.0, 82427.0, 3549404.0, 519146.0, 22727.0, 4165.0, 2004.0, 843.0, 373.0, 194.0, 102.0, 76.0, 47.0, 31.0, 21.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.056640625, -2.975677490234375, -2.89471435546875, -2.813751220703125, -2.7327880859375, -2.651824951171875, -2.57086181640625, -2.489898681640625, -2.408935546875, -2.327972412109375, -2.24700927734375, -2.166046142578125, -2.0850830078125, -2.004119873046875, -1.92315673828125, -1.842193603515625, -1.76123046875, -1.680267333984375, -1.59930419921875, -1.518341064453125, -1.4373779296875, -1.356414794921875, -1.27545166015625, -1.194488525390625, -1.113525390625, -1.032562255859375, -0.95159912109375, -0.870635986328125, -0.7896728515625, -0.708709716796875, -0.62774658203125, -0.546783447265625, -0.4658203125, -0.384857177734375, -0.30389404296875, -0.222930908203125, -0.1419677734375, -0.061004638671875, 0.01995849609375, 0.100921630859375, 0.181884765625, 0.262847900390625, 0.34381103515625, 0.424774169921875, 0.5057373046875, 0.586700439453125, 0.66766357421875, 0.748626708984375, 0.82958984375, 0.910552978515625, 0.99151611328125, 1.072479248046875, 1.1534423828125, 1.234405517578125, 1.31536865234375, 1.396331787109375, 1.477294921875, 1.558258056640625, 1.63922119140625, 1.720184326171875, 1.8011474609375, 1.882110595703125, 1.96307373046875, 2.044036865234375, 2.125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 6.0, 6.0, 10.0, 14.0, 18.0, 17.0, 34.0, 51.0, 59.0, 75.0, 78.0, 85.0, 106.0, 104.0, 81.0, 61.0, 64.0, 43.0, 29.0, 13.0, 14.0, 13.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.12109375, -2.0625, -2.00390625, -1.9453125, -1.88671875, -1.828125, -1.76953125, -1.7109375, -1.65234375, -1.59375, -1.53515625, -1.4765625, -1.41796875, -1.359375, -1.30078125, -1.2421875, -1.18359375, -1.125, -1.06640625, -1.0078125, -0.94921875, -0.890625, -0.83203125, -0.7734375, -0.71484375, -0.65625, -0.59765625, -0.5390625, -0.48046875, -0.421875, -0.36328125, -0.3046875, -0.24609375, -0.1875, -0.12890625, -0.0703125, -0.01171875, 0.046875, 0.10546875, 0.1640625, 0.22265625, 0.28125, 0.33984375, 0.3984375, 0.45703125, 0.515625, 0.57421875, 0.6328125, 0.69140625, 0.75, 0.80859375, 0.8671875, 0.92578125, 0.984375, 1.04296875, 1.1015625, 1.16015625, 1.21875, 1.27734375, 1.3359375, 1.39453125, 1.453125, 1.51171875, 1.5703125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 13.0, 26.0, 55.0, 163.0, 632.0, 9759.0, 4178438.0, 4553.0, 441.0, 117.0, 32.0, 24.0, 12.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.4014892578125, -15.029541015625, -14.6575927734375, -14.28564453125, -13.9136962890625, -13.541748046875, -13.1697998046875, -12.7978515625, -12.4259033203125, -12.053955078125, -11.6820068359375, -11.31005859375, -10.9381103515625, -10.566162109375, -10.1942138671875, -9.822265625, -9.4503173828125, -9.078369140625, -8.7064208984375, -8.33447265625, -7.9625244140625, -7.590576171875, -7.2186279296875, -6.8466796875, -6.4747314453125, -6.102783203125, -5.7308349609375, -5.35888671875, -4.9869384765625, -4.614990234375, -4.2430419921875, -3.87109375, -3.4991455078125, -3.127197265625, -2.7552490234375, -2.38330078125, -2.0113525390625, -1.639404296875, -1.2674560546875, -0.8955078125, -0.5235595703125, -0.151611328125, 0.2203369140625, 0.59228515625, 0.9642333984375, 1.336181640625, 1.7081298828125, 2.080078125, 2.4520263671875, 2.823974609375, 3.1959228515625, 3.56787109375, 3.9398193359375, 4.311767578125, 4.6837158203125, 5.0556640625, 5.4276123046875, 5.799560546875, 6.1715087890625, 6.54345703125, 6.9154052734375, 7.287353515625, 7.6593017578125, 8.03125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 12.0, 31.0, 78.0, 422.0, 2589.0, 742.0, 99.0, 39.0, 21.0, 16.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.7972564697265625, -0.758575439453125, -0.7198944091796875, -0.68121337890625, -0.6425323486328125, -0.603851318359375, -0.5651702880859375, -0.5264892578125, -0.4878082275390625, -0.449127197265625, -0.4104461669921875, -0.37176513671875, -0.3330841064453125, -0.294403076171875, -0.2557220458984375, -0.217041015625, -0.1783599853515625, -0.139678955078125, -0.1009979248046875, -0.06231689453125, -0.0236358642578125, 0.015045166015625, 0.0537261962890625, 0.0924072265625, 0.1310882568359375, 0.169769287109375, 0.2084503173828125, 0.24713134765625, 0.2858123779296875, 0.324493408203125, 0.3631744384765625, 0.40185546875, 0.4405364990234375, 0.479217529296875, 0.5178985595703125, 0.55657958984375, 0.5952606201171875, 0.633941650390625, 0.6726226806640625, 0.7113037109375, 0.7499847412109375, 0.788665771484375, 0.8273468017578125, 0.86602783203125, 0.9047088623046875, 0.943389892578125, 0.9820709228515625, 1.020751953125, 1.0594329833984375, 1.098114013671875, 1.1367950439453125, 1.17547607421875, 1.2141571044921875, 1.252838134765625, 1.2915191650390625, 1.3302001953125, 1.3688812255859375, 1.407562255859375, 1.4462432861328125, 1.48492431640625, 1.5236053466796875, 1.562286376953125, 1.6009674072265625, 1.6396484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 10.0, 19.0, 39.0, 74.0, 173.0, 277.0, 184.0, 105.0, 47.0, 34.0, 13.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.185263633728027, -4.067671775817871, -3.9500796794891357, -3.8324875831604004, -3.714895486831665, -3.5973033905029297, -3.4797115325927734, -3.362119436264038, -3.2445273399353027, -3.1269352436065674, -3.009343385696411, -2.891751289367676, -2.7741591930389404, -2.656567096710205, -2.538975238800049, -2.4213831424713135, -2.3037912845611572, -2.186199188232422, -2.0686073303222656, -1.9510152339935303, -1.833423137664795, -1.7158311605453491, -1.5982391834259033, -1.480647087097168, -1.3630551099777222, -1.2454631328582764, -1.127871036529541, -1.0102790594100952, -0.8926870226860046, -0.7750949859619141, -0.6575030088424683, -0.5399109721183777, -0.4223191738128662, -0.30472713708877563, -0.18713513016700745, -0.06954312324523926, 0.04804891347885132, 0.1656409502029419, 0.2832329273223877, 0.40082496404647827, 0.5184170007705688, 0.6360090374946594, 0.75360107421875, 0.8711930513381958, 0.9887850880622864, 1.106377124786377, 1.2239691019058228, 1.3415610790252686, 1.459153175354004, 1.5767451524734497, 1.694337248802185, 1.8119292259216309, 1.9295213222503662, 2.0471134185791016, 2.164705276489258, 2.282297372817993, 2.3998894691467285, 2.517481565475464, 2.63507342338562, 2.7526655197143555, 2.870257616043091, 2.987849712371826, 3.1054415702819824, 3.2230336666107178, 3.340625524520874]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 14.0, 8.0, 15.0, 18.0, 34.0, 38.0, 39.0, 51.0, 66.0, 67.0, 77.0, 76.0, 68.0, 75.0, 58.0, 65.0, 55.0, 49.0, 33.0, 24.0, 21.0, 11.0, 11.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0943245887756348, -2.038926124572754, -1.9835278987884521, -1.9281295537948608, -1.8727312088012695, -1.8173328638076782, -1.761934518814087, -1.7065361738204956, -1.6511378288269043, -1.595739483833313, -1.5403411388397217, -1.4849427938461304, -1.429544448852539, -1.3741461038589478, -1.3187477588653564, -1.2633494138717651, -1.2079510688781738, -1.1525527238845825, -1.0971543788909912, -1.0417560338974, -0.9863576889038086, -0.9309593439102173, -0.875560998916626, -0.8201626539230347, -0.7647643089294434, -0.709365963935852, -0.6539676189422607, -0.5985692739486694, -0.5431709289550781, -0.4877725839614868, -0.4323742389678955, -0.3769758939743042, -0.32157766819000244, -0.26617932319641113, -0.21078097820281982, -0.15538263320922852, -0.09998428821563721, -0.0445859432220459, 0.01081240177154541, 0.06621074676513672, 0.12160909175872803, 0.17700743675231934, 0.23240578174591064, 0.28780412673950195, 0.34320247173309326, 0.39860081672668457, 0.4539991617202759, 0.5093975067138672, 0.5647958517074585, 0.6201941967010498, 0.6755925416946411, 0.7309908866882324, 0.7863892316818237, 0.841787576675415, 0.8971859216690063, 0.9525842666625977, 1.007982611656189, 1.0633809566497803, 1.1187793016433716, 1.174177646636963, 1.2295759916305542, 1.2849743366241455, 1.3403726816177368, 1.3957710266113281, 1.4511693716049194]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 1.0, 2.0, 7.0, 6.0, 6.0, 14.0, 19.0, 30.0, 54.0, 78.0, 164.0, 301.0, 589.0, 1272.0, 2850.0, 7962.0, 33878.0, 671775.0, 296371.0, 22463.0, 6190.0, 2353.0, 1077.0, 495.0, 254.0, 137.0, 77.0, 41.0, 30.0, 18.0, 12.0, 5.0, 13.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69091796875, -0.671112060546875, -0.65130615234375, -0.631500244140625, -0.6116943359375, -0.591888427734375, -0.57208251953125, -0.552276611328125, -0.532470703125, -0.512664794921875, -0.49285888671875, -0.473052978515625, -0.4532470703125, -0.433441162109375, -0.41363525390625, -0.393829345703125, -0.3740234375, -0.354217529296875, -0.33441162109375, -0.314605712890625, -0.2947998046875, -0.274993896484375, -0.25518798828125, -0.235382080078125, -0.215576171875, -0.195770263671875, -0.17596435546875, -0.156158447265625, -0.1363525390625, -0.116546630859375, -0.09674072265625, -0.076934814453125, -0.05712890625, -0.037322998046875, -0.01751708984375, 0.002288818359375, 0.0220947265625, 0.041900634765625, 0.06170654296875, 0.081512451171875, 0.101318359375, 0.121124267578125, 0.14093017578125, 0.160736083984375, 0.1805419921875, 0.200347900390625, 0.22015380859375, 0.239959716796875, 0.259765625, 0.279571533203125, 0.29937744140625, 0.319183349609375, 0.3389892578125, 0.358795166015625, 0.37860107421875, 0.398406982421875, 0.418212890625, 0.438018798828125, 0.45782470703125, 0.477630615234375, 0.4974365234375, 0.517242431640625, 0.53704833984375, 0.556854248046875, 0.57666015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 11.0, 15.0, 23.0, 35.0, 38.0, 56.0, 86.0, 91.0, 108.0, 98.0, 86.0, 85.0, 66.0, 56.0, 46.0, 26.0, 19.0, 14.0, 11.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.07421875, -2.0261688232421875, -1.978118896484375, -1.9300689697265625, -1.88201904296875, -1.8339691162109375, -1.785919189453125, -1.7378692626953125, -1.6898193359375, -1.6417694091796875, -1.593719482421875, -1.5456695556640625, -1.49761962890625, -1.4495697021484375, -1.401519775390625, -1.3534698486328125, -1.305419921875, -1.2573699951171875, -1.209320068359375, -1.1612701416015625, -1.11322021484375, -1.0651702880859375, -1.017120361328125, -0.9690704345703125, -0.9210205078125, -0.8729705810546875, -0.824920654296875, -0.7768707275390625, -0.72882080078125, -0.6807708740234375, -0.632720947265625, -0.5846710205078125, -0.53662109375, -0.4885711669921875, -0.440521240234375, -0.3924713134765625, -0.34442138671875, -0.2963714599609375, -0.248321533203125, -0.2002716064453125, -0.1522216796875, -0.1041717529296875, -0.056121826171875, -0.0080718994140625, 0.03997802734375, 0.0880279541015625, 0.136077880859375, 0.1841278076171875, 0.232177734375, 0.2802276611328125, 0.328277587890625, 0.3763275146484375, 0.42437744140625, 0.4724273681640625, 0.520477294921875, 0.5685272216796875, 0.6165771484375, 0.6646270751953125, 0.712677001953125, 0.7607269287109375, 0.80877685546875, 0.8568267822265625, 0.904876708984375, 0.9529266357421875, 1.0009765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 8.0, 13.0, 12.0, 36.0, 40.0, 45.0, 57.0, 79.0, 124.0, 184.0, 283.0, 459.0, 649.0, 1008.0, 1651.0, 3000.0, 5629.0, 12389.0, 33426.0, 133220.0, 572796.0, 206510.0, 45924.0, 15471.0, 6828.0, 3461.0, 1925.0, 1170.0, 719.0, 486.0, 271.0, 198.0, 165.0, 79.0, 64.0, 42.0, 39.0, 21.0, 22.0, 17.0, 7.0, 10.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2578125, -0.2499103546142578, -0.24200820922851562, -0.23410606384277344, -0.22620391845703125, -0.21830177307128906, -0.21039962768554688, -0.2024974822998047, -0.1945953369140625, -0.1866931915283203, -0.17879104614257812, -0.17088890075683594, -0.16298675537109375, -0.15508460998535156, -0.14718246459960938, -0.1392803192138672, -0.131378173828125, -0.12347602844238281, -0.11557388305664062, -0.10767173767089844, -0.09976959228515625, -0.09186744689941406, -0.08396530151367188, -0.07606315612792969, -0.0681610107421875, -0.06025886535644531, -0.052356719970703125, -0.04445457458496094, -0.03655242919921875, -0.028650283813476562, -0.020748138427734375, -0.012845993041992188, -0.00494384765625, 0.0029582977294921875, 0.010860443115234375, 0.018762588500976562, 0.02666473388671875, 0.03456687927246094, 0.042469024658203125, 0.05037117004394531, 0.0582733154296875, 0.06617546081542969, 0.07407760620117188, 0.08197975158691406, 0.08988189697265625, 0.09778404235839844, 0.10568618774414062, 0.11358833312988281, 0.121490478515625, 0.1293926239013672, 0.13729476928710938, 0.14519691467285156, 0.15309906005859375, 0.16100120544433594, 0.16890335083007812, 0.1768054962158203, 0.1847076416015625, 0.1926097869873047, 0.20051193237304688, 0.20841407775878906, 0.21631622314453125, 0.22421836853027344, 0.23212051391601562, 0.2400226593017578, 0.2479248046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 9.0, 7.0, 11.0, 10.0, 17.0, 17.0, 22.0, 28.0, 27.0, 36.0, 34.0, 38.0, 45.0, 34.0, 54.0, 46.0, 56.0, 58.0, 57.0, 40.0, 33.0, 38.0, 39.0, 38.0, 30.0, 35.0, 23.0, 18.0, 13.0, 18.0, 9.0, 12.0, 9.0, 7.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.708984375, -1.6570587158203125, -1.605133056640625, -1.5532073974609375, -1.50128173828125, -1.4493560791015625, -1.397430419921875, -1.3455047607421875, -1.2935791015625, -1.2416534423828125, -1.189727783203125, -1.1378021240234375, -1.08587646484375, -1.0339508056640625, -0.982025146484375, -0.9300994873046875, -0.878173828125, -0.8262481689453125, -0.774322509765625, -0.7223968505859375, -0.67047119140625, -0.6185455322265625, -0.566619873046875, -0.5146942138671875, -0.4627685546875, -0.4108428955078125, -0.358917236328125, -0.3069915771484375, -0.25506591796875, -0.2031402587890625, -0.151214599609375, -0.0992889404296875, -0.04736328125, 0.0045623779296875, 0.056488037109375, 0.1084136962890625, 0.16033935546875, 0.2122650146484375, 0.264190673828125, 0.3161163330078125, 0.3680419921875, 0.4199676513671875, 0.471893310546875, 0.5238189697265625, 0.57574462890625, 0.6276702880859375, 0.679595947265625, 0.7315216064453125, 0.783447265625, 0.8353729248046875, 0.887298583984375, 0.9392242431640625, 0.99114990234375, 1.0430755615234375, 1.095001220703125, 1.1469268798828125, 1.1988525390625, 1.2507781982421875, 1.302703857421875, 1.3546295166015625, 1.40655517578125, 1.4584808349609375, 1.510406494140625, 1.5623321533203125, 1.6142578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 12.0, 16.0, 14.0, 13.0, 29.0, 38.0, 65.0, 84.0, 113.0, 194.0, 318.0, 480.0, 866.0, 1527.0, 2990.0, 7101.0, 19018.0, 69654.0, 501464.0, 360428.0, 55683.0, 16161.0, 6054.0, 2779.0, 1413.0, 755.0, 426.0, 288.0, 172.0, 107.0, 81.0, 63.0, 46.0, 25.0, 16.0, 22.0, 8.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.09039306640625, -0.08780479431152344, -0.08521652221679688, -0.08262825012207031, -0.08003997802734375, -0.07745170593261719, -0.07486343383789062, -0.07227516174316406, -0.0696868896484375, -0.06709861755371094, -0.06451034545898438, -0.06192207336425781, -0.05933380126953125, -0.05674552917480469, -0.054157257080078125, -0.05156898498535156, -0.048980712890625, -0.04639244079589844, -0.043804168701171875, -0.04121589660644531, -0.03862762451171875, -0.03603935241699219, -0.033451080322265625, -0.030862808227539062, -0.0282745361328125, -0.025686264038085938, -0.023097991943359375, -0.020509719848632812, -0.01792144775390625, -0.015333175659179688, -0.012744903564453125, -0.010156631469726562, -0.007568359375, -0.0049800872802734375, -0.002391815185546875, 0.0001964569091796875, 0.00278472900390625, 0.0053730010986328125, 0.007961273193359375, 0.010549545288085938, 0.0131378173828125, 0.015726089477539062, 0.018314361572265625, 0.020902633666992188, 0.02349090576171875, 0.026079177856445312, 0.028667449951171875, 0.03125572204589844, 0.033843994140625, 0.03643226623535156, 0.039020538330078125, 0.04160881042480469, 0.04419708251953125, 0.04678535461425781, 0.049373626708984375, 0.05196189880371094, 0.0545501708984375, 0.05713844299316406, 0.059726715087890625, 0.06231498718261719, 0.06490325927734375, 0.06749153137207031, 0.07007980346679688, 0.07266807556152344, 0.07525634765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 12.0, 9.0, 8.0, 17.0, 26.0, 44.0, 56.0, 94.0, 136.0, 187.0, 133.0, 75.0, 36.0, 42.0, 23.0, 23.0, 7.0, 10.0, 10.0, 3.0, 7.0, 6.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -5.043204873800278e-05, -4.8590824007987976e-05, -4.6749599277973175e-05, -4.4908374547958374e-05, -4.306714981794357e-05, -4.122592508792877e-05, -3.938470035791397e-05, -3.754347562789917e-05, -3.570225089788437e-05, -3.386102616786957e-05, -3.201980143785477e-05, -3.0178576707839966e-05, -2.8337351977825165e-05, -2.6496127247810364e-05, -2.4654902517795563e-05, -2.2813677787780762e-05, -2.097245305776596e-05, -1.913122832775116e-05, -1.729000359773636e-05, -1.5448778867721558e-05, -1.3607554137706757e-05, -1.1766329407691956e-05, -9.925104677677155e-06, -8.083879947662354e-06, -6.2426552176475525e-06, -4.4014304876327515e-06, -2.5602057576179504e-06, -7.189810276031494e-07, 1.1222437024116516e-06, 2.9634684324264526e-06, 4.804693162441254e-06, 6.645917892456055e-06, 8.487142622470856e-06, 1.0328367352485657e-05, 1.2169592082500458e-05, 1.4010816812515259e-05, 1.585204154253006e-05, 1.769326627254486e-05, 1.9534491002559662e-05, 2.1375715732574463e-05, 2.3216940462589264e-05, 2.5058165192604065e-05, 2.6899389922618866e-05, 2.8740614652633667e-05, 3.058183938264847e-05, 3.242306411266327e-05, 3.426428884267807e-05, 3.610551357269287e-05, 3.794673830270767e-05, 3.978796303272247e-05, 4.1629187762737274e-05, 4.3470412492752075e-05, 4.5311637222766876e-05, 4.715286195278168e-05, 4.899408668279648e-05, 5.083531141281128e-05, 5.267653614282608e-05, 5.451776087284088e-05, 5.635898560285568e-05, 5.8200210332870483e-05, 6.0041435062885284e-05, 6.188265979290009e-05, 6.372388452291489e-05, 6.556510925292969e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 16.0, 14.0, 24.0, 32.0, 59.0, 97.0, 185.0, 349.0, 591.0, 1360.0, 3029.0, 8969.0, 41416.0, 623962.0, 328696.0, 28016.0, 6883.0, 2524.0, 1120.0, 544.0, 283.0, 145.0, 76.0, 56.0, 25.0, 25.0, 12.0, 13.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.11010265350341797, -0.10600852966308594, -0.1019144058227539, -0.09782028198242188, -0.09372615814208984, -0.08963203430175781, -0.08553791046142578, -0.08144378662109375, -0.07734966278076172, -0.07325553894042969, -0.06916141510009766, -0.06506729125976562, -0.060973167419433594, -0.05687904357910156, -0.05278491973876953, -0.0486907958984375, -0.04459667205810547, -0.04050254821777344, -0.036408424377441406, -0.032314300537109375, -0.028220176696777344, -0.024126052856445312, -0.02003192901611328, -0.01593780517578125, -0.011843681335449219, -0.0077495574951171875, -0.0036554336547851562, 0.000438690185546875, 0.004532814025878906, 0.008626937866210938, 0.012721061706542969, 0.016815185546875, 0.02090930938720703, 0.025003433227539062, 0.029097557067871094, 0.033191680908203125, 0.037285804748535156, 0.04137992858886719, 0.04547405242919922, 0.04956817626953125, 0.05366230010986328, 0.05775642395019531, 0.061850547790527344, 0.06594467163085938, 0.0700387954711914, 0.07413291931152344, 0.07822704315185547, 0.0823211669921875, 0.08641529083251953, 0.09050941467285156, 0.0946035385131836, 0.09869766235351562, 0.10279178619384766, 0.10688591003417969, 0.11098003387451172, 0.11507415771484375, 0.11916828155517578, 0.12326240539550781, 0.12735652923583984, 0.13145065307617188, 0.1355447769165039, 0.13963890075683594, 0.14373302459716797, 0.1478271484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 4.0, 8.0, 12.0, 13.0, 18.0, 23.0, 35.0, 51.0, 65.0, 77.0, 100.0, 140.0, 98.0, 89.0, 64.0, 37.0, 31.0, 35.0, 17.0, 19.0, 9.0, 8.0, 9.0, 4.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.024383544921875, -0.023694276809692383, -0.023005008697509766, -0.02231574058532715, -0.02162647247314453, -0.020937204360961914, -0.020247936248779297, -0.01955866813659668, -0.018869400024414062, -0.018180131912231445, -0.017490863800048828, -0.01680159568786621, -0.016112327575683594, -0.015423059463500977, -0.01473379135131836, -0.014044523239135742, -0.013355255126953125, -0.012665987014770508, -0.01197671890258789, -0.011287450790405273, -0.010598182678222656, -0.009908914566040039, -0.009219646453857422, -0.008530378341674805, -0.007841110229492188, -0.00715184211730957, -0.006462574005126953, -0.005773305892944336, -0.005084037780761719, -0.0043947696685791016, -0.0037055015563964844, -0.003016233444213867, -0.00232696533203125, -0.0016376972198486328, -0.0009484291076660156, -0.00025916099548339844, 0.00043010711669921875, 0.001119375228881836, 0.0018086433410644531, 0.0024979114532470703, 0.0031871795654296875, 0.0038764476776123047, 0.004565715789794922, 0.005254983901977539, 0.005944252014160156, 0.0066335201263427734, 0.007322788238525391, 0.008012056350708008, 0.008701324462890625, 0.009390592575073242, 0.01007986068725586, 0.010769128799438477, 0.011458396911621094, 0.012147665023803711, 0.012836933135986328, 0.013526201248168945, 0.014215469360351562, 0.01490473747253418, 0.015594005584716797, 0.016283273696899414, 0.01697254180908203, 0.01766180992126465, 0.018351078033447266, 0.019040346145629883, 0.0197296142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 26.0, 48.0, 204.0, 433.0, 192.0, 55.0, 24.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.729193687438965, -5.6084513664245605, -5.4877095222473145, -5.36696720123291, -5.246224880218506, -5.125482559204102, -5.0047407150268555, -4.883998394012451, -4.763256072998047, -4.642513751983643, -4.5217719078063965, -4.401029586791992, -4.280287265777588, -4.159544944763184, -4.0388031005859375, -3.918060779571533, -3.797318696975708, -3.676576614379883, -3.5558342933654785, -3.4350922107696533, -3.314349889755249, -3.193607807159424, -3.0728654861450195, -2.9521234035491943, -2.831381320953369, -2.710639238357544, -2.5898969173431396, -2.4691548347473145, -2.34841251373291, -2.227670431137085, -2.1069283485412598, -1.9861860275268555, -1.8654435873031616, -1.7447013854980469, -1.6239591836929321, -1.5032169818878174, -1.3824748992919922, -1.261732578277588, -1.1409904956817627, -1.020248293876648, -0.8995060920715332, -0.7787638902664185, -0.6580216884613037, -0.5372795462608337, -0.416537344455719, -0.29579514265060425, -0.17505300045013428, -0.05431079864501953, 0.06643140316009521, 0.18717359006404877, 0.3079157769680023, 0.4286579489707947, 0.5494001507759094, 0.6701423525810242, 0.7908844947814941, 0.9116266965866089, 1.0323688983917236, 1.1531111001968384, 1.2738533020019531, 1.3945953845977783, 1.5153377056121826, 1.6360797882080078, 1.7568219900131226, 1.8775641918182373, 1.998306393623352]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 13.0, 11.0, 17.0, 21.0, 39.0, 49.0, 53.0, 83.0, 86.0, 102.0, 95.0, 82.0, 89.0, 56.0, 68.0, 47.0, 31.0, 19.0, 13.0, 9.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9014041423797607, -1.8563053607940674, -1.811206579208374, -1.7661077976226807, -1.7210090160369873, -1.675910234451294, -1.6308114528656006, -1.5857127904891968, -1.5406140089035034, -1.49551522731781, -1.4504164457321167, -1.4053176641464233, -1.36021888256073, -1.3151202201843262, -1.2700214385986328, -1.2249226570129395, -1.179823875427246, -1.1347250938415527, -1.0896263122558594, -1.044527530670166, -0.9994288086891174, -0.9543300271034241, -0.9092312455177307, -0.8641325235366821, -0.8190336227416992, -0.7739348411560059, -0.7288360595703125, -0.6837372779846191, -0.6386385560035706, -0.5935397744178772, -0.5484409928321838, -0.5033422708511353, -0.4582434892654419, -0.41314470767974854, -0.36804595589637756, -0.3229471743106842, -0.27784842252731323, -0.23274964094161987, -0.1876508593559265, -0.14255210757255554, -0.09745332598686218, -0.05235455557703972, -0.007255785167217255, 0.03784298896789551, 0.08294175565242767, 0.12804052233695984, 0.1731393039226532, 0.21823805570602417, 0.26333683729171753, 0.3084356188774109, 0.35353437066078186, 0.3986331522464752, 0.4437319040298462, 0.48883068561553955, 0.5339294672012329, 0.5790282487869263, 0.6241270303726196, 0.669225811958313, 0.7143245935440063, 0.7594233751296997, 0.8045220971107483, 0.8496208786964417, 0.894719660282135, 0.9398183822631836, 0.984917163848877]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 0.0, 4.0, 15.0, 15.0, 17.0, 37.0, 49.0, 107.0, 176.0, 421.0, 793.0, 1890.0, 5246.0, 23085.0, 703177.0, 290624.0, 15727.0, 4199.0, 1560.0, 678.0, 310.0, 182.0, 74.0, 56.0, 34.0, 21.0, 23.0, 12.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.892578125, -1.8426361083984375, -1.792694091796875, -1.7427520751953125, -1.69281005859375, -1.6428680419921875, -1.592926025390625, -1.5429840087890625, -1.4930419921875, -1.4430999755859375, -1.393157958984375, -1.3432159423828125, -1.29327392578125, -1.2433319091796875, -1.193389892578125, -1.1434478759765625, -1.093505859375, -1.0435638427734375, -0.993621826171875, -0.9436798095703125, -0.89373779296875, -0.8437957763671875, -0.793853759765625, -0.7439117431640625, -0.6939697265625, -0.6440277099609375, -0.594085693359375, -0.5441436767578125, -0.49420166015625, -0.4442596435546875, -0.394317626953125, -0.3443756103515625, -0.29443359375, -0.2444915771484375, -0.194549560546875, -0.1446075439453125, -0.09466552734375, -0.0447235107421875, 0.005218505859375, 0.0551605224609375, 0.1051025390625, 0.1550445556640625, 0.204986572265625, 0.2549285888671875, 0.30487060546875, 0.3548126220703125, 0.404754638671875, 0.4546966552734375, 0.504638671875, 0.5545806884765625, 0.604522705078125, 0.6544647216796875, 0.70440673828125, 0.7543487548828125, 0.804290771484375, 0.8542327880859375, 0.9041748046875, 0.9541168212890625, 1.004058837890625, 1.0540008544921875, 1.10394287109375, 1.1538848876953125, 1.203826904296875, 1.2537689208984375, 1.3037109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 11.0, 15.0, 21.0, 33.0, 55.0, 75.0, 118.0, 123.0, 139.0, 129.0, 93.0, 57.0, 56.0, 37.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.449005126953125, -2.32183837890625, -2.194671630859375, -2.0675048828125, -1.940338134765625, -1.81317138671875, -1.686004638671875, -1.558837890625, -1.431671142578125, -1.30450439453125, -1.177337646484375, -1.0501708984375, -0.923004150390625, -0.79583740234375, -0.668670654296875, -0.54150390625, -0.414337158203125, -0.28717041015625, -0.160003662109375, -0.0328369140625, 0.094329833984375, 0.22149658203125, 0.348663330078125, 0.475830078125, 0.602996826171875, 0.73016357421875, 0.857330322265625, 0.9844970703125, 1.111663818359375, 1.23883056640625, 1.365997314453125, 1.4931640625, 1.620330810546875, 1.74749755859375, 1.874664306640625, 2.0018310546875, 2.128997802734375, 2.25616455078125, 2.383331298828125, 2.510498046875, 2.637664794921875, 2.76483154296875, 2.891998291015625, 3.0191650390625, 3.146331787109375, 3.27349853515625, 3.400665283203125, 3.52783203125, 3.654998779296875, 3.78216552734375, 3.909332275390625, 4.0364990234375, 4.163665771484375, 4.29083251953125, 4.417999267578125, 4.545166015625, 4.672332763671875, 4.79949951171875, 4.926666259765625, 5.0538330078125, 5.180999755859375, 5.30816650390625, 5.435333251953125, 5.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 4.0, 6.0, 10.0, 15.0, 13.0, 23.0, 44.0, 67.0, 69.0, 116.0, 202.0, 342.0, 598.0, 1440.0, 4065.0, 17497.0, 621294.0, 381574.0, 14793.0, 3621.0, 1311.0, 629.0, 322.0, 169.0, 116.0, 55.0, 38.0, 33.0, 25.0, 11.0, 13.0, 11.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5927734375, -1.54443359375, -1.49609375, -1.44775390625, -1.3994140625, -1.35107421875, -1.302734375, -1.25439453125, -1.2060546875, -1.15771484375, -1.109375, -1.06103515625, -1.0126953125, -0.96435546875, -0.916015625, -0.86767578125, -0.8193359375, -0.77099609375, -0.72265625, -0.67431640625, -0.6259765625, -0.57763671875, -0.529296875, -0.48095703125, -0.4326171875, -0.38427734375, -0.3359375, -0.28759765625, -0.2392578125, -0.19091796875, -0.142578125, -0.09423828125, -0.0458984375, 0.00244140625, 0.05078125, 0.09912109375, 0.1474609375, 0.19580078125, 0.244140625, 0.29248046875, 0.3408203125, 0.38916015625, 0.4375, 0.48583984375, 0.5341796875, 0.58251953125, 0.630859375, 0.67919921875, 0.7275390625, 0.77587890625, 0.82421875, 0.87255859375, 0.9208984375, 0.96923828125, 1.017578125, 1.06591796875, 1.1142578125, 1.16259765625, 1.2109375, 1.25927734375, 1.3076171875, 1.35595703125, 1.404296875, 1.45263671875, 1.5009765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 14.0, 11.0, 15.0, 15.0, 10.0, 21.0, 18.0, 17.0, 23.0, 31.0, 27.0, 28.0, 15.0, 34.0, 40.0, 53.0, 41.0, 36.0, 43.0, 34.0, 41.0, 39.0, 33.0, 41.0, 27.0, 29.0, 30.0, 19.0, 38.0, 22.0, 20.0, 19.0, 18.0, 13.0, 7.0, 10.0, 9.0, 9.0, 3.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-1.505859375, -1.4591217041015625, -1.412384033203125, -1.3656463623046875, -1.31890869140625, -1.2721710205078125, -1.225433349609375, -1.1786956787109375, -1.1319580078125, -1.0852203369140625, -1.038482666015625, -0.9917449951171875, -0.94500732421875, -0.8982696533203125, -0.851531982421875, -0.8047943115234375, -0.758056640625, -0.7113189697265625, -0.664581298828125, -0.6178436279296875, -0.57110595703125, -0.5243682861328125, -0.477630615234375, -0.4308929443359375, -0.3841552734375, -0.3374176025390625, -0.290679931640625, -0.2439422607421875, -0.19720458984375, -0.1504669189453125, -0.103729248046875, -0.0569915771484375, -0.01025390625, 0.0364837646484375, 0.083221435546875, 0.1299591064453125, 0.17669677734375, 0.2234344482421875, 0.270172119140625, 0.3169097900390625, 0.3636474609375, 0.4103851318359375, 0.457122802734375, 0.5038604736328125, 0.55059814453125, 0.5973358154296875, 0.644073486328125, 0.6908111572265625, 0.737548828125, 0.7842864990234375, 0.831024169921875, 0.8777618408203125, 0.92449951171875, 0.9712371826171875, 1.017974853515625, 1.0647125244140625, 1.1114501953125, 1.1581878662109375, 1.204925537109375, 1.2516632080078125, 1.29840087890625, 1.3451385498046875, 1.391876220703125, 1.4386138916015625, 1.4853515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 11.0, 19.0, 32.0, 49.0, 61.0, 68.0, 125.0, 209.0, 328.0, 520.0, 1078.0, 2222.0, 5485.0, 19302.0, 253061.0, 724926.0, 28389.0, 7054.0, 2698.0, 1233.0, 630.0, 367.0, 208.0, 129.0, 108.0, 60.0, 39.0, 26.0, 28.0, 11.0, 6.0, 8.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4403877258300781, -0.42667388916015625, -0.4129600524902344, -0.3992462158203125, -0.3855323791503906, -0.37181854248046875, -0.3581047058105469, -0.344390869140625, -0.3306770324707031, -0.31696319580078125, -0.3032493591308594, -0.2895355224609375, -0.2758216857910156, -0.26210784912109375, -0.24839401245117188, -0.23468017578125, -0.22096633911132812, -0.20725250244140625, -0.19353866577148438, -0.1798248291015625, -0.16611099243164062, -0.15239715576171875, -0.13868331909179688, -0.124969482421875, -0.11125564575195312, -0.09754180908203125, -0.08382797241210938, -0.0701141357421875, -0.056400299072265625, -0.04268646240234375, -0.028972625732421875, -0.0152587890625, -0.001544952392578125, 0.01216888427734375, 0.025882720947265625, 0.0395965576171875, 0.053310394287109375, 0.06702423095703125, 0.08073806762695312, 0.094451904296875, 0.10816574096679688, 0.12187957763671875, 0.13559341430664062, 0.1493072509765625, 0.16302108764648438, 0.17673492431640625, 0.19044876098632812, 0.20416259765625, 0.21787643432617188, 0.23159027099609375, 0.24530410766601562, 0.2590179443359375, 0.2727317810058594, 0.28644561767578125, 0.3001594543457031, 0.313873291015625, 0.3275871276855469, 0.34130096435546875, 0.3550148010253906, 0.3687286376953125, 0.3824424743652344, 0.39615631103515625, 0.4098701477050781, 0.423583984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 15.0, 22.0, 38.0, 76.0, 153.0, 283.0, 174.0, 86.0, 49.0, 36.0, 14.0, 6.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.266124546527863e-05, -6.047263741493225e-05, -5.8284029364585876e-05, -5.60954213142395e-05, -5.390681326389313e-05, -5.171820521354675e-05, -4.952959716320038e-05, -4.7340989112854004e-05, -4.515238106250763e-05, -4.2963773012161255e-05, -4.077516496181488e-05, -3.8586556911468506e-05, -3.639794886112213e-05, -3.420934081077576e-05, -3.202073276042938e-05, -2.9832124710083008e-05, -2.7643516659736633e-05, -2.545490860939026e-05, -2.3266300559043884e-05, -2.107769250869751e-05, -1.8889084458351135e-05, -1.670047640800476e-05, -1.4511868357658386e-05, -1.2323260307312012e-05, -1.0134652256965637e-05, -7.946044206619263e-06, -5.757436156272888e-06, -3.5688281059265137e-06, -1.3802200555801392e-06, 8.083879947662354e-07, 2.99699604511261e-06, 5.185604095458984e-06, 7.374212145805359e-06, 9.562820196151733e-06, 1.1751428246498108e-05, 1.3940036296844482e-05, 1.6128644347190857e-05, 1.831725239753723e-05, 2.0505860447883606e-05, 2.269446849822998e-05, 2.4883076548576355e-05, 2.707168459892273e-05, 2.9260292649269104e-05, 3.144890069961548e-05, 3.363750874996185e-05, 3.582611680030823e-05, 3.80147248506546e-05, 4.0203332901000977e-05, 4.239194095134735e-05, 4.4580549001693726e-05, 4.67691570520401e-05, 4.8957765102386475e-05, 5.114637315273285e-05, 5.3334981203079224e-05, 5.55235892534256e-05, 5.771219730377197e-05, 5.990080535411835e-05, 6.208941340446472e-05, 6.42780214548111e-05, 6.646662950515747e-05, 6.865523755550385e-05, 7.084384560585022e-05, 7.30324536561966e-05, 7.522106170654297e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 13.0, 6.0, 16.0, 22.0, 22.0, 62.0, 81.0, 147.0, 314.0, 679.0, 1864.0, 5856.0, 31259.0, 913260.0, 80837.0, 9608.0, 2692.0, 909.0, 411.0, 197.0, 100.0, 56.0, 27.0, 29.0, 16.0, 12.0, 7.0, 8.0, 4.0, 2.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6545028686523438, -0.6361541748046875, -0.6178054809570312, -0.599456787109375, -0.5811080932617188, -0.5627593994140625, -0.5444107055664062, -0.52606201171875, -0.5077133178710938, -0.4893646240234375, -0.47101593017578125, -0.452667236328125, -0.43431854248046875, -0.4159698486328125, -0.39762115478515625, -0.3792724609375, -0.36092376708984375, -0.3425750732421875, -0.32422637939453125, -0.305877685546875, -0.28752899169921875, -0.2691802978515625, -0.25083160400390625, -0.23248291015625, -0.21413421630859375, -0.1957855224609375, -0.17743682861328125, -0.159088134765625, -0.14073944091796875, -0.1223907470703125, -0.10404205322265625, -0.085693359375, -0.06734466552734375, -0.0489959716796875, -0.03064727783203125, -0.012298583984375, 0.00605010986328125, 0.0243988037109375, 0.04274749755859375, 0.06109619140625, 0.07944488525390625, 0.0977935791015625, 0.11614227294921875, 0.134490966796875, 0.15283966064453125, 0.1711883544921875, 0.18953704833984375, 0.2078857421875, 0.22623443603515625, 0.2445831298828125, 0.26293182373046875, 0.281280517578125, 0.29962921142578125, 0.3179779052734375, 0.33632659912109375, 0.35467529296875, 0.37302398681640625, 0.3913726806640625, 0.40972137451171875, 0.428070068359375, 0.44641876220703125, 0.4647674560546875, 0.48311614990234375, 0.50146484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 9.0, 12.0, 17.0, 24.0, 13.0, 32.0, 75.0, 137.0, 245.0, 188.0, 86.0, 42.0, 27.0, 18.0, 14.0, 15.0, 6.0, 8.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.16821861267089844, -0.16236495971679688, -0.1565113067626953, -0.15065765380859375, -0.1448040008544922, -0.13895034790039062, -0.13309669494628906, -0.1272430419921875, -0.12138938903808594, -0.11553573608398438, -0.10968208312988281, -0.10382843017578125, -0.09797477722167969, -0.09212112426757812, -0.08626747131347656, -0.080413818359375, -0.07456016540527344, -0.06870651245117188, -0.06285285949707031, -0.05699920654296875, -0.05114555358886719, -0.045291900634765625, -0.03943824768066406, -0.0335845947265625, -0.027730941772460938, -0.021877288818359375, -0.016023635864257812, -0.01016998291015625, -0.0043163299560546875, 0.001537322998046875, 0.0073909759521484375, 0.01324462890625, 0.019098281860351562, 0.024951934814453125, 0.030805587768554688, 0.03665924072265625, 0.04251289367675781, 0.048366546630859375, 0.05422019958496094, 0.0600738525390625, 0.06592750549316406, 0.07178115844726562, 0.07763481140136719, 0.08348846435546875, 0.08934211730957031, 0.09519577026367188, 0.10104942321777344, 0.106903076171875, 0.11275672912597656, 0.11861038208007812, 0.12446403503417969, 0.13031768798828125, 0.1361713409423828, 0.14202499389648438, 0.14787864685058594, 0.1537322998046875, 0.15958595275878906, 0.16543960571289062, 0.1712932586669922, 0.17714691162109375, 0.1830005645751953, 0.18885421752929688, 0.19470787048339844, 0.2005615234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 8.0, 17.0, 29.0, 47.0, 96.0, 216.0, 258.0, 149.0, 87.0, 42.0, 19.0, 12.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.628633975982666, -4.489284515380859, -4.349935054779053, -4.210585594177246, -4.0712361335754395, -3.931886672973633, -3.792536973953247, -3.6531875133514404, -3.513838052749634, -3.374488592147827, -3.2351391315460205, -3.095789670944214, -2.956439971923828, -2.8170905113220215, -2.677741050720215, -2.538391590118408, -2.3990421295166016, -2.259692668914795, -2.1203432083129883, -1.980993628501892, -1.8416441679000854, -1.7022947072982788, -1.5629451274871826, -1.423595666885376, -1.2842462062835693, -1.1448967456817627, -1.005547285079956, -0.8661977052688599, -0.7268482446670532, -0.5874987840652466, -0.44814926385879517, -0.30879974365234375, -0.1694507598876953, -0.030101269483566284, 0.10924822092056274, 0.24859771132469177, 0.3879472017288208, 0.5272966623306274, 0.6666461825370789, 0.8059957027435303, 0.9453451633453369, 1.0846946239471436, 1.2240440845489502, 1.3633936643600464, 1.502743124961853, 1.6420925855636597, 1.7814421653747559, 1.9207916259765625, 2.060141086578369, 2.199490547180176, 2.3388400077819824, 2.478189468383789, 2.6175389289855957, 2.7568883895874023, 2.896238088607788, 3.0355875492095947, 3.1749370098114014, 3.314286470413208, 3.4536359310150146, 3.5929853916168213, 3.732335090637207, 3.8716845512390137, 4.01103401184082, 4.150383472442627, 4.289732933044434]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 11.0, 15.0, 20.0, 18.0, 24.0, 32.0, 22.0, 37.0, 41.0, 49.0, 62.0, 52.0, 50.0, 64.0, 78.0, 53.0, 68.0, 31.0, 50.0, 36.0, 32.0, 35.0, 33.0, 23.0, 21.0, 9.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9645183086395264, -2.838589668273926, -2.7126612663269043, -2.5867326259613037, -2.4608042240142822, -2.3348755836486816, -2.20894718170166, -2.0830185413360596, -1.9570900201797485, -1.8311614990234375, -1.7052329778671265, -1.5793044567108154, -1.4533758163452148, -1.3274474143981934, -1.2015187740325928, -1.0755902528762817, -0.9496617317199707, -0.8237332105636597, -0.6978046894073486, -0.5718761086463928, -0.4459475874900818, -0.32001906633377075, -0.19409048557281494, -0.0681619644165039, 0.05776655673980713, 0.18369509279727936, 0.3096236288547516, 0.435552179813385, 0.561480700969696, 0.6874092221260071, 0.8133378028869629, 0.9392663240432739, 1.065195083618164, 1.191123604774475, 1.3170521259307861, 1.4429807662963867, 1.5689091682434082, 1.6948378086090088, 1.8207663297653198, 1.9466948509216309, 2.0726232528686523, 2.198551893234253, 2.3244802951812744, 2.450408935546875, 2.5763373374938965, 2.702265977859497, 2.8281946182250977, 2.954123020172119, 3.0800516605377197, 3.2059803009033203, 3.331908702850342, 3.4578373432159424, 3.583765745162964, 3.7096943855285645, 3.835622787475586, 3.9615514278411865, 4.087480068206787, 4.213408470153809, 4.339337348937988, 4.46526575088501, 4.591194152832031, 4.717122554779053, 4.843051433563232, 4.968979835510254, 5.094908237457275]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 8.0, 11.0, 28.0, 29.0, 47.0, 79.0, 174.0, 269.0, 567.0, 1381.0, 5354.0, 120878.0, 3994405.0, 63151.0, 4865.0, 1897.0, 537.0, 245.0, 136.0, 80.0, 46.0, 30.0, 21.0, 12.0, 8.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.203125, -5.08331298828125, -4.9635009765625, -4.84368896484375, -4.723876953125, -4.60406494140625, -4.4842529296875, -4.36444091796875, -4.24462890625, -4.12481689453125, -4.0050048828125, -3.88519287109375, -3.765380859375, -3.64556884765625, -3.5257568359375, -3.40594482421875, -3.2861328125, -3.16632080078125, -3.0465087890625, -2.92669677734375, -2.806884765625, -2.68707275390625, -2.5672607421875, -2.44744873046875, -2.32763671875, -2.20782470703125, -2.0880126953125, -1.96820068359375, -1.848388671875, -1.72857666015625, -1.6087646484375, -1.48895263671875, -1.369140625, -1.24932861328125, -1.1295166015625, -1.00970458984375, -0.889892578125, -0.77008056640625, -0.6502685546875, -0.53045654296875, -0.41064453125, -0.29083251953125, -0.1710205078125, -0.05120849609375, 0.068603515625, 0.18841552734375, 0.3082275390625, 0.42803955078125, 0.5478515625, 0.66766357421875, 0.7874755859375, 0.90728759765625, 1.027099609375, 1.14691162109375, 1.2667236328125, 1.38653564453125, 1.50634765625, 1.62615966796875, 1.7459716796875, 1.86578369140625, 1.985595703125, 2.10540771484375, 2.2252197265625, 2.34503173828125, 2.46484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 7.0, 15.0, 24.0, 46.0, 50.0, 56.0, 84.0, 90.0, 109.0, 100.0, 87.0, 87.0, 62.0, 56.0, 35.0, 23.0, 12.0, 17.0, 7.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.2640838623046875, -2.205902099609375, -2.1477203369140625, -2.08953857421875, -2.0313568115234375, -1.973175048828125, -1.9149932861328125, -1.8568115234375, -1.7986297607421875, -1.740447998046875, -1.6822662353515625, -1.62408447265625, -1.5659027099609375, -1.507720947265625, -1.4495391845703125, -1.391357421875, -1.3331756591796875, -1.274993896484375, -1.2168121337890625, -1.15863037109375, -1.1004486083984375, -1.042266845703125, -0.9840850830078125, -0.9259033203125, -0.8677215576171875, -0.809539794921875, -0.7513580322265625, -0.69317626953125, -0.6349945068359375, -0.576812744140625, -0.5186309814453125, -0.46044921875, -0.4022674560546875, -0.344085693359375, -0.2859039306640625, -0.22772216796875, -0.1695404052734375, -0.111358642578125, -0.0531768798828125, 0.0050048828125, 0.0631866455078125, 0.121368408203125, 0.1795501708984375, 0.23773193359375, 0.2959136962890625, 0.354095458984375, 0.4122772216796875, 0.470458984375, 0.5286407470703125, 0.586822509765625, 0.6450042724609375, 0.70318603515625, 0.7613677978515625, 0.819549560546875, 0.8777313232421875, 0.9359130859375, 0.9940948486328125, 1.052276611328125, 1.1104583740234375, 1.16864013671875, 1.2268218994140625, 1.285003662109375, 1.3431854248046875, 1.4013671875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 15.0, 9.0, 18.0, 35.0, 75.0, 116.0, 259.0, 594.0, 1912.0, 8790.0, 271441.0, 3890439.0, 16413.0, 2678.0, 808.0, 311.0, 143.0, 85.0, 48.0, 23.0, 19.0, 11.0, 12.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.936981201171875, -4.80755615234375, -4.678131103515625, -4.5487060546875, -4.419281005859375, -4.28985595703125, -4.160430908203125, -4.031005859375, -3.901580810546875, -3.77215576171875, -3.642730712890625, -3.5133056640625, -3.383880615234375, -3.25445556640625, -3.125030517578125, -2.99560546875, -2.866180419921875, -2.73675537109375, -2.607330322265625, -2.4779052734375, -2.348480224609375, -2.21905517578125, -2.089630126953125, -1.960205078125, -1.830780029296875, -1.70135498046875, -1.571929931640625, -1.4425048828125, -1.313079833984375, -1.18365478515625, -1.054229736328125, -0.9248046875, -0.795379638671875, -0.66595458984375, -0.536529541015625, -0.4071044921875, -0.277679443359375, -0.14825439453125, -0.018829345703125, 0.110595703125, 0.240020751953125, 0.36944580078125, 0.498870849609375, 0.6282958984375, 0.757720947265625, 0.88714599609375, 1.016571044921875, 1.14599609375, 1.275421142578125, 1.40484619140625, 1.534271240234375, 1.6636962890625, 1.793121337890625, 1.92254638671875, 2.051971435546875, 2.181396484375, 2.310821533203125, 2.44024658203125, 2.569671630859375, 2.6990966796875, 2.828521728515625, 2.95794677734375, 3.087371826171875, 3.216796875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 3.0, 16.0, 19.0, 14.0, 34.0, 73.0, 307.0, 1480.0, 1544.0, 376.0, 97.0, 44.0, 14.0, 13.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6707687377929688, -0.6428070068359375, -0.6148452758789062, -0.586883544921875, -0.5589218139648438, -0.5309600830078125, -0.5029983520507812, -0.47503662109375, -0.44707489013671875, -0.4191131591796875, -0.39115142822265625, -0.363189697265625, -0.33522796630859375, -0.3072662353515625, -0.27930450439453125, -0.2513427734375, -0.22338104248046875, -0.1954193115234375, -0.16745758056640625, -0.139495849609375, -0.11153411865234375, -0.0835723876953125, -0.05561065673828125, -0.02764892578125, 0.00031280517578125, 0.0282745361328125, 0.05623626708984375, 0.084197998046875, 0.11215972900390625, 0.1401214599609375, 0.16808319091796875, 0.196044921875, 0.22400665283203125, 0.2519683837890625, 0.27993011474609375, 0.307891845703125, 0.33585357666015625, 0.3638153076171875, 0.39177703857421875, 0.41973876953125, 0.44770050048828125, 0.4756622314453125, 0.5036239624023438, 0.531585693359375, 0.5595474243164062, 0.5875091552734375, 0.6154708862304688, 0.6434326171875, 0.6713943481445312, 0.6993560791015625, 0.7273178100585938, 0.755279541015625, 0.7832412719726562, 0.8112030029296875, 0.8391647338867188, 0.86712646484375, 0.8950881958007812, 0.9230499267578125, 0.9510116577148438, 0.978973388671875, 1.0069351196289062, 1.0348968505859375, 1.0628585815429688, 1.0908203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 12.0, 16.0, 39.0, 62.0, 142.0, 231.0, 237.0, 126.0, 50.0, 28.0, 21.0, 10.0, 11.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6737101078033447, -3.565480947494507, -3.457251787185669, -3.349022626876831, -3.2407937049865723, -3.1325645446777344, -3.0243353843688965, -2.9161062240600586, -2.8078770637512207, -2.699647903442383, -2.591418743133545, -2.483189582824707, -2.374960422515869, -2.2667312622070312, -2.1585023403167725, -2.0502731800079346, -1.9420440196990967, -1.8338148593902588, -1.725585699081421, -1.6173566579818726, -1.5091274976730347, -1.4008983373641968, -1.2926692962646484, -1.1844401359558105, -1.0762109756469727, -0.9679818153381348, -0.8597527146339417, -0.7515236139297485, -0.6432944536209106, -0.5350652933120728, -0.42683619260787964, -0.3186070919036865, -0.21037769317626953, -0.10214856266975403, 0.006080567836761475, 0.11430969834327698, 0.22253882884979248, 0.33076798915863037, 0.4389970898628235, 0.5472261905670166, 0.6554553508758545, 0.7636845111846924, 0.8719136118888855, 0.9801427125930786, 1.0883718729019165, 1.1966010332107544, 1.3048300743103027, 1.4130592346191406, 1.5212883949279785, 1.6295175552368164, 1.7377467155456543, 1.8459757566452026, 1.9542049169540405, 2.062434196472168, 2.1706631183624268, 2.2788922786712646, 2.3871214389801025, 2.4953505992889404, 2.6035797595977783, 2.711808919906616, 2.820037841796875, 2.928267002105713, 3.036496162414551, 3.1447253227233887, 3.2529544830322266]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 17.0, 12.0, 21.0, 29.0, 32.0, 41.0, 70.0, 62.0, 66.0, 82.0, 80.0, 88.0, 66.0, 73.0, 63.0, 56.0, 37.0, 37.0, 16.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9855552911758423, -1.9296249151229858, -1.8736945390701294, -1.817764163017273, -1.7618337869644165, -1.70590341091156, -1.6499730348587036, -1.5940426588058472, -1.5381122827529907, -1.4821819067001343, -1.4262515306472778, -1.3703211545944214, -1.314390778541565, -1.2584604024887085, -1.202530026435852, -1.1465996503829956, -1.0906693935394287, -1.0347390174865723, -0.9788086414337158, -0.9228782653808594, -0.8669478893280029, -0.8110175132751465, -0.75508713722229, -0.6991567611694336, -0.6432263851165771, -0.5872960090637207, -0.5313656330108643, -0.4754352569580078, -0.41950488090515137, -0.3635745346546173, -0.30764415860176086, -0.2517137825489044, -0.19578337669372559, -0.13985300064086914, -0.08392263203859329, -0.027992263436317444, 0.027938112616539, 0.08386847376823425, 0.1397988498210907, 0.19572922587394714, 0.2516596019268036, 0.30758997797966003, 0.3635203540325165, 0.41945070028305054, 0.475381076335907, 0.5313114523887634, 0.5872418284416199, 0.6431722044944763, 0.6991025805473328, 0.7550329566001892, 0.8109633326530457, 0.8668937087059021, 0.9228240847587585, 0.9787544012069702, 1.0346847772598267, 1.090615153312683, 1.1465455293655396, 1.202475905418396, 1.2584062814712524, 1.3143366575241089, 1.3702670335769653, 1.4261974096298218, 1.4821277856826782, 1.5380581617355347, 1.5939885377883911]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 11.0, 5.0, 9.0, 12.0, 10.0, 17.0, 27.0, 41.0, 55.0, 66.0, 128.0, 223.0, 491.0, 1025.0, 2941.0, 8834.0, 33302.0, 193004.0, 658880.0, 116154.0, 22947.0, 6427.0, 2202.0, 843.0, 400.0, 183.0, 119.0, 61.0, 47.0, 28.0, 15.0, 11.0, 12.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240478515625, -0.23200225830078125, -0.2235260009765625, -0.21504974365234375, -0.206573486328125, -0.19809722900390625, -0.1896209716796875, -0.18114471435546875, -0.17266845703125, -0.16419219970703125, -0.1557159423828125, -0.14723968505859375, -0.138763427734375, -0.13028717041015625, -0.1218109130859375, -0.11333465576171875, -0.1048583984375, -0.09638214111328125, -0.0879058837890625, -0.07942962646484375, -0.070953369140625, -0.06247711181640625, -0.0540008544921875, -0.04552459716796875, -0.03704833984375, -0.02857208251953125, -0.0200958251953125, -0.01161956787109375, -0.003143310546875, 0.00533294677734375, 0.0138092041015625, 0.02228546142578125, 0.03076171875, 0.03923797607421875, 0.0477142333984375, 0.05619049072265625, 0.064666748046875, 0.07314300537109375, 0.0816192626953125, 0.09009552001953125, 0.09857177734375, 0.10704803466796875, 0.1155242919921875, 0.12400054931640625, 0.132476806640625, 0.14095306396484375, 0.1494293212890625, 0.15790557861328125, 0.1663818359375, 0.17485809326171875, 0.1833343505859375, 0.19181060791015625, 0.200286865234375, 0.20876312255859375, 0.2172393798828125, 0.22571563720703125, 0.23419189453125, 0.24266815185546875, 0.2511444091796875, 0.25962066650390625, 0.268096923828125, 0.27657318115234375, 0.2850494384765625, 0.29352569580078125, 0.302001953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 11.0, 7.0, 8.0, 20.0, 23.0, 36.0, 49.0, 70.0, 79.0, 97.0, 120.0, 98.0, 113.0, 84.0, 69.0, 42.0, 33.0, 17.0, 10.0, 10.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -2.0111541748046875, -1.961761474609375, -1.9123687744140625, -1.86297607421875, -1.8135833740234375, -1.764190673828125, -1.7147979736328125, -1.6654052734375, -1.6160125732421875, -1.566619873046875, -1.5172271728515625, -1.46783447265625, -1.4184417724609375, -1.369049072265625, -1.3196563720703125, -1.270263671875, -1.2208709716796875, -1.171478271484375, -1.1220855712890625, -1.07269287109375, -1.0233001708984375, -0.973907470703125, -0.9245147705078125, -0.8751220703125, -0.8257293701171875, -0.776336669921875, -0.7269439697265625, -0.67755126953125, -0.6281585693359375, -0.578765869140625, -0.5293731689453125, -0.47998046875, -0.4305877685546875, -0.381195068359375, -0.3318023681640625, -0.28240966796875, -0.2330169677734375, -0.183624267578125, -0.1342315673828125, -0.0848388671875, -0.0354461669921875, 0.013946533203125, 0.0633392333984375, 0.11273193359375, 0.1621246337890625, 0.211517333984375, 0.2609100341796875, 0.310302734375, 0.3596954345703125, 0.409088134765625, 0.4584808349609375, 0.50787353515625, 0.5572662353515625, 0.606658935546875, 0.6560516357421875, 0.7054443359375, 0.7548370361328125, 0.804229736328125, 0.8536224365234375, 0.90301513671875, 0.9524078369140625, 1.001800537109375, 1.0511932373046875, 1.1005859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 11.0, 11.0, 17.0, 17.0, 34.0, 36.0, 49.0, 78.0, 114.0, 184.0, 265.0, 418.0, 681.0, 1276.0, 2469.0, 5341.0, 12929.0, 36642.0, 124762.0, 505197.0, 257423.0, 64055.0, 20859.0, 7931.0, 3522.0, 1780.0, 876.0, 546.0, 326.0, 224.0, 142.0, 96.0, 61.0, 47.0, 37.0, 25.0, 16.0, 17.0, 8.0, 8.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.1433887481689453, -0.13821792602539062, -0.13304710388183594, -0.12787628173828125, -0.12270545959472656, -0.11753463745117188, -0.11236381530761719, -0.1071929931640625, -0.10202217102050781, -0.09685134887695312, -0.09168052673339844, -0.08650970458984375, -0.08133888244628906, -0.07616806030273438, -0.07099723815917969, -0.065826416015625, -0.06065559387207031, -0.055484771728515625, -0.05031394958496094, -0.04514312744140625, -0.03997230529785156, -0.034801483154296875, -0.029630661010742188, -0.0244598388671875, -0.019289016723632812, -0.014118194580078125, -0.008947372436523438, -0.00377655029296875, 0.0013942718505859375, 0.006565093994140625, 0.011735916137695312, 0.01690673828125, 0.022077560424804688, 0.027248382568359375, 0.03241920471191406, 0.03759002685546875, 0.04276084899902344, 0.047931671142578125, 0.05310249328613281, 0.0582733154296875, 0.06344413757324219, 0.06861495971679688, 0.07378578186035156, 0.07895660400390625, 0.08412742614746094, 0.08929824829101562, 0.09446907043457031, 0.099639892578125, 0.10481071472167969, 0.10998153686523438, 0.11515235900878906, 0.12032318115234375, 0.12549400329589844, 0.13066482543945312, 0.1358356475830078, 0.1410064697265625, 0.1461772918701172, 0.15134811401367188, 0.15651893615722656, 0.16168975830078125, 0.16686058044433594, 0.17203140258789062, 0.1772022247314453, 0.182373046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 11.0, 14.0, 14.0, 10.0, 21.0, 12.0, 26.0, 25.0, 24.0, 31.0, 29.0, 27.0, 33.0, 44.0, 50.0, 63.0, 59.0, 50.0, 56.0, 55.0, 41.0, 30.0, 40.0, 43.0, 28.0, 29.0, 22.0, 15.0, 17.0, 13.0, 14.0, 6.0, 4.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1776580810546875, -1.135589599609375, -1.0935211181640625, -1.05145263671875, -1.0093841552734375, -0.967315673828125, -0.9252471923828125, -0.8831787109375, -0.8411102294921875, -0.799041748046875, -0.7569732666015625, -0.71490478515625, -0.6728363037109375, -0.630767822265625, -0.5886993408203125, -0.546630859375, -0.5045623779296875, -0.462493896484375, -0.4204254150390625, -0.37835693359375, -0.3362884521484375, -0.294219970703125, -0.2521514892578125, -0.2100830078125, -0.1680145263671875, -0.125946044921875, -0.0838775634765625, -0.04180908203125, 0.0002593994140625, 0.042327880859375, 0.0843963623046875, 0.12646484375, 0.1685333251953125, 0.210601806640625, 0.2526702880859375, 0.29473876953125, 0.3368072509765625, 0.378875732421875, 0.4209442138671875, 0.4630126953125, 0.5050811767578125, 0.547149658203125, 0.5892181396484375, 0.63128662109375, 0.6733551025390625, 0.715423583984375, 0.7574920654296875, 0.799560546875, 0.8416290283203125, 0.883697509765625, 0.9257659912109375, 0.96783447265625, 1.0099029541015625, 1.051971435546875, 1.0940399169921875, 1.1361083984375, 1.1781768798828125, 1.220245361328125, 1.2623138427734375, 1.30438232421875, 1.3464508056640625, 1.388519287109375, 1.4305877685546875, 1.47265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 9.0, 6.0, 14.0, 13.0, 16.0, 29.0, 51.0, 53.0, 89.0, 191.0, 265.0, 478.0, 985.0, 2166.0, 5905.0, 20534.0, 123271.0, 733148.0, 129521.0, 21549.0, 5891.0, 2161.0, 1016.0, 460.0, 301.0, 143.0, 92.0, 66.0, 39.0, 27.0, 15.0, 19.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0618896484375, -0.059861183166503906, -0.05783271789550781, -0.05580425262451172, -0.053775787353515625, -0.05174732208251953, -0.04971885681152344, -0.047690391540527344, -0.04566192626953125, -0.043633460998535156, -0.04160499572753906, -0.03957653045654297, -0.037548065185546875, -0.03551959991455078, -0.03349113464355469, -0.031462669372558594, -0.0294342041015625, -0.027405738830566406, -0.025377273559570312, -0.02334880828857422, -0.021320343017578125, -0.01929187774658203, -0.017263412475585938, -0.015234947204589844, -0.01320648193359375, -0.011178016662597656, -0.009149551391601562, -0.007121086120605469, -0.005092620849609375, -0.0030641555786132812, -0.0010356903076171875, 0.0009927749633789062, 0.003021240234375, 0.005049705505371094, 0.0070781707763671875, 0.009106636047363281, 0.011135101318359375, 0.013163566589355469, 0.015192031860351562, 0.017220497131347656, 0.01924896240234375, 0.021277427673339844, 0.023305892944335938, 0.02533435821533203, 0.027362823486328125, 0.02939128875732422, 0.03141975402832031, 0.033448219299316406, 0.0354766845703125, 0.037505149841308594, 0.03953361511230469, 0.04156208038330078, 0.043590545654296875, 0.04561901092529297, 0.04764747619628906, 0.049675941467285156, 0.05170440673828125, 0.053732872009277344, 0.05576133728027344, 0.05778980255126953, 0.059818267822265625, 0.06184673309326172, 0.06387519836425781, 0.0659036636352539, 0.06793212890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 9.0, 11.0, 16.0, 22.0, 37.0, 62.0, 122.0, 170.0, 214.0, 147.0, 88.0, 44.0, 27.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.574392318725586e-05, -6.418582051992416e-05, -6.262771785259247e-05, -6.106961518526077e-05, -5.951151251792908e-05, -5.795340985059738e-05, -5.6395307183265686e-05, -5.483720451593399e-05, -5.3279101848602295e-05, -5.17209991812706e-05, -5.0162896513938904e-05, -4.860479384660721e-05, -4.704669117927551e-05, -4.548858851194382e-05, -4.393048584461212e-05, -4.2372383177280426e-05, -4.081428050994873e-05, -3.9256177842617035e-05, -3.769807517528534e-05, -3.6139972507953644e-05, -3.458186984062195e-05, -3.302376717329025e-05, -3.146566450595856e-05, -2.990756183862686e-05, -2.8349459171295166e-05, -2.679135650396347e-05, -2.5233253836631775e-05, -2.367515116930008e-05, -2.2117048501968384e-05, -2.0558945834636688e-05, -1.9000843167304993e-05, -1.7442740499973297e-05, -1.58846378326416e-05, -1.4326535165309906e-05, -1.276843249797821e-05, -1.1210329830646515e-05, -9.65222716331482e-06, -8.094124495983124e-06, -6.536021828651428e-06, -4.977919161319733e-06, -3.419816493988037e-06, -1.8617138266563416e-06, -3.03611159324646e-07, 1.2544915080070496e-06, 2.812594175338745e-06, 4.370696842670441e-06, 5.928799510002136e-06, 7.486902177333832e-06, 9.045004844665527e-06, 1.0603107511997223e-05, 1.2161210179328918e-05, 1.3719312846660614e-05, 1.527741551399231e-05, 1.6835518181324005e-05, 1.83936208486557e-05, 1.9951723515987396e-05, 2.1509826183319092e-05, 2.3067928850650787e-05, 2.4626031517982483e-05, 2.618413418531418e-05, 2.7742236852645874e-05, 2.930033951997757e-05, 3.0858442187309265e-05, 3.241654485464096e-05, 3.3974647521972656e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 12.0, 21.0, 21.0, 32.0, 37.0, 62.0, 105.0, 165.0, 249.0, 422.0, 701.0, 1285.0, 2485.0, 5369.0, 13566.0, 40479.0, 169521.0, 561103.0, 184145.0, 43317.0, 14034.0, 5588.0, 2537.0, 1419.0, 727.0, 413.0, 262.0, 164.0, 91.0, 66.0, 38.0, 21.0, 23.0, 22.0, 5.0, 4.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.046112060546875, -0.0446014404296875, -0.0430908203125, -0.0415802001953125, -0.040069580078125, -0.0385589599609375, -0.03704833984375, -0.0355377197265625, -0.034027099609375, -0.0325164794921875, -0.031005859375, -0.0294952392578125, -0.027984619140625, -0.0264739990234375, -0.02496337890625, -0.0234527587890625, -0.021942138671875, -0.0204315185546875, -0.0189208984375, -0.0174102783203125, -0.015899658203125, -0.0143890380859375, -0.01287841796875, -0.0113677978515625, -0.009857177734375, -0.0083465576171875, -0.0068359375, -0.0053253173828125, -0.003814697265625, -0.0023040771484375, -0.00079345703125, 0.0007171630859375, 0.002227783203125, 0.0037384033203125, 0.0052490234375, 0.0067596435546875, 0.008270263671875, 0.0097808837890625, 0.01129150390625, 0.0128021240234375, 0.014312744140625, 0.0158233642578125, 0.017333984375, 0.0188446044921875, 0.020355224609375, 0.0218658447265625, 0.02337646484375, 0.0248870849609375, 0.026397705078125, 0.0279083251953125, 0.0294189453125, 0.0309295654296875, 0.032440185546875, 0.0339508056640625, 0.03546142578125, 0.0369720458984375, 0.038482666015625, 0.0399932861328125, 0.04150390625, 0.0430145263671875, 0.044525146484375, 0.0460357666015625, 0.04754638671875, 0.0490570068359375, 0.050567626953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 15.0, 12.0, 25.0, 29.0, 41.0, 46.0, 56.0, 58.0, 81.0, 84.0, 87.0, 73.0, 66.0, 56.0, 58.0, 27.0, 32.0, 24.0, 30.0, 16.0, 9.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013031005859375, -0.012640237808227539, -0.012249469757080078, -0.011858701705932617, -0.011467933654785156, -0.011077165603637695, -0.010686397552490234, -0.010295629501342773, -0.009904861450195312, -0.009514093399047852, -0.00912332534790039, -0.00873255729675293, -0.008341789245605469, -0.007951021194458008, -0.007560253143310547, -0.007169485092163086, -0.006778717041015625, -0.006387948989868164, -0.005997180938720703, -0.005606412887573242, -0.005215644836425781, -0.00482487678527832, -0.004434108734130859, -0.0040433406829833984, -0.0036525726318359375, -0.0032618045806884766, -0.0028710365295410156, -0.0024802684783935547, -0.0020895004272460938, -0.0016987323760986328, -0.0013079643249511719, -0.0009171962738037109, -0.00052642822265625, -0.00013566017150878906, 0.0002551078796386719, 0.0006458759307861328, 0.0010366439819335938, 0.0014274120330810547, 0.0018181800842285156, 0.0022089481353759766, 0.0025997161865234375, 0.0029904842376708984, 0.0033812522888183594, 0.0037720203399658203, 0.004162788391113281, 0.004553556442260742, 0.004944324493408203, 0.005335092544555664, 0.005725860595703125, 0.006116628646850586, 0.006507396697998047, 0.006898164749145508, 0.007288932800292969, 0.00767970085144043, 0.00807046890258789, 0.008461236953735352, 0.008852005004882812, 0.009242773056030273, 0.009633541107177734, 0.010024309158325195, 0.010415077209472656, 0.010805845260620117, 0.011196613311767578, 0.011587381362915039, 0.0119781494140625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 76.0, 219.0, 443.0, 151.0, 42.0, 17.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.538624286651611, -5.421570777893066, -5.3045172691345215, -5.187463760375977, -5.070409774780273, -4.9533562660217285, -4.836302757263184, -4.719249248504639, -4.602195739746094, -4.485142230987549, -4.368088722229004, -4.251034736633301, -4.133981227874756, -4.016927719116211, -3.899874210357666, -3.782820701599121, -3.665766716003418, -3.548713207244873, -3.431659460067749, -3.314605951309204, -3.197552442550659, -3.080498695373535, -2.9634451866149902, -2.8463916778564453, -2.7293381690979004, -2.6122846603393555, -2.4952309131622314, -2.3781774044036865, -2.2611238956451416, -2.1440701484680176, -2.0270166397094727, -1.9099630117416382, -1.7929093837738037, -1.6758557558059692, -1.5588022470474243, -1.4417486190795898, -1.3246949911117554, -1.207641363143921, -1.090587854385376, -0.9735342264175415, -0.8564806580543518, -0.7394270896911621, -0.6223734617233276, -0.5053198933601379, -0.38826629519462585, -0.27121269702911377, -0.15415912866592407, -0.0371055006980896, 0.0799480676651001, 0.19700166583061218, 0.31405526399612427, 0.43110883235931396, 0.5481624603271484, 0.6652160286903381, 0.7822695970535278, 0.8993232250213623, 1.0163767337799072, 1.1334303617477417, 1.2504838705062866, 1.367537498474121, 1.4845911264419556, 1.60164475440979, 1.718698263168335, 1.8357518911361694, 1.952805519104004]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 10.0, 11.0, 26.0, 33.0, 39.0, 61.0, 84.0, 87.0, 101.0, 103.0, 105.0, 81.0, 74.0, 63.0, 37.0, 25.0, 16.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8379266262054443, -1.7933305501937866, -1.7487343549728394, -1.7041382789611816, -1.6595420837402344, -1.6149460077285767, -1.570349931716919, -1.5257537364959717, -1.4811575412750244, -1.4365614652633667, -1.3919652700424194, -1.3473691940307617, -1.3027729988098145, -1.2581769227981567, -1.213580846786499, -1.1689846515655518, -1.124388575553894, -1.0797924995422363, -1.035196304321289, -0.9906002283096313, -0.9460040330886841, -0.9014079570770264, -0.8568118214607239, -0.8122156858444214, -0.7676195502281189, -0.7230234146118164, -0.6784272789955139, -0.6338311433792114, -0.5892350673675537, -0.5446388721466064, -0.5000427961349487, -0.45544666051864624, -0.41085052490234375, -0.36625438928604126, -0.32165825366973877, -0.27706214785575867, -0.23246601223945618, -0.1878698766231537, -0.14327377080917358, -0.0986776351928711, -0.054081499576568604, -0.00948537141084671, 0.03511075675487518, 0.07970687747001648, 0.12430301308631897, 0.16889914870262146, 0.21349525451660156, 0.25809139013290405, 0.30268752574920654, 0.34728366136550903, 0.3918797969818115, 0.4364759027957916, 0.4810720384120941, 0.5256681442260742, 0.5702642798423767, 0.6148604154586792, 0.6594565510749817, 0.7040526866912842, 0.7486488223075867, 0.7932449579238892, 0.8378410339355469, 0.8824372291564941, 0.9270333051681519, 0.9716294407844543, 1.0162255764007568]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 16.0, 23.0, 35.0, 35.0, 57.0, 76.0, 106.0, 171.0, 255.0, 391.0, 586.0, 967.0, 1604.0, 2866.0, 5421.0, 11688.0, 31004.0, 206334.0, 692358.0, 60578.0, 17201.0, 7445.0, 3817.0, 2066.0, 1245.0, 767.0, 448.0, 285.0, 211.0, 135.0, 100.0, 57.0, 53.0, 33.0, 28.0, 18.0, 10.0, 8.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.17578125, -1.1403961181640625, -1.105010986328125, -1.0696258544921875, -1.03424072265625, -0.9988555908203125, -0.963470458984375, -0.9280853271484375, -0.8927001953125, -0.8573150634765625, -0.821929931640625, -0.7865447998046875, -0.75115966796875, -0.7157745361328125, -0.680389404296875, -0.6450042724609375, -0.609619140625, -0.5742340087890625, -0.538848876953125, -0.5034637451171875, -0.46807861328125, -0.4326934814453125, -0.397308349609375, -0.3619232177734375, -0.3265380859375, -0.2911529541015625, -0.255767822265625, -0.2203826904296875, -0.18499755859375, -0.1496124267578125, -0.114227294921875, -0.0788421630859375, -0.04345703125, -0.0080718994140625, 0.027313232421875, 0.0626983642578125, 0.09808349609375, 0.1334686279296875, 0.168853759765625, 0.2042388916015625, 0.2396240234375, 0.2750091552734375, 0.310394287109375, 0.3457794189453125, 0.38116455078125, 0.4165496826171875, 0.451934814453125, 0.4873199462890625, 0.522705078125, 0.5580902099609375, 0.593475341796875, 0.6288604736328125, 0.66424560546875, 0.6996307373046875, 0.735015869140625, 0.7704010009765625, 0.8057861328125, 0.8411712646484375, 0.876556396484375, 0.9119415283203125, 0.94732666015625, 0.9827117919921875, 1.018096923828125, 1.0534820556640625, 1.0888671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 6.0, 8.0, 12.0, 19.0, 17.0, 34.0, 28.0, 50.0, 57.0, 51.0, 70.0, 77.0, 89.0, 83.0, 80.0, 64.0, 46.0, 43.0, 50.0, 27.0, 21.0, 14.0, 14.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.117218017578125, -2.04302978515625, -1.968841552734375, -1.8946533203125, -1.820465087890625, -1.74627685546875, -1.672088623046875, -1.597900390625, -1.523712158203125, -1.44952392578125, -1.375335693359375, -1.3011474609375, -1.226959228515625, -1.15277099609375, -1.078582763671875, -1.00439453125, -0.930206298828125, -0.85601806640625, -0.781829833984375, -0.7076416015625, -0.633453369140625, -0.55926513671875, -0.485076904296875, -0.410888671875, -0.336700439453125, -0.26251220703125, -0.188323974609375, -0.1141357421875, -0.039947509765625, 0.03424072265625, 0.108428955078125, 0.1826171875, 0.256805419921875, 0.33099365234375, 0.405181884765625, 0.4793701171875, 0.553558349609375, 0.62774658203125, 0.701934814453125, 0.776123046875, 0.850311279296875, 0.92449951171875, 0.998687744140625, 1.0728759765625, 1.147064208984375, 1.22125244140625, 1.295440673828125, 1.36962890625, 1.443817138671875, 1.51800537109375, 1.592193603515625, 1.6663818359375, 1.740570068359375, 1.81475830078125, 1.888946533203125, 1.963134765625, 2.037322998046875, 2.11151123046875, 2.185699462890625, 2.2598876953125, 2.334075927734375, 2.40826416015625, 2.482452392578125, 2.556640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 10.0, 11.0, 12.0, 16.0, 29.0, 38.0, 43.0, 59.0, 98.0, 141.0, 241.0, 427.0, 845.0, 1945.0, 5255.0, 18788.0, 142750.0, 808032.0, 52579.0, 10753.0, 3432.0, 1420.0, 646.0, 342.0, 196.0, 117.0, 100.0, 57.0, 42.0, 31.0, 16.0, 16.0, 19.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.35577392578125, -1.3150634765625, -1.27435302734375, -1.233642578125, -1.19293212890625, -1.1522216796875, -1.11151123046875, -1.07080078125, -1.03009033203125, -0.9893798828125, -0.94866943359375, -0.907958984375, -0.86724853515625, -0.8265380859375, -0.78582763671875, -0.7451171875, -0.70440673828125, -0.6636962890625, -0.62298583984375, -0.582275390625, -0.54156494140625, -0.5008544921875, -0.46014404296875, -0.41943359375, -0.37872314453125, -0.3380126953125, -0.29730224609375, -0.256591796875, -0.21588134765625, -0.1751708984375, -0.13446044921875, -0.09375, -0.05303955078125, -0.0123291015625, 0.02838134765625, 0.069091796875, 0.10980224609375, 0.1505126953125, 0.19122314453125, 0.23193359375, 0.27264404296875, 0.3133544921875, 0.35406494140625, 0.394775390625, 0.43548583984375, 0.4761962890625, 0.51690673828125, 0.5576171875, 0.59832763671875, 0.6390380859375, 0.67974853515625, 0.720458984375, 0.76116943359375, 0.8018798828125, 0.84259033203125, 0.88330078125, 0.92401123046875, 0.9647216796875, 1.00543212890625, 1.046142578125, 1.08685302734375, 1.1275634765625, 1.16827392578125, 1.208984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 9.0, 10.0, 16.0, 11.0, 13.0, 16.0, 16.0, 19.0, 21.0, 24.0, 29.0, 19.0, 27.0, 35.0, 33.0, 40.0, 34.0, 39.0, 57.0, 45.0, 47.0, 48.0, 32.0, 29.0, 30.0, 27.0, 27.0, 24.0, 28.0, 18.0, 23.0, 27.0, 28.0, 13.0, 10.0, 12.0, 9.0, 8.0, 7.0, 8.0, 4.0, 9.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4931640625, -1.447998046875, -1.40283203125, -1.357666015625, -1.3125, -1.267333984375, -1.22216796875, -1.177001953125, -1.1318359375, -1.086669921875, -1.04150390625, -0.996337890625, -0.951171875, -0.906005859375, -0.86083984375, -0.815673828125, -0.7705078125, -0.725341796875, -0.68017578125, -0.635009765625, -0.58984375, -0.544677734375, -0.49951171875, -0.454345703125, -0.4091796875, -0.364013671875, -0.31884765625, -0.273681640625, -0.228515625, -0.183349609375, -0.13818359375, -0.093017578125, -0.0478515625, -0.002685546875, 0.04248046875, 0.087646484375, 0.1328125, 0.177978515625, 0.22314453125, 0.268310546875, 0.3134765625, 0.358642578125, 0.40380859375, 0.448974609375, 0.494140625, 0.539306640625, 0.58447265625, 0.629638671875, 0.6748046875, 0.719970703125, 0.76513671875, 0.810302734375, 0.85546875, 0.900634765625, 0.94580078125, 0.990966796875, 1.0361328125, 1.081298828125, 1.12646484375, 1.171630859375, 1.216796875, 1.261962890625, 1.30712890625, 1.352294921875, 1.3974609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 9.0, 13.0, 17.0, 15.0, 27.0, 33.0, 47.0, 104.0, 183.0, 345.0, 679.0, 1735.0, 5620.0, 28669.0, 892448.0, 102019.0, 11429.0, 3060.0, 1013.0, 465.0, 237.0, 128.0, 83.0, 65.0, 34.0, 18.0, 11.0, 14.0, 7.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.7358856201171875, -0.706146240234375, -0.6764068603515625, -0.64666748046875, -0.6169281005859375, -0.587188720703125, -0.5574493408203125, -0.5277099609375, -0.4979705810546875, -0.468231201171875, -0.4384918212890625, -0.40875244140625, -0.3790130615234375, -0.349273681640625, -0.3195343017578125, -0.289794921875, -0.2600555419921875, -0.230316162109375, -0.2005767822265625, -0.17083740234375, -0.1410980224609375, -0.111358642578125, -0.0816192626953125, -0.0518798828125, -0.0221405029296875, 0.007598876953125, 0.0373382568359375, 0.06707763671875, 0.0968170166015625, 0.126556396484375, 0.1562957763671875, 0.18603515625, 0.2157745361328125, 0.245513916015625, 0.2752532958984375, 0.30499267578125, 0.3347320556640625, 0.364471435546875, 0.3942108154296875, 0.4239501953125, 0.4536895751953125, 0.483428955078125, 0.5131683349609375, 0.54290771484375, 0.5726470947265625, 0.602386474609375, 0.6321258544921875, 0.661865234375, 0.6916046142578125, 0.721343994140625, 0.7510833740234375, 0.78082275390625, 0.8105621337890625, 0.840301513671875, 0.8700408935546875, 0.8997802734375, 0.9295196533203125, 0.959259033203125, 0.9889984130859375, 1.01873779296875, 1.0484771728515625, 1.078216552734375, 1.1079559326171875, 1.1376953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 27.0, 29.0, 66.0, 241.0, 414.0, 85.0, 42.0, 27.0, 16.0, 12.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002275705337524414, -0.00022274907678365707, -0.00021792761981487274, -0.0002131061628460884, -0.00020828470587730408, -0.00020346324890851974, -0.0001986417919397354, -0.00019382033497095108, -0.00018899887800216675, -0.00018417742103338242, -0.00017935596406459808, -0.00017453450709581375, -0.00016971305012702942, -0.0001648915931582451, -0.00016007013618946075, -0.00015524867922067642, -0.0001504272222518921, -0.00014560576528310776, -0.00014078430831432343, -0.0001359628513455391, -0.00013114139437675476, -0.00012631993740797043, -0.0001214984804391861, -0.00011667702347040176, -0.00011185556650161743, -0.0001070341095328331, -0.00010221265256404877, -9.739119559526443e-05, -9.25697386264801e-05, -8.774828165769577e-05, -8.292682468891144e-05, -7.81053677201271e-05, -7.328391075134277e-05, -6.846245378255844e-05, -6.364099681377411e-05, -5.8819539844989777e-05, -5.3998082876205444e-05, -4.917662590742111e-05, -4.435516893863678e-05, -3.953371196985245e-05, -3.4712255001068115e-05, -2.9890798032283783e-05, -2.506934106349945e-05, -2.024788409471512e-05, -1.5426427125930786e-05, -1.0604970157146454e-05, -5.783513188362122e-06, -9.620562195777893e-07, 3.859400749206543e-06, 8.680857717990875e-06, 1.3502314686775208e-05, 1.832377165555954e-05, 2.3145228624343872e-05, 2.7966685593128204e-05, 3.278814256191254e-05, 3.760959953069687e-05, 4.24310564994812e-05, 4.7252513468265533e-05, 5.2073970437049866e-05, 5.68954274058342e-05, 6.171688437461853e-05, 6.653834134340286e-05, 7.13597983121872e-05, 7.618125528097153e-05, 8.100271224975586e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 4.0, 5.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 20.0, 31.0, 48.0, 92.0, 156.0, 260.0, 512.0, 1051.0, 2506.0, 6495.0, 24248.0, 479521.0, 497582.0, 24652.0, 6736.0, 2417.0, 1052.0, 473.0, 232.0, 130.0, 75.0, 65.0, 40.0, 20.0, 21.0, 18.0, 8.0, 10.0, 8.0, 8.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8100204467773438, -0.7875213623046875, -0.7650222778320312, -0.742523193359375, -0.7200241088867188, -0.6975250244140625, -0.6750259399414062, -0.65252685546875, -0.6300277709960938, -0.6075286865234375, -0.5850296020507812, -0.562530517578125, -0.5400314331054688, -0.5175323486328125, -0.49503326416015625, -0.4725341796875, -0.45003509521484375, -0.4275360107421875, -0.40503692626953125, -0.382537841796875, -0.36003875732421875, -0.3375396728515625, -0.31504058837890625, -0.29254150390625, -0.27004241943359375, -0.2475433349609375, -0.22504425048828125, -0.202545166015625, -0.18004608154296875, -0.1575469970703125, -0.13504791259765625, -0.112548828125, -0.09004974365234375, -0.0675506591796875, -0.04505157470703125, -0.022552490234375, -5.340576171875e-05, 0.0224456787109375, 0.04494476318359375, 0.06744384765625, 0.08994293212890625, 0.1124420166015625, 0.13494110107421875, 0.157440185546875, 0.17993927001953125, 0.2024383544921875, 0.22493743896484375, 0.2474365234375, 0.26993560791015625, 0.2924346923828125, 0.31493377685546875, 0.337432861328125, 0.35993194580078125, 0.3824310302734375, 0.40493011474609375, 0.42742919921875, 0.44992828369140625, 0.4724273681640625, 0.49492645263671875, 0.517425537109375, 0.5399246215820312, 0.5624237060546875, 0.5849227905273438, 0.607421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 0.0, 9.0, 7.0, 8.0, 6.0, 7.0, 23.0, 15.0, 19.0, 30.0, 57.0, 95.0, 278.0, 185.0, 78.0, 33.0, 38.0, 19.0, 20.0, 8.0, 10.0, 12.0, 12.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22328567504882812, -0.21463775634765625, -0.20598983764648438, -0.1973419189453125, -0.18869400024414062, -0.18004608154296875, -0.17139816284179688, -0.162750244140625, -0.15410232543945312, -0.14545440673828125, -0.13680648803710938, -0.1281585693359375, -0.11951065063476562, -0.11086273193359375, -0.10221481323242188, -0.09356689453125, -0.08491897583007812, -0.07627105712890625, -0.06762313842773438, -0.0589752197265625, -0.050327301025390625, -0.04167938232421875, -0.033031463623046875, -0.024383544921875, -0.015735626220703125, -0.00708770751953125, 0.001560211181640625, 0.0102081298828125, 0.018856048583984375, 0.02750396728515625, 0.036151885986328125, 0.0447998046875, 0.053447723388671875, 0.06209564208984375, 0.07074356079101562, 0.0793914794921875, 0.08803939819335938, 0.09668731689453125, 0.10533523559570312, 0.113983154296875, 0.12263107299804688, 0.13127899169921875, 0.13992691040039062, 0.1485748291015625, 0.15722274780273438, 0.16587066650390625, 0.17451858520507812, 0.18316650390625, 0.19181442260742188, 0.20046234130859375, 0.20911026000976562, 0.2177581787109375, 0.22640609741210938, 0.23505401611328125, 0.24370193481445312, 0.252349853515625, 0.2609977722167969, 0.26964569091796875, 0.2782936096191406, 0.2869415283203125, 0.2955894470214844, 0.30423736572265625, 0.3128852844238281, 0.321533203125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 37.0, 166.0, 544.0, 175.0, 46.0, 18.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5871992111206055, -5.2689971923828125, -4.9507951736450195, -4.632593631744385, -4.314391613006592, -3.996189594268799, -3.677987813949585, -3.359786033630371, -3.041584014892578, -2.723381996154785, -2.4051802158355713, -2.0869784355163574, -1.7687764167785645, -1.450574517250061, -1.1323726177215576, -0.8141708374023438, -0.4959688186645508, -0.17776691913604736, 0.14043498039245605, 0.4586368799209595, 0.7768387794494629, 1.0950406789779663, 1.4132425785064697, 1.7314443588256836, 2.0496463775634766, 2.3678483963012695, 2.6860501766204834, 3.0042519569396973, 3.3224539756774902, 3.640655994415283, 3.958857774734497, 4.277059555053711, 4.5952606201171875, 4.9134626388549805, 5.231664657592773, 5.549866199493408, 5.868068218231201, 6.186270236968994, 6.504471778869629, 6.822673797607422, 7.140875816345215, 7.459077835083008, 7.777279853820801, 8.095481872558594, 8.41368293762207, 8.731884956359863, 9.050086975097656, 9.36828899383545, 9.686491012573242, 10.004693031311035, 10.322895050048828, 10.641097068786621, 10.959299087524414, 11.27750015258789, 11.595702171325684, 11.913904190063477, 12.23210620880127, 12.550308227539062, 12.868510246276855, 13.186712265014648, 13.504913330078125, 13.823115348815918, 14.141317367553711, 14.459519386291504, 14.777721405029297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 9.0, 22.0, 20.0, 15.0, 21.0, 25.0, 34.0, 31.0, 22.0, 37.0, 32.0, 42.0, 45.0, 40.0, 45.0, 50.0, 48.0, 55.0, 51.0, 48.0, 31.0, 29.0, 39.0, 21.0, 23.0, 28.0, 27.0, 18.0, 15.0, 17.0, 9.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7176430225372314, -2.6250250339508057, -2.53240704536438, -2.439789295196533, -2.3471713066101074, -2.2545533180236816, -2.161935329437256, -2.06931734085083, -1.9766995906829834, -1.8840816020965576, -1.7914637327194214, -1.6988457441329956, -1.6062278747558594, -1.5136098861694336, -1.4209918975830078, -1.3283740282058716, -1.2357560396194458, -1.14313805103302, -1.0505201816558838, -0.957902193069458, -0.8652843236923218, -0.772666335105896, -0.680048406124115, -0.587430477142334, -0.494812548160553, -0.402194619178772, -0.30957669019699097, -0.21695873141288757, -0.12434080243110657, -0.03172287344932556, 0.06089508533477783, 0.15351301431655884, 0.24613094329833984, 0.33874887228012085, 0.43136680126190186, 0.5239847898483276, 0.6166026592254639, 0.7092206478118896, 0.8018385767936707, 0.8944565057754517, 0.9870744347572327, 1.0796923637390137, 1.1723103523254395, 1.2649282217025757, 1.3575462102890015, 1.4501640796661377, 1.5427820682525635, 1.6354000568389893, 1.7280179262161255, 1.8206359148025513, 1.9132537841796875, 2.0058717727661133, 2.098489761352539, 2.1911075115203857, 2.2837255001068115, 2.3763434886932373, 2.468961477279663, 2.561579465866089, 2.6541974544525146, 2.7468152046203613, 2.839433193206787, 2.932051181793213, 3.0246691703796387, 3.1172871589660645, 3.209904909133911]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 15.0, 21.0, 35.0, 53.0, 78.0, 146.0, 248.0, 621.0, 2846.0, 79248.0, 4097327.0, 11391.0, 1447.0, 404.0, 141.0, 97.0, 43.0, 43.0, 16.0, 13.0, 14.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4847412109375, -8.274169921875, -8.0635986328125, -7.85302734375, -7.6424560546875, -7.431884765625, -7.2213134765625, -7.0107421875, -6.8001708984375, -6.589599609375, -6.3790283203125, -6.16845703125, -5.9578857421875, -5.747314453125, -5.5367431640625, -5.326171875, -5.1156005859375, -4.905029296875, -4.6944580078125, -4.48388671875, -4.2733154296875, -4.062744140625, -3.8521728515625, -3.6416015625, -3.4310302734375, -3.220458984375, -3.0098876953125, -2.79931640625, -2.5887451171875, -2.378173828125, -2.1676025390625, -1.95703125, -1.7464599609375, -1.535888671875, -1.3253173828125, -1.11474609375, -0.9041748046875, -0.693603515625, -0.4830322265625, -0.2724609375, -0.0618896484375, 0.148681640625, 0.3592529296875, 0.56982421875, 0.7803955078125, 0.990966796875, 1.2015380859375, 1.412109375, 1.6226806640625, 1.833251953125, 2.0438232421875, 2.25439453125, 2.4649658203125, 2.675537109375, 2.8861083984375, 3.0966796875, 3.3072509765625, 3.517822265625, 3.7283935546875, 3.93896484375, 4.1495361328125, 4.360107421875, 4.5706787109375, 4.78125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 9.0, 15.0, 20.0, 26.0, 36.0, 49.0, 57.0, 79.0, 89.0, 113.0, 126.0, 86.0, 80.0, 64.0, 46.0, 34.0, 23.0, 18.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.2374420166015625, -2.179962158203125, -2.1224822998046875, -2.06500244140625, -2.0075225830078125, -1.950042724609375, -1.8925628662109375, -1.8350830078125, -1.7776031494140625, -1.720123291015625, -1.6626434326171875, -1.60516357421875, -1.5476837158203125, -1.490203857421875, -1.4327239990234375, -1.375244140625, -1.3177642822265625, -1.260284423828125, -1.2028045654296875, -1.14532470703125, -1.0878448486328125, -1.030364990234375, -0.9728851318359375, -0.9154052734375, -0.8579254150390625, -0.800445556640625, -0.7429656982421875, -0.68548583984375, -0.6280059814453125, -0.570526123046875, -0.5130462646484375, -0.45556640625, -0.3980865478515625, -0.340606689453125, -0.2831268310546875, -0.22564697265625, -0.1681671142578125, -0.110687255859375, -0.0532073974609375, 0.0042724609375, 0.0617523193359375, 0.119232177734375, 0.1767120361328125, 0.23419189453125, 0.2916717529296875, 0.349151611328125, 0.4066314697265625, 0.464111328125, 0.5215911865234375, 0.579071044921875, 0.6365509033203125, 0.69403076171875, 0.7515106201171875, 0.808990478515625, 0.8664703369140625, 0.9239501953125, 0.9814300537109375, 1.038909912109375, 1.0963897705078125, 1.15386962890625, 1.2113494873046875, 1.268829345703125, 1.3263092041015625, 1.3837890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 3.0, 5.0, 8.0, 10.0, 10.0, 21.0, 30.0, 35.0, 73.0, 101.0, 158.0, 314.0, 554.0, 1172.0, 2778.0, 7993.0, 35155.0, 2764463.0, 1340196.0, 29375.0, 7044.0, 2490.0, 1096.0, 515.0, 255.0, 150.0, 84.0, 62.0, 41.0, 24.0, 16.0, 14.0, 9.0, 4.0, 10.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.84375, -2.7725830078125, -2.701416015625, -2.6302490234375, -2.55908203125, -2.4879150390625, -2.416748046875, -2.3455810546875, -2.2744140625, -2.2032470703125, -2.132080078125, -2.0609130859375, -1.98974609375, -1.9185791015625, -1.847412109375, -1.7762451171875, -1.705078125, -1.6339111328125, -1.562744140625, -1.4915771484375, -1.42041015625, -1.3492431640625, -1.278076171875, -1.2069091796875, -1.1357421875, -1.0645751953125, -0.993408203125, -0.9222412109375, -0.85107421875, -0.7799072265625, -0.708740234375, -0.6375732421875, -0.56640625, -0.4952392578125, -0.424072265625, -0.3529052734375, -0.28173828125, -0.2105712890625, -0.139404296875, -0.0682373046875, 0.0029296875, 0.0740966796875, 0.145263671875, 0.2164306640625, 0.28759765625, 0.3587646484375, 0.429931640625, 0.5010986328125, 0.572265625, 0.6434326171875, 0.714599609375, 0.7857666015625, 0.85693359375, 0.9281005859375, 0.999267578125, 1.0704345703125, 1.1416015625, 1.2127685546875, 1.283935546875, 1.3551025390625, 1.42626953125, 1.4974365234375, 1.568603515625, 1.6397705078125, 1.7109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 11.0, 11.0, 18.0, 19.0, 54.0, 111.0, 310.0, 900.0, 1506.0, 613.0, 236.0, 91.0, 46.0, 26.0, 23.0, 19.0, 13.0, 13.0, 4.0, 4.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.4361114501953125, -0.416656494140625, -0.3972015380859375, -0.37774658203125, -0.3582916259765625, -0.338836669921875, -0.3193817138671875, -0.2999267578125, -0.2804718017578125, -0.261016845703125, -0.2415618896484375, -0.22210693359375, -0.2026519775390625, -0.183197021484375, -0.1637420654296875, -0.144287109375, -0.1248321533203125, -0.105377197265625, -0.0859222412109375, -0.06646728515625, -0.0470123291015625, -0.027557373046875, -0.0081024169921875, 0.0113525390625, 0.0308074951171875, 0.050262451171875, 0.0697174072265625, 0.08917236328125, 0.1086273193359375, 0.128082275390625, 0.1475372314453125, 0.1669921875, 0.1864471435546875, 0.205902099609375, 0.2253570556640625, 0.24481201171875, 0.2642669677734375, 0.283721923828125, 0.3031768798828125, 0.3226318359375, 0.3420867919921875, 0.361541748046875, 0.3809967041015625, 0.40045166015625, 0.4199066162109375, 0.439361572265625, 0.4588165283203125, 0.478271484375, 0.4977264404296875, 0.517181396484375, 0.5366363525390625, 0.55609130859375, 0.5755462646484375, 0.595001220703125, 0.6144561767578125, 0.6339111328125, 0.6533660888671875, 0.672821044921875, 0.6922760009765625, 0.71173095703125, 0.7311859130859375, 0.750640869140625, 0.7700958251953125, 0.78955078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 16.0, 6.0, 13.0, 16.0, 30.0, 68.0, 112.0, 182.0, 240.0, 133.0, 74.0, 36.0, 24.0, 20.0, 12.0, 3.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.897313117980957, -2.8127846717834473, -2.7282562255859375, -2.6437277793884277, -2.559199571609497, -2.4746711254119873, -2.3901426792144775, -2.3056142330169678, -2.221086025238037, -2.1365575790405273, -2.0520291328430176, -1.9675008058547974, -1.8829724788665771, -1.7984440326690674, -1.7139155864715576, -1.6293871402740479, -1.544858694076538, -1.4603302478790283, -1.375801920890808, -1.2912734746932983, -1.2067451477050781, -1.1222167015075684, -1.0376882553100586, -0.9531598687171936, -0.8686314821243286, -0.7841030955314636, -0.6995747089385986, -0.6150462627410889, -0.5305178761482239, -0.4459894895553589, -0.3614610433578491, -0.27693265676498413, -0.19240450859069824, -0.10787610709667206, -0.023347705602645874, 0.061180710792541504, 0.1457090973854065, 0.23023748397827148, 0.31476593017578125, 0.39929431676864624, 0.48382270336151123, 0.5683510899543762, 0.6528794765472412, 0.737407922744751, 0.821936309337616, 0.906464695930481, 0.9909931421279907, 1.075521469116211, 1.1600499153137207, 1.2445783615112305, 1.3291066884994507, 1.4136351346969604, 1.4981634616851807, 1.5826919078826904, 1.6672203540802002, 1.75174880027771, 1.8362771272659302, 1.92080557346344, 2.00533390045166, 2.08986234664917, 2.1743907928466797, 2.2589192390441895, 2.343447685241699, 2.42797589302063, 2.5125043392181396]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 18.0, 27.0, 34.0, 35.0, 57.0, 51.0, 66.0, 78.0, 85.0, 74.0, 69.0, 76.0, 71.0, 48.0, 42.0, 36.0, 35.0, 31.0, 20.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.907869815826416, -1.8558416366577148, -1.8038134574890137, -1.7517852783203125, -1.6997569799423218, -1.6477288007736206, -1.5957006216049194, -1.5436724424362183, -1.491644263267517, -1.439616084098816, -1.3875879049301147, -1.335559606552124, -1.2835314273834229, -1.2315032482147217, -1.1794750690460205, -1.1274468898773193, -1.0754187107086182, -1.023390531539917, -0.971362292766571, -0.9193341135978699, -0.8673059344291687, -0.8152776956558228, -0.7632495164871216, -0.7112213373184204, -0.6591930389404297, -0.6071648597717285, -0.5551366209983826, -0.5031084418296814, -0.4510802626609802, -0.39905205368995667, -0.3470238447189331, -0.29499566555023193, -0.24296748638153076, -0.1909392923116684, -0.13891109824180603, -0.08688288927078247, -0.034854695200920105, 0.01717349886894226, 0.06920170783996582, 0.12122988700866699, 0.17325809597969055, 0.22528629004955292, 0.2773144841194153, 0.32934269309043884, 0.3813709020614624, 0.4333990812301636, 0.48542729020118713, 0.5374554395675659, 0.5894836783409119, 0.641511857509613, 0.693540096282959, 0.7455682754516602, 0.7975964546203613, 0.8496246337890625, 0.9016528725624084, 0.9536810517311096, 1.0057092905044556, 1.0577374696731567, 1.109765648841858, 1.1617939472198486, 1.2138221263885498, 1.265850305557251, 1.3178784847259521, 1.3699066638946533, 1.4219348430633545]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 13.0, 11.0, 29.0, 44.0, 73.0, 90.0, 170.0, 293.0, 606.0, 1302.0, 3725.0, 15752.0, 146734.0, 784529.0, 79224.0, 10818.0, 2946.0, 1075.0, 502.0, 263.0, 141.0, 79.0, 46.0, 21.0, 19.0, 9.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.2967987060546875, -0.283538818359375, -0.2702789306640625, -0.25701904296875, -0.2437591552734375, -0.230499267578125, -0.2172393798828125, -0.2039794921875, -0.1907196044921875, -0.177459716796875, -0.1641998291015625, -0.15093994140625, -0.1376800537109375, -0.124420166015625, -0.1111602783203125, -0.097900390625, -0.0846405029296875, -0.071380615234375, -0.0581207275390625, -0.04486083984375, -0.0316009521484375, -0.018341064453125, -0.0050811767578125, 0.0081787109375, 0.0214385986328125, 0.034698486328125, 0.0479583740234375, 0.06121826171875, 0.0744781494140625, 0.087738037109375, 0.1009979248046875, 0.1142578125, 0.1275177001953125, 0.140777587890625, 0.1540374755859375, 0.16729736328125, 0.1805572509765625, 0.193817138671875, 0.2070770263671875, 0.2203369140625, 0.2335968017578125, 0.246856689453125, 0.2601165771484375, 0.27337646484375, 0.2866363525390625, 0.299896240234375, 0.3131561279296875, 0.326416015625, 0.3396759033203125, 0.352935791015625, 0.3661956787109375, 0.37945556640625, 0.3927154541015625, 0.405975341796875, 0.4192352294921875, 0.4324951171875, 0.4457550048828125, 0.459014892578125, 0.4722747802734375, 0.48553466796875, 0.4987945556640625, 0.512054443359375, 0.5253143310546875, 0.53857421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 11.0, 13.0, 15.0, 39.0, 28.0, 56.0, 59.0, 75.0, 106.0, 103.0, 100.0, 83.0, 85.0, 56.0, 49.0, 39.0, 29.0, 25.0, 4.0, 4.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.7196197509765625, -1.675567626953125, -1.6315155029296875, -1.58746337890625, -1.5434112548828125, -1.499359130859375, -1.4553070068359375, -1.4112548828125, -1.3672027587890625, -1.323150634765625, -1.2790985107421875, -1.23504638671875, -1.1909942626953125, -1.146942138671875, -1.1028900146484375, -1.058837890625, -1.0147857666015625, -0.970733642578125, -0.9266815185546875, -0.88262939453125, -0.8385772705078125, -0.794525146484375, -0.7504730224609375, -0.7064208984375, -0.6623687744140625, -0.618316650390625, -0.5742645263671875, -0.53021240234375, -0.4861602783203125, -0.442108154296875, -0.3980560302734375, -0.35400390625, -0.3099517822265625, -0.265899658203125, -0.2218475341796875, -0.17779541015625, -0.1337432861328125, -0.089691162109375, -0.0456390380859375, -0.0015869140625, 0.0424652099609375, 0.086517333984375, 0.1305694580078125, 0.17462158203125, 0.2186737060546875, 0.262725830078125, 0.3067779541015625, 0.350830078125, 0.3948822021484375, 0.438934326171875, 0.4829864501953125, 0.52703857421875, 0.5710906982421875, 0.615142822265625, 0.6591949462890625, 0.7032470703125, 0.7472991943359375, 0.791351318359375, 0.8354034423828125, 0.87945556640625, 0.9235076904296875, 0.967559814453125, 1.0116119384765625, 1.0556640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 16.0, 15.0, 11.0, 18.0, 30.0, 56.0, 63.0, 102.0, 161.0, 192.0, 328.0, 447.0, 740.0, 1143.0, 1885.0, 3493.0, 7001.0, 16099.0, 42615.0, 144353.0, 472674.0, 247016.0, 66114.0, 23128.0, 9718.0, 4658.0, 2493.0, 1371.0, 893.0, 523.0, 382.0, 223.0, 152.0, 126.0, 83.0, 68.0, 49.0, 20.0, 19.0, 20.0, 18.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15652084350585938, -0.15142059326171875, -0.14632034301757812, -0.1412200927734375, -0.13611984252929688, -0.13101959228515625, -0.12591934204101562, -0.120819091796875, -0.11571884155273438, -0.11061859130859375, -0.10551834106445312, -0.1004180908203125, -0.09531784057617188, -0.09021759033203125, -0.08511734008789062, -0.08001708984375, -0.07491683959960938, -0.06981658935546875, -0.06471633911132812, -0.0596160888671875, -0.054515838623046875, -0.04941558837890625, -0.044315338134765625, -0.039215087890625, -0.034114837646484375, -0.02901458740234375, -0.023914337158203125, -0.0188140869140625, -0.013713836669921875, -0.00861358642578125, -0.003513336181640625, 0.0015869140625, 0.006687164306640625, 0.01178741455078125, 0.016887664794921875, 0.0219879150390625, 0.027088165283203125, 0.03218841552734375, 0.037288665771484375, 0.042388916015625, 0.047489166259765625, 0.05258941650390625, 0.057689666748046875, 0.0627899169921875, 0.06789016723632812, 0.07299041748046875, 0.07809066772460938, 0.08319091796875, 0.08829116821289062, 0.09339141845703125, 0.09849166870117188, 0.1035919189453125, 0.10869216918945312, 0.11379241943359375, 0.11889266967773438, 0.123992919921875, 0.12909317016601562, 0.13419342041015625, 0.13929367065429688, 0.1443939208984375, 0.14949417114257812, 0.15459442138671875, 0.15969467163085938, 0.164794921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 9.0, 13.0, 8.0, 12.0, 13.0, 23.0, 28.0, 25.0, 32.0, 35.0, 33.0, 31.0, 43.0, 52.0, 38.0, 53.0, 38.0, 42.0, 52.0, 51.0, 34.0, 39.0, 33.0, 33.0, 24.0, 29.0, 22.0, 17.0, 17.0, 18.0, 17.0, 11.0, 12.0, 9.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.15576171875, -1.1162109375, -1.07666015625, -1.037109375, -0.99755859375, -0.9580078125, -0.91845703125, -0.87890625, -0.83935546875, -0.7998046875, -0.76025390625, -0.720703125, -0.68115234375, -0.6416015625, -0.60205078125, -0.5625, -0.52294921875, -0.4833984375, -0.44384765625, -0.404296875, -0.36474609375, -0.3251953125, -0.28564453125, -0.24609375, -0.20654296875, -0.1669921875, -0.12744140625, -0.087890625, -0.04833984375, -0.0087890625, 0.03076171875, 0.0703125, 0.10986328125, 0.1494140625, 0.18896484375, 0.228515625, 0.26806640625, 0.3076171875, 0.34716796875, 0.38671875, 0.42626953125, 0.4658203125, 0.50537109375, 0.544921875, 0.58447265625, 0.6240234375, 0.66357421875, 0.703125, 0.74267578125, 0.7822265625, 0.82177734375, 0.861328125, 0.90087890625, 0.9404296875, 0.97998046875, 1.01953125, 1.05908203125, 1.0986328125, 1.13818359375, 1.177734375, 1.21728515625, 1.2568359375, 1.29638671875, 1.3359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 7.0, 12.0, 16.0, 18.0, 16.0, 20.0, 39.0, 50.0, 84.0, 109.0, 167.0, 244.0, 440.0, 701.0, 1223.0, 2083.0, 4150.0, 9221.0, 25285.0, 101484.0, 531550.0, 289017.0, 52666.0, 16187.0, 6436.0, 3086.0, 1655.0, 958.0, 542.0, 349.0, 220.0, 159.0, 101.0, 56.0, 49.0, 36.0, 27.0, 30.0, 17.0, 8.0, 6.0, 8.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.051971435546875, -0.05038642883300781, -0.048801422119140625, -0.04721641540527344, -0.04563140869140625, -0.04404640197753906, -0.042461395263671875, -0.04087638854980469, -0.0392913818359375, -0.03770637512207031, -0.036121368408203125, -0.03453636169433594, -0.03295135498046875, -0.03136634826660156, -0.029781341552734375, -0.028196334838867188, -0.026611328125, -0.025026321411132812, -0.023441314697265625, -0.021856307983398438, -0.02027130126953125, -0.018686294555664062, -0.017101287841796875, -0.015516281127929688, -0.0139312744140625, -0.012346267700195312, -0.010761260986328125, -0.009176254272460938, -0.00759124755859375, -0.0060062408447265625, -0.004421234130859375, -0.0028362274169921875, -0.001251220703125, 0.0003337860107421875, 0.001918792724609375, 0.0035037994384765625, 0.00508880615234375, 0.0066738128662109375, 0.008258819580078125, 0.009843826293945312, 0.0114288330078125, 0.013013839721679688, 0.014598846435546875, 0.016183853149414062, 0.01776885986328125, 0.019353866577148438, 0.020938873291015625, 0.022523880004882812, 0.02410888671875, 0.025693893432617188, 0.027278900146484375, 0.028863906860351562, 0.03044891357421875, 0.03203392028808594, 0.033618927001953125, 0.03520393371582031, 0.0367889404296875, 0.03837394714355469, 0.039958953857421875, 0.04154396057128906, 0.04312896728515625, 0.04471397399902344, 0.046298980712890625, 0.04788398742675781, 0.049468994140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 18.0, 26.0, 49.0, 94.0, 118.0, 154.0, 163.0, 113.0, 80.0, 46.0, 32.0, 30.0, 13.0, 7.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -5.137734115123749e-05, -4.976615309715271e-05, -4.815496504306793e-05, -4.6543776988983154e-05, -4.4932588934898376e-05, -4.33214008808136e-05, -4.171021282672882e-05, -4.009902477264404e-05, -3.8487836718559265e-05, -3.687664866447449e-05, -3.526546061038971e-05, -3.365427255630493e-05, -3.2043084502220154e-05, -3.0431896448135376e-05, -2.8820708394050598e-05, -2.720952033996582e-05, -2.5598332285881042e-05, -2.3987144231796265e-05, -2.2375956177711487e-05, -2.076476812362671e-05, -1.915358006954193e-05, -1.7542392015457153e-05, -1.5931203961372375e-05, -1.4320015907287598e-05, -1.270882785320282e-05, -1.1097639799118042e-05, -9.486451745033264e-06, -7.875263690948486e-06, -6.2640756368637085e-06, -4.652887582778931e-06, -3.041699528694153e-06, -1.430511474609375e-06, 1.8067657947540283e-07, 1.7918646335601807e-06, 3.4030526876449585e-06, 5.014240741729736e-06, 6.625428795814514e-06, 8.236616849899292e-06, 9.84780490398407e-06, 1.1458992958068848e-05, 1.3070181012153625e-05, 1.4681369066238403e-05, 1.629255712032318e-05, 1.790374517440796e-05, 1.9514933228492737e-05, 2.1126121282577515e-05, 2.2737309336662292e-05, 2.434849739074707e-05, 2.5959685444831848e-05, 2.7570873498916626e-05, 2.9182061553001404e-05, 3.079324960708618e-05, 3.240443766117096e-05, 3.401562571525574e-05, 3.5626813769340515e-05, 3.723800182342529e-05, 3.884918987751007e-05, 4.046037793159485e-05, 4.2071565985679626e-05, 4.3682754039764404e-05, 4.529394209384918e-05, 4.690513014793396e-05, 4.851631820201874e-05, 5.0127506256103516e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 13.0, 13.0, 20.0, 20.0, 40.0, 57.0, 68.0, 114.0, 129.0, 227.0, 351.0, 586.0, 925.0, 1762.0, 3307.0, 6981.0, 16810.0, 49474.0, 189472.0, 495007.0, 198672.0, 51857.0, 17590.0, 7307.0, 3398.0, 1762.0, 961.0, 569.0, 374.0, 210.0, 144.0, 94.0, 76.0, 42.0, 35.0, 20.0, 17.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.04522705078125, -0.04391670227050781, -0.042606353759765625, -0.04129600524902344, -0.03998565673828125, -0.03867530822753906, -0.037364959716796875, -0.03605461120605469, -0.0347442626953125, -0.03343391418457031, -0.032123565673828125, -0.030813217163085938, -0.02950286865234375, -0.028192520141601562, -0.026882171630859375, -0.025571823120117188, -0.024261474609375, -0.022951126098632812, -0.021640777587890625, -0.020330429077148438, -0.01902008056640625, -0.017709732055664062, -0.016399383544921875, -0.015089035034179688, -0.0137786865234375, -0.012468338012695312, -0.011157989501953125, -0.009847640991210938, -0.00853729248046875, -0.0072269439697265625, -0.005916595458984375, -0.0046062469482421875, -0.0032958984375, -0.0019855499267578125, -0.000675201416015625, 0.0006351470947265625, 0.00194549560546875, 0.0032558441162109375, 0.004566192626953125, 0.0058765411376953125, 0.0071868896484375, 0.008497238159179688, 0.009807586669921875, 0.011117935180664062, 0.01242828369140625, 0.013738632202148438, 0.015048980712890625, 0.016359329223632812, 0.017669677734375, 0.018980026245117188, 0.020290374755859375, 0.021600723266601562, 0.02291107177734375, 0.024221420288085938, 0.025531768798828125, 0.026842117309570312, 0.0281524658203125, 0.029462814331054688, 0.030773162841796875, 0.03208351135253906, 0.03339385986328125, 0.03470420837402344, 0.036014556884765625, 0.03732490539550781, 0.03863525390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 2.0, 13.0, 17.0, 28.0, 27.0, 46.0, 37.0, 52.0, 64.0, 70.0, 69.0, 78.0, 90.0, 62.0, 74.0, 38.0, 42.0, 29.0, 24.0, 25.0, 22.0, 10.0, 17.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010894775390625, -0.010493159294128418, -0.010091543197631836, -0.009689927101135254, -0.009288311004638672, -0.00888669490814209, -0.008485078811645508, -0.008083462715148926, -0.007681846618652344, -0.007280230522155762, -0.00687861442565918, -0.006476998329162598, -0.006075382232666016, -0.005673766136169434, -0.0052721500396728516, -0.0048705339431762695, -0.0044689178466796875, -0.0040673017501831055, -0.0036656856536865234, -0.0032640695571899414, -0.0028624534606933594, -0.0024608373641967773, -0.0020592212677001953, -0.0016576051712036133, -0.0012559890747070312, -0.0008543729782104492, -0.0004527568817138672, -5.1140785217285156e-05, 0.0003504753112792969, 0.0007520914077758789, 0.001153707504272461, 0.001555323600769043, 0.001956939697265625, 0.002358555793762207, 0.002760171890258789, 0.003161787986755371, 0.003563404083251953, 0.003965020179748535, 0.004366636276245117, 0.004768252372741699, 0.005169868469238281, 0.005571484565734863, 0.005973100662231445, 0.006374716758728027, 0.006776332855224609, 0.007177948951721191, 0.0075795650482177734, 0.007981181144714355, 0.008382797241210938, 0.00878441333770752, 0.009186029434204102, 0.009587645530700684, 0.009989261627197266, 0.010390877723693848, 0.01079249382019043, 0.011194109916687012, 0.011595726013183594, 0.011997342109680176, 0.012398958206176758, 0.01280057430267334, 0.013202190399169922, 0.013603806495666504, 0.014005422592163086, 0.014407038688659668, 0.01480865478515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 31.0, 54.0, 267.0, 478.0, 112.0, 37.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.457675933837891, -4.319665431976318, -4.181655406951904, -4.043644905090332, -3.905634641647339, -3.7676243782043457, -3.6296138763427734, -3.4916036128997803, -3.353593349456787, -3.215583086013794, -3.077572822570801, -2.9395623207092285, -2.8015520572662354, -2.663541793823242, -2.52553129196167, -2.3875210285186768, -2.2495107650756836, -2.1115005016326904, -1.9734901189804077, -1.835479736328125, -1.6974694728851318, -1.5594592094421387, -1.421448826789856, -1.2834384441375732, -1.14542818069458, -1.007417917251587, -0.8694075345993042, -0.7313972115516663, -0.5933868885040283, -0.4553765654563904, -0.31736624240875244, -0.1793559193611145, -0.04134511947631836, 0.09666520357131958, 0.23467552661895752, 0.37268584966659546, 0.5106961727142334, 0.6487064957618713, 0.7867168188095093, 0.9247271418571472, 1.0627374649047852, 1.2007477283477783, 1.338758111000061, 1.4767684936523438, 1.614778757095337, 1.75278902053833, 1.8907994031906128, 2.0288097858428955, 2.1668200492858887, 2.304830312728882, 2.442840576171875, 2.5808510780334473, 2.7188613414764404, 2.8568716049194336, 2.994882106781006, 3.132892370223999, 3.270902633666992, 3.4089128971099854, 3.5469231605529785, 3.684933662414551, 3.822943925857544, 3.960954189300537, 4.098964691162109, 4.236974716186523, 4.374985218048096]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 13.0, 19.0, 24.0, 51.0, 44.0, 75.0, 80.0, 102.0, 99.0, 104.0, 95.0, 78.0, 65.0, 43.0, 34.0, 35.0, 10.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8624941110610962, -1.8180227279663086, -1.7735512256622314, -1.7290798425674438, -1.6846084594726562, -1.640136957168579, -1.5956655740737915, -1.551194190979004, -1.5067226886749268, -1.4622513055801392, -1.417779803276062, -1.3733084201812744, -1.3288370370864868, -1.2843656539916992, -1.239894151687622, -1.1954227685928345, -1.1509513854980469, -1.1064800024032593, -1.0620085000991821, -1.0175371170043945, -0.9730657339096069, -0.9285942912101746, -0.8841228485107422, -0.8396514654159546, -0.7951800227165222, -0.7507085800170898, -0.7062371969223022, -0.6617657542228699, -0.6172943115234375, -0.5728229284286499, -0.5283514857292175, -0.48388007283210754, -0.4394086003303528, -0.3949371874332428, -0.3504657745361328, -0.30599433183670044, -0.26152291893959045, -0.21705150604248047, -0.1725800633430481, -0.1281086504459381, -0.08363723754882812, -0.03916581720113754, 0.0053056031465530396, 0.04977703094482422, 0.0942484438419342, 0.1387198567390442, 0.18319129943847656, 0.22766271233558655, 0.27213412523269653, 0.3166055381298065, 0.3610769510269165, 0.4055483937263489, 0.45001980662345886, 0.49449121952056885, 0.5389626622200012, 0.5834341049194336, 0.6279054880142212, 0.6723769307136536, 0.7168483138084412, 0.7613197565078735, 0.8057911396026611, 0.8502625823020935, 0.8947340250015259, 0.9392054080963135, 0.9836768507957458]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 12.0, 9.0, 17.0, 28.0, 39.0, 71.0, 125.0, 198.0, 386.0, 860.0, 2464.0, 11431.0, 390462.0, 624198.0, 13527.0, 2881.0, 949.0, 369.0, 200.0, 115.0, 76.0, 47.0, 31.0, 18.0, 14.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7783203125, -1.727569580078125, -1.67681884765625, -1.626068115234375, -1.5753173828125, -1.524566650390625, -1.47381591796875, -1.423065185546875, -1.372314453125, -1.321563720703125, -1.27081298828125, -1.220062255859375, -1.1693115234375, -1.118560791015625, -1.06781005859375, -1.017059326171875, -0.96630859375, -0.915557861328125, -0.86480712890625, -0.814056396484375, -0.7633056640625, -0.712554931640625, -0.66180419921875, -0.611053466796875, -0.560302734375, -0.509552001953125, -0.45880126953125, -0.408050537109375, -0.3572998046875, -0.306549072265625, -0.25579833984375, -0.205047607421875, -0.154296875, -0.103546142578125, -0.05279541015625, -0.002044677734375, 0.0487060546875, 0.099456787109375, 0.15020751953125, 0.200958251953125, 0.251708984375, 0.302459716796875, 0.35321044921875, 0.403961181640625, 0.4547119140625, 0.505462646484375, 0.55621337890625, 0.606964111328125, 0.65771484375, 0.708465576171875, 0.75921630859375, 0.809967041015625, 0.8607177734375, 0.911468505859375, 0.96221923828125, 1.012969970703125, 1.063720703125, 1.114471435546875, 1.16522216796875, 1.215972900390625, 1.2667236328125, 1.317474365234375, 1.36822509765625, 1.418975830078125, 1.4697265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 28.0, 39.0, 38.0, 56.0, 69.0, 89.0, 83.0, 95.0, 91.0, 75.0, 67.0, 60.0, 47.0, 31.0, 25.0, 25.0, 15.0, 3.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.56219482421875, -2.4837646484375, -2.40533447265625, -2.326904296875, -2.24847412109375, -2.1700439453125, -2.09161376953125, -2.01318359375, -1.93475341796875, -1.8563232421875, -1.77789306640625, -1.699462890625, -1.62103271484375, -1.5426025390625, -1.46417236328125, -1.3857421875, -1.30731201171875, -1.2288818359375, -1.15045166015625, -1.072021484375, -0.99359130859375, -0.9151611328125, -0.83673095703125, -0.75830078125, -0.67987060546875, -0.6014404296875, -0.52301025390625, -0.444580078125, -0.36614990234375, -0.2877197265625, -0.20928955078125, -0.130859375, -0.05242919921875, 0.0260009765625, 0.10443115234375, 0.182861328125, 0.26129150390625, 0.3397216796875, 0.41815185546875, 0.49658203125, 0.57501220703125, 0.6534423828125, 0.73187255859375, 0.810302734375, 0.88873291015625, 0.9671630859375, 1.04559326171875, 1.1240234375, 1.20245361328125, 1.2808837890625, 1.35931396484375, 1.437744140625, 1.51617431640625, 1.5946044921875, 1.67303466796875, 1.75146484375, 1.82989501953125, 1.9083251953125, 1.98675537109375, 2.065185546875, 2.14361572265625, 2.2220458984375, 2.30047607421875, 2.37890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 3.0, 10.0, 4.0, 16.0, 13.0, 21.0, 25.0, 31.0, 66.0, 92.0, 125.0, 220.0, 314.0, 591.0, 975.0, 1654.0, 3594.0, 10190.0, 99596.0, 873907.0, 43284.0, 7294.0, 2893.0, 1432.0, 794.0, 486.0, 283.0, 189.0, 133.0, 77.0, 62.0, 44.0, 34.0, 20.0, 13.0, 10.0, 16.0, 9.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.0166015625, -0.9870223999023438, -0.9574432373046875, -0.9278640747070312, -0.898284912109375, -0.8687057495117188, -0.8391265869140625, -0.8095474243164062, -0.77996826171875, -0.7503890991210938, -0.7208099365234375, -0.6912307739257812, -0.661651611328125, -0.6320724487304688, -0.6024932861328125, -0.5729141235351562, -0.5433349609375, -0.5137557983398438, -0.4841766357421875, -0.45459747314453125, -0.425018310546875, -0.39543914794921875, -0.3658599853515625, -0.33628082275390625, -0.30670166015625, -0.27712249755859375, -0.2475433349609375, -0.21796417236328125, -0.188385009765625, -0.15880584716796875, -0.1292266845703125, -0.09964752197265625, -0.070068359375, -0.04048919677734375, -0.0109100341796875, 0.01866912841796875, 0.048248291015625, 0.07782745361328125, 0.1074066162109375, 0.13698577880859375, 0.16656494140625, 0.19614410400390625, 0.2257232666015625, 0.25530242919921875, 0.284881591796875, 0.31446075439453125, 0.3440399169921875, 0.37361907958984375, 0.4031982421875, 0.43277740478515625, 0.4623565673828125, 0.49193572998046875, 0.521514892578125, 0.5510940551757812, 0.5806732177734375, 0.6102523803710938, 0.63983154296875, 0.6694107055664062, 0.6989898681640625, 0.7285690307617188, 0.758148193359375, 0.7877273559570312, 0.8173065185546875, 0.8468856811523438, 0.87646484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 12.0, 23.0, 10.0, 14.0, 15.0, 25.0, 26.0, 28.0, 41.0, 37.0, 44.0, 42.0, 43.0, 47.0, 38.0, 36.0, 38.0, 35.0, 41.0, 46.0, 34.0, 52.0, 34.0, 16.0, 25.0, 30.0, 25.0, 16.0, 17.0, 13.0, 14.0, 17.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.4248809814453125, -1.377105712890625, -1.3293304443359375, -1.28155517578125, -1.2337799072265625, -1.186004638671875, -1.1382293701171875, -1.0904541015625, -1.0426788330078125, -0.994903564453125, -0.9471282958984375, -0.89935302734375, -0.8515777587890625, -0.803802490234375, -0.7560272216796875, -0.708251953125, -0.6604766845703125, -0.612701416015625, -0.5649261474609375, -0.51715087890625, -0.4693756103515625, -0.421600341796875, -0.3738250732421875, -0.3260498046875, -0.2782745361328125, -0.230499267578125, -0.1827239990234375, -0.13494873046875, -0.0871734619140625, -0.039398193359375, 0.0083770751953125, 0.05615234375, 0.1039276123046875, 0.151702880859375, 0.1994781494140625, 0.24725341796875, 0.2950286865234375, 0.342803955078125, 0.3905792236328125, 0.4383544921875, 0.4861297607421875, 0.533905029296875, 0.5816802978515625, 0.62945556640625, 0.6772308349609375, 0.725006103515625, 0.7727813720703125, 0.820556640625, 0.8683319091796875, 0.916107177734375, 0.9638824462890625, 1.01165771484375, 1.0594329833984375, 1.107208251953125, 1.1549835205078125, 1.2027587890625, 1.2505340576171875, 1.298309326171875, 1.3460845947265625, 1.39385986328125, 1.4416351318359375, 1.489410400390625, 1.5371856689453125, 1.5849609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 12.0, 16.0, 14.0, 25.0, 51.0, 58.0, 96.0, 222.0, 423.0, 1072.0, 3416.0, 21238.0, 895455.0, 115656.0, 7585.0, 1873.0, 647.0, 307.0, 139.0, 108.0, 43.0, 27.0, 19.0, 12.0, 12.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6549148559570312, -0.6355133056640625, -0.6161117553710938, -0.596710205078125, -0.5773086547851562, -0.5579071044921875, -0.5385055541992188, -0.51910400390625, -0.49970245361328125, -0.4803009033203125, -0.46089935302734375, -0.441497802734375, -0.42209625244140625, -0.4026947021484375, -0.38329315185546875, -0.3638916015625, -0.34449005126953125, -0.3250885009765625, -0.30568695068359375, -0.286285400390625, -0.26688385009765625, -0.2474822998046875, -0.22808074951171875, -0.20867919921875, -0.18927764892578125, -0.1698760986328125, -0.15047454833984375, -0.131072998046875, -0.11167144775390625, -0.0922698974609375, -0.07286834716796875, -0.053466796875, -0.03406524658203125, -0.0146636962890625, 0.00473785400390625, 0.024139404296875, 0.04354095458984375, 0.0629425048828125, 0.08234405517578125, 0.10174560546875, 0.12114715576171875, 0.1405487060546875, 0.15995025634765625, 0.179351806640625, 0.19875335693359375, 0.2181549072265625, 0.23755645751953125, 0.2569580078125, 0.27635955810546875, 0.2957611083984375, 0.31516265869140625, 0.334564208984375, 0.35396575927734375, 0.3733673095703125, 0.39276885986328125, 0.41217041015625, 0.43157196044921875, 0.4509735107421875, 0.47037506103515625, 0.489776611328125, 0.5091781616210938, 0.5285797119140625, 0.5479812622070312, 0.5673828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 20.0, 28.0, 46.0, 130.0, 386.0, 215.0, 72.0, 45.0, 15.0, 16.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018095970153808594, -0.00017732474952936172, -0.0001736897975206375, -0.0001700548455119133, -0.0001664198935031891, -0.00016278494149446487, -0.00015914998948574066, -0.00015551503747701645, -0.00015188008546829224, -0.00014824513345956802, -0.0001446101814508438, -0.0001409752294421196, -0.00013734027743339539, -0.00013370532542467117, -0.00013007037341594696, -0.00012643542140722275, -0.00012280046939849854, -0.00011916551738977432, -0.00011553056538105011, -0.0001118956133723259, -0.00010826066136360168, -0.00010462570935487747, -0.00010099075734615326, -9.735580533742905e-05, -9.372085332870483e-05, -9.008590131998062e-05, -8.645094931125641e-05, -8.28159973025322e-05, -7.918104529380798e-05, -7.554609328508377e-05, -7.191114127635956e-05, -6.827618926763535e-05, -6.464123725891113e-05, -6.100628525018692e-05, -5.737133324146271e-05, -5.3736381232738495e-05, -5.010142922401428e-05, -4.646647721529007e-05, -4.283152520656586e-05, -3.9196573197841644e-05, -3.556162118911743e-05, -3.192666918039322e-05, -2.8291717171669006e-05, -2.4656765162944794e-05, -2.102181315422058e-05, -1.738686114549637e-05, -1.3751909136772156e-05, -1.0116957128047943e-05, -6.4820051193237305e-06, -2.847053110599518e-06, 7.878988981246948e-07, 4.4228509068489075e-06, 8.05780291557312e-06, 1.1692754924297333e-05, 1.5327706933021545e-05, 1.8962658941745758e-05, 2.259761095046997e-05, 2.6232562959194183e-05, 2.9867514967918396e-05, 3.350246697664261e-05, 3.713741898536682e-05, 4.0772370994091034e-05, 4.4407323002815247e-05, 4.804227501153946e-05, 5.167722702026367e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 12.0, 23.0, 26.0, 37.0, 80.0, 142.0, 299.0, 616.0, 1531.0, 4692.0, 23567.0, 858957.0, 142973.0, 10695.0, 3024.0, 944.0, 447.0, 216.0, 92.0, 54.0, 34.0, 24.0, 13.0, 9.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.483154296875, -0.4651222229003906, -0.44709014892578125, -0.4290580749511719, -0.4110260009765625, -0.3929939270019531, -0.37496185302734375, -0.3569297790527344, -0.338897705078125, -0.3208656311035156, -0.30283355712890625, -0.2848014831542969, -0.2667694091796875, -0.24873733520507812, -0.23070526123046875, -0.21267318725585938, -0.19464111328125, -0.17660903930664062, -0.15857696533203125, -0.14054489135742188, -0.1225128173828125, -0.10448074340820312, -0.08644866943359375, -0.06841659545898438, -0.050384521484375, -0.032352447509765625, -0.01432037353515625, 0.003711700439453125, 0.0217437744140625, 0.039775848388671875, 0.05780792236328125, 0.07583999633789062, 0.0938720703125, 0.11190414428710938, 0.12993621826171875, 0.14796829223632812, 0.1660003662109375, 0.18403244018554688, 0.20206451416015625, 0.22009658813476562, 0.238128662109375, 0.2561607360839844, 0.27419281005859375, 0.2922248840332031, 0.3102569580078125, 0.3282890319824219, 0.34632110595703125, 0.3643531799316406, 0.38238525390625, 0.4004173278808594, 0.41844940185546875, 0.4364814758300781, 0.4545135498046875, 0.4725456237792969, 0.49057769775390625, 0.5086097717285156, 0.526641845703125, 0.5446739196777344, 0.5627059936523438, 0.5807380676269531, 0.5987701416015625, 0.6168022155761719, 0.6348342895507812, 0.6528663635253906, 0.6708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 7.0, 5.0, 5.0, 20.0, 13.0, 29.0, 38.0, 57.0, 112.0, 171.0, 228.0, 97.0, 67.0, 51.0, 22.0, 14.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2041015625, -0.19887542724609375, -0.1936492919921875, -0.18842315673828125, -0.183197021484375, -0.17797088623046875, -0.1727447509765625, -0.16751861572265625, -0.16229248046875, -0.15706634521484375, -0.1518402099609375, -0.14661407470703125, -0.141387939453125, -0.13616180419921875, -0.1309356689453125, -0.12570953369140625, -0.1204833984375, -0.11525726318359375, -0.1100311279296875, -0.10480499267578125, -0.099578857421875, -0.09435272216796875, -0.0891265869140625, -0.08390045166015625, -0.07867431640625, -0.07344818115234375, -0.0682220458984375, -0.06299591064453125, -0.057769775390625, -0.05254364013671875, -0.0473175048828125, -0.04209136962890625, -0.036865234375, -0.03163909912109375, -0.0264129638671875, -0.02118682861328125, -0.015960693359375, -0.01073455810546875, -0.0055084228515625, -0.00028228759765625, 0.00494384765625, 0.01016998291015625, 0.0153961181640625, 0.02062225341796875, 0.025848388671875, 0.03107452392578125, 0.0363006591796875, 0.04152679443359375, 0.0467529296875, 0.05197906494140625, 0.0572052001953125, 0.06243133544921875, 0.067657470703125, 0.07288360595703125, 0.0781097412109375, 0.08333587646484375, 0.08856201171875, 0.09378814697265625, 0.0990142822265625, 0.10424041748046875, 0.109466552734375, 0.11469268798828125, 0.1199188232421875, 0.12514495849609375, 0.13037109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 16.0, 25.0, 46.0, 101.0, 196.0, 310.0, 149.0, 66.0, 34.0, 24.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.903681993484497, -2.7609798908233643, -2.6182777881622314, -2.4755756855010986, -2.3328733444213867, -2.190171241760254, -2.047469139099121, -1.9047670364379883, -1.7620649337768555, -1.6193628311157227, -1.4766607284545898, -1.3339585065841675, -1.1912564039230347, -1.0485543012619019, -0.9058521389961243, -0.7631499767303467, -0.6204478740692139, -0.47774574160575867, -0.33504360914230347, -0.19234147667884827, -0.049639344215393066, 0.09306275844573975, 0.23576492071151733, 0.3784670829772949, 0.5211691856384277, 0.6638712882995605, 0.8065734505653381, 0.9492756128311157, 1.0919777154922485, 1.2346798181533813, 1.3773820400238037, 1.5200841426849365, 1.6627860069274902, 1.805488109588623, 1.9481902122497559, 2.0908923149108887, 2.2335944175720215, 2.3762965202331543, 2.518998861312866, 2.661700963973999, 2.804403066635132, 2.9471051692962646, 3.0898072719573975, 3.2325093746185303, 3.375211715698242, 3.517913818359375, 3.660615921020508, 3.8033180236816406, 3.9460201263427734, 4.088722229003906, 4.231424331665039, 4.374126434326172, 4.516828536987305, 4.6595306396484375, 4.80223274230957, 4.944934844970703, 5.087636947631836, 5.230339050292969, 5.373041152954102, 5.515743255615234, 5.658445358276367, 5.8011474609375, 5.943849563598633, 6.086551666259766, 6.229254245758057]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 6.0, 5.0, 19.0, 17.0, 17.0, 24.0, 33.0, 29.0, 34.0, 51.0, 49.0, 44.0, 60.0, 47.0, 62.0, 52.0, 45.0, 58.0, 40.0, 51.0, 36.0, 42.0, 36.0, 27.0, 26.0, 23.0, 15.0, 15.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0103719234466553, -2.907381772994995, -2.804391384124756, -2.7014012336730957, -2.5984108448028564, -2.4954206943511963, -2.392430305480957, -2.289440155029297, -2.1864500045776367, -2.0834598541259766, -1.9804694652557373, -1.8774793148040771, -1.7744890451431274, -1.6714987754821777, -1.568508505821228, -1.4655182361602783, -1.3625279664993286, -1.259537696838379, -1.1565474271774292, -1.0535571575164795, -0.9505670070648193, -0.8475767374038696, -0.7445864677429199, -0.641596257686615, -0.5386059880256653, -0.43561574816703796, -0.33262550830841064, -0.22963523864746094, -0.12664499878883362, -0.0236547589302063, 0.07933551073074341, 0.18232572078704834, 0.28531599044799805, 0.38830623030662537, 0.4912964701652527, 0.5942867398262024, 0.6972769498825073, 0.800267219543457, 0.9032574892044067, 1.0062477588653564, 1.1092379093170166, 1.2122281789779663, 1.315218448638916, 1.4182085990905762, 1.5211988687515259, 1.6241891384124756, 1.7271794080734253, 1.830169677734375, 1.9331599473953247, 2.0361502170562744, 2.1391403675079346, 2.242130756378174, 2.345120906829834, 2.448111057281494, 2.5511014461517334, 2.6540915966033936, 2.757081985473633, 2.860072135925293, 2.9630625247955322, 3.0660526752471924, 3.1690430641174316, 3.272033214569092, 3.375023365020752, 3.478013753890991, 3.5810039043426514]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 5.0, 3.0, 2.0, 5.0, 9.0, 11.0, 11.0, 9.0, 12.0, 23.0, 34.0, 45.0, 68.0, 98.0, 160.0, 296.0, 461.0, 778.0, 1639.0, 3986.0, 15256.0, 213345.0, 3794245.0, 140270.0, 14421.0, 4736.0, 2041.0, 918.0, 490.0, 292.0, 203.0, 111.0, 88.0, 62.0, 39.0, 40.0, 25.0, 11.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.111328125, -3.0324859619140625, -2.953643798828125, -2.8748016357421875, -2.79595947265625, -2.7171173095703125, -2.638275146484375, -2.5594329833984375, -2.4805908203125, -2.4017486572265625, -2.322906494140625, -2.2440643310546875, -2.16522216796875, -2.0863800048828125, -2.007537841796875, -1.9286956787109375, -1.849853515625, -1.7710113525390625, -1.692169189453125, -1.6133270263671875, -1.53448486328125, -1.4556427001953125, -1.376800537109375, -1.2979583740234375, -1.2191162109375, -1.1402740478515625, -1.061431884765625, -0.9825897216796875, -0.90374755859375, -0.8249053955078125, -0.746063232421875, -0.6672210693359375, -0.58837890625, -0.5095367431640625, -0.430694580078125, -0.3518524169921875, -0.27301025390625, -0.1941680908203125, -0.115325927734375, -0.0364837646484375, 0.0423583984375, 0.1212005615234375, 0.200042724609375, 0.2788848876953125, 0.35772705078125, 0.4365692138671875, 0.515411376953125, 0.5942535400390625, 0.673095703125, 0.7519378662109375, 0.830780029296875, 0.9096221923828125, 0.98846435546875, 1.0673065185546875, 1.146148681640625, 1.2249908447265625, 1.3038330078125, 1.3826751708984375, 1.461517333984375, 1.5403594970703125, 1.61920166015625, 1.6980438232421875, 1.776885986328125, 1.8557281494140625, 1.9345703125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 6.0, 14.0, 22.0, 30.0, 42.0, 54.0, 65.0, 95.0, 110.0, 94.0, 93.0, 85.0, 71.0, 61.0, 38.0, 26.0, 26.0, 24.0, 13.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8837890625, -1.833709716796875, -1.78363037109375, -1.733551025390625, -1.6834716796875, -1.633392333984375, -1.58331298828125, -1.533233642578125, -1.483154296875, -1.433074951171875, -1.38299560546875, -1.332916259765625, -1.2828369140625, -1.232757568359375, -1.18267822265625, -1.132598876953125, -1.08251953125, -1.032440185546875, -0.98236083984375, -0.932281494140625, -0.8822021484375, -0.832122802734375, -0.78204345703125, -0.731964111328125, -0.681884765625, -0.631805419921875, -0.58172607421875, -0.531646728515625, -0.4815673828125, -0.431488037109375, -0.38140869140625, -0.331329345703125, -0.28125, -0.231170654296875, -0.18109130859375, -0.131011962890625, -0.0809326171875, -0.030853271484375, 0.01922607421875, 0.069305419921875, 0.119384765625, 0.169464111328125, 0.21954345703125, 0.269622802734375, 0.3197021484375, 0.369781494140625, 0.41986083984375, 0.469940185546875, 0.52001953125, 0.570098876953125, 0.62017822265625, 0.670257568359375, 0.7203369140625, 0.770416259765625, 0.82049560546875, 0.870574951171875, 0.920654296875, 0.970733642578125, 1.02081298828125, 1.070892333984375, 1.1209716796875, 1.171051025390625, 1.22113037109375, 1.271209716796875, 1.3212890625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 5.0, 13.0, 16.0, 18.0, 31.0, 43.0, 55.0, 70.0, 112.0, 193.0, 336.0, 555.0, 1086.0, 2335.0, 5272.0, 15379.0, 82500.0, 3821435.0, 227651.0, 23966.0, 7162.0, 2847.0, 1383.0, 765.0, 379.0, 231.0, 149.0, 88.0, 56.0, 43.0, 22.0, 17.0, 12.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.923828125, -1.861083984375, -1.79833984375, -1.735595703125, -1.6728515625, -1.610107421875, -1.54736328125, -1.484619140625, -1.421875, -1.359130859375, -1.29638671875, -1.233642578125, -1.1708984375, -1.108154296875, -1.04541015625, -0.982666015625, -0.919921875, -0.857177734375, -0.79443359375, -0.731689453125, -0.6689453125, -0.606201171875, -0.54345703125, -0.480712890625, -0.41796875, -0.355224609375, -0.29248046875, -0.229736328125, -0.1669921875, -0.104248046875, -0.04150390625, 0.021240234375, 0.083984375, 0.146728515625, 0.20947265625, 0.272216796875, 0.3349609375, 0.397705078125, 0.46044921875, 0.523193359375, 0.5859375, 0.648681640625, 0.71142578125, 0.774169921875, 0.8369140625, 0.899658203125, 0.96240234375, 1.025146484375, 1.087890625, 1.150634765625, 1.21337890625, 1.276123046875, 1.3388671875, 1.401611328125, 1.46435546875, 1.527099609375, 1.58984375, 1.652587890625, 1.71533203125, 1.778076171875, 1.8408203125, 1.903564453125, 1.96630859375, 2.029052734375, 2.091796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 3.0, 3.0, 10.0, 5.0, 8.0, 17.0, 12.0, 18.0, 29.0, 36.0, 83.0, 191.0, 476.0, 1287.0, 1072.0, 434.0, 161.0, 70.0, 43.0, 24.0, 17.0, 16.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5994491577148438, -0.5812225341796875, -0.5629959106445312, -0.544769287109375, -0.5265426635742188, -0.5083160400390625, -0.49008941650390625, -0.47186279296875, -0.45363616943359375, -0.4354095458984375, -0.41718292236328125, -0.398956298828125, -0.38072967529296875, -0.3625030517578125, -0.34427642822265625, -0.3260498046875, -0.30782318115234375, -0.2895965576171875, -0.27136993408203125, -0.253143310546875, -0.23491668701171875, -0.2166900634765625, -0.19846343994140625, -0.18023681640625, -0.16201019287109375, -0.1437835693359375, -0.12555694580078125, -0.107330322265625, -0.08910369873046875, -0.0708770751953125, -0.05265045166015625, -0.034423828125, -0.01619720458984375, 0.0020294189453125, 0.02025604248046875, 0.038482666015625, 0.05670928955078125, 0.0749359130859375, 0.09316253662109375, 0.11138916015625, 0.12961578369140625, 0.1478424072265625, 0.16606903076171875, 0.184295654296875, 0.20252227783203125, 0.2207489013671875, 0.23897552490234375, 0.2572021484375, 0.27542877197265625, 0.2936553955078125, 0.31188201904296875, 0.330108642578125, 0.34833526611328125, 0.3665618896484375, 0.38478851318359375, 0.40301513671875, 0.42124176025390625, 0.4394683837890625, 0.45769500732421875, 0.475921630859375, 0.49414825439453125, 0.5123748779296875, 0.5306015014648438, 0.548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 19.0, 17.0, 52.0, 51.0, 103.0, 130.0, 176.0, 158.0, 100.0, 59.0, 34.0, 29.0, 16.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7705849409103394, -1.701843023300171, -1.6331011056900024, -1.564359188079834, -1.495617151260376, -1.4268752336502075, -1.358133316040039, -1.2893913984298706, -1.2206494808197021, -1.1519075632095337, -1.0831656455993652, -1.0144236087799072, -0.9456816911697388, -0.8769397735595703, -0.8081978559494019, -0.7394559383392334, -0.6707139015197754, -0.6019719839096069, -0.5332300066947937, -0.46448808908462524, -0.3957461416721344, -0.32700419425964355, -0.2582622766494751, -0.18952032923698425, -0.12077838182449341, -0.05203644186258316, 0.016705498099327087, 0.08544743061065674, 0.15418937802314758, 0.22293132543563843, 0.2916732430458069, 0.36041519045829773, 0.4291572570800781, 0.49789920449256897, 0.5666411519050598, 0.6353830695152283, 0.7041250467300415, 0.77286696434021, 0.8416088819503784, 0.9103507995605469, 0.9790927767753601, 1.0478347539901733, 1.1165766716003418, 1.1853185892105103, 1.2540605068206787, 1.3228025436401367, 1.3915443420410156, 1.4602863788604736, 1.529028296470642, 1.5977702140808105, 1.666512131690979, 1.7352540493011475, 1.8039960861206055, 1.872738003730774, 1.9414799213409424, 2.0102219581604004, 2.0789637565612793, 2.1477057933807373, 2.216447591781616, 2.285189628601074, 2.353931427001953, 2.422673463821411, 2.491415500640869, 2.560157299041748, 2.628899335861206]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 1.0, 12.0, 13.0, 20.0, 22.0, 30.0, 42.0, 36.0, 41.0, 52.0, 69.0, 67.0, 65.0, 61.0, 55.0, 57.0, 61.0, 41.0, 53.0, 32.0, 43.0, 24.0, 27.0, 23.0, 9.0, 16.0, 12.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4072253704071045, -1.364511489868164, -1.3217976093292236, -1.2790837287902832, -1.2363698482513428, -1.1936559677124023, -1.150942087173462, -1.1082282066345215, -1.065514326095581, -1.0228004455566406, -0.9800865650177002, -0.9373726844787598, -0.8946588039398193, -0.8519449234008789, -0.8092310428619385, -0.766517162322998, -0.7238032817840576, -0.6810894012451172, -0.6383755207061768, -0.5956616401672363, -0.5529477596282959, -0.5102338790893555, -0.46751999855041504, -0.4248061180114746, -0.3820922374725342, -0.33937835693359375, -0.2966644763946533, -0.2539505958557129, -0.21123671531677246, -0.16852283477783203, -0.1258089542388916, -0.08309507369995117, -0.04038119316101074, 0.0023326873779296875, 0.04504656791687012, 0.08776044845581055, 0.13047432899475098, 0.1731882095336914, 0.21590209007263184, 0.25861597061157227, 0.3013298511505127, 0.3440437316894531, 0.38675761222839355, 0.429471492767334, 0.4721853733062744, 0.5148992538452148, 0.5576131343841553, 0.6003270149230957, 0.6430408954620361, 0.6857547760009766, 0.728468656539917, 0.7711825370788574, 0.8138964176177979, 0.8566102981567383, 0.8993241786956787, 0.9420380592346191, 0.9847519397735596, 1.0274658203125, 1.0701797008514404, 1.1128935813903809, 1.1556074619293213, 1.1983213424682617, 1.2410352230072021, 1.2837491035461426, 1.326462984085083]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 13.0, 17.0, 23.0, 56.0, 82.0, 151.0, 290.0, 519.0, 1208.0, 3037.0, 9980.0, 69193.0, 847330.0, 98462.0, 12087.0, 3389.0, 1388.0, 643.0, 299.0, 150.0, 65.0, 40.0, 36.0, 33.0, 11.0, 13.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.43233489990234375, -0.4139862060546875, -0.39563751220703125, -0.377288818359375, -0.35894012451171875, -0.3405914306640625, -0.32224273681640625, -0.30389404296875, -0.28554534912109375, -0.2671966552734375, -0.24884796142578125, -0.230499267578125, -0.21215057373046875, -0.1938018798828125, -0.17545318603515625, -0.1571044921875, -0.13875579833984375, -0.1204071044921875, -0.10205841064453125, -0.083709716796875, -0.06536102294921875, -0.0470123291015625, -0.02866363525390625, -0.01031494140625, 0.00803375244140625, 0.0263824462890625, 0.04473114013671875, 0.063079833984375, 0.08142852783203125, 0.0997772216796875, 0.11812591552734375, 0.136474609375, 0.15482330322265625, 0.1731719970703125, 0.19152069091796875, 0.209869384765625, 0.22821807861328125, 0.2465667724609375, 0.26491546630859375, 0.28326416015625, 0.30161285400390625, 0.3199615478515625, 0.33831024169921875, 0.356658935546875, 0.37500762939453125, 0.3933563232421875, 0.41170501708984375, 0.4300537109375, 0.44840240478515625, 0.4667510986328125, 0.48509979248046875, 0.503448486328125, 0.5217971801757812, 0.5401458740234375, 0.5584945678710938, 0.57684326171875, 0.5951919555664062, 0.6135406494140625, 0.6318893432617188, 0.650238037109375, 0.6685867309570312, 0.6869354248046875, 0.7052841186523438, 0.7236328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 2.0, 4.0, 8.0, 11.0, 16.0, 23.0, 43.0, 51.0, 48.0, 73.0, 87.0, 105.0, 103.0, 87.0, 80.0, 73.0, 50.0, 42.0, 28.0, 24.0, 23.0, 14.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6376953125, -1.5970611572265625, -1.556427001953125, -1.5157928466796875, -1.47515869140625, -1.4345245361328125, -1.393890380859375, -1.3532562255859375, -1.3126220703125, -1.2719879150390625, -1.231353759765625, -1.1907196044921875, -1.15008544921875, -1.1094512939453125, -1.068817138671875, -1.0281829833984375, -0.987548828125, -0.9469146728515625, -0.906280517578125, -0.8656463623046875, -0.82501220703125, -0.7843780517578125, -0.743743896484375, -0.7031097412109375, -0.6624755859375, -0.6218414306640625, -0.581207275390625, -0.5405731201171875, -0.49993896484375, -0.4593048095703125, -0.418670654296875, -0.3780364990234375, -0.33740234375, -0.2967681884765625, -0.256134033203125, -0.2154998779296875, -0.17486572265625, -0.1342315673828125, -0.093597412109375, -0.0529632568359375, -0.0123291015625, 0.0283050537109375, 0.068939208984375, 0.1095733642578125, 0.15020751953125, 0.1908416748046875, 0.231475830078125, 0.2721099853515625, 0.312744140625, 0.3533782958984375, 0.394012451171875, 0.4346466064453125, 0.47528076171875, 0.5159149169921875, 0.556549072265625, 0.5971832275390625, 0.6378173828125, 0.6784515380859375, 0.719085693359375, 0.7597198486328125, 0.80035400390625, 0.8409881591796875, 0.881622314453125, 0.9222564697265625, 0.962890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 20.0, 22.0, 27.0, 56.0, 73.0, 144.0, 220.0, 299.0, 552.0, 942.0, 1705.0, 3222.0, 7259.0, 21659.0, 112437.0, 694756.0, 161212.0, 27231.0, 8364.0, 3823.0, 1815.0, 1053.0, 620.0, 343.0, 217.0, 149.0, 98.0, 64.0, 42.0, 23.0, 24.0, 14.0, 13.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2727622985839844, -0.26354217529296875, -0.2543220520019531, -0.2451019287109375, -0.23588180541992188, -0.22666168212890625, -0.21744155883789062, -0.208221435546875, -0.19900131225585938, -0.18978118896484375, -0.18056106567382812, -0.1713409423828125, -0.16212081909179688, -0.15290069580078125, -0.14368057250976562, -0.13446044921875, -0.12524032592773438, -0.11602020263671875, -0.10680007934570312, -0.0975799560546875, -0.08835983276367188, -0.07913970947265625, -0.06991958618164062, -0.060699462890625, -0.051479339599609375, -0.04225921630859375, -0.033039093017578125, -0.0238189697265625, -0.014598846435546875, -0.00537872314453125, 0.003841400146484375, 0.0130615234375, 0.022281646728515625, 0.03150177001953125, 0.040721893310546875, 0.0499420166015625, 0.059162139892578125, 0.06838226318359375, 0.07760238647460938, 0.086822509765625, 0.09604263305664062, 0.10526275634765625, 0.11448287963867188, 0.1237030029296875, 0.13292312622070312, 0.14214324951171875, 0.15136337280273438, 0.16058349609375, 0.16980361938476562, 0.17902374267578125, 0.18824386596679688, 0.1974639892578125, 0.20668411254882812, 0.21590423583984375, 0.22512435913085938, 0.234344482421875, 0.24356460571289062, 0.25278472900390625, 0.2620048522949219, 0.2712249755859375, 0.2804450988769531, 0.28966522216796875, 0.2988853454589844, 0.30810546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 3.0, 10.0, 4.0, 11.0, 7.0, 10.0, 14.0, 15.0, 29.0, 18.0, 25.0, 31.0, 38.0, 34.0, 35.0, 52.0, 40.0, 46.0, 56.0, 38.0, 49.0, 35.0, 47.0, 40.0, 38.0, 48.0, 30.0, 29.0, 30.0, 19.0, 23.0, 20.0, 9.0, 8.0, 7.0, 10.0, 12.0, 3.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0264739990234375, -0.989471435546875, -0.9524688720703125, -0.91546630859375, -0.8784637451171875, -0.841461181640625, -0.8044586181640625, -0.7674560546875, -0.7304534912109375, -0.693450927734375, -0.6564483642578125, -0.61944580078125, -0.5824432373046875, -0.545440673828125, -0.5084381103515625, -0.471435546875, -0.4344329833984375, -0.397430419921875, -0.3604278564453125, -0.32342529296875, -0.2864227294921875, -0.249420166015625, -0.2124176025390625, -0.1754150390625, -0.1384124755859375, -0.101409912109375, -0.0644073486328125, -0.02740478515625, 0.0095977783203125, 0.046600341796875, 0.0836029052734375, 0.12060546875, 0.1576080322265625, 0.194610595703125, 0.2316131591796875, 0.26861572265625, 0.3056182861328125, 0.342620849609375, 0.3796234130859375, 0.4166259765625, 0.4536285400390625, 0.490631103515625, 0.5276336669921875, 0.56463623046875, 0.6016387939453125, 0.638641357421875, 0.6756439208984375, 0.712646484375, 0.7496490478515625, 0.786651611328125, 0.8236541748046875, 0.86065673828125, 0.8976593017578125, 0.934661865234375, 0.9716644287109375, 1.0086669921875, 1.0456695556640625, 1.082672119140625, 1.1196746826171875, 1.15667724609375, 1.1936798095703125, 1.230682373046875, 1.2676849365234375, 1.3046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 13.0, 15.0, 23.0, 31.0, 71.0, 130.0, 241.0, 640.0, 1949.0, 8591.0, 86737.0, 883729.0, 56718.0, 6816.0, 1680.0, 605.0, 234.0, 116.0, 77.0, 38.0, 39.0, 16.0, 12.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.1275005340576172, -0.12267684936523438, -0.11785316467285156, -0.11302947998046875, -0.10820579528808594, -0.10338211059570312, -0.09855842590332031, -0.0937347412109375, -0.08891105651855469, -0.08408737182617188, -0.07926368713378906, -0.07444000244140625, -0.06961631774902344, -0.06479263305664062, -0.05996894836425781, -0.055145263671875, -0.05032157897949219, -0.045497894287109375, -0.04067420959472656, -0.03585052490234375, -0.031026840209960938, -0.026203155517578125, -0.021379470825195312, -0.0165557861328125, -0.011732101440429688, -0.006908416748046875, -0.0020847320556640625, 0.00273895263671875, 0.0075626373291015625, 0.012386322021484375, 0.017210006713867188, 0.02203369140625, 0.026857376098632812, 0.031681060791015625, 0.03650474548339844, 0.04132843017578125, 0.04615211486816406, 0.050975799560546875, 0.05579948425292969, 0.0606231689453125, 0.06544685363769531, 0.07027053833007812, 0.07509422302246094, 0.07991790771484375, 0.08474159240722656, 0.08956527709960938, 0.09438896179199219, 0.099212646484375, 0.10403633117675781, 0.10886001586914062, 0.11368370056152344, 0.11850738525390625, 0.12333106994628906, 0.12815475463867188, 0.1329784393310547, 0.1378021240234375, 0.1426258087158203, 0.14744949340820312, 0.15227317810058594, 0.15709686279296875, 0.16192054748535156, 0.16674423217773438, 0.1715679168701172, 0.1763916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 32.0, 57.0, 148.0, 276.0, 254.0, 115.0, 41.0, 12.0, 13.0, 10.0, 6.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011628866195678711, -0.00011304859071969986, -0.00010980851948261261, -0.00010656844824552536, -0.00010332837700843811, -0.00010008830577135086, -9.684823453426361e-05, -9.360816329717636e-05, -9.036809206008911e-05, -8.712802082300186e-05, -8.388794958591461e-05, -8.064787834882736e-05, -7.740780711174011e-05, -7.416773587465286e-05, -7.092766463756561e-05, -6.768759340047836e-05, -6.444752216339111e-05, -6.120745092630386e-05, -5.7967379689216614e-05, -5.4727308452129364e-05, -5.1487237215042114e-05, -4.8247165977954865e-05, -4.5007094740867615e-05, -4.1767023503780365e-05, -3.8526952266693115e-05, -3.5286881029605865e-05, -3.2046809792518616e-05, -2.8806738555431366e-05, -2.5566667318344116e-05, -2.2326596081256866e-05, -1.9086524844169617e-05, -1.5846453607082367e-05, -1.2606382369995117e-05, -9.366311132907867e-06, -6.126239895820618e-06, -2.886168658733368e-06, 3.5390257835388184e-07, 3.5939738154411316e-06, 6.834045052528381e-06, 1.0074116289615631e-05, 1.3314187526702881e-05, 1.655425876379013e-05, 1.979433000087738e-05, 2.303440123796463e-05, 2.627447247505188e-05, 2.951454371213913e-05, 3.275461494922638e-05, 3.599468618631363e-05, 3.923475742340088e-05, 4.247482866048813e-05, 4.571489989757538e-05, 4.895497113466263e-05, 5.219504237174988e-05, 5.543511360883713e-05, 5.867518484592438e-05, 6.191525608301163e-05, 6.515532732009888e-05, 6.839539855718613e-05, 7.163546979427338e-05, 7.487554103136063e-05, 7.811561226844788e-05, 8.135568350553513e-05, 8.459575474262238e-05, 8.783582597970963e-05, 9.107589721679688e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 4.0, 8.0, 8.0, 8.0, 13.0, 18.0, 35.0, 40.0, 52.0, 74.0, 107.0, 169.0, 240.0, 379.0, 580.0, 980.0, 1519.0, 2935.0, 5630.0, 13212.0, 41811.0, 213342.0, 585486.0, 130760.0, 29874.0, 10464.0, 4631.0, 2353.0, 1390.0, 813.0, 537.0, 345.0, 209.0, 138.0, 112.0, 78.0, 44.0, 44.0, 28.0, 19.0, 10.0, 23.0, 6.0, 5.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07021045684814453, -0.06797218322753906, -0.0657339096069336, -0.06349563598632812, -0.061257362365722656, -0.05901908874511719, -0.05678081512451172, -0.05454254150390625, -0.05230426788330078, -0.05006599426269531, -0.047827720642089844, -0.045589447021484375, -0.043351173400878906, -0.04111289978027344, -0.03887462615966797, -0.0366363525390625, -0.03439807891845703, -0.03215980529785156, -0.029921531677246094, -0.027683258056640625, -0.025444984436035156, -0.023206710815429688, -0.02096843719482422, -0.01873016357421875, -0.01649188995361328, -0.014253616333007812, -0.012015342712402344, -0.009777069091796875, -0.007538795471191406, -0.0053005218505859375, -0.0030622482299804688, -0.000823974609375, 0.0014142990112304688, 0.0036525726318359375, 0.005890846252441406, 0.008129119873046875, 0.010367393493652344, 0.012605667114257812, 0.014843940734863281, 0.01708221435546875, 0.01932048797607422, 0.021558761596679688, 0.023797035217285156, 0.026035308837890625, 0.028273582458496094, 0.030511856079101562, 0.03275012969970703, 0.0349884033203125, 0.03722667694091797, 0.03946495056152344, 0.041703224182128906, 0.043941497802734375, 0.046179771423339844, 0.04841804504394531, 0.05065631866455078, 0.05289459228515625, 0.05513286590576172, 0.05737113952636719, 0.059609413146972656, 0.061847686767578125, 0.0640859603881836, 0.06632423400878906, 0.06856250762939453, 0.07080078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 18.0, 14.0, 26.0, 41.0, 51.0, 94.0, 117.0, 140.0, 123.0, 89.0, 77.0, 56.0, 43.0, 25.0, 17.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024139404296875, -0.02335071563720703, -0.022562026977539062, -0.021773338317871094, -0.020984649658203125, -0.020195960998535156, -0.019407272338867188, -0.01861858367919922, -0.01782989501953125, -0.01704120635986328, -0.016252517700195312, -0.015463829040527344, -0.014675140380859375, -0.013886451721191406, -0.013097763061523438, -0.012309074401855469, -0.0115203857421875, -0.010731697082519531, -0.009943008422851562, -0.009154319763183594, -0.008365631103515625, -0.007576942443847656, -0.0067882537841796875, -0.005999565124511719, -0.00521087646484375, -0.004422187805175781, -0.0036334991455078125, -0.0028448104858398438, -0.002056121826171875, -0.0012674331665039062, -0.0004787445068359375, 0.00030994415283203125, 0.0010986328125, 0.0018873214721679688, 0.0026760101318359375, 0.0034646987915039062, 0.004253387451171875, 0.005042076110839844, 0.0058307647705078125, 0.006619453430175781, 0.00740814208984375, 0.008196830749511719, 0.008985519409179688, 0.009774208068847656, 0.010562896728515625, 0.011351585388183594, 0.012140274047851562, 0.012928962707519531, 0.0137176513671875, 0.014506340026855469, 0.015295028686523438, 0.016083717346191406, 0.016872406005859375, 0.017661094665527344, 0.018449783325195312, 0.01923847198486328, 0.02002716064453125, 0.02081584930419922, 0.021604537963867188, 0.022393226623535156, 0.023181915283203125, 0.023970603942871094, 0.024759292602539062, 0.02554798126220703, 0.026336669921875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 16.0, 50.0, 109.0, 299.0, 309.0, 125.0, 47.0, 13.0, 13.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.703280448913574, -3.613175392150879, -3.5230703353881836, -3.4329652786254883, -3.342860221862793, -3.2527554035186768, -3.1626503467559814, -3.072545289993286, -2.982440233230591, -2.8923351764678955, -2.8022301197052, -2.712125062942505, -2.6220202445983887, -2.5319151878356934, -2.441810131072998, -2.3517050743103027, -2.2616000175476074, -2.171494960784912, -2.081389904022217, -1.991284966468811, -1.9011799097061157, -1.8110748529434204, -1.7209699153900146, -1.6308648586273193, -1.540759801864624, -1.4506547451019287, -1.3605496883392334, -1.2704447507858276, -1.1803396940231323, -1.090234637260437, -1.0001296997070312, -0.9100246429443359, -0.8199193477630615, -0.7298142910003662, -0.6397092938423157, -0.5496042966842651, -0.4594992399215698, -0.3693942129611969, -0.279289186000824, -0.18918418884277344, -0.09907913208007812, -0.0089741051197052, 0.08113092184066772, 0.17123594880104065, 0.2613409757614136, 0.3514460027217865, 0.4415510296821594, 0.53165602684021, 0.6217610836029053, 0.7118661403656006, 0.8019711375236511, 0.8920761346817017, 0.982181191444397, 1.0722862482070923, 1.162391185760498, 1.2524962425231934, 1.3426012992858887, 1.432706356048584, 1.5228114128112793, 1.612916350364685, 1.7030214071273804, 1.7931264638900757, 1.8832314014434814, 1.9733364582061768, 2.063441514968872]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 17.0, 19.0, 26.0, 41.0, 52.0, 55.0, 64.0, 102.0, 96.0, 78.0, 81.0, 78.0, 66.0, 55.0, 41.0, 36.0, 29.0, 23.0, 16.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.436684250831604, -1.4001200199127197, -1.3635557889938354, -1.3269915580749512, -1.2904272079467773, -1.253862977027893, -1.2172987461090088, -1.1807345151901245, -1.1441702842712402, -1.107606053352356, -1.0710418224334717, -1.0344775915145874, -0.9979133009910583, -0.9613490700721741, -0.924784779548645, -0.8882205486297607, -0.8516563177108765, -0.8150920867919922, -0.7785278558731079, -0.7419635653495789, -0.7053993344306946, -0.6688351035118103, -0.6322708129882812, -0.595706582069397, -0.5591423511505127, -0.5225781202316284, -0.48601385951042175, -0.4494495987892151, -0.4128853678703308, -0.37632113695144653, -0.33975687623023987, -0.3031926155090332, -0.2666285037994385, -0.230064257979393, -0.19350001215934753, -0.15693576633930206, -0.12037152051925659, -0.08380727469921112, -0.04724302887916565, -0.010678768157958984, 0.025885462760925293, 0.062449708580970764, 0.09901395440101624, 0.1355782002210617, 0.17214244604110718, 0.20870669186115265, 0.24527093768119812, 0.2818351984024048, 0.31839942932128906, 0.35496366024017334, 0.39152792096138, 0.42809218168258667, 0.46465641260147095, 0.5012206435203552, 0.5377849340438843, 0.5743491649627686, 0.6109133958816528, 0.6474776268005371, 0.6840418577194214, 0.7206061482429504, 0.7571703791618347, 0.793734610080719, 0.830298900604248, 0.8668631315231323, 0.9034273624420166]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 17.0, 21.0, 32.0, 36.0, 54.0, 101.0, 137.0, 227.0, 414.0, 719.0, 1419.0, 3575.0, 9913.0, 41643.0, 758965.0, 196415.0, 23149.0, 6718.0, 2482.0, 1082.0, 561.0, 301.0, 207.0, 113.0, 83.0, 50.0, 34.0, 22.0, 11.0, 13.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.802734375, -0.7775039672851562, -0.7522735595703125, -0.7270431518554688, -0.701812744140625, -0.6765823364257812, -0.6513519287109375, -0.6261215209960938, -0.60089111328125, -0.5756607055664062, -0.5504302978515625, -0.5251998901367188, -0.499969482421875, -0.47473907470703125, -0.4495086669921875, -0.42427825927734375, -0.3990478515625, -0.37381744384765625, -0.3485870361328125, -0.32335662841796875, -0.298126220703125, -0.27289581298828125, -0.2476654052734375, -0.22243499755859375, -0.19720458984375, -0.17197418212890625, -0.1467437744140625, -0.12151336669921875, -0.096282958984375, -0.07105255126953125, -0.0458221435546875, -0.02059173583984375, 0.004638671875, 0.02986907958984375, 0.0550994873046875, 0.08032989501953125, 0.105560302734375, 0.13079071044921875, 0.1560211181640625, 0.18125152587890625, 0.20648193359375, 0.23171234130859375, 0.2569427490234375, 0.28217315673828125, 0.307403564453125, 0.33263397216796875, 0.3578643798828125, 0.38309478759765625, 0.4083251953125, 0.43355560302734375, 0.4587860107421875, 0.48401641845703125, 0.509246826171875, 0.5344772338867188, 0.5597076416015625, 0.5849380493164062, 0.61016845703125, 0.6353988647460938, 0.6606292724609375, 0.6858596801757812, 0.711090087890625, 0.7363204956054688, 0.7615509033203125, 0.7867813110351562, 0.81201171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 24.0, 19.0, 29.0, 31.0, 44.0, 46.0, 61.0, 80.0, 81.0, 87.0, 72.0, 76.0, 68.0, 52.0, 48.0, 32.0, 24.0, 26.0, 25.0, 14.0, 16.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.984466552734375, -1.92010498046875, -1.855743408203125, -1.7913818359375, -1.727020263671875, -1.66265869140625, -1.598297119140625, -1.533935546875, -1.469573974609375, -1.40521240234375, -1.340850830078125, -1.2764892578125, -1.212127685546875, -1.14776611328125, -1.083404541015625, -1.01904296875, -0.954681396484375, -0.89031982421875, -0.825958251953125, -0.7615966796875, -0.697235107421875, -0.63287353515625, -0.568511962890625, -0.504150390625, -0.439788818359375, -0.37542724609375, -0.311065673828125, -0.2467041015625, -0.182342529296875, -0.11798095703125, -0.053619384765625, 0.0107421875, 0.075103759765625, 0.13946533203125, 0.203826904296875, 0.2681884765625, 0.332550048828125, 0.39691162109375, 0.461273193359375, 0.525634765625, 0.589996337890625, 0.65435791015625, 0.718719482421875, 0.7830810546875, 0.847442626953125, 0.91180419921875, 0.976165771484375, 1.04052734375, 1.104888916015625, 1.16925048828125, 1.233612060546875, 1.2979736328125, 1.362335205078125, 1.42669677734375, 1.491058349609375, 1.555419921875, 1.619781494140625, 1.68414306640625, 1.748504638671875, 1.8128662109375, 1.877227783203125, 1.94158935546875, 2.005950927734375, 2.0703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 16.0, 24.0, 30.0, 31.0, 46.0, 54.0, 77.0, 237.0, 1648.0, 75516.0, 966168.0, 3843.0, 398.0, 126.0, 81.0, 49.0, 37.0, 35.0, 26.0, 19.0, 14.0, 22.0, 10.0, 3.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8011474609375, -1.723388671875, -1.6456298828125, -1.56787109375, -1.4901123046875, -1.412353515625, -1.3345947265625, -1.2568359375, -1.1790771484375, -1.101318359375, -1.0235595703125, -0.94580078125, -0.8680419921875, -0.790283203125, -0.7125244140625, -0.634765625, -0.5570068359375, -0.479248046875, -0.4014892578125, -0.32373046875, -0.2459716796875, -0.168212890625, -0.0904541015625, -0.0126953125, 0.0650634765625, 0.142822265625, 0.2205810546875, 0.29833984375, 0.3760986328125, 0.453857421875, 0.5316162109375, 0.609375, 0.6871337890625, 0.764892578125, 0.8426513671875, 0.92041015625, 0.9981689453125, 1.075927734375, 1.1536865234375, 1.2314453125, 1.3092041015625, 1.386962890625, 1.4647216796875, 1.54248046875, 1.6202392578125, 1.697998046875, 1.7757568359375, 1.853515625, 1.9312744140625, 2.009033203125, 2.0867919921875, 2.16455078125, 2.2423095703125, 2.320068359375, 2.3978271484375, 2.4755859375, 2.5533447265625, 2.631103515625, 2.7088623046875, 2.78662109375, 2.8643798828125, 2.942138671875, 3.0198974609375, 3.09765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 7.0, 14.0, 16.0, 27.0, 29.0, 32.0, 53.0, 41.0, 58.0, 49.0, 50.0, 57.0, 72.0, 65.0, 48.0, 78.0, 52.0, 42.0, 36.0, 32.0, 24.0, 25.0, 21.0, 17.0, 9.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.34649658203125, -1.2886962890625, -1.23089599609375, -1.173095703125, -1.11529541015625, -1.0574951171875, -0.99969482421875, -0.94189453125, -0.88409423828125, -0.8262939453125, -0.76849365234375, -0.710693359375, -0.65289306640625, -0.5950927734375, -0.53729248046875, -0.4794921875, -0.42169189453125, -0.3638916015625, -0.30609130859375, -0.248291015625, -0.19049072265625, -0.1326904296875, -0.07489013671875, -0.01708984375, 0.04071044921875, 0.0985107421875, 0.15631103515625, 0.214111328125, 0.27191162109375, 0.3297119140625, 0.38751220703125, 0.4453125, 0.50311279296875, 0.5609130859375, 0.61871337890625, 0.676513671875, 0.73431396484375, 0.7921142578125, 0.84991455078125, 0.90771484375, 0.96551513671875, 1.0233154296875, 1.08111572265625, 1.138916015625, 1.19671630859375, 1.2545166015625, 1.31231689453125, 1.3701171875, 1.42791748046875, 1.4857177734375, 1.54351806640625, 1.601318359375, 1.65911865234375, 1.7169189453125, 1.77471923828125, 1.83251953125, 1.89031982421875, 1.9481201171875, 2.00592041015625, 2.063720703125, 2.12152099609375, 2.1793212890625, 2.23712158203125, 2.294921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 14.0, 11.0, 17.0, 25.0, 41.0, 65.0, 108.0, 184.0, 371.0, 775.0, 1686.0, 4969.0, 26331.0, 921795.0, 79576.0, 7987.0, 2447.0, 1020.0, 491.0, 241.0, 141.0, 79.0, 43.0, 32.0, 21.0, 24.0, 7.0, 10.0, 4.0, 11.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.55810546875, -0.5432968139648438, -0.5284881591796875, -0.5136795043945312, -0.498870849609375, -0.48406219482421875, -0.4692535400390625, -0.45444488525390625, -0.43963623046875, -0.42482757568359375, -0.4100189208984375, -0.39521026611328125, -0.380401611328125, -0.36559295654296875, -0.3507843017578125, -0.33597564697265625, -0.3211669921875, -0.30635833740234375, -0.2915496826171875, -0.27674102783203125, -0.261932373046875, -0.24712371826171875, -0.2323150634765625, -0.21750640869140625, -0.20269775390625, -0.18788909912109375, -0.1730804443359375, -0.15827178955078125, -0.143463134765625, -0.12865447998046875, -0.1138458251953125, -0.09903717041015625, -0.084228515625, -0.06941986083984375, -0.0546112060546875, -0.03980255126953125, -0.024993896484375, -0.01018524169921875, 0.0046234130859375, 0.01943206787109375, 0.03424072265625, 0.04904937744140625, 0.0638580322265625, 0.07866668701171875, 0.093475341796875, 0.10828399658203125, 0.1230926513671875, 0.13790130615234375, 0.1527099609375, 0.16751861572265625, 0.1823272705078125, 0.19713592529296875, 0.211944580078125, 0.22675323486328125, 0.2415618896484375, 0.25637054443359375, 0.27117919921875, 0.28598785400390625, 0.3007965087890625, 0.31560516357421875, 0.330413818359375, 0.34522247314453125, 0.3600311279296875, 0.37483978271484375, 0.3896484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 21.0, 24.0, 45.0, 96.0, 381.0, 216.0, 83.0, 38.0, 24.0, 17.0, 15.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.599592208862305e-05, -7.368717342615128e-05, -7.13784247636795e-05, -6.906967610120773e-05, -6.676092743873596e-05, -6.445217877626419e-05, -6.214343011379242e-05, -5.983468145132065e-05, -5.752593278884888e-05, -5.5217184126377106e-05, -5.2908435463905334e-05, -5.059968680143356e-05, -4.829093813896179e-05, -4.598218947649002e-05, -4.367344081401825e-05, -4.136469215154648e-05, -3.905594348907471e-05, -3.6747194826602936e-05, -3.4438446164131165e-05, -3.212969750165939e-05, -2.9820948839187622e-05, -2.751220017671585e-05, -2.520345151424408e-05, -2.289470285177231e-05, -2.0585954189300537e-05, -1.8277205526828766e-05, -1.5968456864356995e-05, -1.3659708201885223e-05, -1.1350959539413452e-05, -9.042210876941681e-06, -6.73346221446991e-06, -4.4247135519981384e-06, -2.115964889526367e-06, 1.9278377294540405e-07, 2.5015324354171753e-06, 4.8102810978889465e-06, 7.119029760360718e-06, 9.427778422832489e-06, 1.173652708530426e-05, 1.4045275747776031e-05, 1.6354024410247803e-05, 1.8662773072719574e-05, 2.0971521735191345e-05, 2.3280270397663116e-05, 2.5589019060134888e-05, 2.789776772260666e-05, 3.020651638507843e-05, 3.25152650475502e-05, 3.482401371002197e-05, 3.7132762372493744e-05, 3.9441511034965515e-05, 4.1750259697437286e-05, 4.405900835990906e-05, 4.636775702238083e-05, 4.86765056848526e-05, 5.098525434732437e-05, 5.329400300979614e-05, 5.5602751672267914e-05, 5.7911500334739685e-05, 6.0220248997211456e-05, 6.252899765968323e-05, 6.4837746322155e-05, 6.714649498462677e-05, 6.945524364709854e-05, 7.176399230957031e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 10.0, 11.0, 19.0, 21.0, 35.0, 42.0, 78.0, 98.0, 145.0, 222.0, 385.0, 721.0, 1488.0, 4754.0, 26597.0, 925338.0, 76092.0, 8075.0, 2232.0, 906.0, 491.0, 249.0, 180.0, 110.0, 80.0, 49.0, 35.0, 29.0, 18.0, 8.0, 7.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438232421875, -0.4211692810058594, -0.40410614013671875, -0.3870429992675781, -0.3699798583984375, -0.3529167175292969, -0.33585357666015625, -0.3187904357910156, -0.301727294921875, -0.2846641540527344, -0.26760101318359375, -0.2505378723144531, -0.2334747314453125, -0.21641159057617188, -0.19934844970703125, -0.18228530883789062, -0.16522216796875, -0.14815902709960938, -0.13109588623046875, -0.11403274536132812, -0.0969696044921875, -0.07990646362304688, -0.06284332275390625, -0.045780181884765625, -0.028717041015625, -0.011653900146484375, 0.00540924072265625, 0.022472381591796875, 0.0395355224609375, 0.056598663330078125, 0.07366180419921875, 0.09072494506835938, 0.1077880859375, 0.12485122680664062, 0.14191436767578125, 0.15897750854492188, 0.1760406494140625, 0.19310379028320312, 0.21016693115234375, 0.22723007202148438, 0.244293212890625, 0.2613563537597656, 0.27841949462890625, 0.2954826354980469, 0.3125457763671875, 0.3296089172363281, 0.34667205810546875, 0.3637351989746094, 0.38079833984375, 0.3978614807128906, 0.41492462158203125, 0.4319877624511719, 0.4490509033203125, 0.4661140441894531, 0.48317718505859375, 0.5002403259277344, 0.517303466796875, 0.5343666076660156, 0.5514297485351562, 0.5684928894042969, 0.5855560302734375, 0.6026191711425781, 0.6196823120117188, 0.6367454528808594, 0.65380859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 18.0, 31.0, 50.0, 137.0, 531.0, 109.0, 40.0, 32.0, 11.0, 7.0, 12.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3245868682861328, -0.3159217834472656, -0.30725669860839844, -0.29859161376953125, -0.28992652893066406, -0.2812614440917969, -0.2725963592529297, -0.2639312744140625, -0.2552661895751953, -0.24660110473632812, -0.23793601989746094, -0.22927093505859375, -0.22060585021972656, -0.21194076538085938, -0.2032756805419922, -0.194610595703125, -0.1859455108642578, -0.17728042602539062, -0.16861534118652344, -0.15995025634765625, -0.15128517150878906, -0.14262008666992188, -0.1339550018310547, -0.1252899169921875, -0.11662483215332031, -0.10795974731445312, -0.09929466247558594, -0.09062957763671875, -0.08196449279785156, -0.07329940795898438, -0.06463432312011719, -0.05596923828125, -0.04730415344238281, -0.038639068603515625, -0.029973983764648438, -0.02130889892578125, -0.012643814086914062, -0.003978729248046875, 0.0046863555908203125, 0.0133514404296875, 0.022016525268554688, 0.030681610107421875, 0.03934669494628906, 0.04801177978515625, 0.05667686462402344, 0.06534194946289062, 0.07400703430175781, 0.082672119140625, 0.09133720397949219, 0.10000228881835938, 0.10866737365722656, 0.11733245849609375, 0.12599754333496094, 0.13466262817382812, 0.1433277130126953, 0.1519927978515625, 0.1606578826904297, 0.16932296752929688, 0.17798805236816406, 0.18665313720703125, 0.19531822204589844, 0.20398330688476562, 0.2126483917236328, 0.2213134765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 16.0, 42.0, 108.0, 314.0, 312.0, 121.0, 42.0, 18.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.555488586425781, -9.352388381958008, -9.149288177490234, -8.946187019348145, -8.743086814880371, -8.539986610412598, -8.336885452270508, -8.133785247802734, -7.930685043334961, -7.7275848388671875, -7.524484157562256, -7.321383476257324, -7.118283271789551, -6.915183067321777, -6.712082386016846, -6.508981704711914, -6.305881500244141, -6.102781295776367, -5.8996806144714355, -5.696579933166504, -5.4934797286987305, -5.290379524230957, -5.087278842926025, -4.884178161621094, -4.68107795715332, -4.477977752685547, -4.274877071380615, -4.071776390075684, -3.86867618560791, -3.6655757427215576, -3.462475299835205, -3.2593748569488525, -3.056274890899658, -2.8531744480133057, -2.650074005126953, -2.4469735622406006, -2.243873119354248, -2.0407726764678955, -1.837672233581543, -1.6345717906951904, -1.431471347808838, -1.2283709049224854, -1.0252704620361328, -0.8221700191497803, -0.6190695762634277, -0.4159691333770752, -0.21286869049072266, -0.009768247604370117, 0.19333219528198242, 0.39643263816833496, 0.5995330810546875, 0.80263352394104, 1.0057339668273926, 1.2088344097137451, 1.4119348526000977, 1.6150352954864502, 1.8181357383728027, 2.0212361812591553, 2.224336624145508, 2.4274370670318604, 2.630537509918213, 2.8336379528045654, 3.036738395690918, 3.2398388385772705, 3.442939281463623]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 3.0, 7.0, 7.0, 19.0, 9.0, 16.0, 18.0, 24.0, 27.0, 26.0, 31.0, 32.0, 21.0, 41.0, 36.0, 47.0, 41.0, 54.0, 34.0, 40.0, 47.0, 43.0, 40.0, 32.0, 39.0, 37.0, 27.0, 27.0, 19.0, 19.0, 22.0, 12.0, 20.0, 13.0, 7.0, 8.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.3098936080932617, -2.2411890029907227, -2.1724843978881836, -2.1037797927856445, -2.0350751876831055, -1.9663704633712769, -1.8976657390594482, -1.8289611339569092, -1.7602565288543701, -1.691551923751831, -1.622847318649292, -1.5541425943374634, -1.4854379892349243, -1.4167333841323853, -1.3480286598205566, -1.2793240547180176, -1.2106194496154785, -1.1419148445129395, -1.0732102394104004, -1.0045055150985718, -0.9358009099960327, -0.8670963048934937, -0.7983916401863098, -0.729686975479126, -0.6609823703765869, -0.5922777652740479, -0.523573100566864, -0.45486846566200256, -0.3861638307571411, -0.31745919585227966, -0.2487545609474182, -0.18004992604255676, -0.11134552955627441, -0.042640894651412964, 0.026063740253448486, 0.09476837515830994, 0.1634730100631714, 0.23217764496803284, 0.3008822798728943, 0.36958691477775574, 0.4382915496826172, 0.5069961547851562, 0.5757008194923401, 0.6444054841995239, 0.713110089302063, 0.781814694404602, 0.8505193591117859, 0.9192240238189697, 0.9879286289215088, 1.0566332340240479, 1.125337839126587, 1.1940425634384155, 1.2627471685409546, 1.3314517736434937, 1.4001564979553223, 1.4688611030578613, 1.5375657081604004, 1.6062703132629395, 1.6749749183654785, 1.7436796426773071, 1.8123842477798462, 1.8810888528823853, 1.9497935771942139, 2.018498182296753, 2.087202787399292]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 0.0, 9.0, 7.0, 8.0, 10.0, 17.0, 38.0, 48.0, 69.0, 119.0, 167.0, 263.0, 523.0, 918.0, 2076.0, 6992.0, 67754.0, 3995969.0, 105785.0, 8640.0, 2476.0, 1033.0, 532.0, 309.0, 178.0, 103.0, 76.0, 52.0, 29.0, 23.0, 21.0, 10.0, 2.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.35546875, -3.255462646484375, -3.15545654296875, -3.055450439453125, -2.9554443359375, -2.855438232421875, -2.75543212890625, -2.655426025390625, -2.555419921875, -2.455413818359375, -2.35540771484375, -2.255401611328125, -2.1553955078125, -2.055389404296875, -1.95538330078125, -1.855377197265625, -1.75537109375, -1.655364990234375, -1.55535888671875, -1.455352783203125, -1.3553466796875, -1.255340576171875, -1.15533447265625, -1.055328369140625, -0.955322265625, -0.855316162109375, -0.75531005859375, -0.655303955078125, -0.5552978515625, -0.455291748046875, -0.35528564453125, -0.255279541015625, -0.1552734375, -0.055267333984375, 0.04473876953125, 0.144744873046875, 0.2447509765625, 0.344757080078125, 0.44476318359375, 0.544769287109375, 0.644775390625, 0.744781494140625, 0.84478759765625, 0.944793701171875, 1.0447998046875, 1.144805908203125, 1.24481201171875, 1.344818115234375, 1.44482421875, 1.544830322265625, 1.64483642578125, 1.744842529296875, 1.8448486328125, 1.944854736328125, 2.04486083984375, 2.144866943359375, 2.244873046875, 2.344879150390625, 2.44488525390625, 2.544891357421875, 2.6448974609375, 2.744903564453125, 2.84490966796875, 2.944915771484375, 3.044921875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 11.0, 3.0, 6.0, 12.0, 17.0, 29.0, 30.0, 48.0, 47.0, 57.0, 77.0, 92.0, 98.0, 76.0, 95.0, 66.0, 50.0, 39.0, 38.0, 38.0, 22.0, 24.0, 9.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1889190673828125, -1.150299072265625, -1.1116790771484375, -1.07305908203125, -1.0344390869140625, -0.995819091796875, -0.9571990966796875, -0.9185791015625, -0.8799591064453125, -0.841339111328125, -0.8027191162109375, -0.76409912109375, -0.7254791259765625, -0.686859130859375, -0.6482391357421875, -0.609619140625, -0.5709991455078125, -0.532379150390625, -0.4937591552734375, -0.45513916015625, -0.4165191650390625, -0.377899169921875, -0.3392791748046875, -0.3006591796875, -0.2620391845703125, -0.223419189453125, -0.1847991943359375, -0.14617919921875, -0.1075592041015625, -0.068939208984375, -0.0303192138671875, 0.00830078125, 0.0469207763671875, 0.085540771484375, 0.1241607666015625, 0.16278076171875, 0.2014007568359375, 0.240020751953125, 0.2786407470703125, 0.3172607421875, 0.3558807373046875, 0.394500732421875, 0.4331207275390625, 0.47174072265625, 0.5103607177734375, 0.548980712890625, 0.5876007080078125, 0.626220703125, 0.6648406982421875, 0.703460693359375, 0.7420806884765625, 0.78070068359375, 0.8193206787109375, 0.857940673828125, 0.8965606689453125, 0.9351806640625, 0.9738006591796875, 1.012420654296875, 1.0510406494140625, 1.08966064453125, 1.1282806396484375, 1.166900634765625, 1.2055206298828125, 1.244140625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 7.0, 6.0, 12.0, 9.0, 24.0, 41.0, 66.0, 145.0, 261.0, 585.0, 1511.0, 4606.0, 22111.0, 741533.0, 3382705.0, 31462.0, 6049.0, 1757.0, 732.0, 311.0, 151.0, 70.0, 49.0, 23.0, 21.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.074951171875, -2.98974609375, -2.904541015625, -2.8193359375, -2.734130859375, -2.64892578125, -2.563720703125, -2.478515625, -2.393310546875, -2.30810546875, -2.222900390625, -2.1376953125, -2.052490234375, -1.96728515625, -1.882080078125, -1.796875, -1.711669921875, -1.62646484375, -1.541259765625, -1.4560546875, -1.370849609375, -1.28564453125, -1.200439453125, -1.115234375, -1.030029296875, -0.94482421875, -0.859619140625, -0.7744140625, -0.689208984375, -0.60400390625, -0.518798828125, -0.43359375, -0.348388671875, -0.26318359375, -0.177978515625, -0.0927734375, -0.007568359375, 0.07763671875, 0.162841796875, 0.248046875, 0.333251953125, 0.41845703125, 0.503662109375, 0.5888671875, 0.674072265625, 0.75927734375, 0.844482421875, 0.9296875, 1.014892578125, 1.10009765625, 1.185302734375, 1.2705078125, 1.355712890625, 1.44091796875, 1.526123046875, 1.611328125, 1.696533203125, 1.78173828125, 1.866943359375, 1.9521484375, 2.037353515625, 2.12255859375, 2.207763671875, 2.29296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 8.0, 8.0, 12.0, 9.0, 19.0, 24.0, 25.0, 60.0, 122.0, 305.0, 953.0, 1550.0, 536.0, 207.0, 86.0, 43.0, 31.0, 19.0, 17.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5350570678710938, -0.5154266357421875, -0.49579620361328125, -0.476165771484375, -0.45653533935546875, -0.4369049072265625, -0.41727447509765625, -0.39764404296875, -0.37801361083984375, -0.3583831787109375, -0.33875274658203125, -0.319122314453125, -0.29949188232421875, -0.2798614501953125, -0.26023101806640625, -0.2406005859375, -0.22097015380859375, -0.2013397216796875, -0.18170928955078125, -0.162078857421875, -0.14244842529296875, -0.1228179931640625, -0.10318756103515625, -0.08355712890625, -0.06392669677734375, -0.0442962646484375, -0.02466583251953125, -0.005035400390625, 0.01459503173828125, 0.0342254638671875, 0.05385589599609375, 0.073486328125, 0.09311676025390625, 0.1127471923828125, 0.13237762451171875, 0.152008056640625, 0.17163848876953125, 0.1912689208984375, 0.21089935302734375, 0.23052978515625, 0.25016021728515625, 0.2697906494140625, 0.28942108154296875, 0.309051513671875, 0.32868194580078125, 0.3483123779296875, 0.36794281005859375, 0.3875732421875, 0.40720367431640625, 0.4268341064453125, 0.44646453857421875, 0.466094970703125, 0.48572540283203125, 0.5053558349609375, 0.5249862670898438, 0.54461669921875, 0.5642471313476562, 0.5838775634765625, 0.6035079956054688, 0.623138427734375, 0.6427688598632812, 0.6623992919921875, 0.6820297241210938, 0.70166015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 10.0, 19.0, 32.0, 47.0, 89.0, 143.0, 198.0, 194.0, 97.0, 59.0, 38.0, 23.0, 15.0, 15.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3228342533111572, -3.2410762310028076, -3.159317970275879, -3.0775599479675293, -2.9958016872406006, -2.914043664932251, -2.8322854042053223, -2.7505273818969727, -2.668769359588623, -2.5870113372802734, -2.5052530765533447, -2.423495054244995, -2.3417367935180664, -2.259978771209717, -2.178220748901367, -2.0964624881744385, -2.0147042274475098, -1.9329460859298706, -1.8511879444122314, -1.7694299221038818, -1.6876717805862427, -1.6059136390686035, -1.5241554975509644, -1.4423973560333252, -1.3606393337249756, -1.2788811922073364, -1.1971230506896973, -1.1153650283813477, -1.0336068868637085, -0.9518487453460693, -0.8700906038284302, -0.7883325219154358, -0.7065744400024414, -0.6248162984848022, -0.5430582165718079, -0.4613000750541687, -0.37954196333885193, -0.29778385162353516, -0.216025710105896, -0.1342676281929016, -0.05250948667526245, 0.029248632490634918, 0.11100675165653229, 0.19276487827301025, 0.274522989988327, 0.3562811017036438, 0.43803924322128296, 0.5197973251342773, 0.6015554666519165, 0.6833136081695557, 0.76507169008255, 0.8468298316001892, 0.9285879135131836, 1.0103460550308228, 1.092104196548462, 1.1738622188568115, 1.2556204795837402, 1.3373786211013794, 1.4191367626190186, 1.5008947849273682, 1.5826529264450073, 1.6644110679626465, 1.7461692094802856, 1.8279273509979248, 1.9096853733062744]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 3.0, 11.0, 15.0, 15.0, 15.0, 28.0, 29.0, 27.0, 41.0, 29.0, 49.0, 56.0, 60.0, 44.0, 53.0, 50.0, 53.0, 61.0, 48.0, 46.0, 45.0, 38.0, 34.0, 32.0, 22.0, 15.0, 14.0, 13.0, 8.0, 12.0, 11.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0057085752487183, -0.9715639352798462, -0.9374192357063293, -0.9032745957374573, -0.8691298961639404, -0.8349852561950684, -0.8008406162261963, -0.7666959762573242, -0.7325512766838074, -0.6984066367149353, -0.6642619371414185, -0.6301172971725464, -0.5959726572036743, -0.5618279576301575, -0.5276833176612854, -0.49353864789009094, -0.4593939781188965, -0.425249308347702, -0.39110463857650757, -0.3569599986076355, -0.32281532883644104, -0.2886706590652466, -0.2545260190963745, -0.22038134932518005, -0.1862366795539856, -0.15209200978279114, -0.11794735491275787, -0.08380269259214401, -0.04965803027153015, -0.015513360500335693, 0.01863129436969757, 0.052775949239730835, 0.08692061901092529, 0.12106528133153915, 0.15520994365215302, 0.18935459852218628, 0.22349926829338074, 0.2576439380645752, 0.29178857803344727, 0.3259332478046417, 0.3600779175758362, 0.39422258734703064, 0.4283672571182251, 0.46251189708709717, 0.4966565668582916, 0.5308012366294861, 0.5649458765983582, 0.599090576171875, 0.6332352161407471, 0.6673798561096191, 0.701524555683136, 0.7356691956520081, 0.7698138952255249, 0.803958535194397, 0.838103175163269, 0.8722478151321411, 0.906392514705658, 0.94053715467453, 0.9746818542480469, 1.008826494216919, 1.042971134185791, 1.077115774154663, 1.1112605333328247, 1.1454051733016968, 1.1795498132705688]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 1.0, 8.0, 8.0, 18.0, 27.0, 38.0, 51.0, 125.0, 188.0, 320.0, 610.0, 1244.0, 2685.0, 7043.0, 25783.0, 331371.0, 629034.0, 35328.0, 8512.0, 3169.0, 1397.0, 681.0, 358.0, 229.0, 115.0, 68.0, 50.0, 24.0, 23.0, 16.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7705078125, -0.747222900390625, -0.72393798828125, -0.700653076171875, -0.6773681640625, -0.654083251953125, -0.63079833984375, -0.607513427734375, -0.584228515625, -0.560943603515625, -0.53765869140625, -0.514373779296875, -0.4910888671875, -0.467803955078125, -0.44451904296875, -0.421234130859375, -0.39794921875, -0.374664306640625, -0.35137939453125, -0.328094482421875, -0.3048095703125, -0.281524658203125, -0.25823974609375, -0.234954833984375, -0.211669921875, -0.188385009765625, -0.16510009765625, -0.141815185546875, -0.1185302734375, -0.095245361328125, -0.07196044921875, -0.048675537109375, -0.025390625, -0.002105712890625, 0.02117919921875, 0.044464111328125, 0.0677490234375, 0.091033935546875, 0.11431884765625, 0.137603759765625, 0.160888671875, 0.184173583984375, 0.20745849609375, 0.230743408203125, 0.2540283203125, 0.277313232421875, 0.30059814453125, 0.323883056640625, 0.34716796875, 0.370452880859375, 0.39373779296875, 0.417022705078125, 0.4403076171875, 0.463592529296875, 0.48687744140625, 0.510162353515625, 0.533447265625, 0.556732177734375, 0.58001708984375, 0.603302001953125, 0.6265869140625, 0.649871826171875, 0.67315673828125, 0.696441650390625, 0.7197265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 27.0, 27.0, 45.0, 40.0, 36.0, 69.0, 75.0, 69.0, 69.0, 65.0, 72.0, 61.0, 62.0, 56.0, 47.0, 32.0, 25.0, 15.0, 10.0, 17.0, 14.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -1.0159378051757812, -0.9859771728515625, -0.9560165405273438, -0.926055908203125, -0.8960952758789062, -0.8661346435546875, -0.8361740112304688, -0.80621337890625, -0.7762527465820312, -0.7462921142578125, -0.7163314819335938, -0.686370849609375, -0.6564102172851562, -0.6264495849609375, -0.5964889526367188, -0.5665283203125, -0.5365676879882812, -0.5066070556640625, -0.47664642333984375, -0.446685791015625, -0.41672515869140625, -0.3867645263671875, -0.35680389404296875, -0.32684326171875, -0.29688262939453125, -0.2669219970703125, -0.23696136474609375, -0.207000732421875, -0.17704010009765625, -0.1470794677734375, -0.11711883544921875, -0.087158203125, -0.05719757080078125, -0.0272369384765625, 0.00272369384765625, 0.032684326171875, 0.06264495849609375, 0.0926055908203125, 0.12256622314453125, 0.15252685546875, 0.18248748779296875, 0.2124481201171875, 0.24240875244140625, 0.272369384765625, 0.30233001708984375, 0.3322906494140625, 0.36225128173828125, 0.3922119140625, 0.42217254638671875, 0.4521331787109375, 0.48209381103515625, 0.512054443359375, 0.5420150756835938, 0.5719757080078125, 0.6019363403320312, 0.63189697265625, 0.6618576049804688, 0.6918182373046875, 0.7217788696289062, 0.751739501953125, 0.7817001342773438, 0.8116607666015625, 0.8416213989257812, 0.87158203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 4.0, 10.0, 13.0, 26.0, 29.0, 46.0, 78.0, 130.0, 210.0, 355.0, 686.0, 1357.0, 3040.0, 7381.0, 23880.0, 174959.0, 726814.0, 83043.0, 16053.0, 5517.0, 2391.0, 1089.0, 612.0, 326.0, 157.0, 97.0, 66.0, 42.0, 23.0, 29.0, 9.0, 17.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.46728515625, -0.45368194580078125, -0.4400787353515625, -0.42647552490234375, -0.412872314453125, -0.39926910400390625, -0.3856658935546875, -0.37206268310546875, -0.35845947265625, -0.34485626220703125, -0.3312530517578125, -0.31764984130859375, -0.304046630859375, -0.29044342041015625, -0.2768402099609375, -0.26323699951171875, -0.2496337890625, -0.23603057861328125, -0.2224273681640625, -0.20882415771484375, -0.195220947265625, -0.18161773681640625, -0.1680145263671875, -0.15441131591796875, -0.14080810546875, -0.12720489501953125, -0.1136016845703125, -0.09999847412109375, -0.086395263671875, -0.07279205322265625, -0.0591888427734375, -0.04558563232421875, -0.031982421875, -0.01837921142578125, -0.0047760009765625, 0.00882720947265625, 0.022430419921875, 0.03603363037109375, 0.0496368408203125, 0.06324005126953125, 0.07684326171875, 0.09044647216796875, 0.1040496826171875, 0.11765289306640625, 0.131256103515625, 0.14485931396484375, 0.1584625244140625, 0.17206573486328125, 0.1856689453125, 0.19927215576171875, 0.2128753662109375, 0.22647857666015625, 0.240081787109375, 0.25368499755859375, 0.2672882080078125, 0.28089141845703125, 0.29449462890625, 0.30809783935546875, 0.3217010498046875, 0.33530426025390625, 0.348907470703125, 0.36251068115234375, 0.3761138916015625, 0.38971710205078125, 0.4033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 7.0, 7.0, 10.0, 8.0, 19.0, 24.0, 20.0, 18.0, 32.0, 29.0, 29.0, 37.0, 44.0, 47.0, 44.0, 39.0, 46.0, 46.0, 58.0, 34.0, 42.0, 45.0, 27.0, 49.0, 46.0, 27.0, 30.0, 26.0, 24.0, 13.0, 13.0, 8.0, 12.0, 9.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.1720123291015625, -1.131134033203125, -1.0902557373046875, -1.04937744140625, -1.0084991455078125, -0.967620849609375, -0.9267425537109375, -0.8858642578125, -0.8449859619140625, -0.804107666015625, -0.7632293701171875, -0.72235107421875, -0.6814727783203125, -0.640594482421875, -0.5997161865234375, -0.558837890625, -0.5179595947265625, -0.477081298828125, -0.4362030029296875, -0.39532470703125, -0.3544464111328125, -0.313568115234375, -0.2726898193359375, -0.2318115234375, -0.1909332275390625, -0.150054931640625, -0.1091766357421875, -0.06829833984375, -0.0274200439453125, 0.013458251953125, 0.0543365478515625, 0.09521484375, 0.1360931396484375, 0.176971435546875, 0.2178497314453125, 0.25872802734375, 0.2996063232421875, 0.340484619140625, 0.3813629150390625, 0.4222412109375, 0.4631195068359375, 0.503997802734375, 0.5448760986328125, 0.58575439453125, 0.6266326904296875, 0.667510986328125, 0.7083892822265625, 0.749267578125, 0.7901458740234375, 0.831024169921875, 0.8719024658203125, 0.91278076171875, 0.9536590576171875, 0.994537353515625, 1.0354156494140625, 1.0762939453125, 1.1171722412109375, 1.158050537109375, 1.1989288330078125, 1.23980712890625, 1.2806854248046875, 1.321563720703125, 1.3624420166015625, 1.4033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 8.0, 14.0, 18.0, 41.0, 43.0, 78.0, 94.0, 165.0, 232.0, 332.0, 567.0, 945.0, 1649.0, 3130.0, 6716.0, 19275.0, 84589.0, 621443.0, 248304.0, 39653.0, 11095.0, 4596.0, 2179.0, 1256.0, 768.0, 430.0, 314.0, 197.0, 106.0, 88.0, 61.0, 47.0, 30.0, 22.0, 12.0, 12.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07757568359375, -0.07505416870117188, -0.07253265380859375, -0.07001113891601562, -0.0674896240234375, -0.06496810913085938, -0.06244659423828125, -0.059925079345703125, -0.057403564453125, -0.054882049560546875, -0.05236053466796875, -0.049839019775390625, -0.0473175048828125, -0.044795989990234375, -0.04227447509765625, -0.039752960205078125, -0.0372314453125, -0.034709930419921875, -0.03218841552734375, -0.029666900634765625, -0.0271453857421875, -0.024623870849609375, -0.02210235595703125, -0.019580841064453125, -0.017059326171875, -0.014537811279296875, -0.01201629638671875, -0.009494781494140625, -0.0069732666015625, -0.004451751708984375, -0.00193023681640625, 0.000591278076171875, 0.00311279296875, 0.005634307861328125, 0.00815582275390625, 0.010677337646484375, 0.0131988525390625, 0.015720367431640625, 0.01824188232421875, 0.020763397216796875, 0.023284912109375, 0.025806427001953125, 0.02832794189453125, 0.030849456787109375, 0.0333709716796875, 0.035892486572265625, 0.03841400146484375, 0.040935516357421875, 0.04345703125, 0.045978546142578125, 0.04850006103515625, 0.051021575927734375, 0.0535430908203125, 0.056064605712890625, 0.05858612060546875, 0.061107635498046875, 0.063629150390625, 0.06615066528320312, 0.06867218017578125, 0.07119369506835938, 0.0737152099609375, 0.07623672485351562, 0.07875823974609375, 0.08127975463867188, 0.08380126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 20.0, 33.0, 54.0, 79.0, 107.0, 198.0, 174.0, 126.0, 62.0, 35.0, 30.0, 13.0, 11.0, 13.0, 4.0, 7.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97834587097168e-05, -5.797017365694046e-05, -5.6156888604164124e-05, -5.434360355138779e-05, -5.253031849861145e-05, -5.0717033445835114e-05, -4.890374839305878e-05, -4.709046334028244e-05, -4.5277178287506104e-05, -4.346389323472977e-05, -4.165060818195343e-05, -3.9837323129177094e-05, -3.802403807640076e-05, -3.621075302362442e-05, -3.4397467970848083e-05, -3.258418291807175e-05, -3.077089786529541e-05, -2.8957612812519073e-05, -2.7144327759742737e-05, -2.53310427069664e-05, -2.3517757654190063e-05, -2.1704472601413727e-05, -1.989118754863739e-05, -1.8077902495861053e-05, -1.6264617443084717e-05, -1.445133239030838e-05, -1.2638047337532043e-05, -1.0824762284755707e-05, -9.01147723197937e-06, -7.1981921792030334e-06, -5.384907126426697e-06, -3.57162207365036e-06, -1.7583370208740234e-06, 5.494803190231323e-08, 1.86823308467865e-06, 3.6815181374549866e-06, 5.494803190231323e-06, 7.30808824300766e-06, 9.121373295783997e-06, 1.0934658348560333e-05, 1.274794340133667e-05, 1.4561228454113007e-05, 1.6374513506889343e-05, 1.818779855966568e-05, 2.0001083612442017e-05, 2.1814368665218353e-05, 2.362765371799469e-05, 2.5440938770771027e-05, 2.7254223823547363e-05, 2.90675088763237e-05, 3.088079392910004e-05, 3.269407898187637e-05, 3.450736403465271e-05, 3.632064908742905e-05, 3.813393414020538e-05, 3.994721919298172e-05, 4.176050424575806e-05, 4.357378929853439e-05, 4.538707435131073e-05, 4.720035940408707e-05, 4.90136444568634e-05, 5.082692950963974e-05, 5.264021456241608e-05, 5.445349961519241e-05, 5.626678466796875e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 13.0, 15.0, 29.0, 25.0, 33.0, 55.0, 92.0, 151.0, 218.0, 341.0, 528.0, 986.0, 1756.0, 3372.0, 6967.0, 16221.0, 44395.0, 156668.0, 530194.0, 198350.0, 53153.0, 18460.0, 7972.0, 3808.0, 1944.0, 1099.0, 610.0, 373.0, 232.0, 152.0, 98.0, 70.0, 53.0, 28.0, 23.0, 16.0, 4.0, 7.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.07537841796875, -0.07325983047485352, -0.07114124298095703, -0.06902265548706055, -0.06690406799316406, -0.06478548049926758, -0.0626668930053711, -0.06054830551147461, -0.058429718017578125, -0.05631113052368164, -0.054192543029785156, -0.05207395553588867, -0.04995536804199219, -0.0478367805480957, -0.04571819305419922, -0.043599605560302734, -0.04148101806640625, -0.039362430572509766, -0.03724384307861328, -0.0351252555847168, -0.03300666809082031, -0.030888080596923828, -0.028769493103027344, -0.02665090560913086, -0.024532318115234375, -0.02241373062133789, -0.020295143127441406, -0.018176555633544922, -0.016057968139648438, -0.013939380645751953, -0.011820793151855469, -0.009702205657958984, -0.0075836181640625, -0.005465030670166016, -0.0033464431762695312, -0.0012278556823730469, 0.0008907318115234375, 0.003009319305419922, 0.005127906799316406, 0.007246494293212891, 0.009365081787109375, 0.01148366928100586, 0.013602256774902344, 0.015720844268798828, 0.017839431762695312, 0.019958019256591797, 0.02207660675048828, 0.024195194244384766, 0.02631378173828125, 0.028432369232177734, 0.03055095672607422, 0.0326695442199707, 0.03478813171386719, 0.03690671920776367, 0.039025306701660156, 0.04114389419555664, 0.043262481689453125, 0.04538106918334961, 0.047499656677246094, 0.04961824417114258, 0.05173683166503906, 0.05385541915893555, 0.05597400665283203, 0.058092594146728516, 0.060211181640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 3.0, 6.0, 16.0, 19.0, 11.0, 18.0, 37.0, 39.0, 44.0, 54.0, 57.0, 88.0, 104.0, 120.0, 75.0, 60.0, 49.0, 30.0, 31.0, 20.0, 21.0, 20.0, 11.0, 7.0, 10.0, 10.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186614990234375, -0.018013715744018555, -0.01736593246459961, -0.016718149185180664, -0.01607036590576172, -0.015422582626342773, -0.014774799346923828, -0.014127016067504883, -0.013479232788085938, -0.012831449508666992, -0.012183666229248047, -0.011535882949829102, -0.010888099670410156, -0.010240316390991211, -0.009592533111572266, -0.00894474983215332, -0.008296966552734375, -0.00764918327331543, -0.007001399993896484, -0.006353616714477539, -0.005705833435058594, -0.0050580501556396484, -0.004410266876220703, -0.003762483596801758, -0.0031147003173828125, -0.002466917037963867, -0.0018191337585449219, -0.0011713504791259766, -0.0005235671997070312, 0.00012421607971191406, 0.0007719993591308594, 0.0014197826385498047, 0.00206756591796875, 0.0027153491973876953, 0.0033631324768066406, 0.004010915756225586, 0.004658699035644531, 0.0053064823150634766, 0.005954265594482422, 0.006602048873901367, 0.0072498321533203125, 0.007897615432739258, 0.008545398712158203, 0.009193181991577148, 0.009840965270996094, 0.010488748550415039, 0.011136531829833984, 0.01178431510925293, 0.012432098388671875, 0.01307988166809082, 0.013727664947509766, 0.014375448226928711, 0.015023231506347656, 0.0156710147857666, 0.016318798065185547, 0.016966581344604492, 0.017614364624023438, 0.018262147903442383, 0.018909931182861328, 0.019557714462280273, 0.02020549774169922, 0.020853281021118164, 0.02150106430053711, 0.022148847579956055, 0.022796630859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 13.0, 10.0, 27.0, 41.0, 52.0, 81.0, 124.0, 143.0, 146.0, 111.0, 73.0, 49.0, 30.0, 17.0, 19.0, 10.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.304758071899414, -1.2662726640701294, -1.2277873754501343, -1.1893019676208496, -1.150816559791565, -1.1123311519622803, -1.0738458633422852, -1.0353604555130005, -0.9968751072883606, -0.9583897590637207, -0.919904351234436, -0.8814190030097961, -0.8429336547851562, -0.8044482469558716, -0.7659628987312317, -0.7274775505065918, -0.6889921426773071, -0.6505067944526672, -0.6120213866233826, -0.5735360383987427, -0.535050630569458, -0.4965652823448181, -0.4580799341201782, -0.41959455609321594, -0.38110917806625366, -0.3426238000392914, -0.3041384220123291, -0.2656530737876892, -0.22716769576072693, -0.18868231773376465, -0.15019695460796356, -0.11171159148216248, -0.07322633266448975, -0.03474096208810806, 0.0037444084882736206, 0.042229779064655304, 0.08071514964103699, 0.11920052766799927, 0.15768589079380035, 0.19617125391960144, 0.23465663194656372, 0.273142009973526, 0.3116273880004883, 0.3501127362251282, 0.38859811425209045, 0.42708349227905273, 0.4655688405036926, 0.5040541887283325, 0.5425395965576172, 0.5810249447822571, 0.6195103526115417, 0.6579957008361816, 0.6964811086654663, 0.7349664568901062, 0.7734518051147461, 0.8119372129440308, 0.8504225611686707, 0.8889079093933105, 0.9273933172225952, 0.9658786654472351, 1.004364013671875, 1.0428494215011597, 1.0813348293304443, 1.1198201179504395, 1.1583055257797241]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 10.0, 5.0, 8.0, 19.0, 9.0, 17.0, 28.0, 32.0, 37.0, 44.0, 43.0, 67.0, 67.0, 56.0, 56.0, 63.0, 69.0, 62.0, 45.0, 58.0, 39.0, 39.0, 31.0, 20.0, 9.0, 19.0, 19.0, 8.0, 9.0, 9.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9158645868301392, -0.8896703720092773, -0.8634761571884155, -0.8372819423675537, -0.8110877275466919, -0.7848935127258301, -0.7586992383003235, -0.7325050234794617, -0.7063108086585999, -0.680116593837738, -0.6539223790168762, -0.6277281641960144, -0.6015338897705078, -0.575339674949646, -0.5491454601287842, -0.5229512453079224, -0.49675703048706055, -0.47056281566619873, -0.4443686008453369, -0.4181743562221527, -0.3919801414012909, -0.3657859265804291, -0.3395916819572449, -0.31339746713638306, -0.28720325231552124, -0.2610090374946594, -0.2348148077726364, -0.2086205780506134, -0.1824263632297516, -0.15623214840888977, -0.13003791868686676, -0.10384368896484375, -0.07764947414398193, -0.05145525187253952, -0.025261029601097107, 0.0009331926703453064, 0.02712741494178772, 0.053321629762649536, 0.07951585948467255, 0.10571008920669556, 0.13190430402755737, 0.1580985188484192, 0.1842927485704422, 0.2104869782924652, 0.23668119311332703, 0.26287540793418884, 0.28906965255737305, 0.31526386737823486, 0.3414580821990967, 0.3676522970199585, 0.3938465118408203, 0.4200407564640045, 0.44623497128486633, 0.47242918610572815, 0.49862343072891235, 0.5248176455497742, 0.551011860370636, 0.5772060751914978, 0.6034002900123596, 0.6295945048332214, 0.655788779258728, 0.6819829940795898, 0.7081772089004517, 0.7343714237213135, 0.7605656385421753]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 11.0, 9.0, 14.0, 17.0, 25.0, 25.0, 48.0, 71.0, 105.0, 158.0, 245.0, 367.0, 578.0, 1086.0, 2016.0, 4324.0, 10959.0, 40761.0, 422892.0, 500046.0, 43922.0, 11549.0, 4357.0, 2091.0, 1102.0, 659.0, 378.0, 236.0, 164.0, 90.0, 71.0, 50.0, 27.0, 30.0, 17.0, 17.0, 12.0, 10.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7343902587890625, -0.711456298828125, -0.6885223388671875, -0.66558837890625, -0.6426544189453125, -0.619720458984375, -0.5967864990234375, -0.5738525390625, -0.5509185791015625, -0.527984619140625, -0.5050506591796875, -0.48211669921875, -0.4591827392578125, -0.436248779296875, -0.4133148193359375, -0.390380859375, -0.3674468994140625, -0.344512939453125, -0.3215789794921875, -0.29864501953125, -0.2757110595703125, -0.252777099609375, -0.2298431396484375, -0.2069091796875, -0.1839752197265625, -0.161041259765625, -0.1381072998046875, -0.11517333984375, -0.0922393798828125, -0.069305419921875, -0.0463714599609375, -0.0234375, -0.0005035400390625, 0.022430419921875, 0.0453643798828125, 0.06829833984375, 0.0912322998046875, 0.114166259765625, 0.1371002197265625, 0.1600341796875, 0.1829681396484375, 0.205902099609375, 0.2288360595703125, 0.25177001953125, 0.2747039794921875, 0.297637939453125, 0.3205718994140625, 0.343505859375, 0.3664398193359375, 0.389373779296875, 0.4123077392578125, 0.43524169921875, 0.4581756591796875, 0.481109619140625, 0.5040435791015625, 0.5269775390625, 0.5499114990234375, 0.572845458984375, 0.5957794189453125, 0.61871337890625, 0.6416473388671875, 0.664581298828125, 0.6875152587890625, 0.71044921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 3.0, 10.0, 8.0, 13.0, 12.0, 19.0, 23.0, 26.0, 38.0, 44.0, 38.0, 55.0, 55.0, 56.0, 45.0, 73.0, 81.0, 60.0, 55.0, 49.0, 48.0, 34.0, 31.0, 26.0, 17.0, 20.0, 8.0, 9.0, 12.0, 9.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.6640625, -1.61419677734375, -1.5643310546875, -1.51446533203125, -1.464599609375, -1.41473388671875, -1.3648681640625, -1.31500244140625, -1.26513671875, -1.21527099609375, -1.1654052734375, -1.11553955078125, -1.065673828125, -1.01580810546875, -0.9659423828125, -0.91607666015625, -0.8662109375, -0.81634521484375, -0.7664794921875, -0.71661376953125, -0.666748046875, -0.61688232421875, -0.5670166015625, -0.51715087890625, -0.46728515625, -0.41741943359375, -0.3675537109375, -0.31768798828125, -0.267822265625, -0.21795654296875, -0.1680908203125, -0.11822509765625, -0.068359375, -0.01849365234375, 0.0313720703125, 0.08123779296875, 0.131103515625, 0.18096923828125, 0.2308349609375, 0.28070068359375, 0.33056640625, 0.38043212890625, 0.4302978515625, 0.48016357421875, 0.530029296875, 0.57989501953125, 0.6297607421875, 0.67962646484375, 0.7294921875, 0.77935791015625, 0.8292236328125, 0.87908935546875, 0.928955078125, 0.97882080078125, 1.0286865234375, 1.07855224609375, 1.12841796875, 1.17828369140625, 1.2281494140625, 1.27801513671875, 1.327880859375, 1.37774658203125, 1.4276123046875, 1.47747802734375, 1.52734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 11.0, 13.0, 11.0, 16.0, 19.0, 14.0, 21.0, 16.0, 29.0, 45.0, 54.0, 73.0, 175.0, 335.0, 1132.0, 8879.0, 956885.0, 76253.0, 3299.0, 582.0, 237.0, 111.0, 74.0, 34.0, 38.0, 34.0, 25.0, 22.0, 19.0, 10.0, 20.0, 10.0, 7.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.275390625, -2.20147705078125, -2.1275634765625, -2.05364990234375, -1.979736328125, -1.90582275390625, -1.8319091796875, -1.75799560546875, -1.68408203125, -1.61016845703125, -1.5362548828125, -1.46234130859375, -1.388427734375, -1.31451416015625, -1.2406005859375, -1.16668701171875, -1.0927734375, -1.01885986328125, -0.9449462890625, -0.87103271484375, -0.797119140625, -0.72320556640625, -0.6492919921875, -0.57537841796875, -0.50146484375, -0.42755126953125, -0.3536376953125, -0.27972412109375, -0.205810546875, -0.13189697265625, -0.0579833984375, 0.01593017578125, 0.08984375, 0.16375732421875, 0.2376708984375, 0.31158447265625, 0.385498046875, 0.45941162109375, 0.5333251953125, 0.60723876953125, 0.68115234375, 0.75506591796875, 0.8289794921875, 0.90289306640625, 0.976806640625, 1.05072021484375, 1.1246337890625, 1.19854736328125, 1.2724609375, 1.34637451171875, 1.4202880859375, 1.49420166015625, 1.568115234375, 1.64202880859375, 1.7159423828125, 1.78985595703125, 1.86376953125, 1.93768310546875, 2.0115966796875, 2.08551025390625, 2.159423828125, 2.23333740234375, 2.3072509765625, 2.38116455078125, 2.455078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 10.0, 11.0, 8.0, 16.0, 10.0, 9.0, 20.0, 24.0, 24.0, 28.0, 28.0, 31.0, 38.0, 31.0, 36.0, 42.0, 39.0, 35.0, 54.0, 56.0, 45.0, 45.0, 41.0, 38.0, 27.0, 42.0, 29.0, 30.0, 26.0, 23.0, 11.0, 17.0, 15.0, 13.0, 13.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4541015625, -1.4105987548828125, -1.367095947265625, -1.3235931396484375, -1.28009033203125, -1.2365875244140625, -1.193084716796875, -1.1495819091796875, -1.1060791015625, -1.0625762939453125, -1.019073486328125, -0.9755706787109375, -0.93206787109375, -0.8885650634765625, -0.845062255859375, -0.8015594482421875, -0.758056640625, -0.7145538330078125, -0.671051025390625, -0.6275482177734375, -0.58404541015625, -0.5405426025390625, -0.497039794921875, -0.4535369873046875, -0.4100341796875, -0.3665313720703125, -0.323028564453125, -0.2795257568359375, -0.23602294921875, -0.1925201416015625, -0.149017333984375, -0.1055145263671875, -0.06201171875, -0.0185089111328125, 0.024993896484375, 0.0684967041015625, 0.11199951171875, 0.1555023193359375, 0.199005126953125, 0.2425079345703125, 0.2860107421875, 0.3295135498046875, 0.373016357421875, 0.4165191650390625, 0.46002197265625, 0.5035247802734375, 0.547027587890625, 0.5905303955078125, 0.634033203125, 0.6775360107421875, 0.721038818359375, 0.7645416259765625, 0.80804443359375, 0.8515472412109375, 0.895050048828125, 0.9385528564453125, 0.9820556640625, 1.0255584716796875, 1.069061279296875, 1.1125640869140625, 1.15606689453125, 1.1995697021484375, 1.243072509765625, 1.2865753173828125, 1.330078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 10.0, 20.0, 24.0, 46.0, 76.0, 172.0, 364.0, 948.0, 2925.0, 12579.0, 139968.0, 849730.0, 33564.0, 5507.0, 1490.0, 537.0, 253.0, 111.0, 61.0, 39.0, 25.0, 20.0, 16.0, 9.0, 10.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.3703498840332031, -0.35886383056640625, -0.3473777770996094, -0.3358917236328125, -0.3244056701660156, -0.31291961669921875, -0.3014335632324219, -0.289947509765625, -0.2784614562988281, -0.26697540283203125, -0.2554893493652344, -0.2440032958984375, -0.23251724243164062, -0.22103118896484375, -0.20954513549804688, -0.19805908203125, -0.18657302856445312, -0.17508697509765625, -0.16360092163085938, -0.1521148681640625, -0.14062881469726562, -0.12914276123046875, -0.11765670776367188, -0.106170654296875, -0.09468460083007812, -0.08319854736328125, -0.07171249389648438, -0.0602264404296875, -0.048740386962890625, -0.03725433349609375, -0.025768280029296875, -0.0142822265625, -0.002796173095703125, 0.00868988037109375, 0.020175933837890625, 0.0316619873046875, 0.043148040771484375, 0.05463409423828125, 0.06612014770507812, 0.077606201171875, 0.08909225463867188, 0.10057830810546875, 0.11206436157226562, 0.1235504150390625, 0.13503646850585938, 0.14652252197265625, 0.15800857543945312, 0.16949462890625, 0.18098068237304688, 0.19246673583984375, 0.20395278930664062, 0.2154388427734375, 0.22692489624023438, 0.23841094970703125, 0.24989700317382812, 0.261383056640625, 0.2728691101074219, 0.28435516357421875, 0.2958412170410156, 0.3073272705078125, 0.3188133239746094, 0.33029937744140625, 0.3417854309082031, 0.353271484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 11.0, 18.0, 34.0, 43.0, 91.0, 256.0, 301.0, 91.0, 54.0, 28.0, 13.0, 12.0, 12.0, 8.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.240606307983398e-05, -6.0395337641239166e-05, -5.838461220264435e-05, -5.637388676404953e-05, -5.436316132545471e-05, -5.2352435886859894e-05, -5.0341710448265076e-05, -4.833098500967026e-05, -4.632025957107544e-05, -4.430953413248062e-05, -4.22988086938858e-05, -4.0288083255290985e-05, -3.827735781669617e-05, -3.626663237810135e-05, -3.425590693950653e-05, -3.224518150091171e-05, -3.0234456062316895e-05, -2.8223730623722076e-05, -2.6213005185127258e-05, -2.420227974653244e-05, -2.2191554307937622e-05, -2.0180828869342804e-05, -1.8170103430747986e-05, -1.6159377992153168e-05, -1.414865255355835e-05, -1.2137927114963531e-05, -1.0127201676368713e-05, -8.116476237773895e-06, -6.105750799179077e-06, -4.095025360584259e-06, -2.084299921989441e-06, -7.35744833946228e-08, 1.9371509552001953e-06, 3.9478763937950134e-06, 5.9586018323898315e-06, 7.96932727098465e-06, 9.980052709579468e-06, 1.1990778148174286e-05, 1.4001503586769104e-05, 1.6012229025363922e-05, 1.802295446395874e-05, 2.003367990255356e-05, 2.2044405341148376e-05, 2.4055130779743195e-05, 2.6065856218338013e-05, 2.807658165693283e-05, 3.008730709552765e-05, 3.209803253412247e-05, 3.4108757972717285e-05, 3.61194834113121e-05, 3.813020884990692e-05, 4.014093428850174e-05, 4.215165972709656e-05, 4.4162385165691376e-05, 4.6173110604286194e-05, 4.818383604288101e-05, 5.019456148147583e-05, 5.220528692007065e-05, 5.4216012358665466e-05, 5.6226737797260284e-05, 5.82374632358551e-05, 6.024818867444992e-05, 6.225891411304474e-05, 6.426963955163956e-05, 6.628036499023438e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 9.0, 20.0, 22.0, 36.0, 53.0, 60.0, 148.0, 271.0, 562.0, 1355.0, 5568.0, 44041.0, 915266.0, 71124.0, 6955.0, 1655.0, 626.0, 314.0, 177.0, 104.0, 59.0, 37.0, 19.0, 16.0, 11.0, 2.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.35384368896484375, -0.3400115966796875, -0.32617950439453125, -0.312347412109375, -0.29851531982421875, -0.2846832275390625, -0.27085113525390625, -0.25701904296875, -0.24318695068359375, -0.2293548583984375, -0.21552276611328125, -0.201690673828125, -0.18785858154296875, -0.1740264892578125, -0.16019439697265625, -0.1463623046875, -0.13253021240234375, -0.1186981201171875, -0.10486602783203125, -0.091033935546875, -0.07720184326171875, -0.0633697509765625, -0.04953765869140625, -0.03570556640625, -0.02187347412109375, -0.0080413818359375, 0.00579071044921875, 0.019622802734375, 0.03345489501953125, 0.0472869873046875, 0.06111907958984375, 0.074951171875, 0.08878326416015625, 0.1026153564453125, 0.11644744873046875, 0.130279541015625, 0.14411163330078125, 0.1579437255859375, 0.17177581787109375, 0.18560791015625, 0.19944000244140625, 0.2132720947265625, 0.22710418701171875, 0.240936279296875, 0.25476837158203125, 0.2686004638671875, 0.28243255615234375, 0.2962646484375, 0.31009674072265625, 0.3239288330078125, 0.33776092529296875, 0.351593017578125, 0.36542510986328125, 0.3792572021484375, 0.39308929443359375, 0.40692138671875, 0.42075347900390625, 0.4345855712890625, 0.44841766357421875, 0.462249755859375, 0.47608184814453125, 0.4899139404296875, 0.5037460327148438, 0.517578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 12.0, 13.0, 20.0, 48.0, 77.0, 178.0, 373.0, 141.0, 59.0, 35.0, 22.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2556629180908203, -0.24863052368164062, -0.24159812927246094, -0.23456573486328125, -0.22753334045410156, -0.22050094604492188, -0.2134685516357422, -0.2064361572265625, -0.1994037628173828, -0.19237136840820312, -0.18533897399902344, -0.17830657958984375, -0.17127418518066406, -0.16424179077148438, -0.1572093963623047, -0.150177001953125, -0.1431446075439453, -0.13611221313476562, -0.12907981872558594, -0.12204742431640625, -0.11501502990722656, -0.10798263549804688, -0.10095024108886719, -0.0939178466796875, -0.08688545227050781, -0.07985305786132812, -0.07282066345214844, -0.06578826904296875, -0.05875587463378906, -0.051723480224609375, -0.04469108581542969, -0.03765869140625, -0.030626296997070312, -0.023593902587890625, -0.016561508178710938, -0.00952911376953125, -0.0024967193603515625, 0.004535675048828125, 0.011568069458007812, 0.0186004638671875, 0.025632858276367188, 0.032665252685546875, 0.03969764709472656, 0.04673004150390625, 0.05376243591308594, 0.060794830322265625, 0.06782722473144531, 0.074859619140625, 0.08189201354980469, 0.08892440795898438, 0.09595680236816406, 0.10298919677734375, 0.11002159118652344, 0.11705398559570312, 0.12408638000488281, 0.1311187744140625, 0.1381511688232422, 0.14518356323242188, 0.15221595764160156, 0.15924835205078125, 0.16628074645996094, 0.17331314086914062, 0.1803455352783203, 0.1873779296875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 12.0, 18.0, 39.0, 100.0, 234.0, 312.0, 151.0, 64.0, 35.0, 17.0, 16.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0284457206726074, -2.8633882999420166, -2.698330879211426, -2.533273696899414, -2.3682162761688232, -2.2031588554382324, -2.0381014347076416, -1.8730441331863403, -1.7079867124557495, -1.5429292917251587, -1.3778719902038574, -1.2128145694732666, -1.0477571487426758, -0.8826998472213745, -0.7176424264907837, -0.5525851249694824, -0.3875277042388916, -0.22247032821178436, -0.057412952184677124, 0.10764443874359131, 0.27270179986953735, 0.4377591609954834, 0.6028165817260742, 0.7678738832473755, 0.9329313039779663, 1.0979887247085571, 1.2630460262298584, 1.4281034469604492, 1.59316086769104, 1.7582181692123413, 1.9232755899429321, 2.0883328914642334, 2.253390312194824, 2.418447732925415, 2.583505153656006, 2.7485623359680176, 2.9136197566986084, 3.078677177429199, 3.24373459815979, 3.408792018890381, 3.5738492012023926, 3.7389066219329834, 3.903964042663574, 4.069021224975586, 4.234078884124756, 4.399136066436768, 4.5641937255859375, 4.729250907897949, 4.894308090209961, 5.059365272521973, 5.224422931671143, 5.389480113983154, 5.554537773132324, 5.719594955444336, 5.884652137756348, 6.049709796905518, 6.2147674560546875, 6.379824638366699, 6.544882297515869, 6.709939479827881, 6.874997138977051, 7.0400543212890625, 7.205111503601074, 7.370169162750244, 7.535226345062256]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 11.0, 8.0, 14.0, 12.0, 13.0, 22.0, 20.0, 17.0, 26.0, 26.0, 28.0, 26.0, 32.0, 28.0, 29.0, 28.0, 51.0, 34.0, 33.0, 33.0, 45.0, 38.0, 40.0, 31.0, 26.0, 43.0, 31.0, 32.0, 29.0, 27.0, 14.0, 23.0, 12.0, 10.0, 14.0, 15.0, 11.0, 12.0, 10.0, 6.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.9444060325622559, -1.8847922086715698, -1.8251783847808838, -1.7655645608901978, -1.7059507369995117, -1.6463369131088257, -1.5867230892181396, -1.5271092653274536, -1.4674954414367676, -1.4078816175460815, -1.3482677936553955, -1.2886539697647095, -1.2290401458740234, -1.1694263219833374, -1.1098124980926514, -1.0501986742019653, -0.9905848503112793, -0.9309710264205933, -0.8713572025299072, -0.8117433786392212, -0.7521295547485352, -0.6925157308578491, -0.6329019069671631, -0.573288083076477, -0.513674259185791, -0.454060435295105, -0.39444661140441895, -0.3348327875137329, -0.2752189636230469, -0.21560513973236084, -0.1559913158416748, -0.09637749195098877, -0.036763668060302734, 0.0228501558303833, 0.08246397972106934, 0.14207780361175537, 0.2016916275024414, 0.26130545139312744, 0.3209192752838135, 0.3805330991744995, 0.44014692306518555, 0.4997607469558716, 0.5593745708465576, 0.6189883947372437, 0.6786022186279297, 0.7382160425186157, 0.7978298664093018, 0.8574436902999878, 0.9170575141906738, 0.9766713380813599, 1.036285161972046, 1.095898985862732, 1.155512809753418, 1.215126633644104, 1.27474045753479, 1.334354281425476, 1.393968105316162, 1.4535819292068481, 1.5131957530975342, 1.5728095769882202, 1.6324234008789062, 1.6920372247695923, 1.7516510486602783, 1.8112648725509644, 1.8708786964416504]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 7.0, 16.0, 18.0, 38.0, 35.0, 62.0, 96.0, 151.0, 259.0, 437.0, 757.0, 1415.0, 2520.0, 5225.0, 17767.0, 150203.0, 3615512.0, 364729.0, 21289.0, 7154.0, 2983.0, 1485.0, 818.0, 485.0, 290.0, 170.0, 108.0, 77.0, 47.0, 42.0, 21.0, 17.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.846893310546875, -1.78656005859375, -1.726226806640625, -1.6658935546875, -1.605560302734375, -1.54522705078125, -1.484893798828125, -1.424560546875, -1.364227294921875, -1.30389404296875, -1.243560791015625, -1.1832275390625, -1.122894287109375, -1.06256103515625, -1.002227783203125, -0.94189453125, -0.881561279296875, -0.82122802734375, -0.760894775390625, -0.7005615234375, -0.640228271484375, -0.57989501953125, -0.519561767578125, -0.459228515625, -0.398895263671875, -0.33856201171875, -0.278228759765625, -0.2178955078125, -0.157562255859375, -0.09722900390625, -0.036895751953125, 0.0234375, 0.083770751953125, 0.14410400390625, 0.204437255859375, 0.2647705078125, 0.325103759765625, 0.38543701171875, 0.445770263671875, 0.506103515625, 0.566436767578125, 0.62677001953125, 0.687103271484375, 0.7474365234375, 0.807769775390625, 0.86810302734375, 0.928436279296875, 0.98876953125, 1.049102783203125, 1.10943603515625, 1.169769287109375, 1.2301025390625, 1.290435791015625, 1.35076904296875, 1.411102294921875, 1.471435546875, 1.531768798828125, 1.59210205078125, 1.652435302734375, 1.7127685546875, 1.773101806640625, 1.83343505859375, 1.893768310546875, 1.9541015625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 6.0, 8.0, 10.0, 20.0, 19.0, 21.0, 34.0, 47.0, 47.0, 66.0, 60.0, 76.0, 76.0, 77.0, 69.0, 68.0, 65.0, 55.0, 47.0, 29.0, 22.0, 28.0, 17.0, 9.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.208984375, -1.1755828857421875, -1.142181396484375, -1.1087799072265625, -1.07537841796875, -1.0419769287109375, -1.008575439453125, -0.9751739501953125, -0.9417724609375, -0.9083709716796875, -0.874969482421875, -0.8415679931640625, -0.80816650390625, -0.7747650146484375, -0.741363525390625, -0.7079620361328125, -0.674560546875, -0.6411590576171875, -0.607757568359375, -0.5743560791015625, -0.54095458984375, -0.5075531005859375, -0.474151611328125, -0.4407501220703125, -0.4073486328125, -0.3739471435546875, -0.340545654296875, -0.3071441650390625, -0.27374267578125, -0.2403411865234375, -0.206939697265625, -0.1735382080078125, -0.14013671875, -0.1067352294921875, -0.073333740234375, -0.0399322509765625, -0.00653076171875, 0.0268707275390625, 0.060272216796875, 0.0936737060546875, 0.1270751953125, 0.1604766845703125, 0.193878173828125, 0.2272796630859375, 0.26068115234375, 0.2940826416015625, 0.327484130859375, 0.3608856201171875, 0.394287109375, 0.4276885986328125, 0.461090087890625, 0.4944915771484375, 0.52789306640625, 0.5612945556640625, 0.594696044921875, 0.6280975341796875, 0.6614990234375, 0.6949005126953125, 0.728302001953125, 0.7617034912109375, 0.79510498046875, 0.8285064697265625, 0.861907958984375, 0.8953094482421875, 0.9287109375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 23.0, 18.0, 23.0, 33.0, 39.0, 69.0, 105.0, 195.0, 360.0, 838.0, 2448.0, 8412.0, 45247.0, 3793443.0, 314737.0, 20619.0, 4856.0, 1591.0, 549.0, 247.0, 133.0, 79.0, 61.0, 43.0, 28.0, 20.0, 14.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.47265625, -3.38311767578125, -3.2935791015625, -3.20404052734375, -3.114501953125, -3.02496337890625, -2.9354248046875, -2.84588623046875, -2.75634765625, -2.66680908203125, -2.5772705078125, -2.48773193359375, -2.398193359375, -2.30865478515625, -2.2191162109375, -2.12957763671875, -2.0400390625, -1.95050048828125, -1.8609619140625, -1.77142333984375, -1.681884765625, -1.59234619140625, -1.5028076171875, -1.41326904296875, -1.32373046875, -1.23419189453125, -1.1446533203125, -1.05511474609375, -0.965576171875, -0.87603759765625, -0.7864990234375, -0.69696044921875, -0.607421875, -0.51788330078125, -0.4283447265625, -0.33880615234375, -0.249267578125, -0.15972900390625, -0.0701904296875, 0.01934814453125, 0.10888671875, 0.19842529296875, 0.2879638671875, 0.37750244140625, 0.467041015625, 0.55657958984375, 0.6461181640625, 0.73565673828125, 0.8251953125, 0.91473388671875, 1.0042724609375, 1.09381103515625, 1.183349609375, 1.27288818359375, 1.3624267578125, 1.45196533203125, 1.54150390625, 1.63104248046875, 1.7205810546875, 1.81011962890625, 1.899658203125, 1.98919677734375, 2.0787353515625, 2.16827392578125, 2.2578125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 3.0, 6.0, 15.0, 27.0, 16.0, 29.0, 52.0, 81.0, 245.0, 743.0, 1649.0, 747.0, 249.0, 74.0, 32.0, 31.0, 13.0, 10.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486572265625, -0.4628105163574219, -0.43904876708984375, -0.4152870178222656, -0.3915252685546875, -0.3677635192871094, -0.34400177001953125, -0.3202400207519531, -0.296478271484375, -0.2727165222167969, -0.24895477294921875, -0.22519302368164062, -0.2014312744140625, -0.17766952514648438, -0.15390777587890625, -0.13014602661132812, -0.10638427734375, -0.08262252807617188, -0.05886077880859375, -0.035099029541015625, -0.0113372802734375, 0.012424468994140625, 0.03618621826171875, 0.059947967529296875, 0.083709716796875, 0.10747146606445312, 0.13123321533203125, 0.15499496459960938, 0.1787567138671875, 0.20251846313476562, 0.22628021240234375, 0.2500419616699219, 0.2738037109375, 0.2975654602050781, 0.32132720947265625, 0.3450889587402344, 0.3688507080078125, 0.3926124572753906, 0.41637420654296875, 0.4401359558105469, 0.463897705078125, 0.4876594543457031, 0.5114212036132812, 0.5351829528808594, 0.5589447021484375, 0.5827064514160156, 0.6064682006835938, 0.6302299499511719, 0.65399169921875, 0.6777534484863281, 0.7015151977539062, 0.7252769470214844, 0.7490386962890625, 0.7728004455566406, 0.7965621948242188, 0.8203239440917969, 0.844085693359375, 0.8678474426269531, 0.8916091918945312, 0.9153709411621094, 0.9391326904296875, 0.9628944396972656, 0.9866561889648438, 1.0104179382324219, 1.0341796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 12.0, 15.0, 27.0, 33.0, 53.0, 78.0, 115.0, 139.0, 139.0, 124.0, 81.0, 59.0, 41.0, 22.0, 18.0, 12.0, 8.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62961483001709, -2.5625107288360596, -2.4954066276550293, -2.428302526473999, -2.3611984252929688, -2.2940940856933594, -2.226990222930908, -2.159885883331299, -2.0927817821502686, -2.0256776809692383, -1.958573579788208, -1.8914694786071777, -1.824365258216858, -1.7572611570358276, -1.6901570558547974, -1.623052954673767, -1.5559488534927368, -1.4888447523117065, -1.4217406511306763, -1.3546364307403564, -1.2875323295593262, -1.220428228378296, -1.1533241271972656, -1.0862200260162354, -1.019115924835205, -0.9520118236541748, -0.8849076628684998, -0.8178035616874695, -0.7506994009017944, -0.6835952997207642, -0.6164911985397339, -0.5493870973587036, -0.48228275775909424, -0.4151786267757416, -0.3480744957923889, -0.28097039461135864, -0.21386626362800598, -0.14676213264465332, -0.07965803146362305, -0.012553900480270386, 0.054550230503082275, 0.12165435403585434, 0.1887584775686264, 0.25586259365081787, 0.32296672463417053, 0.3900708556175232, 0.45717495679855347, 0.5242791175842285, 0.5913832187652588, 0.6584873199462891, 0.7255914807319641, 0.7926955819129944, 0.8597997426986694, 0.9269038438796997, 0.99400794506073, 1.0611120462417603, 1.12821626663208, 1.1953203678131104, 1.2624244689941406, 1.329528570175171, 1.3966327905654907, 1.463736891746521, 1.5308409929275513, 1.5979450941085815, 1.6650491952896118]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 11.0, 10.0, 24.0, 25.0, 27.0, 40.0, 31.0, 39.0, 53.0, 40.0, 43.0, 43.0, 45.0, 57.0, 49.0, 41.0, 46.0, 60.0, 36.0, 31.0, 34.0, 21.0, 28.0, 29.0, 26.0, 8.0, 12.0, 11.0, 10.0, 12.0, 7.0, 5.0, 7.0, 0.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9882547855377197, -0.9553248286247253, -0.922394871711731, -0.8894649147987366, -0.8565349578857422, -0.823604941368103, -0.7906749844551086, -0.7577450275421143, -0.7248150706291199, -0.6918851137161255, -0.6589551568031311, -0.6260251998901367, -0.5930951833724976, -0.560165286064148, -0.5272352695465088, -0.4943053126335144, -0.46137535572052, -0.42844539880752563, -0.39551544189453125, -0.3625854551792145, -0.3296554982662201, -0.2967255413532257, -0.26379555463790894, -0.23086559772491455, -0.19793564081192017, -0.16500568389892578, -0.1320757120847702, -0.09914574772119522, -0.06621578335762024, -0.033285826444625854, -0.0003558546304702759, 0.0325741171836853, 0.06550419330596924, 0.09843415766954422, 0.1313641220331192, 0.16429409384727478, 0.19722405076026917, 0.23015400767326355, 0.2630839943885803, 0.2960139513015747, 0.3289439082145691, 0.3618738651275635, 0.39480382204055786, 0.42773380875587463, 0.460663765668869, 0.4935937225818634, 0.5265237092971802, 0.5594536662101746, 0.592383623123169, 0.6253135800361633, 0.6582435369491577, 0.6911734938621521, 0.7241034507751465, 0.7570334672927856, 0.78996342420578, 0.8228933811187744, 0.8558233380317688, 0.8887532949447632, 0.9216832518577576, 0.954613208770752, 0.9875432252883911, 1.0204731225967407, 1.0534031391143799, 1.0863330364227295, 1.1192630529403687]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 12.0, 8.0, 12.0, 21.0, 35.0, 45.0, 53.0, 102.0, 161.0, 223.0, 372.0, 706.0, 1299.0, 2778.0, 6736.0, 23649.0, 217912.0, 719673.0, 55169.0, 11492.0, 4061.0, 1772.0, 922.0, 491.0, 298.0, 182.0, 103.0, 92.0, 61.0, 38.0, 26.0, 15.0, 9.0, 9.0, 6.0, 5.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.626953125, -0.6062164306640625, -0.585479736328125, -0.5647430419921875, -0.54400634765625, -0.5232696533203125, -0.502532958984375, -0.4817962646484375, -0.4610595703125, -0.4403228759765625, -0.419586181640625, -0.3988494873046875, -0.37811279296875, -0.3573760986328125, -0.336639404296875, -0.3159027099609375, -0.295166015625, -0.2744293212890625, -0.253692626953125, -0.2329559326171875, -0.21221923828125, -0.1914825439453125, -0.170745849609375, -0.1500091552734375, -0.1292724609375, -0.1085357666015625, -0.087799072265625, -0.0670623779296875, -0.04632568359375, -0.0255889892578125, -0.004852294921875, 0.0158843994140625, 0.03662109375, 0.0573577880859375, 0.078094482421875, 0.0988311767578125, 0.11956787109375, 0.1403045654296875, 0.161041259765625, 0.1817779541015625, 0.2025146484375, 0.2232513427734375, 0.243988037109375, 0.2647247314453125, 0.28546142578125, 0.3061981201171875, 0.326934814453125, 0.3476715087890625, 0.368408203125, 0.3891448974609375, 0.409881591796875, 0.4306182861328125, 0.45135498046875, 0.4720916748046875, 0.492828369140625, 0.5135650634765625, 0.5343017578125, 0.5550384521484375, 0.575775146484375, 0.5965118408203125, 0.61724853515625, 0.6379852294921875, 0.658721923828125, 0.6794586181640625, 0.7001953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 5.0, 11.0, 16.0, 14.0, 24.0, 16.0, 28.0, 39.0, 39.0, 60.0, 57.0, 62.0, 56.0, 68.0, 68.0, 64.0, 63.0, 52.0, 47.0, 39.0, 32.0, 30.0, 29.0, 17.0, 11.0, 11.0, 14.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7861328125, -0.7613601684570312, -0.7365875244140625, -0.7118148803710938, -0.687042236328125, -0.6622695922851562, -0.6374969482421875, -0.6127243041992188, -0.58795166015625, -0.5631790161132812, -0.5384063720703125, -0.5136337280273438, -0.488861083984375, -0.46408843994140625, -0.4393157958984375, -0.41454315185546875, -0.3897705078125, -0.36499786376953125, -0.3402252197265625, -0.31545257568359375, -0.290679931640625, -0.26590728759765625, -0.2411346435546875, -0.21636199951171875, -0.19158935546875, -0.16681671142578125, -0.1420440673828125, -0.11727142333984375, -0.092498779296875, -0.06772613525390625, -0.0429534912109375, -0.01818084716796875, 0.006591796875, 0.03136444091796875, 0.0561370849609375, 0.08090972900390625, 0.105682373046875, 0.13045501708984375, 0.1552276611328125, 0.18000030517578125, 0.20477294921875, 0.22954559326171875, 0.2543182373046875, 0.27909088134765625, 0.303863525390625, 0.32863616943359375, 0.3534088134765625, 0.37818145751953125, 0.4029541015625, 0.42772674560546875, 0.4524993896484375, 0.47727203369140625, 0.502044677734375, 0.5268173217773438, 0.5515899658203125, 0.5763626098632812, 0.60113525390625, 0.6259078979492188, 0.6506805419921875, 0.6754531860351562, 0.700225830078125, 0.7249984741210938, 0.7497711181640625, 0.7745437622070312, 0.79931640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 20.0, 34.0, 58.0, 116.0, 201.0, 431.0, 926.0, 2478.0, 8355.0, 43527.0, 558814.0, 389976.0, 32953.0, 6829.0, 2185.0, 887.0, 347.0, 173.0, 85.0, 44.0, 30.0, 17.0, 11.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.461181640625, -0.4471778869628906, -0.43317413330078125, -0.4191703796386719, -0.4051666259765625, -0.3911628723144531, -0.37715911865234375, -0.3631553649902344, -0.349151611328125, -0.3351478576660156, -0.32114410400390625, -0.3071403503417969, -0.2931365966796875, -0.2791328430175781, -0.26512908935546875, -0.2511253356933594, -0.23712158203125, -0.22311782836914062, -0.20911407470703125, -0.19511032104492188, -0.1811065673828125, -0.16710281372070312, -0.15309906005859375, -0.13909530639648438, -0.125091552734375, -0.11108779907226562, -0.09708404541015625, -0.08308029174804688, -0.0690765380859375, -0.055072784423828125, -0.04106903076171875, -0.027065277099609375, -0.0130615234375, 0.000942230224609375, 0.01494598388671875, 0.028949737548828125, 0.0429534912109375, 0.056957244873046875, 0.07096099853515625, 0.08496475219726562, 0.098968505859375, 0.11297225952148438, 0.12697601318359375, 0.14097976684570312, 0.1549835205078125, 0.16898727416992188, 0.18299102783203125, 0.19699478149414062, 0.21099853515625, 0.22500228881835938, 0.23900604248046875, 0.2530097961425781, 0.2670135498046875, 0.2810173034667969, 0.29502105712890625, 0.3090248107910156, 0.323028564453125, 0.3370323181152344, 0.35103607177734375, 0.3650398254394531, 0.3790435791015625, 0.3930473327636719, 0.40705108642578125, 0.4210548400878906, 0.43505859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 3.0, 8.0, 5.0, 7.0, 9.0, 15.0, 13.0, 16.0, 15.0, 25.0, 20.0, 31.0, 32.0, 26.0, 42.0, 45.0, 36.0, 51.0, 48.0, 53.0, 52.0, 75.0, 41.0, 39.0, 37.0, 35.0, 30.0, 31.0, 25.0, 18.0, 21.0, 20.0, 11.0, 13.0, 7.0, 7.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3486328125, -1.3122634887695312, -1.2758941650390625, -1.2395248413085938, -1.203155517578125, -1.1667861938476562, -1.1304168701171875, -1.0940475463867188, -1.05767822265625, -1.0213088989257812, -0.9849395751953125, -0.9485702514648438, -0.912200927734375, -0.8758316040039062, -0.8394622802734375, -0.8030929565429688, -0.7667236328125, -0.7303543090820312, -0.6939849853515625, -0.6576156616210938, -0.621246337890625, -0.5848770141601562, -0.5485076904296875, -0.5121383666992188, -0.47576904296875, -0.43939971923828125, -0.4030303955078125, -0.36666107177734375, -0.330291748046875, -0.29392242431640625, -0.2575531005859375, -0.22118377685546875, -0.184814453125, -0.14844512939453125, -0.1120758056640625, -0.07570648193359375, -0.039337158203125, -0.00296783447265625, 0.0334014892578125, 0.06977081298828125, 0.10614013671875, 0.14250946044921875, 0.1788787841796875, 0.21524810791015625, 0.251617431640625, 0.28798675537109375, 0.3243560791015625, 0.36072540283203125, 0.3970947265625, 0.43346405029296875, 0.4698333740234375, 0.5062026977539062, 0.542572021484375, 0.5789413452148438, 0.6153106689453125, 0.6516799926757812, 0.68804931640625, 0.7244186401367188, 0.7607879638671875, 0.7971572875976562, 0.833526611328125, 0.8698959350585938, 0.9062652587890625, 0.9426345825195312, 0.97900390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 9.0, 7.0, 15.0, 14.0, 29.0, 42.0, 74.0, 83.0, 140.0, 226.0, 352.0, 640.0, 1293.0, 2747.0, 6982.0, 21630.0, 99719.0, 662744.0, 199559.0, 34613.0, 10045.0, 3909.0, 1664.0, 831.0, 480.0, 235.0, 168.0, 96.0, 62.0, 40.0, 29.0, 21.0, 11.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10595703125, -0.10261154174804688, -0.09926605224609375, -0.09592056274414062, -0.0925750732421875, -0.08922958374023438, -0.08588409423828125, -0.08253860473632812, -0.079193115234375, -0.07584762573242188, -0.07250213623046875, -0.06915664672851562, -0.0658111572265625, -0.062465667724609375, -0.05912017822265625, -0.055774688720703125, -0.05242919921875, -0.049083709716796875, -0.04573822021484375, -0.042392730712890625, -0.0390472412109375, -0.035701751708984375, -0.03235626220703125, -0.029010772705078125, -0.025665283203125, -0.022319793701171875, -0.01897430419921875, -0.015628814697265625, -0.0122833251953125, -0.008937835693359375, -0.00559234619140625, -0.002246856689453125, 0.0010986328125, 0.004444122314453125, 0.00778961181640625, 0.011135101318359375, 0.0144805908203125, 0.017826080322265625, 0.02117156982421875, 0.024517059326171875, 0.027862548828125, 0.031208038330078125, 0.03455352783203125, 0.037899017333984375, 0.0412445068359375, 0.044589996337890625, 0.04793548583984375, 0.051280975341796875, 0.05462646484375, 0.057971954345703125, 0.06131744384765625, 0.06466293334960938, 0.0680084228515625, 0.07135391235351562, 0.07469940185546875, 0.07804489135742188, 0.081390380859375, 0.08473587036132812, 0.08808135986328125, 0.09142684936523438, 0.0947723388671875, 0.09811782836914062, 0.10146331787109375, 0.10480880737304688, 0.108154296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 11.0, 17.0, 25.0, 40.0, 54.0, 85.0, 113.0, 192.0, 154.0, 81.0, 49.0, 39.0, 27.0, 32.0, 9.0, 11.0, 9.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.350090891122818e-05, -7.160194218158722e-05, -6.970297545194626e-05, -6.78040087223053e-05, -6.590504199266434e-05, -6.400607526302338e-05, -6.210710853338242e-05, -6.0208141803741455e-05, -5.8309175074100494e-05, -5.6410208344459534e-05, -5.451124161481857e-05, -5.261227488517761e-05, -5.071330815553665e-05, -4.881434142589569e-05, -4.691537469625473e-05, -4.501640796661377e-05, -4.311744123697281e-05, -4.121847450733185e-05, -3.931950777769089e-05, -3.742054104804993e-05, -3.5521574318408966e-05, -3.3622607588768005e-05, -3.1723640859127045e-05, -2.9824674129486084e-05, -2.7925707399845123e-05, -2.6026740670204163e-05, -2.4127773940563202e-05, -2.222880721092224e-05, -2.032984048128128e-05, -1.843087375164032e-05, -1.653190702199936e-05, -1.4632940292358398e-05, -1.2733973562717438e-05, -1.0835006833076477e-05, -8.936040103435516e-06, -7.037073373794556e-06, -5.138106644153595e-06, -3.2391399145126343e-06, -1.3401731848716736e-06, 5.587935447692871e-07, 2.457760274410248e-06, 4.3567270040512085e-06, 6.255693733692169e-06, 8.15466046333313e-06, 1.005362719297409e-05, 1.1952593922615051e-05, 1.3851560652256012e-05, 1.5750527381896973e-05, 1.7649494111537933e-05, 1.9548460841178894e-05, 2.1447427570819855e-05, 2.3346394300460815e-05, 2.5245361030101776e-05, 2.7144327759742737e-05, 2.9043294489383698e-05, 3.094226121902466e-05, 3.284122794866562e-05, 3.474019467830658e-05, 3.663916140794754e-05, 3.85381281375885e-05, 4.043709486722946e-05, 4.233606159687042e-05, 4.423502832651138e-05, 4.6133995056152344e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 11.0, 11.0, 14.0, 14.0, 28.0, 36.0, 59.0, 96.0, 171.0, 209.0, 344.0, 593.0, 978.0, 1552.0, 2726.0, 5051.0, 9586.0, 19531.0, 43465.0, 113458.0, 389513.0, 298276.0, 90794.0, 36319.0, 16905.0, 8282.0, 4415.0, 2454.0, 1446.0, 805.0, 533.0, 272.0, 204.0, 144.0, 80.0, 45.0, 47.0, 28.0, 17.0, 14.0, 8.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06494140625, -0.06276893615722656, -0.060596466064453125, -0.05842399597167969, -0.05625152587890625, -0.05407905578613281, -0.051906585693359375, -0.04973411560058594, -0.0475616455078125, -0.04538917541503906, -0.043216705322265625, -0.04104423522949219, -0.03887176513671875, -0.03669929504394531, -0.034526824951171875, -0.03235435485839844, -0.030181884765625, -0.028009414672851562, -0.025836944580078125, -0.023664474487304688, -0.02149200439453125, -0.019319534301757812, -0.017147064208984375, -0.014974594116210938, -0.0128021240234375, -0.010629653930664062, -0.008457183837890625, -0.0062847137451171875, -0.00411224365234375, -0.0019397735595703125, 0.000232696533203125, 0.0024051666259765625, 0.00457763671875, 0.0067501068115234375, 0.008922576904296875, 0.011095046997070312, 0.01326751708984375, 0.015439987182617188, 0.017612457275390625, 0.019784927368164062, 0.0219573974609375, 0.024129867553710938, 0.026302337646484375, 0.028474807739257812, 0.03064727783203125, 0.03281974792480469, 0.034992218017578125, 0.03716468811035156, 0.039337158203125, 0.04150962829589844, 0.043682098388671875, 0.04585456848144531, 0.04802703857421875, 0.05019950866699219, 0.052371978759765625, 0.05454444885253906, 0.0567169189453125, 0.05888938903808594, 0.061061859130859375, 0.06323432922363281, 0.06540679931640625, 0.06757926940917969, 0.06975173950195312, 0.07192420959472656, 0.0740966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 10.0, 6.0, 8.0, 10.0, 15.0, 18.0, 23.0, 24.0, 23.0, 29.0, 39.0, 59.0, 64.0, 62.0, 89.0, 83.0, 83.0, 59.0, 51.0, 41.0, 38.0, 37.0, 19.0, 17.0, 16.0, 16.0, 13.0, 7.0, 7.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.02039480209350586, -0.01977825164794922, -0.019161701202392578, -0.018545150756835938, -0.017928600311279297, -0.017312049865722656, -0.016695499420166016, -0.016078948974609375, -0.015462398529052734, -0.014845848083496094, -0.014229297637939453, -0.013612747192382812, -0.012996196746826172, -0.012379646301269531, -0.01176309585571289, -0.01114654541015625, -0.01052999496459961, -0.009913444519042969, -0.009296894073486328, -0.008680343627929688, -0.008063793182373047, -0.007447242736816406, -0.006830692291259766, -0.006214141845703125, -0.005597591400146484, -0.004981040954589844, -0.004364490509033203, -0.0037479400634765625, -0.003131389617919922, -0.0025148391723632812, -0.0018982887268066406, -0.00128173828125, -0.0006651878356933594, -4.863739013671875e-05, 0.0005679130554199219, 0.0011844635009765625, 0.0018010139465332031, 0.0024175643920898438, 0.0030341148376464844, 0.003650665283203125, 0.004267215728759766, 0.004883766174316406, 0.005500316619873047, 0.0061168670654296875, 0.006733417510986328, 0.007349967956542969, 0.00796651840209961, 0.00858306884765625, 0.00919961929321289, 0.009816169738769531, 0.010432720184326172, 0.011049270629882812, 0.011665821075439453, 0.012282371520996094, 0.012898921966552734, 0.013515472412109375, 0.014132022857666016, 0.014748573303222656, 0.015365123748779297, 0.015981674194335938, 0.016598224639892578, 0.01721477508544922, 0.01783132553100586, 0.0184478759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 6.0, 16.0, 34.0, 35.0, 58.0, 68.0, 110.0, 137.0, 140.0, 116.0, 69.0, 60.0, 46.0, 27.0, 18.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1575431823730469, -1.1226516962051392, -1.087760090827942, -1.0528686046600342, -1.0179771184921265, -0.9830855131149292, -0.9481940269470215, -0.913302481174469, -0.8784109354019165, -0.843519389629364, -0.8086279034614563, -0.7737363576889038, -0.7388448119163513, -0.7039532661437988, -0.6690617799758911, -0.6341702342033386, -0.5992787480354309, -0.5643872022628784, -0.5294957160949707, -0.4946041703224182, -0.4597126245498657, -0.4248211085796356, -0.3899295926094055, -0.355038046836853, -0.3201465308666229, -0.2852550148963928, -0.25036346912384033, -0.21547195315361023, -0.18058042228221893, -0.14568889141082764, -0.11079737544059753, -0.07590584456920624, -0.04101431369781494, -0.0061227865517139435, 0.028768740594387054, 0.06366026401519775, 0.09855179488658905, 0.13344332575798035, 0.16833484172821045, 0.20322637259960175, 0.23811790347099304, 0.27300941944122314, 0.30790096521377563, 0.34279248118400574, 0.37768399715423584, 0.41257554292678833, 0.44746705889701843, 0.48235857486724854, 0.517250120639801, 0.5521416664123535, 0.5870331525802612, 0.6219246983528137, 0.6568162441253662, 0.6917077302932739, 0.7265992760658264, 0.7614908218383789, 0.7963823080062866, 0.8312738537788391, 0.8661653399467468, 0.9010568857192993, 0.9359484314918518, 0.9708399772644043, 1.005731463432312, 1.0406229496002197, 1.075514554977417]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 12.0, 15.0, 13.0, 35.0, 38.0, 45.0, 46.0, 63.0, 68.0, 56.0, 71.0, 74.0, 61.0, 77.0, 56.0, 50.0, 37.0, 36.0, 36.0, 22.0, 13.0, 18.0, 12.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9620012044906616, -0.9360266327857971, -0.9100520610809326, -0.8840775489807129, -0.8581029772758484, -0.8321284055709839, -0.8061538934707642, -0.7801793217658997, -0.7542047500610352, -0.7282301783561707, -0.7022556066513062, -0.6762810945510864, -0.6503065228462219, -0.6243319511413574, -0.5983574390411377, -0.5723828673362732, -0.5464082956314087, -0.5204337239265442, -0.4944591820240021, -0.46848464012145996, -0.44251006841659546, -0.41653549671173096, -0.39056095480918884, -0.36458641290664673, -0.3386118412017822, -0.3126372694969177, -0.2866627275943756, -0.2606881856918335, -0.234713613986969, -0.20873905718326569, -0.18276450037956238, -0.15678994357585907, -0.13081538677215576, -0.10484082996845245, -0.07886627316474915, -0.05289171636104584, -0.02691715955734253, -0.0009426027536392212, 0.025031954050064087, 0.051006510853767395, 0.0769810676574707, 0.10295562446117401, 0.12893018126487732, 0.15490473806858063, 0.18087929487228394, 0.20685385167598724, 0.23282840847969055, 0.25880295038223267, 0.28477752208709717, 0.31075209379196167, 0.3367266356945038, 0.3627011775970459, 0.3886757493019104, 0.4146503210067749, 0.440624862909317, 0.46659940481185913, 0.49257397651672363, 0.5185485482215881, 0.5445231199264526, 0.5704976320266724, 0.5964722037315369, 0.6224467754364014, 0.6484212875366211, 0.6743958592414856, 0.7003704309463501]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 4.0, 16.0, 27.0, 22.0, 43.0, 73.0, 118.0, 198.0, 325.0, 635.0, 1197.0, 2264.0, 5187.0, 14524.0, 94261.0, 842424.0, 65874.0, 12410.0, 4610.0, 2062.0, 989.0, 517.0, 292.0, 191.0, 99.0, 64.0, 34.0, 23.0, 19.0, 20.0, 4.0, 8.0, 4.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2387237548828125, -1.183502197265625, -1.1282806396484375, -1.07305908203125, -1.0178375244140625, -0.962615966796875, -0.9073944091796875, -0.8521728515625, -0.7969512939453125, -0.741729736328125, -0.6865081787109375, -0.63128662109375, -0.5760650634765625, -0.520843505859375, -0.4656219482421875, -0.410400390625, -0.3551788330078125, -0.299957275390625, -0.2447357177734375, -0.18951416015625, -0.1342926025390625, -0.079071044921875, -0.0238494873046875, 0.0313720703125, 0.0865936279296875, 0.141815185546875, 0.1970367431640625, 0.25225830078125, 0.3074798583984375, 0.362701416015625, 0.4179229736328125, 0.47314453125, 0.5283660888671875, 0.583587646484375, 0.6388092041015625, 0.69403076171875, 0.7492523193359375, 0.804473876953125, 0.8596954345703125, 0.9149169921875, 0.9701385498046875, 1.025360107421875, 1.0805816650390625, 1.13580322265625, 1.1910247802734375, 1.246246337890625, 1.3014678955078125, 1.356689453125, 1.4119110107421875, 1.467132568359375, 1.5223541259765625, 1.57757568359375, 1.6327972412109375, 1.688018798828125, 1.7432403564453125, 1.7984619140625, 1.8536834716796875, 1.908905029296875, 1.9641265869140625, 2.01934814453125, 2.0745697021484375, 2.129791259765625, 2.1850128173828125, 2.240234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 6.0, 4.0, 6.0, 10.0, 15.0, 18.0, 16.0, 32.0, 55.0, 51.0, 67.0, 60.0, 87.0, 69.0, 74.0, 66.0, 75.0, 54.0, 52.0, 41.0, 36.0, 25.0, 22.0, 13.0, 13.0, 11.0, 5.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.0403900146484375, -1.985076904296875, -1.9297637939453125, -1.87445068359375, -1.8191375732421875, -1.763824462890625, -1.7085113525390625, -1.6531982421875, -1.5978851318359375, -1.542572021484375, -1.4872589111328125, -1.43194580078125, -1.3766326904296875, -1.321319580078125, -1.2660064697265625, -1.210693359375, -1.1553802490234375, -1.100067138671875, -1.0447540283203125, -0.98944091796875, -0.9341278076171875, -0.878814697265625, -0.8235015869140625, -0.7681884765625, -0.7128753662109375, -0.657562255859375, -0.6022491455078125, -0.54693603515625, -0.4916229248046875, -0.436309814453125, -0.3809967041015625, -0.32568359375, -0.2703704833984375, -0.215057373046875, -0.1597442626953125, -0.10443115234375, -0.0491180419921875, 0.006195068359375, 0.0615081787109375, 0.1168212890625, 0.1721343994140625, 0.227447509765625, 0.2827606201171875, 0.33807373046875, 0.3933868408203125, 0.448699951171875, 0.5040130615234375, 0.559326171875, 0.6146392822265625, 0.669952392578125, 0.7252655029296875, 0.78057861328125, 0.8358917236328125, 0.891204833984375, 0.9465179443359375, 1.0018310546875, 1.0571441650390625, 1.112457275390625, 1.1677703857421875, 1.22308349609375, 1.2783966064453125, 1.333709716796875, 1.3890228271484375, 1.4443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 16.0, 2.0, 13.0, 22.0, 13.0, 28.0, 35.0, 46.0, 94.0, 134.0, 176.0, 377.0, 642.0, 1132.0, 2330.0, 4767.0, 12747.0, 53016.0, 710364.0, 221088.0, 25985.0, 8110.0, 3493.0, 1759.0, 899.0, 505.0, 279.0, 159.0, 83.0, 79.0, 49.0, 40.0, 21.0, 13.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.0835723876953125, -1.043121337890625, -1.0026702880859375, -0.96221923828125, -0.9217681884765625, -0.881317138671875, -0.8408660888671875, -0.8004150390625, -0.7599639892578125, -0.719512939453125, -0.6790618896484375, -0.63861083984375, -0.5981597900390625, -0.557708740234375, -0.5172576904296875, -0.476806640625, -0.4363555908203125, -0.395904541015625, -0.3554534912109375, -0.31500244140625, -0.2745513916015625, -0.234100341796875, -0.1936492919921875, -0.1531982421875, -0.1127471923828125, -0.072296142578125, -0.0318450927734375, 0.00860595703125, 0.0490570068359375, 0.089508056640625, 0.1299591064453125, 0.17041015625, 0.2108612060546875, 0.251312255859375, 0.2917633056640625, 0.33221435546875, 0.3726654052734375, 0.413116455078125, 0.4535675048828125, 0.4940185546875, 0.5344696044921875, 0.574920654296875, 0.6153717041015625, 0.65582275390625, 0.6962738037109375, 0.736724853515625, 0.7771759033203125, 0.817626953125, 0.8580780029296875, 0.898529052734375, 0.9389801025390625, 0.97943115234375, 1.0198822021484375, 1.060333251953125, 1.1007843017578125, 1.1412353515625, 1.1816864013671875, 1.222137451171875, 1.2625885009765625, 1.30303955078125, 1.3434906005859375, 1.383941650390625, 1.4243927001953125, 1.46484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 10.0, 12.0, 9.0, 15.0, 18.0, 24.0, 32.0, 37.0, 37.0, 46.0, 49.0, 40.0, 48.0, 48.0, 53.0, 41.0, 54.0, 56.0, 52.0, 37.0, 39.0, 36.0, 24.0, 24.0, 23.0, 21.0, 18.0, 15.0, 14.0, 7.0, 15.0, 11.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4306640625, -1.3872222900390625, -1.343780517578125, -1.3003387451171875, -1.25689697265625, -1.2134552001953125, -1.170013427734375, -1.1265716552734375, -1.0831298828125, -1.0396881103515625, -0.996246337890625, -0.9528045654296875, -0.90936279296875, -0.8659210205078125, -0.822479248046875, -0.7790374755859375, -0.735595703125, -0.6921539306640625, -0.648712158203125, -0.6052703857421875, -0.56182861328125, -0.5183868408203125, -0.474945068359375, -0.4315032958984375, -0.3880615234375, -0.3446197509765625, -0.301177978515625, -0.2577362060546875, -0.21429443359375, -0.1708526611328125, -0.127410888671875, -0.0839691162109375, -0.04052734375, 0.0029144287109375, 0.046356201171875, 0.0897979736328125, 0.13323974609375, 0.1766815185546875, 0.220123291015625, 0.2635650634765625, 0.3070068359375, 0.3504486083984375, 0.393890380859375, 0.4373321533203125, 0.48077392578125, 0.5242156982421875, 0.567657470703125, 0.6110992431640625, 0.654541015625, 0.6979827880859375, 0.741424560546875, 0.7848663330078125, 0.82830810546875, 0.8717498779296875, 0.915191650390625, 0.9586334228515625, 1.0020751953125, 1.0455169677734375, 1.088958740234375, 1.1324005126953125, 1.17584228515625, 1.2192840576171875, 1.262725830078125, 1.3061676025390625, 1.349609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 19.0, 23.0, 32.0, 55.0, 76.0, 124.0, 200.0, 254.0, 452.0, 817.0, 1416.0, 2925.0, 7840.0, 33002.0, 701655.0, 264636.0, 23239.0, 6206.0, 2541.0, 1105.0, 679.0, 444.0, 286.0, 186.0, 123.0, 57.0, 44.0, 22.0, 16.0, 15.0, 14.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.448486328125, -0.4356346130371094, -0.42278289794921875, -0.4099311828613281, -0.3970794677734375, -0.3842277526855469, -0.37137603759765625, -0.3585243225097656, -0.345672607421875, -0.3328208923339844, -0.31996917724609375, -0.3071174621582031, -0.2942657470703125, -0.2814140319824219, -0.26856231689453125, -0.2557106018066406, -0.24285888671875, -0.23000717163085938, -0.21715545654296875, -0.20430374145507812, -0.1914520263671875, -0.17860031127929688, -0.16574859619140625, -0.15289688110351562, -0.140045166015625, -0.12719345092773438, -0.11434173583984375, -0.10149002075195312, -0.0886383056640625, -0.07578659057617188, -0.06293487548828125, -0.050083160400390625, -0.0372314453125, -0.024379730224609375, -0.01152801513671875, 0.001323699951171875, 0.0141754150390625, 0.027027130126953125, 0.03987884521484375, 0.052730560302734375, 0.065582275390625, 0.07843399047851562, 0.09128570556640625, 0.10413742065429688, 0.1169891357421875, 0.12984085083007812, 0.14269256591796875, 0.15554428100585938, 0.16839599609375, 0.18124771118164062, 0.19409942626953125, 0.20695114135742188, 0.2198028564453125, 0.23265457153320312, 0.24550628662109375, 0.2583580017089844, 0.271209716796875, 0.2840614318847656, 0.29691314697265625, 0.3097648620605469, 0.3226165771484375, 0.3354682922363281, 0.34832000732421875, 0.3611717224121094, 0.3740234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 18.0, 24.0, 82.0, 198.0, 423.0, 127.0, 55.0, 25.0, 11.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.896257400512695e-05, -6.571691483259201e-05, -6.247125566005707e-05, -5.9225596487522125e-05, -5.597993731498718e-05, -5.273427814245224e-05, -4.94886189699173e-05, -4.6242959797382355e-05, -4.299730062484741e-05, -3.975164145231247e-05, -3.650598227977753e-05, -3.3260323107242584e-05, -3.001466393470764e-05, -2.67690047621727e-05, -2.3523345589637756e-05, -2.0277686417102814e-05, -1.703202724456787e-05, -1.3786368072032928e-05, -1.0540708899497986e-05, -7.295049726963043e-06, -4.049390554428101e-06, -8.03731381893158e-07, 2.4419277906417847e-06, 5.687586963176727e-06, 8.93324613571167e-06, 1.2178905308246613e-05, 1.5424564480781555e-05, 1.8670223653316498e-05, 2.191588282585144e-05, 2.5161541998386383e-05, 2.8407201170921326e-05, 3.165286034345627e-05, 3.489851951599121e-05, 3.8144178688526154e-05, 4.1389837861061096e-05, 4.463549703359604e-05, 4.788115620613098e-05, 5.1126815378665924e-05, 5.437247455120087e-05, 5.761813372373581e-05, 6.086379289627075e-05, 6.41094520688057e-05, 6.735511124134064e-05, 7.060077041387558e-05, 7.384642958641052e-05, 7.709208875894547e-05, 8.033774793148041e-05, 8.358340710401535e-05, 8.682906627655029e-05, 9.007472544908524e-05, 9.332038462162018e-05, 9.656604379415512e-05, 9.981170296669006e-05, 0.000103057362139225, 0.00010630302131175995, 0.00010954868048429489, 0.00011279433965682983, 0.00011603999882936478, 0.00011928565800189972, 0.00012253131717443466, 0.0001257769763469696, 0.00012902263551950455, 0.0001322682946920395, 0.00013551395386457443, 0.00013875961303710938]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 12.0, 6.0, 5.0, 34.0, 27.0, 37.0, 73.0, 93.0, 134.0, 193.0, 263.0, 402.0, 621.0, 1145.0, 2020.0, 3806.0, 8860.0, 30562.0, 311077.0, 627417.0, 41242.0, 10510.0, 4344.0, 2306.0, 1257.0, 701.0, 428.0, 298.0, 217.0, 148.0, 100.0, 68.0, 50.0, 30.0, 16.0, 14.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.37384796142578125, -0.3621978759765625, -0.35054779052734375, -0.338897705078125, -0.32724761962890625, -0.3155975341796875, -0.30394744873046875, -0.29229736328125, -0.28064727783203125, -0.2689971923828125, -0.25734710693359375, -0.245697021484375, -0.23404693603515625, -0.2223968505859375, -0.21074676513671875, -0.1990966796875, -0.18744659423828125, -0.1757965087890625, -0.16414642333984375, -0.152496337890625, -0.14084625244140625, -0.1291961669921875, -0.11754608154296875, -0.10589599609375, -0.09424591064453125, -0.0825958251953125, -0.07094573974609375, -0.059295654296875, -0.04764556884765625, -0.0359954833984375, -0.02434539794921875, -0.0126953125, -0.00104522705078125, 0.0106048583984375, 0.02225494384765625, 0.033905029296875, 0.04555511474609375, 0.0572052001953125, 0.06885528564453125, 0.08050537109375, 0.09215545654296875, 0.1038055419921875, 0.11545562744140625, 0.127105712890625, 0.13875579833984375, 0.1504058837890625, 0.16205596923828125, 0.1737060546875, 0.18535614013671875, 0.1970062255859375, 0.20865631103515625, 0.220306396484375, 0.23195648193359375, 0.2436065673828125, 0.25525665283203125, 0.26690673828125, 0.27855682373046875, 0.2902069091796875, 0.30185699462890625, 0.313507080078125, 0.32515716552734375, 0.3368072509765625, 0.34845733642578125, 0.360107421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 5.0, 20.0, 12.0, 12.0, 20.0, 22.0, 28.0, 47.0, 77.0, 79.0, 108.0, 158.0, 91.0, 65.0, 55.0, 40.0, 35.0, 22.0, 8.0, 15.0, 14.0, 10.0, 9.0, 10.0, 5.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06546783447265625, -0.0625152587890625, -0.05956268310546875, -0.056610107421875, -0.05365753173828125, -0.0507049560546875, -0.04775238037109375, -0.0447998046875, -0.04184722900390625, -0.0388946533203125, -0.03594207763671875, -0.032989501953125, -0.03003692626953125, -0.0270843505859375, -0.02413177490234375, -0.02117919921875, -0.01822662353515625, -0.0152740478515625, -0.01232147216796875, -0.009368896484375, -0.00641632080078125, -0.0034637451171875, -0.00051116943359375, 0.00244140625, 0.00539398193359375, 0.0083465576171875, 0.01129913330078125, 0.014251708984375, 0.01720428466796875, 0.0201568603515625, 0.02310943603515625, 0.02606201171875, 0.02901458740234375, 0.0319671630859375, 0.03491973876953125, 0.037872314453125, 0.04082489013671875, 0.0437774658203125, 0.04673004150390625, 0.0496826171875, 0.05263519287109375, 0.0555877685546875, 0.05854034423828125, 0.061492919921875, 0.06444549560546875, 0.0673980712890625, 0.07035064697265625, 0.07330322265625, 0.07625579833984375, 0.0792083740234375, 0.08216094970703125, 0.085113525390625, 0.08806610107421875, 0.0910186767578125, 0.09397125244140625, 0.096923828125, 0.09987640380859375, 0.1028289794921875, 0.10578155517578125, 0.108734130859375, 0.11168670654296875, 0.1146392822265625, 0.11759185791015625, 0.12054443359375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 17.0, 34.0, 20.0, 45.0, 50.0, 79.0, 104.0, 100.0, 137.0, 103.0, 97.0, 53.0, 41.0, 31.0, 16.0, 16.0, 12.0, 7.0, 5.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.9285340309143066, -2.860914945602417, -2.7932960987091064, -2.725677013397217, -2.658057928085327, -2.5904388427734375, -2.522819995880127, -2.4552009105682373, -2.3875818252563477, -2.319962739944458, -2.2523438930511475, -2.184724807739258, -2.117105722427368, -2.0494866371154785, -1.981867790222168, -1.9142487049102783, -1.8466298580169678, -1.7790108919143677, -1.711391806602478, -1.643772840499878, -1.5761537551879883, -1.5085347890853882, -1.440915822982788, -1.3732967376708984, -1.3056777715682983, -1.2380588054656982, -1.1704397201538086, -1.1028207540512085, -1.0352017879486084, -0.9675827026367188, -0.8999637365341187, -0.8323447108268738, -0.7647258043289185, -0.6971067786216736, -0.6294877529144287, -0.5618687868118286, -0.49424976110458374, -0.42663073539733887, -0.3590117394924164, -0.2913927435874939, -0.22377371788024902, -0.15615470707416534, -0.08853569626808167, -0.020916685461997986, 0.04670232534408569, 0.11432135105133057, 0.18194034695625305, 0.24955934286117554, 0.3171783685684204, 0.3847973942756653, 0.45241639018058777, 0.5200353860855103, 0.5876544117927551, 0.6552734375, 0.7228924036026001, 0.790511429309845, 0.8581304550170898, 0.9257494807243347, 0.9933685064315796, 1.0609874725341797, 1.1286065578460693, 1.1962255239486694, 1.2638444900512695, 1.3314635753631592, 1.3990825414657593]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 5.0, 6.0, 9.0, 11.0, 16.0, 16.0, 11.0, 28.0, 22.0, 30.0, 19.0, 29.0, 25.0, 31.0, 26.0, 42.0, 38.0, 34.0, 38.0, 48.0, 38.0, 27.0, 38.0, 38.0, 40.0, 40.0, 36.0, 33.0, 31.0, 28.0, 20.0, 20.0, 20.0, 10.0, 16.0, 17.0, 17.0, 12.0, 8.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734708309173584, -1.677946925163269, -1.621185541152954, -1.5644241571426392, -1.5076627731323242, -1.4509012699127197, -1.3941398859024048, -1.3373785018920898, -1.280617117881775, -1.22385573387146, -1.167094349861145, -1.11033296585083, -1.0535714626312256, -0.9968101382255554, -0.9400486946105957, -0.8832873106002808, -0.8265259265899658, -0.7697645425796509, -0.7130031585693359, -0.6562417149543762, -0.5994803309440613, -0.5427189469337463, -0.485957533121109, -0.4291961193084717, -0.37243473529815674, -0.3156733512878418, -0.25891193747520447, -0.20215053856372833, -0.1453891396522522, -0.08862775564193726, -0.03186634182929993, 0.024895071983337402, 0.0816565752029419, 0.13841797411441803, 0.19517937302589417, 0.2519407868385315, 0.30870217084884644, 0.3654635548591614, 0.4222249686717987, 0.47898638248443604, 0.535747766494751, 0.5925091505050659, 0.6492705345153809, 0.7060319781303406, 0.7627933621406555, 0.8195547461509705, 0.8763161897659302, 0.9330775737762451, 0.9898389577865601, 1.046600341796875, 1.10336172580719, 1.1601231098175049, 1.2168846130371094, 1.2736458778381348, 1.3304073810577393, 1.3871687650680542, 1.4439301490783691, 1.500691533088684, 1.557452917098999, 1.614214301109314, 1.670975685119629, 1.7277371883392334, 1.7844985723495483, 1.8412599563598633, 1.8980213403701782]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 12.0, 9.0, 20.0, 25.0, 28.0, 40.0, 50.0, 70.0, 98.0, 146.0, 225.0, 361.0, 536.0, 870.0, 1553.0, 3030.0, 6471.0, 18384.0, 84824.0, 2029415.0, 1929681.0, 86393.0, 18296.0, 6571.0, 3007.0, 1627.0, 911.0, 541.0, 354.0, 232.0, 148.0, 79.0, 65.0, 66.0, 25.0, 28.0, 23.0, 15.0, 7.0, 11.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.7275390625, -1.6781768798828125, -1.628814697265625, -1.5794525146484375, -1.53009033203125, -1.4807281494140625, -1.431365966796875, -1.3820037841796875, -1.3326416015625, -1.2832794189453125, -1.233917236328125, -1.1845550537109375, -1.13519287109375, -1.0858306884765625, -1.036468505859375, -0.9871063232421875, -0.937744140625, -0.8883819580078125, -0.839019775390625, -0.7896575927734375, -0.74029541015625, -0.6909332275390625, -0.641571044921875, -0.5922088623046875, -0.5428466796875, -0.4934844970703125, -0.444122314453125, -0.3947601318359375, -0.34539794921875, -0.2960357666015625, -0.246673583984375, -0.1973114013671875, -0.14794921875, -0.0985870361328125, -0.049224853515625, 0.0001373291015625, 0.04949951171875, 0.0988616943359375, 0.148223876953125, 0.1975860595703125, 0.2469482421875, 0.2963104248046875, 0.345672607421875, 0.3950347900390625, 0.44439697265625, 0.4937591552734375, 0.543121337890625, 0.5924835205078125, 0.641845703125, 0.6912078857421875, 0.740570068359375, 0.7899322509765625, 0.83929443359375, 0.8886566162109375, 0.938018798828125, 0.9873809814453125, 1.0367431640625, 1.0861053466796875, 1.135467529296875, 1.1848297119140625, 1.23419189453125, 1.2835540771484375, 1.332916259765625, 1.3822784423828125, 1.431640625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 10.0, 13.0, 20.0, 18.0, 23.0, 44.0, 42.0, 48.0, 53.0, 55.0, 84.0, 66.0, 70.0, 60.0, 75.0, 75.0, 40.0, 42.0, 29.0, 28.0, 28.0, 17.0, 7.0, 13.0, 7.0, 6.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80517578125, -0.778228759765625, -0.75128173828125, -0.724334716796875, -0.6973876953125, -0.670440673828125, -0.64349365234375, -0.616546630859375, -0.589599609375, -0.562652587890625, -0.53570556640625, -0.508758544921875, -0.4818115234375, -0.454864501953125, -0.42791748046875, -0.400970458984375, -0.3740234375, -0.347076416015625, -0.32012939453125, -0.293182373046875, -0.2662353515625, -0.239288330078125, -0.21234130859375, -0.185394287109375, -0.158447265625, -0.131500244140625, -0.10455322265625, -0.077606201171875, -0.0506591796875, -0.023712158203125, 0.00323486328125, 0.030181884765625, 0.05712890625, 0.084075927734375, 0.11102294921875, 0.137969970703125, 0.1649169921875, 0.191864013671875, 0.21881103515625, 0.245758056640625, 0.272705078125, 0.299652099609375, 0.32659912109375, 0.353546142578125, 0.3804931640625, 0.407440185546875, 0.43438720703125, 0.461334228515625, 0.48828125, 0.515228271484375, 0.54217529296875, 0.569122314453125, 0.5960693359375, 0.623016357421875, 0.64996337890625, 0.676910400390625, 0.703857421875, 0.730804443359375, 0.75775146484375, 0.784698486328125, 0.8116455078125, 0.838592529296875, 0.86553955078125, 0.892486572265625, 0.91943359375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 7.0, 7.0, 15.0, 18.0, 27.0, 46.0, 64.0, 168.0, 381.0, 1023.0, 3139.0, 11415.0, 60130.0, 3343917.0, 725429.0, 36759.0, 7995.0, 2309.0, 770.0, 308.0, 135.0, 70.0, 45.0, 25.0, 20.0, 10.0, 6.0, 9.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.556976318359375, -2.47137451171875, -2.385772705078125, -2.3001708984375, -2.214569091796875, -2.12896728515625, -2.043365478515625, -1.957763671875, -1.872161865234375, -1.78656005859375, -1.700958251953125, -1.6153564453125, -1.529754638671875, -1.44415283203125, -1.358551025390625, -1.27294921875, -1.187347412109375, -1.10174560546875, -1.016143798828125, -0.9305419921875, -0.844940185546875, -0.75933837890625, -0.673736572265625, -0.588134765625, -0.502532958984375, -0.41693115234375, -0.331329345703125, -0.2457275390625, -0.160125732421875, -0.07452392578125, 0.011077880859375, 0.0966796875, 0.182281494140625, 0.26788330078125, 0.353485107421875, 0.4390869140625, 0.524688720703125, 0.61029052734375, 0.695892333984375, 0.781494140625, 0.867095947265625, 0.95269775390625, 1.038299560546875, 1.1239013671875, 1.209503173828125, 1.29510498046875, 1.380706787109375, 1.46630859375, 1.551910400390625, 1.63751220703125, 1.723114013671875, 1.8087158203125, 1.894317626953125, 1.97991943359375, 2.065521240234375, 2.151123046875, 2.236724853515625, 2.32232666015625, 2.407928466796875, 2.4935302734375, 2.579132080078125, 2.66473388671875, 2.750335693359375, 2.8359375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 8.0, 13.0, 18.0, 16.0, 14.0, 23.0, 41.0, 68.0, 65.0, 126.0, 241.0, 559.0, 1055.0, 848.0, 408.0, 203.0, 100.0, 51.0, 51.0, 40.0, 22.0, 17.0, 15.0, 12.0, 12.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5979537963867188, -0.5792083740234375, -0.5604629516601562, -0.541717529296875, -0.5229721069335938, -0.5042266845703125, -0.48548126220703125, -0.46673583984375, -0.44799041748046875, -0.4292449951171875, -0.41049957275390625, -0.391754150390625, -0.37300872802734375, -0.3542633056640625, -0.33551788330078125, -0.3167724609375, -0.29802703857421875, -0.2792816162109375, -0.26053619384765625, -0.241790771484375, -0.22304534912109375, -0.2042999267578125, -0.18555450439453125, -0.16680908203125, -0.14806365966796875, -0.1293182373046875, -0.11057281494140625, -0.091827392578125, -0.07308197021484375, -0.0543365478515625, -0.03559112548828125, -0.016845703125, 0.00189971923828125, 0.0206451416015625, 0.03939056396484375, 0.058135986328125, 0.07688140869140625, 0.0956268310546875, 0.11437225341796875, 0.13311767578125, 0.15186309814453125, 0.1706085205078125, 0.18935394287109375, 0.208099365234375, 0.22684478759765625, 0.2455902099609375, 0.26433563232421875, 0.2830810546875, 0.30182647705078125, 0.3205718994140625, 0.33931732177734375, 0.358062744140625, 0.37680816650390625, 0.3955535888671875, 0.41429901123046875, 0.43304443359375, 0.45178985595703125, 0.4705352783203125, 0.48928070068359375, 0.508026123046875, 0.5267715454101562, 0.5455169677734375, 0.5642623901367188, 0.5830078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 8.0, 5.0, 6.0, 13.0, 12.0, 22.0, 27.0, 32.0, 53.0, 55.0, 76.0, 75.0, 86.0, 83.0, 82.0, 73.0, 65.0, 55.0, 31.0, 24.0, 33.0, 11.0, 16.0, 10.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1894127130508423, -1.1456818580627441, -1.1019511222839355, -1.058220386505127, -1.0144895315170288, -0.9707587361335754, -0.9270279407501221, -0.8832971453666687, -0.8395663499832153, -0.795835554599762, -0.7521047592163086, -0.7083739638328552, -0.6646431684494019, -0.6209123730659485, -0.5771815776824951, -0.5334507822990417, -0.4897199869155884, -0.445989191532135, -0.40225839614868164, -0.35852760076522827, -0.3147968053817749, -0.27106600999832153, -0.22733521461486816, -0.1836044192314148, -0.13987362384796143, -0.09614282846450806, -0.05241203308105469, -0.008681237697601318, 0.03504955768585205, 0.07878035306930542, 0.12251114845275879, 0.16624194383621216, 0.20997262001037598, 0.25370341539382935, 0.2974342107772827, 0.3411650061607361, 0.38489580154418945, 0.4286265969276428, 0.4723573923110962, 0.5160881876945496, 0.5598189830780029, 0.6035497784614563, 0.6472805738449097, 0.691011369228363, 0.7347421646118164, 0.7784729599952698, 0.8222037553787231, 0.8659345507621765, 0.9096653461456299, 0.9533961415290833, 0.9971269369125366, 1.0408577919006348, 1.0845885276794434, 1.128319263458252, 1.17205011844635, 1.2157809734344482, 1.2595117092132568, 1.3032424449920654, 1.3469732999801636, 1.3907041549682617, 1.4344348907470703, 1.478165626525879, 1.521896481513977, 1.5656273365020752, 1.6093580722808838]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 11.0, 7.0, 6.0, 12.0, 16.0, 18.0, 26.0, 24.0, 25.0, 32.0, 36.0, 39.0, 35.0, 36.0, 44.0, 41.0, 49.0, 37.0, 46.0, 42.0, 40.0, 45.0, 38.0, 37.0, 39.0, 19.0, 26.0, 33.0, 28.0, 17.0, 15.0, 14.0, 14.0, 13.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0004099607467651, -0.9704493880271912, -0.9404888153076172, -0.910528302192688, -0.880567729473114, -0.85060715675354, -0.8206465840339661, -0.7906860113143921, -0.7607254981994629, -0.7307649254798889, -0.7008043527603149, -0.6708438396453857, -0.6408832669258118, -0.6109226942062378, -0.5809621214866638, -0.5510015487670898, -0.5210410356521606, -0.49108046293258667, -0.4611199200153351, -0.4311593472957611, -0.4011988043785095, -0.37123823165893555, -0.3412776589393616, -0.31131711602211, -0.2813565135002136, -0.25139594078063965, -0.22143539786338806, -0.1914748251438141, -0.1615142822265625, -0.13155370950698853, -0.10159315168857574, -0.07163259387016296, -0.04167205095291138, -0.011711491271853447, 0.018249068409204483, 0.04820962995290756, 0.07817018777132034, 0.10813075304031372, 0.1380913108587265, 0.16805186867713928, 0.19801242649555206, 0.22797298431396484, 0.2579335570335388, 0.2878940999507904, 0.3178546726703644, 0.34781521558761597, 0.37777578830718994, 0.4077363610267639, 0.4376969039440155, 0.4676574766635895, 0.49761801958084106, 0.527578592300415, 0.557539165019989, 0.587499737739563, 0.6174602508544922, 0.6474208235740662, 0.6773813962936401, 0.7073419690132141, 0.7373025417327881, 0.7672630548477173, 0.7972236275672913, 0.8271842002868652, 0.8571447730064392, 0.8871053457260132, 0.9170658588409424]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 14.0, 18.0, 38.0, 34.0, 59.0, 118.0, 188.0, 292.0, 630.0, 1175.0, 2387.0, 5285.0, 12928.0, 48206.0, 615524.0, 311472.0, 31541.0, 10100.0, 4330.0, 1987.0, 975.0, 524.0, 240.0, 197.0, 96.0, 71.0, 46.0, 22.0, 16.0, 12.0, 7.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68359375, -0.6660079956054688, -0.6484222412109375, -0.6308364868164062, -0.613250732421875, -0.5956649780273438, -0.5780792236328125, -0.5604934692382812, -0.54290771484375, -0.5253219604492188, -0.5077362060546875, -0.49015045166015625, -0.472564697265625, -0.45497894287109375, -0.4373931884765625, -0.41980743408203125, -0.4022216796875, -0.38463592529296875, -0.3670501708984375, -0.34946441650390625, -0.331878662109375, -0.31429290771484375, -0.2967071533203125, -0.27912139892578125, -0.26153564453125, -0.24394989013671875, -0.2263641357421875, -0.20877838134765625, -0.191192626953125, -0.17360687255859375, -0.1560211181640625, -0.13843536376953125, -0.120849609375, -0.10326385498046875, -0.0856781005859375, -0.06809234619140625, -0.050506591796875, -0.03292083740234375, -0.0153350830078125, 0.00225067138671875, 0.01983642578125, 0.03742218017578125, 0.0550079345703125, 0.07259368896484375, 0.090179443359375, 0.10776519775390625, 0.1253509521484375, 0.14293670654296875, 0.1605224609375, 0.17810821533203125, 0.1956939697265625, 0.21327972412109375, 0.230865478515625, 0.24845123291015625, 0.2660369873046875, 0.28362274169921875, 0.30120849609375, 0.31879425048828125, 0.3363800048828125, 0.35396575927734375, 0.371551513671875, 0.38913726806640625, 0.4067230224609375, 0.42430877685546875, 0.44189453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 10.0, 5.0, 11.0, 15.0, 15.0, 34.0, 21.0, 40.0, 30.0, 37.0, 46.0, 50.0, 36.0, 57.0, 49.0, 40.0, 53.0, 48.0, 50.0, 53.0, 38.0, 36.0, 37.0, 28.0, 36.0, 22.0, 19.0, 18.0, 17.0, 12.0, 4.0, 10.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.84765625, -0.825592041015625, -0.80352783203125, -0.781463623046875, -0.7593994140625, -0.737335205078125, -0.71527099609375, -0.693206787109375, -0.671142578125, -0.649078369140625, -0.62701416015625, -0.604949951171875, -0.5828857421875, -0.560821533203125, -0.53875732421875, -0.516693115234375, -0.49462890625, -0.472564697265625, -0.45050048828125, -0.428436279296875, -0.4063720703125, -0.384307861328125, -0.36224365234375, -0.340179443359375, -0.318115234375, -0.296051025390625, -0.27398681640625, -0.251922607421875, -0.2298583984375, -0.207794189453125, -0.18572998046875, -0.163665771484375, -0.1416015625, -0.119537353515625, -0.09747314453125, -0.075408935546875, -0.0533447265625, -0.031280517578125, -0.00921630859375, 0.012847900390625, 0.034912109375, 0.056976318359375, 0.07904052734375, 0.101104736328125, 0.1231689453125, 0.145233154296875, 0.16729736328125, 0.189361572265625, 0.21142578125, 0.233489990234375, 0.25555419921875, 0.277618408203125, 0.2996826171875, 0.321746826171875, 0.34381103515625, 0.365875244140625, 0.387939453125, 0.410003662109375, 0.43206787109375, 0.454132080078125, 0.4761962890625, 0.498260498046875, 0.52032470703125, 0.542388916015625, 0.564453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 22.0, 22.0, 46.0, 53.0, 114.0, 252.0, 520.0, 1207.0, 3482.0, 12540.0, 84895.0, 772555.0, 147641.0, 18077.0, 4414.0, 1412.0, 630.0, 290.0, 149.0, 66.0, 49.0, 37.0, 26.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4892578125, -0.47377777099609375, -0.4582977294921875, -0.44281768798828125, -0.427337646484375, -0.41185760498046875, -0.3963775634765625, -0.38089752197265625, -0.36541748046875, -0.34993743896484375, -0.3344573974609375, -0.31897735595703125, -0.303497314453125, -0.28801727294921875, -0.2725372314453125, -0.25705718994140625, -0.2415771484375, -0.22609710693359375, -0.2106170654296875, -0.19513702392578125, -0.179656982421875, -0.16417694091796875, -0.1486968994140625, -0.13321685791015625, -0.11773681640625, -0.10225677490234375, -0.0867767333984375, -0.07129669189453125, -0.055816650390625, -0.04033660888671875, -0.0248565673828125, -0.00937652587890625, 0.006103515625, 0.02158355712890625, 0.0370635986328125, 0.05254364013671875, 0.068023681640625, 0.08350372314453125, 0.0989837646484375, 0.11446380615234375, 0.12994384765625, 0.14542388916015625, 0.1609039306640625, 0.17638397216796875, 0.191864013671875, 0.20734405517578125, 0.2228240966796875, 0.23830413818359375, 0.2537841796875, 0.26926422119140625, 0.2847442626953125, 0.30022430419921875, 0.315704345703125, 0.33118438720703125, 0.3466644287109375, 0.36214447021484375, 0.37762451171875, 0.39310455322265625, 0.4085845947265625, 0.42406463623046875, 0.439544677734375, 0.45502471923828125, 0.4705047607421875, 0.48598480224609375, 0.50146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 6.0, 9.0, 5.0, 15.0, 7.0, 21.0, 23.0, 31.0, 37.0, 37.0, 40.0, 44.0, 47.0, 43.0, 55.0, 56.0, 59.0, 61.0, 55.0, 43.0, 37.0, 45.0, 37.0, 36.0, 29.0, 23.0, 16.0, 19.0, 11.0, 12.0, 10.0, 3.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.643096923828125, -1.58795166015625, -1.532806396484375, -1.4776611328125, -1.422515869140625, -1.36737060546875, -1.312225341796875, -1.257080078125, -1.201934814453125, -1.14678955078125, -1.091644287109375, -1.0364990234375, -0.981353759765625, -0.92620849609375, -0.871063232421875, -0.81591796875, -0.760772705078125, -0.70562744140625, -0.650482177734375, -0.5953369140625, -0.540191650390625, -0.48504638671875, -0.429901123046875, -0.374755859375, -0.319610595703125, -0.26446533203125, -0.209320068359375, -0.1541748046875, -0.099029541015625, -0.04388427734375, 0.011260986328125, 0.06640625, 0.121551513671875, 0.17669677734375, 0.231842041015625, 0.2869873046875, 0.342132568359375, 0.39727783203125, 0.452423095703125, 0.507568359375, 0.562713623046875, 0.61785888671875, 0.673004150390625, 0.7281494140625, 0.783294677734375, 0.83843994140625, 0.893585205078125, 0.94873046875, 1.003875732421875, 1.05902099609375, 1.114166259765625, 1.1693115234375, 1.224456787109375, 1.27960205078125, 1.334747314453125, 1.389892578125, 1.445037841796875, 1.50018310546875, 1.555328369140625, 1.6104736328125, 1.665618896484375, 1.72076416015625, 1.775909423828125, 1.8310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 5.0, 19.0, 18.0, 28.0, 39.0, 54.0, 95.0, 140.0, 238.0, 440.0, 926.0, 1989.0, 5927.0, 28599.0, 635084.0, 346664.0, 19947.0, 4819.0, 1690.0, 751.0, 378.0, 233.0, 158.0, 85.0, 49.0, 44.0, 37.0, 20.0, 13.0, 14.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2506828308105469, -0.24306488037109375, -0.23544692993164062, -0.2278289794921875, -0.22021102905273438, -0.21259307861328125, -0.20497512817382812, -0.197357177734375, -0.18973922729492188, -0.18212127685546875, -0.17450332641601562, -0.1668853759765625, -0.15926742553710938, -0.15164947509765625, -0.14403152465820312, -0.13641357421875, -0.12879562377929688, -0.12117767333984375, -0.11355972290039062, -0.1059417724609375, -0.09832382202148438, -0.09070587158203125, -0.08308792114257812, -0.075469970703125, -0.06785202026367188, -0.06023406982421875, -0.052616119384765625, -0.0449981689453125, -0.037380218505859375, -0.02976226806640625, -0.022144317626953125, -0.0145263671875, -0.006908416748046875, 0.00070953369140625, 0.008327484130859375, 0.0159454345703125, 0.023563385009765625, 0.03118133544921875, 0.038799285888671875, 0.046417236328125, 0.054035186767578125, 0.06165313720703125, 0.06927108764648438, 0.0768890380859375, 0.08450698852539062, 0.09212493896484375, 0.09974288940429688, 0.10736083984375, 0.11497879028320312, 0.12259674072265625, 0.13021469116210938, 0.1378326416015625, 0.14545059204101562, 0.15306854248046875, 0.16068649291992188, 0.168304443359375, 0.17592239379882812, 0.18354034423828125, 0.19115829467773438, 0.1987762451171875, 0.20639419555664062, 0.21401214599609375, 0.22163009643554688, 0.229248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 14.0, 9.0, 22.0, 26.0, 44.0, 68.0, 94.0, 127.0, 185.0, 162.0, 78.0, 60.0, 38.0, 16.0, 13.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.814168930053711e-05, -7.53011554479599e-05, -7.246062159538269e-05, -6.962008774280548e-05, -6.677955389022827e-05, -6.393902003765106e-05, -6.109848618507385e-05, -5.825795233249664e-05, -5.5417418479919434e-05, -5.2576884627342224e-05, -4.9736350774765015e-05, -4.6895816922187805e-05, -4.4055283069610596e-05, -4.1214749217033386e-05, -3.837421536445618e-05, -3.553368151187897e-05, -3.269314765930176e-05, -2.985261380672455e-05, -2.701207995414734e-05, -2.417154610157013e-05, -2.133101224899292e-05, -1.849047839641571e-05, -1.56499445438385e-05, -1.2809410691261292e-05, -9.968876838684082e-06, -7.1283429861068726e-06, -4.287809133529663e-06, -1.4472752809524536e-06, 1.3932585716247559e-06, 4.233792424201965e-06, 7.074326276779175e-06, 9.914860129356384e-06, 1.2755393981933594e-05, 1.5595927834510803e-05, 1.8436461687088013e-05, 2.1276995539665222e-05, 2.411752939224243e-05, 2.695806324481964e-05, 2.979859709739685e-05, 3.263913094997406e-05, 3.547966480255127e-05, 3.832019865512848e-05, 4.116073250770569e-05, 4.40012663602829e-05, 4.684180021286011e-05, 4.968233406543732e-05, 5.2522867918014526e-05, 5.5363401770591736e-05, 5.8203935623168945e-05, 6.104446947574615e-05, 6.388500332832336e-05, 6.672553718090057e-05, 6.956607103347778e-05, 7.240660488605499e-05, 7.52471387386322e-05, 7.808767259120941e-05, 8.092820644378662e-05, 8.376874029636383e-05, 8.660927414894104e-05, 8.944980800151825e-05, 9.229034185409546e-05, 9.513087570667267e-05, 9.797140955924988e-05, 0.00010081194341182709, 0.0001036524772644043]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 4.0, 18.0, 22.0, 25.0, 30.0, 45.0, 65.0, 91.0, 106.0, 173.0, 222.0, 288.0, 460.0, 601.0, 946.0, 1491.0, 2508.0, 4821.0, 10367.0, 27506.0, 89970.0, 385482.0, 383153.0, 90109.0, 27786.0, 10464.0, 4547.0, 2537.0, 1430.0, 995.0, 626.0, 445.0, 294.0, 241.0, 162.0, 129.0, 95.0, 63.0, 53.0, 58.0, 29.0, 27.0, 14.0, 15.0, 8.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1241455078125, -0.12026596069335938, -0.11638641357421875, -0.11250686645507812, -0.1086273193359375, -0.10474777221679688, -0.10086822509765625, -0.09698867797851562, -0.093109130859375, -0.08922958374023438, -0.08535003662109375, -0.08147048950195312, -0.0775909423828125, -0.07371139526367188, -0.06983184814453125, -0.06595230102539062, -0.06207275390625, -0.058193206787109375, -0.05431365966796875, -0.050434112548828125, -0.0465545654296875, -0.042675018310546875, -0.03879547119140625, -0.034915924072265625, -0.031036376953125, -0.027156829833984375, -0.02327728271484375, -0.019397735595703125, -0.0155181884765625, -0.011638641357421875, -0.00775909423828125, -0.003879547119140625, 0.0, 0.003879547119140625, 0.00775909423828125, 0.011638641357421875, 0.0155181884765625, 0.019397735595703125, 0.02327728271484375, 0.027156829833984375, 0.031036376953125, 0.034915924072265625, 0.03879547119140625, 0.042675018310546875, 0.0465545654296875, 0.050434112548828125, 0.05431365966796875, 0.058193206787109375, 0.06207275390625, 0.06595230102539062, 0.06983184814453125, 0.07371139526367188, 0.0775909423828125, 0.08147048950195312, 0.08535003662109375, 0.08922958374023438, 0.093109130859375, 0.09698867797851562, 0.10086822509765625, 0.10474777221679688, 0.1086273193359375, 0.11250686645507812, 0.11638641357421875, 0.12026596069335938, 0.1241455078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 4.0, 12.0, 10.0, 30.0, 40.0, 52.0, 62.0, 111.0, 115.0, 126.0, 110.0, 83.0, 66.0, 53.0, 34.0, 25.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048858642578125, -0.047251224517822266, -0.04564380645751953, -0.0440363883972168, -0.04242897033691406, -0.04082155227661133, -0.039214134216308594, -0.03760671615600586, -0.035999298095703125, -0.03439188003540039, -0.032784461975097656, -0.031177043914794922, -0.029569625854492188, -0.027962207794189453, -0.02635478973388672, -0.024747371673583984, -0.02313995361328125, -0.021532535552978516, -0.01992511749267578, -0.018317699432373047, -0.016710281372070312, -0.015102863311767578, -0.013495445251464844, -0.01188802719116211, -0.010280609130859375, -0.00867319107055664, -0.007065773010253906, -0.005458354949951172, -0.0038509368896484375, -0.002243518829345703, -0.0006361007690429688, 0.0009713172912597656, 0.0025787353515625, 0.004186153411865234, 0.005793571472167969, 0.007400989532470703, 0.009008407592773438, 0.010615825653076172, 0.012223243713378906, 0.01383066177368164, 0.015438079833984375, 0.01704549789428711, 0.018652915954589844, 0.020260334014892578, 0.021867752075195312, 0.023475170135498047, 0.02508258819580078, 0.026690006256103516, 0.02829742431640625, 0.029904842376708984, 0.03151226043701172, 0.03311967849731445, 0.03472709655761719, 0.03633451461791992, 0.037941932678222656, 0.03954935073852539, 0.041156768798828125, 0.04276418685913086, 0.044371604919433594, 0.04597902297973633, 0.04758644104003906, 0.0491938591003418, 0.05080127716064453, 0.052408695220947266, 0.05401611328125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 18.0, 16.0, 26.0, 25.0, 56.0, 46.0, 62.0, 72.0, 72.0, 80.0, 73.0, 74.0, 66.0, 59.0, 51.0, 40.0, 28.0, 17.0, 13.0, 18.0, 12.0, 11.0, 2.0, 4.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7586199641227722, -0.7334376573562622, -0.7082552909851074, -0.6830729842185974, -0.6578906178474426, -0.6327083110809326, -0.6075259447097778, -0.5823436379432678, -0.5571613311767578, -0.5319790244102478, -0.506796658039093, -0.481614351272583, -0.4564320147037506, -0.4312496781349182, -0.4060673415660858, -0.3808850049972534, -0.355702668428421, -0.3305203318595886, -0.3053379952907562, -0.28015565872192383, -0.2549733519554138, -0.22979101538658142, -0.20460867881774902, -0.17942635715007782, -0.15424402058124542, -0.12906168401241302, -0.10387936234474182, -0.07869702577590942, -0.05351469665765762, -0.028332367539405823, -0.0031500309705734253, 0.02203229069709778, 0.047214627265930176, 0.07239695638418198, 0.09757928550243378, 0.12276162207126617, 0.14794394373893738, 0.17312628030776978, 0.19830861687660217, 0.22349093854427338, 0.24867327511310577, 0.273855596780777, 0.2990379333496094, 0.3242202699184418, 0.34940260648727417, 0.3745849132537842, 0.39976727962493896, 0.424949586391449, 0.45013192296028137, 0.47531425952911377, 0.5004965662956238, 0.5256789326667786, 0.5508612394332886, 0.5760436058044434, 0.6012259125709534, 0.6264082193374634, 0.6515905857086182, 0.6767728924751282, 0.701955258846283, 0.727137565612793, 0.7523199319839478, 0.7775022387504578, 0.8026845455169678, 0.8278669118881226, 0.8530492186546326]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 14.0, 16.0, 21.0, 31.0, 26.0, 23.0, 28.0, 37.0, 44.0, 42.0, 41.0, 37.0, 55.0, 44.0, 43.0, 54.0, 47.0, 40.0, 32.0, 38.0, 34.0, 38.0, 24.0, 38.0, 24.0, 20.0, 19.0, 8.0, 14.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.7005771994590759, -0.6812631487846375, -0.6619490385055542, -0.6426349878311157, -0.6233208775520325, -0.604006826877594, -0.5846927165985107, -0.5653786659240723, -0.5460646152496338, -0.5267505645751953, -0.5074364542961121, -0.4881224036216736, -0.4688083231449127, -0.44949424266815186, -0.430180162191391, -0.4108660817146301, -0.39155200123786926, -0.3722379207611084, -0.35292384028434753, -0.33360975980758667, -0.3142957091331482, -0.29498162865638733, -0.27566754817962646, -0.256353497505188, -0.23703940212726593, -0.21772532165050507, -0.1984112560749054, -0.17909717559814453, -0.15978309512138367, -0.140469029545784, -0.12115494906902313, -0.10184088349342346, -0.0825268030166626, -0.06321272999048233, -0.043898653239011765, -0.0245845764875412, -0.005270503461360931, 0.014043569564819336, 0.0333576500415802, 0.05267171561717987, 0.07198579609394073, 0.091299869120121, 0.11061394214630127, 0.12992802262306213, 0.149242103099823, 0.16855616867542267, 0.18787024915218353, 0.2071843147277832, 0.22649839520454407, 0.24581247568130493, 0.2651265561580658, 0.28444063663482666, 0.30375468730926514, 0.323068767786026, 0.34238284826278687, 0.36169689893722534, 0.3810110092163086, 0.40032508969306946, 0.4196391701698303, 0.4389532208442688, 0.45826730132102966, 0.4775813817977905, 0.4968954622745514, 0.5162095427513123, 0.5355235934257507]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 2.0, 3.0, 8.0, 6.0, 21.0, 19.0, 20.0, 31.0, 35.0, 44.0, 87.0, 109.0, 165.0, 264.0, 480.0, 756.0, 1327.0, 2248.0, 4301.0, 8302.0, 18792.0, 54336.0, 236580.0, 524740.0, 132702.0, 35209.0, 13510.0, 6345.0, 3337.0, 1881.0, 1130.0, 654.0, 379.0, 226.0, 155.0, 105.0, 72.0, 36.0, 33.0, 30.0, 23.0, 15.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.95263671875, -0.9222183227539062, -0.8917999267578125, -0.8613815307617188, -0.830963134765625, -0.8005447387695312, -0.7701263427734375, -0.7397079467773438, -0.70928955078125, -0.6788711547851562, -0.6484527587890625, -0.6180343627929688, -0.587615966796875, -0.5571975708007812, -0.5267791748046875, -0.49636077880859375, -0.4659423828125, -0.43552398681640625, -0.4051055908203125, -0.37468719482421875, -0.344268798828125, -0.31385040283203125, -0.2834320068359375, -0.25301361083984375, -0.22259521484375, -0.19217681884765625, -0.1617584228515625, -0.13134002685546875, -0.100921630859375, -0.07050323486328125, -0.0400848388671875, -0.00966644287109375, 0.020751953125, 0.05117034912109375, 0.0815887451171875, 0.11200714111328125, 0.142425537109375, 0.17284393310546875, 0.2032623291015625, 0.23368072509765625, 0.26409912109375, 0.29451751708984375, 0.3249359130859375, 0.35535430908203125, 0.385772705078125, 0.41619110107421875, 0.4466094970703125, 0.47702789306640625, 0.5074462890625, 0.5378646850585938, 0.5682830810546875, 0.5987014770507812, 0.629119873046875, 0.6595382690429688, 0.6899566650390625, 0.7203750610351562, 0.75079345703125, 0.7812118530273438, 0.8116302490234375, 0.8420486450195312, 0.872467041015625, 0.9028854370117188, 0.9333038330078125, 0.9637222290039062, 0.994140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 9.0, 15.0, 14.0, 15.0, 22.0, 19.0, 18.0, 28.0, 38.0, 29.0, 40.0, 44.0, 28.0, 48.0, 53.0, 44.0, 62.0, 53.0, 47.0, 41.0, 34.0, 34.0, 41.0, 26.0, 29.0, 28.0, 22.0, 16.0, 17.0, 13.0, 11.0, 6.0, 10.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0615234375, -1.028961181640625, -0.99639892578125, -0.963836669921875, -0.9312744140625, -0.898712158203125, -0.86614990234375, -0.833587646484375, -0.801025390625, -0.768463134765625, -0.73590087890625, -0.703338623046875, -0.6707763671875, -0.638214111328125, -0.60565185546875, -0.573089599609375, -0.54052734375, -0.507965087890625, -0.47540283203125, -0.442840576171875, -0.4102783203125, -0.377716064453125, -0.34515380859375, -0.312591552734375, -0.280029296875, -0.247467041015625, -0.21490478515625, -0.182342529296875, -0.1497802734375, -0.117218017578125, -0.08465576171875, -0.052093505859375, -0.01953125, 0.013031005859375, 0.04559326171875, 0.078155517578125, 0.1107177734375, 0.143280029296875, 0.17584228515625, 0.208404541015625, 0.240966796875, 0.273529052734375, 0.30609130859375, 0.338653564453125, 0.3712158203125, 0.403778076171875, 0.43634033203125, 0.468902587890625, 0.50146484375, 0.534027099609375, 0.56658935546875, 0.599151611328125, 0.6317138671875, 0.664276123046875, 0.69683837890625, 0.729400634765625, 0.761962890625, 0.794525146484375, 0.82708740234375, 0.859649658203125, 0.8922119140625, 0.924774169921875, 0.95733642578125, 0.989898681640625, 1.0224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 13.0, 17.0, 17.0, 26.0, 35.0, 47.0, 68.0, 94.0, 112.0, 166.0, 259.0, 403.0, 691.0, 1244.0, 2454.0, 5443.0, 14264.0, 43643.0, 188959.0, 586459.0, 145739.0, 36216.0, 12094.0, 4857.0, 2183.0, 1147.0, 630.0, 391.0, 259.0, 178.0, 125.0, 77.0, 58.0, 39.0, 46.0, 20.0, 17.0, 11.0, 8.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.275970458984375, -1.23260498046875, -1.189239501953125, -1.1458740234375, -1.102508544921875, -1.05914306640625, -1.015777587890625, -0.972412109375, -0.929046630859375, -0.88568115234375, -0.842315673828125, -0.7989501953125, -0.755584716796875, -0.71221923828125, -0.668853759765625, -0.62548828125, -0.582122802734375, -0.53875732421875, -0.495391845703125, -0.4520263671875, -0.408660888671875, -0.36529541015625, -0.321929931640625, -0.278564453125, -0.235198974609375, -0.19183349609375, -0.148468017578125, -0.1051025390625, -0.061737060546875, -0.01837158203125, 0.024993896484375, 0.068359375, 0.111724853515625, 0.15509033203125, 0.198455810546875, 0.2418212890625, 0.285186767578125, 0.32855224609375, 0.371917724609375, 0.415283203125, 0.458648681640625, 0.50201416015625, 0.545379638671875, 0.5887451171875, 0.632110595703125, 0.67547607421875, 0.718841552734375, 0.76220703125, 0.805572509765625, 0.84893798828125, 0.892303466796875, 0.9356689453125, 0.979034423828125, 1.02239990234375, 1.065765380859375, 1.109130859375, 1.152496337890625, 1.19586181640625, 1.239227294921875, 1.2825927734375, 1.325958251953125, 1.36932373046875, 1.412689208984375, 1.4560546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 4.0, 9.0, 6.0, 14.0, 8.0, 14.0, 15.0, 12.0, 17.0, 25.0, 31.0, 37.0, 22.0, 35.0, 42.0, 45.0, 44.0, 48.0, 40.0, 42.0, 31.0, 46.0, 44.0, 48.0, 38.0, 35.0, 38.0, 37.0, 37.0, 25.0, 15.0, 19.0, 12.0, 10.0, 8.0, 13.0, 11.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.171875, -1.13525390625, -1.0986328125, -1.06201171875, -1.025390625, -0.98876953125, -0.9521484375, -0.91552734375, -0.87890625, -0.84228515625, -0.8056640625, -0.76904296875, -0.732421875, -0.69580078125, -0.6591796875, -0.62255859375, -0.5859375, -0.54931640625, -0.5126953125, -0.47607421875, -0.439453125, -0.40283203125, -0.3662109375, -0.32958984375, -0.29296875, -0.25634765625, -0.2197265625, -0.18310546875, -0.146484375, -0.10986328125, -0.0732421875, -0.03662109375, 0.0, 0.03662109375, 0.0732421875, 0.10986328125, 0.146484375, 0.18310546875, 0.2197265625, 0.25634765625, 0.29296875, 0.32958984375, 0.3662109375, 0.40283203125, 0.439453125, 0.47607421875, 0.5126953125, 0.54931640625, 0.5859375, 0.62255859375, 0.6591796875, 0.69580078125, 0.732421875, 0.76904296875, 0.8056640625, 0.84228515625, 0.87890625, 0.91552734375, 0.9521484375, 0.98876953125, 1.025390625, 1.06201171875, 1.0986328125, 1.13525390625, 1.171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 15.0, 18.0, 25.0, 38.0, 40.0, 81.0, 83.0, 138.0, 167.0, 303.0, 472.0, 809.0, 1425.0, 2705.0, 5335.0, 11501.0, 28575.0, 89616.0, 555786.0, 255008.0, 57938.0, 20360.0, 8752.0, 4214.0, 2117.0, 1179.0, 686.0, 356.0, 238.0, 180.0, 120.0, 78.0, 47.0, 42.0, 21.0, 22.0, 14.0, 10.0, 10.0, 8.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18408203125, -0.17811012268066406, -0.17213821411132812, -0.1661663055419922, -0.16019439697265625, -0.1542224884033203, -0.14825057983398438, -0.14227867126464844, -0.1363067626953125, -0.13033485412597656, -0.12436294555664062, -0.11839103698730469, -0.11241912841796875, -0.10644721984863281, -0.10047531127929688, -0.09450340270996094, -0.088531494140625, -0.08255958557128906, -0.07658767700195312, -0.07061576843261719, -0.06464385986328125, -0.05867195129394531, -0.052700042724609375, -0.04672813415527344, -0.0407562255859375, -0.03478431701660156, -0.028812408447265625, -0.022840499877929688, -0.01686859130859375, -0.010896682739257812, -0.004924774169921875, 0.0010471343994140625, 0.00701904296875, 0.012990951538085938, 0.018962860107421875, 0.024934768676757812, 0.03090667724609375, 0.03687858581542969, 0.042850494384765625, 0.04882240295410156, 0.0547943115234375, 0.06076622009277344, 0.06673812866210938, 0.07271003723144531, 0.07868194580078125, 0.08465385437011719, 0.09062576293945312, 0.09659767150878906, 0.102569580078125, 0.10854148864746094, 0.11451339721679688, 0.12048530578613281, 0.12645721435546875, 0.1324291229248047, 0.13840103149414062, 0.14437294006347656, 0.1503448486328125, 0.15631675720214844, 0.16228866577148438, 0.1682605743408203, 0.17423248291015625, 0.1802043914794922, 0.18617630004882812, 0.19214820861816406, 0.1981201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 11.0, 27.0, 19.0, 28.0, 47.0, 63.0, 86.0, 239.0, 175.0, 79.0, 56.0, 49.0, 30.0, 18.0, 14.0, 15.0, 6.0, 4.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.1856040954589844e-05, -5.0487928092479706e-05, -4.911981523036957e-05, -4.775170236825943e-05, -4.638358950614929e-05, -4.5015476644039154e-05, -4.3647363781929016e-05, -4.227925091981888e-05, -4.091113805770874e-05, -3.95430251955986e-05, -3.8174912333488464e-05, -3.6806799471378326e-05, -3.543868660926819e-05, -3.407057374715805e-05, -3.270246088504791e-05, -3.1334348022937775e-05, -2.9966235160827637e-05, -2.85981222987175e-05, -2.723000943660736e-05, -2.5861896574497223e-05, -2.4493783712387085e-05, -2.3125670850276947e-05, -2.175755798816681e-05, -2.038944512605667e-05, -1.9021332263946533e-05, -1.7653219401836395e-05, -1.6285106539726257e-05, -1.491699367761612e-05, -1.3548880815505981e-05, -1.2180767953395844e-05, -1.0812655091285706e-05, -9.444542229175568e-06, -8.07642936706543e-06, -6.708316504955292e-06, -5.340203642845154e-06, -3.972090780735016e-06, -2.603977918624878e-06, -1.23586505651474e-06, 1.3224780559539795e-07, 1.5003606677055359e-06, 2.868473529815674e-06, 4.236586391925812e-06, 5.60469925403595e-06, 6.972812116146088e-06, 8.340924978256226e-06, 9.709037840366364e-06, 1.1077150702476501e-05, 1.244526356458664e-05, 1.3813376426696777e-05, 1.5181489288806915e-05, 1.6549602150917053e-05, 1.791771501302719e-05, 1.928582787513733e-05, 2.0653940737247467e-05, 2.2022053599357605e-05, 2.3390166461467743e-05, 2.475827932357788e-05, 2.612639218568802e-05, 2.7494505047798157e-05, 2.8862617909908295e-05, 3.0230730772018433e-05, 3.159884363412857e-05, 3.296695649623871e-05, 3.4335069358348846e-05, 3.5703182220458984e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 15.0, 17.0, 24.0, 25.0, 36.0, 64.0, 88.0, 115.0, 161.0, 243.0, 370.0, 565.0, 909.0, 1498.0, 2737.0, 5152.0, 10620.0, 25096.0, 80468.0, 614696.0, 224532.0, 46868.0, 17058.0, 7766.0, 3769.0, 2189.0, 1227.0, 708.0, 451.0, 330.0, 209.0, 154.0, 120.0, 68.0, 50.0, 41.0, 28.0, 22.0, 10.0, 11.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.260498046875, -0.2523040771484375, -0.244110107421875, -0.2359161376953125, -0.22772216796875, -0.2195281982421875, -0.211334228515625, -0.2031402587890625, -0.1949462890625, -0.1867523193359375, -0.178558349609375, -0.1703643798828125, -0.16217041015625, -0.1539764404296875, -0.145782470703125, -0.1375885009765625, -0.12939453125, -0.1212005615234375, -0.113006591796875, -0.1048126220703125, -0.09661865234375, -0.0884246826171875, -0.080230712890625, -0.0720367431640625, -0.0638427734375, -0.0556488037109375, -0.047454833984375, -0.0392608642578125, -0.03106689453125, -0.0228729248046875, -0.014678955078125, -0.0064849853515625, 0.001708984375, 0.0099029541015625, 0.018096923828125, 0.0262908935546875, 0.03448486328125, 0.0426788330078125, 0.050872802734375, 0.0590667724609375, 0.0672607421875, 0.0754547119140625, 0.083648681640625, 0.0918426513671875, 0.10003662109375, 0.1082305908203125, 0.116424560546875, 0.1246185302734375, 0.1328125, 0.1410064697265625, 0.149200439453125, 0.1573944091796875, 0.16558837890625, 0.1737823486328125, 0.181976318359375, 0.1901702880859375, 0.1983642578125, 0.2065582275390625, 0.214752197265625, 0.2229461669921875, 0.23114013671875, 0.2393341064453125, 0.247528076171875, 0.2557220458984375, 0.263916015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 7.0, 7.0, 8.0, 5.0, 17.0, 8.0, 11.0, 23.0, 31.0, 30.0, 50.0, 67.0, 90.0, 163.0, 118.0, 98.0, 45.0, 42.0, 36.0, 18.0, 21.0, 14.0, 12.0, 10.0, 8.0, 13.0, 8.0, 2.0, 8.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12017822265625, -0.1166372299194336, -0.11309623718261719, -0.10955524444580078, -0.10601425170898438, -0.10247325897216797, -0.09893226623535156, -0.09539127349853516, -0.09185028076171875, -0.08830928802490234, -0.08476829528808594, -0.08122730255126953, -0.07768630981445312, -0.07414531707763672, -0.07060432434082031, -0.0670633316040039, -0.0635223388671875, -0.059981346130371094, -0.05644035339355469, -0.05289936065673828, -0.049358367919921875, -0.04581737518310547, -0.04227638244628906, -0.038735389709472656, -0.03519439697265625, -0.031653404235839844, -0.028112411499023438, -0.02457141876220703, -0.021030426025390625, -0.01748943328857422, -0.013948440551757812, -0.010407447814941406, -0.006866455078125, -0.0033254623413085938, 0.0002155303955078125, 0.0037565231323242188, 0.007297515869140625, 0.010838508605957031, 0.014379501342773438, 0.017920494079589844, 0.02146148681640625, 0.025002479553222656, 0.028543472290039062, 0.03208446502685547, 0.035625457763671875, 0.03916645050048828, 0.04270744323730469, 0.046248435974121094, 0.0497894287109375, 0.053330421447753906, 0.05687141418457031, 0.06041240692138672, 0.06395339965820312, 0.06749439239501953, 0.07103538513183594, 0.07457637786865234, 0.07811737060546875, 0.08165836334228516, 0.08519935607910156, 0.08874034881591797, 0.09228134155273438, 0.09582233428955078, 0.09936332702636719, 0.1029043197631836, 0.1064453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 14.0, 22.0, 28.0, 39.0, 76.0, 111.0, 117.0, 132.0, 148.0, 110.0, 67.0, 38.0, 29.0, 19.0, 11.0, 15.0, 4.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0309042930603027, -1.945160984992981, -1.8594176769256592, -1.7736742496490479, -1.687930941581726, -1.6021876335144043, -1.516444206237793, -1.4307008981704712, -1.3449575901031494, -1.2592142820358276, -1.1734709739685059, -1.0877275466918945, -1.0019842386245728, -0.916240930557251, -0.8304975628852844, -0.7447541952133179, -0.6590108871459961, -0.5732675790786743, -0.48752421140670776, -0.4017808735370636, -0.31603753566741943, -0.23029419779777527, -0.1445508599281311, -0.05880749225616455, 0.026935815811157227, 0.11267915368080139, 0.19842249155044556, 0.2841658294200897, 0.3699091672897339, 0.45565250515937805, 0.5413958430290222, 0.6271392107009888, 0.7128827571868896, 0.7986260652542114, 0.884369432926178, 0.9701128005981445, 1.0558561086654663, 1.141599416732788, 1.2273428440093994, 1.3130861520767212, 1.398829460144043, 1.4845727682113647, 1.5703160762786865, 1.6560595035552979, 1.7418028116226196, 1.8275461196899414, 1.9132895469665527, 1.9990328550338745, 2.0847761631011963, 2.1705195903778076, 2.25626277923584, 2.342006206512451, 2.4277496337890625, 2.5134928226470947, 2.599236249923706, 2.6849794387817383, 2.7707228660583496, 2.856466293334961, 2.942209482192993, 3.0279529094696045, 3.1136960983276367, 3.199439525604248, 3.2851829528808594, 3.3709263801574707, 3.456669569015503]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 5.0, 8.0, 6.0, 11.0, 17.0, 19.0, 15.0, 12.0, 16.0, 34.0, 26.0, 22.0, 26.0, 28.0, 36.0, 39.0, 40.0, 60.0, 44.0, 32.0, 45.0, 36.0, 39.0, 40.0, 28.0, 38.0, 33.0, 29.0, 31.0, 16.0, 20.0, 28.0, 16.0, 12.0, 16.0, 13.0, 10.0, 4.0, 5.0, 2.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8244893550872803, -1.7670289278030396, -1.7095686197280884, -1.6521081924438477, -1.5946478843688965, -1.5371874570846558, -1.479727029800415, -1.4222667217254639, -1.3648064136505127, -1.307345986366272, -1.2498856782913208, -1.19242525100708, -1.134964942932129, -1.0775045156478882, -1.0200440883636475, -0.9625837802886963, -0.9051233530044556, -0.8476629853248596, -0.7902026176452637, -0.732742190361023, -0.6752818822860718, -0.617821455001831, -0.5603610873222351, -0.5029007196426392, -0.4454403519630432, -0.38797998428344727, -0.3305196166038513, -0.273059219121933, -0.21559885144233704, -0.1581384837627411, -0.10067808628082275, -0.04321771860122681, 0.01424252986907959, 0.07170290499925613, 0.12916328012943268, 0.18662366271018982, 0.24408403038978577, 0.3015443980693817, 0.35900479555130005, 0.416465163230896, 0.47392553091049194, 0.5313858985900879, 0.5888462662696838, 0.6463066339492798, 0.7037670612335205, 0.7612273693084717, 0.8186877965927124, 0.8761481642723083, 0.9336085319519043, 0.9910688996315002, 1.0485292673110962, 1.105989694595337, 1.163450002670288, 1.2209104299545288, 1.2783708572387695, 1.3358311653137207, 1.3932914733886719, 1.4507519006729126, 1.5082122087478638, 1.5656726360321045, 1.6231329441070557, 1.6805933713912964, 1.738053798675537, 1.7955141067504883, 1.852974534034729]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 3.0, 11.0, 12.0, 5.0, 19.0, 24.0, 29.0, 33.0, 38.0, 41.0, 48.0, 79.0, 77.0, 126.0, 148.0, 158.0, 225.0, 313.0, 474.0, 1032.0, 3191.0, 1040823.0, 1503.0, 585.0, 363.0, 257.0, 198.0, 154.0, 147.0, 80.0, 92.0, 62.0, 46.0, 37.0, 40.0, 23.0, 19.0, 20.0, 15.0, 9.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.803248643875122, -2.71335506439209, -2.6234614849090576, -2.5335679054260254, -2.443674325942993, -2.353780746459961, -2.2638869285583496, -2.1739933490753174, -2.084099769592285, -1.994206190109253, -1.9043126106262207, -1.8144190311431885, -1.7245253324508667, -1.6346317529678345, -1.5447381734848022, -1.4548444747924805, -1.3649510145187378, -1.2750574350357056, -1.1851638555526733, -1.0952701568603516, -1.0053765773773193, -0.9154829978942871, -0.8255894184112549, -0.7356957793235779, -0.6458021998405457, -0.5559086203575134, -0.4660149812698364, -0.3761214017868042, -0.2862277925014496, -0.19633418321609497, -0.10644060373306274, -0.016546964645385742, 0.07334661483764648, 0.1632402241230011, 0.2531338334083557, 0.34302741289138794, 0.43292102217674255, 0.5228146314620972, 0.6127082109451294, 0.7026018500328064, 0.7924954295158386, 0.8823890089988708, 0.9722826480865479, 1.06217622756958, 1.1520698070526123, 1.2419633865356445, 1.3318569660186768, 1.4217506647109985, 1.5116442441940308, 1.601537823677063, 1.6914314031600952, 1.781325101852417, 1.8712186813354492, 1.9611122608184814, 2.0510058403015137, 2.140899419784546, 2.230792999267578, 2.3206865787506104, 2.4105801582336426, 2.500473737716675, 2.590367317199707, 2.6802611351013184, 2.7701544761657715, 2.860048294067383, 2.949941873550415]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 8.0, 12.0, 20.0, 36.0, 34.0, 52.0, 72.0, 104.0, 141.0, 189.0, 317.0, 541.0, 1109.0, 3470.0, 51455272.0, 5843.0, 1321.0, 668.0, 330.0, 216.0, 145.0, 102.0, 78.0, 74.0, 44.0, 40.0, 26.0, 14.0, 8.0, 13.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.327807426452637, -11.8970308303833, -11.466254234313965, -11.035478591918945, -10.60470199584961, -10.173925399780273, -9.743148803710938, -9.312372207641602, -8.881596565246582, -8.450819969177246, -8.02004337310791, -7.589267253875732, -7.158491134643555, -6.727714538574219, -6.296937942504883, -5.866161823272705, -5.435385227203369, -5.004608631134033, -4.5738325119018555, -4.1430559158325195, -3.712279796600342, -3.281503200531006, -2.850726842880249, -2.419950485229492, -1.9891741275787354, -1.5583977699279785, -1.1276214122772217, -0.6968449354171753, -0.26606857776641846, 0.16470789909362793, 0.5954842567443848, 1.0262606143951416, 1.4570369720458984, 1.8878133296966553, 2.318589687347412, 2.749366283416748, 3.180142402648926, 3.6109189987182617, 4.041695594787598, 4.472471714019775, 4.903247833251953, 5.334024429321289, 5.764800548553467, 6.195577144622803, 6.6263532638549805, 7.057129859924316, 7.487906455993652, 7.91868257522583, 8.349458694458008, 8.780235290527344, 9.21101188659668, 9.6417875289917, 10.072564125061035, 10.503340721130371, 10.934117317199707, 11.364892959594727, 11.795670509338379, 12.226447105407715, 12.65722370147705, 13.08799934387207, 13.518775939941406, 13.949552536010742, 14.380329132080078, 14.811105728149414, 15.241881370544434]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 12.0, 14.0, 21.0, 26.0, 45.0, 64.0, 85.0, 149.0, 228.0, 342.0, 473.0, 762.0, 1194.0, 1898.0, 2865.0, 4780.0, 7847.0, 13950.0, 24462.0, 46299.0, 87612.0, 169525.0, 320098.0, 567118.0, 3707758.0, 608206.0, 339730.0, 181425.0, 93769.0, 49019.0, 25884.0, 14412.0, 8160.0, 4854.0, 2985.0, 1858.0, 1228.0, 783.0, 496.0, 347.0, 241.0, 145.0, 88.0, 69.0, 43.0, 23.0, 15.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.78759765625, -0.76263427734375, -0.7376708984375, -0.71270751953125, -0.687744140625, -0.66278076171875, -0.6378173828125, -0.61285400390625, -0.587890625, -0.56292724609375, -0.5379638671875, -0.51300048828125, -0.488037109375, -0.46307373046875, -0.4381103515625, -0.41314697265625, -0.38818359375, -0.36322021484375, -0.3382568359375, -0.31329345703125, -0.288330078125, -0.26336669921875, -0.2384033203125, -0.21343994140625, -0.1884765625, -0.16351318359375, -0.1385498046875, -0.11358642578125, -0.088623046875, -0.06365966796875, -0.0386962890625, -0.01373291015625, 0.01123046875, 0.03619384765625, 0.0611572265625, 0.08612060546875, 0.111083984375, 0.13604736328125, 0.1610107421875, 0.18597412109375, 0.2109375, 0.23590087890625, 0.2608642578125, 0.28582763671875, 0.310791015625, 0.33575439453125, 0.3607177734375, 0.38568115234375, 0.41064453125, 0.43560791015625, 0.4605712890625, 0.48553466796875, 0.510498046875, 0.53546142578125, 0.5604248046875, 0.58538818359375, 0.6103515625, 0.63531494140625, 0.6602783203125, 0.68524169921875, 0.710205078125, 0.73516845703125, 0.7601318359375, 0.78509521484375, 0.81005859375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 9.0, 20.0, 14.0, 22.0, 21.0, 29.0, 31.0, 34.0, 34.0, 42.0, 46.0, 43.0, 49.0, 90.0, 969.0, 108.0, 54.0, 57.0, 42.0, 41.0, 44.0, 31.0, 22.0, 32.0, 20.0, 24.0, 15.0, 11.0, 6.0, 16.0, 5.0, 7.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.390625, -9.110595703125, -8.83056640625, -8.550537109375, -8.2705078125, -7.990478515625, -7.71044921875, -7.430419921875, -7.150390625, -6.870361328125, -6.59033203125, -6.310302734375, -6.0302734375, -5.750244140625, -5.47021484375, -5.190185546875, -4.91015625, -4.630126953125, -4.35009765625, -4.070068359375, -3.7900390625, -3.510009765625, -3.22998046875, -2.949951171875, -2.669921875, -2.389892578125, -2.10986328125, -1.829833984375, -1.5498046875, -1.269775390625, -0.98974609375, -0.709716796875, -0.4296875, -0.149658203125, 0.13037109375, 0.410400390625, 0.6904296875, 0.970458984375, 1.25048828125, 1.530517578125, 1.810546875, 2.090576171875, 2.37060546875, 2.650634765625, 2.9306640625, 3.210693359375, 3.49072265625, 3.770751953125, 4.05078125, 4.330810546875, 4.61083984375, 4.890869140625, 5.1708984375, 5.450927734375, 5.73095703125, 6.010986328125, 6.291015625, 6.571044921875, 6.85107421875, 7.131103515625, 7.4111328125, 7.691162109375, 7.97119140625, 8.251220703125, 8.53125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 14.0, 21.0, 34.0, 44.0, 69.0, 118.0, 137.0, 203.0, 321.0, 456.0, 732.0, 1045.0, 1656.0, 2637.0, 4053.0, 6611.0, 10897.0, 17666.0, 30548.0, 51360.0, 89208.0, 149477.0, 243964.0, 362976.0, 608303.0, 3491047.0, 429515.0, 306232.0, 195766.0, 117228.0, 68352.0, 39872.0, 23387.0, 14168.0, 8637.0, 5303.0, 3302.0, 2136.0, 1305.0, 871.0, 578.0, 347.0, 268.0, 170.0, 125.0, 85.0, 61.0, 38.0, 26.0, 20.0, 12.0, 13.0, 7.0, 7.0, 1.0, 0.0, 2.0], "bins": [-0.4912109375, -0.4759864807128906, -0.46076202392578125, -0.4455375671386719, -0.4303131103515625, -0.4150886535644531, -0.39986419677734375, -0.3846397399902344, -0.369415283203125, -0.3541908264160156, -0.33896636962890625, -0.3237419128417969, -0.3085174560546875, -0.2932929992675781, -0.27806854248046875, -0.2628440856933594, -0.24761962890625, -0.23239517211914062, -0.21717071533203125, -0.20194625854492188, -0.1867218017578125, -0.17149734497070312, -0.15627288818359375, -0.14104843139648438, -0.125823974609375, -0.11059951782226562, -0.09537506103515625, -0.08015060424804688, -0.0649261474609375, -0.049701690673828125, -0.03447723388671875, -0.019252777099609375, -0.0040283203125, 0.011196136474609375, 0.02642059326171875, 0.041645050048828125, 0.0568695068359375, 0.07209396362304688, 0.08731842041015625, 0.10254287719726562, 0.117767333984375, 0.13299179077148438, 0.14821624755859375, 0.16344070434570312, 0.1786651611328125, 0.19388961791992188, 0.20911407470703125, 0.22433853149414062, 0.23956298828125, 0.2547874450683594, 0.27001190185546875, 0.2852363586425781, 0.3004608154296875, 0.3156852722167969, 0.33090972900390625, 0.3461341857910156, 0.361358642578125, 0.3765830993652344, 0.39180755615234375, 0.4070320129394531, 0.4222564697265625, 0.4374809265136719, 0.45270538330078125, 0.4679298400878906, 0.483154296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 12.0, 10.0, 14.0, 18.0, 25.0, 15.0, 22.0, 24.0, 33.0, 37.0, 35.0, 41.0, 36.0, 35.0, 37.0, 38.0, 422.0, 684.0, 46.0, 44.0, 38.0, 44.0, 27.0, 32.0, 31.0, 31.0, 25.0, 25.0, 30.0, 13.0, 14.0, 18.0, 9.0, 9.0, 6.0, 5.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1640625, -6.94091796875, -6.7177734375, -6.49462890625, -6.271484375, -6.04833984375, -5.8251953125, -5.60205078125, -5.37890625, -5.15576171875, -4.9326171875, -4.70947265625, -4.486328125, -4.26318359375, -4.0400390625, -3.81689453125, -3.59375, -3.37060546875, -3.1474609375, -2.92431640625, -2.701171875, -2.47802734375, -2.2548828125, -2.03173828125, -1.80859375, -1.58544921875, -1.3623046875, -1.13916015625, -0.916015625, -0.69287109375, -0.4697265625, -0.24658203125, -0.0234375, 0.19970703125, 0.4228515625, 0.64599609375, 0.869140625, 1.09228515625, 1.3154296875, 1.53857421875, 1.76171875, 1.98486328125, 2.2080078125, 2.43115234375, 2.654296875, 2.87744140625, 3.1005859375, 3.32373046875, 3.546875, 3.77001953125, 3.9931640625, 4.21630859375, 4.439453125, 4.66259765625, 4.8857421875, 5.10888671875, 5.33203125, 5.55517578125, 5.7783203125, 6.00146484375, 6.224609375, 6.44775390625, 6.6708984375, 6.89404296875, 7.1171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 15.0, 14.0, 22.0, 33.0, 42.0, 65.0, 114.0, 155.0, 223.0, 292.0, 459.0, 693.0, 1046.0, 1751.0, 2905.0, 4997.0, 8948.0, 16815.0, 33974.0, 69716.0, 159678.0, 5644188.0, 188231.0, 77260.0, 37278.0, 18605.0, 9896.0, 5532.0, 3168.0, 1852.0, 1161.0, 733.0, 493.0, 328.0, 193.0, 170.0, 109.0, 75.0, 51.0, 42.0, 42.0, 15.0, 22.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.63671875, -1.584869384765625, -1.53302001953125, -1.481170654296875, -1.4293212890625, -1.377471923828125, -1.32562255859375, -1.273773193359375, -1.221923828125, -1.170074462890625, -1.11822509765625, -1.066375732421875, -1.0145263671875, -0.962677001953125, -0.91082763671875, -0.858978271484375, -0.80712890625, -0.755279541015625, -0.70343017578125, -0.651580810546875, -0.5997314453125, -0.547882080078125, -0.49603271484375, -0.444183349609375, -0.392333984375, -0.340484619140625, -0.28863525390625, -0.236785888671875, -0.1849365234375, -0.133087158203125, -0.08123779296875, -0.029388427734375, 0.0224609375, 0.074310302734375, 0.12615966796875, 0.178009033203125, 0.2298583984375, 0.281707763671875, 0.33355712890625, 0.385406494140625, 0.437255859375, 0.489105224609375, 0.54095458984375, 0.592803955078125, 0.6446533203125, 0.696502685546875, 0.74835205078125, 0.800201416015625, 0.85205078125, 0.903900146484375, 0.95574951171875, 1.007598876953125, 1.0594482421875, 1.111297607421875, 1.16314697265625, 1.214996337890625, 1.266845703125, 1.318695068359375, 1.37054443359375, 1.422393798828125, 1.4742431640625, 1.526092529296875, 1.57794189453125, 1.629791259765625, 1.681640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 6.0, 12.0, 8.0, 17.0, 12.0, 12.0, 14.0, 28.0, 19.0, 37.0, 29.0, 29.0, 38.0, 44.0, 43.0, 43.0, 27.0, 60.0, 1028.0, 78.0, 42.0, 40.0, 49.0, 41.0, 42.0, 37.0, 24.0, 26.0, 24.0, 13.0, 17.0, 14.0, 9.0, 12.0, 15.0, 14.0, 0.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.52801513671875, -7.2552490234375, -6.98248291015625, -6.709716796875, -6.43695068359375, -6.1641845703125, -5.89141845703125, -5.61865234375, -5.34588623046875, -5.0731201171875, -4.80035400390625, -4.527587890625, -4.25482177734375, -3.9820556640625, -3.70928955078125, -3.4365234375, -3.16375732421875, -2.8909912109375, -2.61822509765625, -2.345458984375, -2.07269287109375, -1.7999267578125, -1.52716064453125, -1.25439453125, -0.98162841796875, -0.7088623046875, -0.43609619140625, -0.163330078125, 0.10943603515625, 0.3822021484375, 0.65496826171875, 0.927734375, 1.20050048828125, 1.4732666015625, 1.74603271484375, 2.018798828125, 2.29156494140625, 2.5643310546875, 2.83709716796875, 3.10986328125, 3.38262939453125, 3.6553955078125, 3.92816162109375, 4.200927734375, 4.47369384765625, 4.7464599609375, 5.01922607421875, 5.2919921875, 5.56475830078125, 5.8375244140625, 6.11029052734375, 6.383056640625, 6.65582275390625, 6.9285888671875, 7.20135498046875, 7.47412109375, 7.74688720703125, 8.0196533203125, 8.29241943359375, 8.565185546875, 8.83795166015625, 9.1107177734375, 9.38348388671875, 9.65625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 19.0, 49.0, 100.0, 280.0, 302.0, 132.0, 49.0, 22.0, 11.0, 11.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.92098045349121, -25.890653610229492, -24.860328674316406, -23.830001831054688, -22.79967498779297, -21.76934814453125, -20.73902130126953, -19.708696365356445, -18.678369522094727, -17.648042678833008, -16.617717742919922, -15.587390899658203, -14.557064056396484, -13.526737213134766, -12.496411323547363, -11.466085433959961, -10.435758590698242, -9.405431747436523, -8.375105857849121, -7.3447794914245605, -6.314453125, -5.2841267585754395, -4.253800392150879, -3.2234740257263184, -2.193147659301758, -1.1628212928771973, -0.13249492645263672, 0.8978314399719238, 1.9281578063964844, 2.958484172821045, 3.9888105392456055, 5.019136905670166, 6.049465179443359, 7.07979154586792, 8.11011791229248, 9.140443801879883, 10.170770645141602, 11.20109748840332, 12.231423377990723, 13.261749267578125, 14.292076110839844, 15.322402954101562, 16.35272979736328, 17.383054733276367, 18.413381576538086, 19.443708419799805, 20.47403335571289, 21.50436019897461, 22.534687042236328, 23.565013885498047, 24.595340728759766, 25.62566566467285, 26.65599250793457, 27.68631935119629, 28.716644287109375, 29.746971130371094, 30.777297973632812, 31.80762481689453, 32.83795166015625, 33.86827850341797, 34.89860534667969, 35.92892837524414, 36.95925521850586, 37.98958206176758, 39.0199089050293]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 6.0, 5.0, 8.0, 11.0, 15.0, 25.0, 28.0, 36.0, 41.0, 54.0, 77.0, 95.0, 102.0, 111.0, 94.0, 63.0, 51.0, 29.0, 25.0, 19.0, 23.0, 16.0, 10.0, 10.0, 7.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.89131164550781, -36.70288848876953, -35.514469146728516, -34.326045989990234, -33.13762664794922, -31.949203491210938, -30.760780334472656, -29.572359085083008, -28.38393783569336, -27.19551658630371, -26.007095336914062, -24.81867218017578, -23.630250930786133, -22.441829681396484, -21.253406524658203, -20.064985275268555, -18.876564025878906, -17.688142776489258, -16.49972152709961, -15.311298370361328, -14.12287712097168, -12.934455871582031, -11.746033668518066, -10.557611465454102, -9.369190216064453, -8.180768966674805, -6.99234676361084, -5.803925037384033, -4.615503311157227, -3.42708158493042, -2.2386598587036133, -1.0502376556396484, 0.13818359375, 1.3266053199768066, 2.5150270462036133, 3.70344877243042, 4.891870498657227, 6.080292224884033, 7.26871395111084, 8.457136154174805, 9.645557403564453, 10.833978652954102, 12.022400856018066, 13.210823059082031, 14.39924430847168, 15.587665557861328, 16.77608871459961, 17.964509963989258, 19.152931213378906, 20.341352462768555, 21.529773712158203, 22.718196868896484, 23.906618118286133, 25.09503936767578, 26.283462524414062, 27.47188377380371, 28.66030502319336, 29.848726272583008, 31.037147521972656, 32.22557067871094, 33.41399383544922, 34.602413177490234, 35.790836334228516, 36.97925567626953, 38.16767883300781]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 3.0, 2.0, 7.0, 9.0, 6.0, 7.0, 12.0, 17.0, 30.0, 45.0, 47.0, 92.0, 141.0, 225.0, 363.0, 612.0, 983.0, 1657.0, 3410.0, 7133.0, 22565.0, 639471.0, 3477702.0, 24569.0, 7503.0, 3331.0, 1713.0, 1010.0, 578.0, 343.0, 216.0, 146.0, 97.0, 59.0, 45.0, 40.0, 27.0, 15.0, 16.0, 12.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.143798828125, -0.13866806030273438, -0.13353729248046875, -0.12840652465820312, -0.1232757568359375, -0.11814498901367188, -0.11301422119140625, -0.10788345336914062, -0.102752685546875, -0.09762191772460938, -0.09249114990234375, -0.08736038208007812, -0.0822296142578125, -0.07709884643554688, -0.07196807861328125, -0.06683731079101562, -0.06170654296875, -0.056575775146484375, -0.05144500732421875, -0.046314239501953125, -0.0411834716796875, -0.036052703857421875, -0.03092193603515625, -0.025791168212890625, -0.020660400390625, -0.015529632568359375, -0.01039886474609375, -0.005268096923828125, -0.0001373291015625, 0.004993438720703125, 0.01012420654296875, 0.015254974365234375, 0.0203857421875, 0.025516510009765625, 0.03064727783203125, 0.035778045654296875, 0.0409088134765625, 0.046039581298828125, 0.05117034912109375, 0.056301116943359375, 0.061431884765625, 0.06656265258789062, 0.07169342041015625, 0.07682418823242188, 0.0819549560546875, 0.08708572387695312, 0.09221649169921875, 0.09734725952148438, 0.10247802734375, 0.10760879516601562, 0.11273956298828125, 0.11787033081054688, 0.1230010986328125, 0.12813186645507812, 0.13326263427734375, 0.13839340209960938, 0.143524169921875, 0.14865493774414062, 0.15378570556640625, 0.15891647338867188, 0.1640472412109375, 0.16917800903320312, 0.17430877685546875, 0.17943954467773438, 0.1845703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 3.0, 11.0, 3.0, 13.0, 11.0, 14.0, 20.0, 43.0, 555.0, 142.0, 43.0, 13.0, 6.0, 12.0, 10.0, 13.0, 8.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.06247138977050781, -0.060306549072265625, -0.05814170837402344, -0.05597686767578125, -0.05381202697753906, -0.051647186279296875, -0.04948234558105469, -0.0473175048828125, -0.04515266418457031, -0.042987823486328125, -0.04082298278808594, -0.03865814208984375, -0.03649330139160156, -0.034328460693359375, -0.03216361999511719, -0.029998779296875, -0.027833938598632812, -0.025669097900390625, -0.023504257202148438, -0.02133941650390625, -0.019174575805664062, -0.017009735107421875, -0.014844894409179688, -0.0126800537109375, -0.010515213012695312, -0.008350372314453125, -0.0061855316162109375, -0.00402069091796875, -0.0018558502197265625, 0.000308990478515625, 0.0024738311767578125, 0.004638671875, 0.0068035125732421875, 0.008968353271484375, 0.011133193969726562, 0.01329803466796875, 0.015462875366210938, 0.017627716064453125, 0.019792556762695312, 0.0219573974609375, 0.024122238159179688, 0.026287078857421875, 0.028451919555664062, 0.03061676025390625, 0.03278160095214844, 0.034946441650390625, 0.03711128234863281, 0.039276123046875, 0.04144096374511719, 0.043605804443359375, 0.04577064514160156, 0.04793548583984375, 0.05010032653808594, 0.052265167236328125, 0.05443000793457031, 0.0565948486328125, 0.05875968933105469, 0.060924530029296875, 0.06308937072753906, 0.06525421142578125, 0.06741905212402344, 0.06958389282226562, 0.07174873352050781, 0.07391357421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 5.0, 8.0, 7.0, 7.0, 12.0, 19.0, 37.0, 61.0, 162.0, 385.0, 898.0, 2628.0, 10303.0, 76534.0, 3835437.0, 243155.0, 18806.0, 4011.0, 1144.0, 384.0, 117.0, 54.0, 44.0, 14.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256103515625, -0.2487201690673828, -0.24133682250976562, -0.23395347595214844, -0.22657012939453125, -0.21918678283691406, -0.21180343627929688, -0.2044200897216797, -0.1970367431640625, -0.1896533966064453, -0.18227005004882812, -0.17488670349121094, -0.16750335693359375, -0.16012001037597656, -0.15273666381835938, -0.1453533172607422, -0.137969970703125, -0.1305866241455078, -0.12320327758789062, -0.11581993103027344, -0.10843658447265625, -0.10105323791503906, -0.09366989135742188, -0.08628654479980469, -0.0789031982421875, -0.07151985168457031, -0.06413650512695312, -0.05675315856933594, -0.04936981201171875, -0.04198646545410156, -0.034603118896484375, -0.027219772338867188, -0.01983642578125, -0.012453079223632812, -0.005069732666015625, 0.0023136138916015625, 0.00969696044921875, 0.017080307006835938, 0.024463653564453125, 0.03184700012207031, 0.0392303466796875, 0.04661369323730469, 0.053997039794921875, 0.06138038635253906, 0.06876373291015625, 0.07614707946777344, 0.08353042602539062, 0.09091377258300781, 0.098297119140625, 0.10568046569824219, 0.11306381225585938, 0.12044715881347656, 0.12783050537109375, 0.13521385192871094, 0.14259719848632812, 0.1499805450439453, 0.1573638916015625, 0.1647472381591797, 0.17213058471679688, 0.17951393127441406, 0.18689727783203125, 0.19428062438964844, 0.20166397094726562, 0.2090473175048828, 0.2164306640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 11.0, 13.0, 15.0, 16.0, 17.0, 31.0, 37.0, 64.0, 95.0, 190.0, 497.0, 1629.0, 848.0, 237.0, 131.0, 66.0, 42.0, 26.0, 25.0, 18.0, 14.0, 14.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.0864400863647461, -0.08395195007324219, -0.08146381378173828, -0.07897567749023438, -0.07648754119873047, -0.07399940490722656, -0.07151126861572266, -0.06902313232421875, -0.06653499603271484, -0.06404685974121094, -0.06155872344970703, -0.059070587158203125, -0.05658245086669922, -0.05409431457519531, -0.051606178283691406, -0.0491180419921875, -0.046629905700683594, -0.04414176940917969, -0.04165363311767578, -0.039165496826171875, -0.03667736053466797, -0.03418922424316406, -0.031701087951660156, -0.02921295166015625, -0.026724815368652344, -0.024236679077148438, -0.02174854278564453, -0.019260406494140625, -0.01677227020263672, -0.014284133911132812, -0.011795997619628906, -0.009307861328125, -0.006819725036621094, -0.0043315887451171875, -0.0018434524536132812, 0.000644683837890625, 0.0031328201293945312, 0.0056209564208984375, 0.008109092712402344, 0.01059722900390625, 0.013085365295410156, 0.015573501586914062, 0.01806163787841797, 0.020549774169921875, 0.02303791046142578, 0.025526046752929688, 0.028014183044433594, 0.0305023193359375, 0.032990455627441406, 0.03547859191894531, 0.03796672821044922, 0.040454864501953125, 0.04294300079345703, 0.04543113708496094, 0.047919273376464844, 0.05040740966796875, 0.052895545959472656, 0.05538368225097656, 0.05787181854248047, 0.060359954833984375, 0.06284809112548828, 0.06533622741699219, 0.0678243637084961, 0.0703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 9.0, 45.0, 321.0, 552.0, 60.0, 10.0, 4.0, 1.0, 1.0], "bins": [-2.028738260269165, -1.9939026832580566, -1.9590669870376587, -1.9242314100265503, -1.8893957138061523, -1.854560136795044, -1.819724440574646, -1.7848888635635376, -1.7500531673431396, -1.7152175903320312, -1.6803818941116333, -1.645546317100525, -1.610710620880127, -1.5758750438690186, -1.5410393476486206, -1.5062037706375122, -1.4713681936264038, -1.4365326166152954, -1.4016969203948975, -1.366861343383789, -1.3320256471633911, -1.2971900701522827, -1.2623543739318848, -1.2275187969207764, -1.192683219909668, -1.1578476428985596, -1.1230119466781616, -1.0881763696670532, -1.0533406734466553, -1.0185050964355469, -0.9836694598197937, -0.9488338232040405, -0.9139982461929321, -0.879162609577179, -0.8443269729614258, -0.8094913363456726, -0.7746556997299194, -0.739820122718811, -0.7049844861030579, -0.6701488494873047, -0.6353132128715515, -0.6004775762557983, -0.5656419396400452, -0.530806303024292, -0.4959706962108612, -0.46113505959510803, -0.42629945278167725, -0.3914638161659241, -0.3566281795501709, -0.3217925429344177, -0.28695690631866455, -0.25212129950523376, -0.2172856628894806, -0.18245002627372742, -0.14761440455913544, -0.11277878284454346, -0.07794314622879028, -0.043107517063617706, -0.00827188789844513, 0.026563741266727448, 0.061399370431900024, 0.0962350070476532, 0.13107062876224518, 0.16590625047683716, 0.20074188709259033]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 11.0, 17.0, 16.0, 26.0, 26.0, 26.0, 45.0, 45.0, 48.0, 42.0, 51.0, 70.0, 57.0, 59.0, 61.0, 59.0, 54.0, 42.0, 36.0, 40.0, 29.0, 30.0, 25.0, 10.0, 14.0, 15.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548907995223999, -0.2457183450460434, -0.2365458905696869, -0.22737343609333038, -0.21820098161697388, -0.20902852714061737, -0.19985607266426086, -0.19068363308906555, -0.18151116371154785, -0.17233870923519135, -0.16316625475883484, -0.15399380028247833, -0.14482134580612183, -0.13564889132976532, -0.1264764368534088, -0.1173039898276329, -0.108131542801857, -0.09895908832550049, -0.08978663384914398, -0.08061417937278748, -0.07144172489643097, -0.06226927414536476, -0.05309682339429855, -0.04392436891794205, -0.03475191444158554, -0.025579459965229034, -0.016407007351517677, -0.00723455473780632, 0.0019378997385501862, 0.011110354214906693, 0.0202828049659729, 0.029455259442329407, 0.03862771391868591, 0.04780016839504242, 0.056972622871398926, 0.06614507734775543, 0.07531753182411194, 0.08448998630046844, 0.09366243332624435, 0.10283488780260086, 0.11200734227895737, 0.12117979675531387, 0.13035224378108978, 0.1395246982574463, 0.1486971527338028, 0.1578696072101593, 0.1670420616865158, 0.17621451616287231, 0.18538697063922882, 0.19455942511558533, 0.20373187959194183, 0.21290433406829834, 0.22207678854465485, 0.23124924302101135, 0.24042168259620667, 0.24959415197372437, 0.2587665915489197, 0.267939031124115, 0.2771115005016327, 0.286283940076828, 0.2954564094543457, 0.304628849029541, 0.3138013184070587, 0.32297375798225403, 0.33214622735977173]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 8.0, 14.0, 22.0, 20.0, 24.0, 31.0, 71.0, 85.0, 132.0, 152.0, 246.0, 378.0, 480.0, 699.0, 1135.0, 1628.0, 2450.0, 3811.0, 6190.0, 10296.0, 19216.0, 44230.0, 804667.0, 90915.0, 26485.0, 13639.0, 7797.0, 4742.0, 2901.0, 1959.0, 1311.0, 845.0, 605.0, 397.0, 284.0, 201.0, 143.0, 91.0, 70.0, 51.0, 51.0, 19.0, 18.0, 12.0, 10.0, 8.0, 9.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2327880859375, -0.2254505157470703, -0.21811294555664062, -0.21077537536621094, -0.20343780517578125, -0.19610023498535156, -0.18876266479492188, -0.1814250946044922, -0.1740875244140625, -0.1667499542236328, -0.15941238403320312, -0.15207481384277344, -0.14473724365234375, -0.13739967346191406, -0.13006210327148438, -0.12272453308105469, -0.115386962890625, -0.10804939270019531, -0.10071182250976562, -0.09337425231933594, -0.08603668212890625, -0.07869911193847656, -0.07136154174804688, -0.06402397155761719, -0.0566864013671875, -0.04934883117675781, -0.042011260986328125, -0.03467369079589844, -0.02733612060546875, -0.019998550415039062, -0.012660980224609375, -0.0053234100341796875, 0.00201416015625, 0.009351730346679688, 0.016689300537109375, 0.024026870727539062, 0.03136444091796875, 0.03870201110839844, 0.046039581298828125, 0.05337715148925781, 0.0607147216796875, 0.06805229187011719, 0.07538986206054688, 0.08272743225097656, 0.09006500244140625, 0.09740257263183594, 0.10474014282226562, 0.11207771301269531, 0.119415283203125, 0.1267528533935547, 0.13409042358398438, 0.14142799377441406, 0.14876556396484375, 0.15610313415527344, 0.16344070434570312, 0.1707782745361328, 0.1781158447265625, 0.1854534149169922, 0.19279098510742188, 0.20012855529785156, 0.20746612548828125, 0.21480369567871094, 0.22214126586914062, 0.2294788360595703, 0.23681640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 8.0, 4.0, 4.0, 7.0, 2.0, 5.0, 12.0, 11.0, 14.0, 14.0, 23.0, 53.0, 437.0, 243.0, 40.0, 19.0, 8.0, 11.0, 14.0, 9.0, 10.0, 5.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.06182289123535156, -0.059680938720703125, -0.05753898620605469, -0.05539703369140625, -0.05325508117675781, -0.051113128662109375, -0.04897117614746094, -0.0468292236328125, -0.04468727111816406, -0.042545318603515625, -0.04040336608886719, -0.03826141357421875, -0.03611946105957031, -0.033977508544921875, -0.03183555603027344, -0.029693603515625, -0.027551651000976562, -0.025409698486328125, -0.023267745971679688, -0.02112579345703125, -0.018983840942382812, -0.016841888427734375, -0.014699935913085938, -0.0125579833984375, -0.010416030883789062, -0.008274078369140625, -0.0061321258544921875, -0.00399017333984375, -0.0018482208251953125, 0.000293731689453125, 0.0024356842041015625, 0.00457763671875, 0.0067195892333984375, 0.008861541748046875, 0.011003494262695312, 0.01314544677734375, 0.015287399291992188, 0.017429351806640625, 0.019571304321289062, 0.0217132568359375, 0.023855209350585938, 0.025997161865234375, 0.028139114379882812, 0.03028106689453125, 0.03242301940917969, 0.034564971923828125, 0.03670692443847656, 0.038848876953125, 0.04099082946777344, 0.043132781982421875, 0.04527473449707031, 0.04741668701171875, 0.04955863952636719, 0.051700592041015625, 0.05384254455566406, 0.0559844970703125, 0.05812644958496094, 0.060268402099609375, 0.06241035461425781, 0.06455230712890625, 0.06669425964355469, 0.06883621215820312, 0.07097816467285156, 0.0731201171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 8.0, 16.0, 15.0, 21.0, 20.0, 36.0, 45.0, 70.0, 61.0, 95.0, 132.0, 206.0, 371.0, 728.0, 1555.0, 3538.0, 8115.0, 23018.0, 79520.0, 406666.0, 407787.0, 78802.0, 23000.0, 8146.0, 3308.0, 1481.0, 715.0, 353.0, 203.0, 139.0, 83.0, 63.0, 51.0, 42.0, 42.0, 19.0, 26.0, 15.0, 9.0, 8.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15586090087890625, -0.1508331298828125, -0.14580535888671875, -0.140777587890625, -0.13574981689453125, -0.1307220458984375, -0.12569427490234375, -0.12066650390625, -0.11563873291015625, -0.1106109619140625, -0.10558319091796875, -0.100555419921875, -0.09552764892578125, -0.0904998779296875, -0.08547210693359375, -0.0804443359375, -0.07541656494140625, -0.0703887939453125, -0.06536102294921875, -0.060333251953125, -0.05530548095703125, -0.0502777099609375, -0.04524993896484375, -0.04022216796875, -0.03519439697265625, -0.0301666259765625, -0.02513885498046875, -0.020111083984375, -0.01508331298828125, -0.0100555419921875, -0.00502777099609375, 0.0, 0.00502777099609375, 0.0100555419921875, 0.01508331298828125, 0.020111083984375, 0.02513885498046875, 0.0301666259765625, 0.03519439697265625, 0.04022216796875, 0.04524993896484375, 0.0502777099609375, 0.05530548095703125, 0.060333251953125, 0.06536102294921875, 0.0703887939453125, 0.07541656494140625, 0.0804443359375, 0.08547210693359375, 0.0904998779296875, 0.09552764892578125, 0.100555419921875, 0.10558319091796875, 0.1106109619140625, 0.11563873291015625, 0.12066650390625, 0.12569427490234375, 0.1307220458984375, 0.13574981689453125, 0.140777587890625, 0.14580535888671875, 0.1508331298828125, 0.15586090087890625, 0.160888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 7.0, 7.0, 7.0, 10.0, 17.0, 15.0, 10.0, 7.0, 26.0, 31.0, 35.0, 21.0, 45.0, 46.0, 42.0, 38.0, 47.0, 46.0, 42.0, 50.0, 47.0, 47.0, 57.0, 39.0, 31.0, 41.0, 20.0, 26.0, 31.0, 18.0, 12.0, 17.0, 20.0, 11.0, 6.0, 6.0, 4.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24152374267578125, -0.2340240478515625, -0.22652435302734375, -0.219024658203125, -0.21152496337890625, -0.2040252685546875, -0.19652557373046875, -0.18902587890625, -0.18152618408203125, -0.1740264892578125, -0.16652679443359375, -0.159027099609375, -0.15152740478515625, -0.1440277099609375, -0.13652801513671875, -0.1290283203125, -0.12152862548828125, -0.1140289306640625, -0.10652923583984375, -0.099029541015625, -0.09152984619140625, -0.0840301513671875, -0.07653045654296875, -0.06903076171875, -0.06153106689453125, -0.0540313720703125, -0.04653167724609375, -0.039031982421875, -0.03153228759765625, -0.0240325927734375, -0.01653289794921875, -0.009033203125, -0.00153350830078125, 0.0059661865234375, 0.01346588134765625, 0.020965576171875, 0.02846527099609375, 0.0359649658203125, 0.04346466064453125, 0.05096435546875, 0.05846405029296875, 0.0659637451171875, 0.07346343994140625, 0.080963134765625, 0.08846282958984375, 0.0959625244140625, 0.10346221923828125, 0.1109619140625, 0.11846160888671875, 0.1259613037109375, 0.13346099853515625, 0.140960693359375, 0.14846038818359375, 0.1559600830078125, 0.16345977783203125, 0.17095947265625, 0.17845916748046875, 0.1859588623046875, 0.19345855712890625, 0.200958251953125, 0.20845794677734375, 0.2159576416015625, 0.22345733642578125, 0.23095703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 9.0, 12.0, 21.0, 22.0, 39.0, 63.0, 113.0, 167.0, 318.0, 604.0, 1379.0, 3385.0, 10342.0, 47908.0, 487145.0, 437328.0, 44059.0, 9766.0, 3245.0, 1310.0, 565.0, 299.0, 178.0, 93.0, 70.0, 34.0, 17.0, 13.0, 9.0, 11.0, 7.0, 6.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086669921875, -0.08395957946777344, -0.08124923706054688, -0.07853889465332031, -0.07582855224609375, -0.07311820983886719, -0.07040786743164062, -0.06769752502441406, -0.0649871826171875, -0.06227684020996094, -0.059566497802734375, -0.05685615539550781, -0.05414581298828125, -0.05143547058105469, -0.048725128173828125, -0.04601478576660156, -0.043304443359375, -0.04059410095214844, -0.037883758544921875, -0.03517341613769531, -0.03246307373046875, -0.029752731323242188, -0.027042388916015625, -0.024332046508789062, -0.0216217041015625, -0.018911361694335938, -0.016201019287109375, -0.013490676879882812, -0.01078033447265625, -0.008069992065429688, -0.005359649658203125, -0.0026493072509765625, 6.103515625e-05, 0.0027713775634765625, 0.005481719970703125, 0.008192062377929688, 0.01090240478515625, 0.013612747192382812, 0.016323089599609375, 0.019033432006835938, 0.0217437744140625, 0.024454116821289062, 0.027164459228515625, 0.029874801635742188, 0.03258514404296875, 0.03529548645019531, 0.038005828857421875, 0.04071617126464844, 0.043426513671875, 0.04613685607910156, 0.048847198486328125, 0.05155754089355469, 0.05426788330078125, 0.05697822570800781, 0.059688568115234375, 0.06239891052246094, 0.0651092529296875, 0.06781959533691406, 0.07052993774414062, 0.07324028015136719, 0.07595062255859375, 0.07866096496582031, 0.08137130737304688, 0.08408164978027344, 0.0867919921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 11.0, 6.0, 15.0, 11.0, 14.0, 16.0, 22.0, 29.0, 35.0, 38.0, 65.0, 58.0, 63.0, 63.0, 71.0, 64.0, 57.0, 57.0, 44.0, 28.0, 41.0, 31.0, 30.0, 14.0, 18.0, 13.0, 16.0, 10.0, 6.0, 9.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.430511474609375e-05, -1.3804063200950623e-05, -1.3303011655807495e-05, -1.2801960110664368e-05, -1.230090856552124e-05, -1.1799857020378113e-05, -1.1298805475234985e-05, -1.0797753930091858e-05, -1.029670238494873e-05, -9.795650839805603e-06, -9.294599294662476e-06, -8.793547749519348e-06, -8.29249620437622e-06, -7.791444659233093e-06, -7.290393114089966e-06, -6.789341568946838e-06, -6.288290023803711e-06, -5.7872384786605835e-06, -5.286186933517456e-06, -4.785135388374329e-06, -4.284083843231201e-06, -3.7830322980880737e-06, -3.2819807529449463e-06, -2.780929207801819e-06, -2.2798776626586914e-06, -1.778826117515564e-06, -1.2777745723724365e-06, -7.767230272293091e-07, -2.7567148208618164e-07, 2.253800630569458e-07, 7.264316082000732e-07, 1.2274831533432007e-06, 1.7285346984863281e-06, 2.2295862436294556e-06, 2.730637788772583e-06, 3.2316893339157104e-06, 3.732740879058838e-06, 4.233792424201965e-06, 4.734843969345093e-06, 5.23589551448822e-06, 5.736947059631348e-06, 6.237998604774475e-06, 6.7390501499176025e-06, 7.24010169506073e-06, 7.741153240203857e-06, 8.242204785346985e-06, 8.743256330490112e-06, 9.24430787563324e-06, 9.745359420776367e-06, 1.0246410965919495e-05, 1.0747462511062622e-05, 1.124851405620575e-05, 1.1749565601348877e-05, 1.2250617146492004e-05, 1.2751668691635132e-05, 1.325272023677826e-05, 1.3753771781921387e-05, 1.4254823327064514e-05, 1.4755874872207642e-05, 1.5256926417350769e-05, 1.5757977962493896e-05, 1.6259029507637024e-05, 1.676008105278015e-05, 1.726113259792328e-05, 1.7762184143066406e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 13.0, 17.0, 20.0, 59.0, 90.0, 138.0, 240.0, 602.0, 1592.0, 4777.0, 21573.0, 178881.0, 719144.0, 101171.0, 14390.0, 3657.0, 1199.0, 471.0, 224.0, 115.0, 66.0, 40.0, 16.0, 12.0, 14.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.08754253387451172, -0.08475303649902344, -0.08196353912353516, -0.07917404174804688, -0.0763845443725586, -0.07359504699707031, -0.07080554962158203, -0.06801605224609375, -0.06522655487060547, -0.06243705749511719, -0.059647560119628906, -0.056858062744140625, -0.054068565368652344, -0.05127906799316406, -0.04848957061767578, -0.0457000732421875, -0.04291057586669922, -0.04012107849121094, -0.037331581115722656, -0.034542083740234375, -0.031752586364746094, -0.028963088989257812, -0.02617359161376953, -0.02338409423828125, -0.02059459686279297, -0.017805099487304688, -0.015015602111816406, -0.012226104736328125, -0.009436607360839844, -0.0066471099853515625, -0.0038576126098632812, -0.001068115234375, 0.0017213821411132812, 0.0045108795166015625, 0.007300376892089844, 0.010089874267578125, 0.012879371643066406, 0.015668869018554688, 0.01845836639404297, 0.02124786376953125, 0.02403736114501953, 0.026826858520507812, 0.029616355895996094, 0.032405853271484375, 0.035195350646972656, 0.03798484802246094, 0.04077434539794922, 0.0435638427734375, 0.04635334014892578, 0.04914283752441406, 0.051932334899902344, 0.054721832275390625, 0.057511329650878906, 0.06030082702636719, 0.06309032440185547, 0.06587982177734375, 0.06866931915283203, 0.07145881652832031, 0.0742483139038086, 0.07703781127929688, 0.07982730865478516, 0.08261680603027344, 0.08540630340576172, 0.08819580078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 14.0, 25.0, 24.0, 28.0, 31.0, 37.0, 56.0, 64.0, 73.0, 70.0, 80.0, 90.0, 87.0, 66.0, 52.0, 40.0, 39.0, 32.0, 24.0, 10.0, 10.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06633663177490234, -0.06382560729980469, -0.06131458282470703, -0.058803558349609375, -0.05629253387451172, -0.05378150939941406, -0.051270484924316406, -0.04875946044921875, -0.046248435974121094, -0.04373741149902344, -0.04122638702392578, -0.038715362548828125, -0.03620433807373047, -0.03369331359863281, -0.031182289123535156, -0.0286712646484375, -0.026160240173339844, -0.023649215698242188, -0.02113819122314453, -0.018627166748046875, -0.01611614227294922, -0.013605117797851562, -0.011094093322753906, -0.00858306884765625, -0.006072044372558594, -0.0035610198974609375, -0.0010499954223632812, 0.001461029052734375, 0.003972053527832031, 0.0064830780029296875, 0.008994102478027344, 0.011505126953125, 0.014016151428222656, 0.016527175903320312, 0.01903820037841797, 0.021549224853515625, 0.02406024932861328, 0.026571273803710938, 0.029082298278808594, 0.03159332275390625, 0.034104347229003906, 0.03661537170410156, 0.03912639617919922, 0.041637420654296875, 0.04414844512939453, 0.04665946960449219, 0.049170494079589844, 0.0516815185546875, 0.054192543029785156, 0.05670356750488281, 0.05921459197998047, 0.061725616455078125, 0.06423664093017578, 0.06674766540527344, 0.0692586898803711, 0.07176971435546875, 0.0742807388305664, 0.07679176330566406, 0.07930278778076172, 0.08181381225585938, 0.08432483673095703, 0.08683586120605469, 0.08934688568115234, 0.09185791015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 4.0, 15.0, 35.0, 177.0, 576.0, 146.0, 40.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6978521943092346, -0.5693410038948059, -0.4408298134803772, -0.3123186230659485, -0.18380743265151978, -0.055296242237091064, 0.07321494817733765, 0.20172613859176636, 0.33023732900619507, 0.4587485194206238, 0.5872597098350525, 0.7157709002494812, 0.8442820906639099, 0.9727932810783386, 1.101304531097412, 1.2298157215118408, 1.3583269119262695, 1.4868381023406982, 1.615349292755127, 1.7438604831695557, 1.8723716735839844, 2.000882863998413, 2.129394054412842, 2.2579052448272705, 2.386416435241699, 2.514927625656128, 2.6434388160705566, 2.7719500064849854, 2.900461196899414, 3.0289723873138428, 3.1574835777282715, 3.2859947681427, 3.414505958557129, 3.5430171489715576, 3.6715283393859863, 3.800039529800415, 3.9285507202148438, 4.057062149047852, 4.185573101043701, 4.314084053039551, 4.442595481872559, 4.571106910705566, 4.699617862701416, 4.828128814697266, 4.956640243530273, 5.085151672363281, 5.213662624359131, 5.3421735763549805, 5.470685005187988, 5.599196434020996, 5.727707386016846, 5.856218338012695, 5.984729766845703, 6.113241195678711, 6.2417521476745605, 6.37026309967041, 6.498774528503418, 6.627285957336426, 6.755796909332275, 6.884307861328125, 7.012819290161133, 7.141330718994141, 7.26984167098999, 7.39835262298584, 7.526864051818848]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 2.0, 5.0, 3.0, 7.0, 9.0, 13.0, 20.0, 34.0, 51.0, 79.0, 108.0, 133.0, 140.0, 118.0, 83.0, 58.0, 39.0, 12.0, 16.0, 13.0, 6.0, 4.0, 7.0, 2.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.230095386505127, -4.105755805969238, -3.9814162254333496, -3.857076644897461, -3.7327370643615723, -3.6083974838256836, -3.484057903289795, -3.3597183227539062, -3.2353787422180176, -3.111039161682129, -2.9866995811462402, -2.8623600006103516, -2.738020420074463, -2.613680839538574, -2.4893412590026855, -2.365001678466797, -2.240662097930908, -2.1163225173950195, -1.9919829368591309, -1.8676433563232422, -1.7433037757873535, -1.6189641952514648, -1.4946246147155762, -1.3702850341796875, -1.245945692062378, -1.1216061115264893, -0.9972665309906006, -0.8729269504547119, -0.7485873699188232, -0.6242478489875793, -0.4999082684516907, -0.375568687915802, -0.25122904777526855, -0.12688946723937988, -0.002549901604652405, 0.12178966403007507, 0.24612924456596375, 0.37046879529953003, 0.4948083758354187, 0.6191479563713074, 0.743487536907196, 0.8678271174430847, 0.9921666979789734, 1.1165062189102173, 1.240845799446106, 1.3651853799819946, 1.4895249605178833, 1.613864541053772, 1.7382041215896606, 1.8625437021255493, 1.986883282661438, 2.111222743988037, 2.235562324523926, 2.3599019050598145, 2.484241485595703, 2.608581066131592, 2.7329206466674805, 2.857260227203369, 2.981599807739258, 3.1059393882751465, 3.230278968811035, 3.354618549346924, 3.4789581298828125, 3.603297710418701, 3.72763729095459]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 14.0, 20.0, 24.0, 43.0, 60.0, 74.0, 98.0, 136.0, 218.0, 298.0, 432.0, 654.0, 968.0, 1613.0, 2574.0, 4730.0, 10664.0, 32215.0, 807588.0, 3277268.0, 32567.0, 10307.0, 4837.0, 2609.0, 1473.0, 936.0, 576.0, 404.0, 269.0, 174.0, 114.0, 81.0, 60.0, 42.0, 38.0, 28.0, 7.0, 12.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431640625, -0.41815948486328125, -0.4046783447265625, -0.39119720458984375, -0.377716064453125, -0.36423492431640625, -0.3507537841796875, -0.33727264404296875, -0.32379150390625, -0.31031036376953125, -0.2968292236328125, -0.28334808349609375, -0.269866943359375, -0.25638580322265625, -0.2429046630859375, -0.22942352294921875, -0.2159423828125, -0.20246124267578125, -0.1889801025390625, -0.17549896240234375, -0.162017822265625, -0.14853668212890625, -0.1350555419921875, -0.12157440185546875, -0.10809326171875, -0.09461212158203125, -0.0811309814453125, -0.06764984130859375, -0.054168701171875, -0.04068756103515625, -0.0272064208984375, -0.01372528076171875, -0.000244140625, 0.01323699951171875, 0.0267181396484375, 0.04019927978515625, 0.053680419921875, 0.06716156005859375, 0.0806427001953125, 0.09412384033203125, 0.10760498046875, 0.12108612060546875, 0.1345672607421875, 0.14804840087890625, 0.161529541015625, 0.17501068115234375, 0.1884918212890625, 0.20197296142578125, 0.2154541015625, 0.22893524169921875, 0.2424163818359375, 0.25589752197265625, 0.269378662109375, 0.28285980224609375, 0.2963409423828125, 0.30982208251953125, 0.32330322265625, 0.33678436279296875, 0.3502655029296875, 0.36374664306640625, 0.377227783203125, 0.39070892333984375, 0.4041900634765625, 0.41767120361328125, 0.43115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 20.0, 19.0, 39.0, 123.0, 374.0, 197.0, 60.0, 19.0, 13.0, 16.0, 9.0, 8.0, 12.0, 6.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06637763977050781, -0.06427383422851562, -0.06217002868652344, -0.06006622314453125, -0.05796241760253906, -0.055858612060546875, -0.05375480651855469, -0.0516510009765625, -0.04954719543457031, -0.047443389892578125, -0.04533958435058594, -0.04323577880859375, -0.04113197326660156, -0.039028167724609375, -0.03692436218261719, -0.034820556640625, -0.03271675109863281, -0.030612945556640625, -0.028509140014648438, -0.02640533447265625, -0.024301528930664062, -0.022197723388671875, -0.020093917846679688, -0.0179901123046875, -0.015886306762695312, -0.013782501220703125, -0.011678695678710938, -0.00957489013671875, -0.0074710845947265625, -0.005367279052734375, -0.0032634735107421875, -0.00115966796875, 0.0009441375732421875, 0.003047943115234375, 0.0051517486572265625, 0.00725555419921875, 0.009359359741210938, 0.011463165283203125, 0.013566970825195312, 0.0156707763671875, 0.017774581909179688, 0.019878387451171875, 0.021982192993164062, 0.02408599853515625, 0.026189804077148438, 0.028293609619140625, 0.030397415161132812, 0.032501220703125, 0.03460502624511719, 0.036708831787109375, 0.03881263732910156, 0.04091644287109375, 0.04302024841308594, 0.045124053955078125, 0.04722785949707031, 0.0493316650390625, 0.05143547058105469, 0.053539276123046875, 0.05564308166503906, 0.05774688720703125, 0.05985069274902344, 0.061954498291015625, 0.06405830383300781, 0.066162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 8.0, 21.0, 21.0, 42.0, 82.0, 141.0, 343.0, 895.0, 3087.0, 15300.0, 168753.0, 3893035.0, 96939.0, 11388.0, 2675.0, 832.0, 351.0, 153.0, 74.0, 32.0, 25.0, 22.0, 12.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.380859375, -0.36525726318359375, -0.3496551513671875, -0.33405303955078125, -0.318450927734375, -0.30284881591796875, -0.2872467041015625, -0.27164459228515625, -0.25604248046875, -0.24044036865234375, -0.2248382568359375, -0.20923614501953125, -0.193634033203125, -0.17803192138671875, -0.1624298095703125, -0.14682769775390625, -0.1312255859375, -0.11562347412109375, -0.1000213623046875, -0.08441925048828125, -0.068817138671875, -0.05321502685546875, -0.0376129150390625, -0.02201080322265625, -0.00640869140625, 0.00919342041015625, 0.0247955322265625, 0.04039764404296875, 0.055999755859375, 0.07160186767578125, 0.0872039794921875, 0.10280609130859375, 0.118408203125, 0.13401031494140625, 0.1496124267578125, 0.16521453857421875, 0.180816650390625, 0.19641876220703125, 0.2120208740234375, 0.22762298583984375, 0.24322509765625, 0.25882720947265625, 0.2744293212890625, 0.29003143310546875, 0.305633544921875, 0.32123565673828125, 0.3368377685546875, 0.35243988037109375, 0.3680419921875, 0.38364410400390625, 0.3992462158203125, 0.41484832763671875, 0.430450439453125, 0.44605255126953125, 0.4616546630859375, 0.47725677490234375, 0.49285888671875, 0.5084609985351562, 0.5240631103515625, 0.5396652221679688, 0.555267333984375, 0.5708694458007812, 0.5864715576171875, 0.6020736694335938, 0.61767578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 3.0, 4.0, 4.0, 7.0, 7.0, 10.0, 17.0, 11.0, 23.0, 30.0, 43.0, 69.0, 93.0, 196.0, 368.0, 2101.0, 524.0, 192.0, 102.0, 72.0, 50.0, 30.0, 27.0, 18.0, 17.0, 13.0, 7.0, 8.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.04871988296508789, -0.04656696319580078, -0.04441404342651367, -0.04226112365722656, -0.04010820388793945, -0.037955284118652344, -0.035802364349365234, -0.033649444580078125, -0.031496524810791016, -0.029343605041503906, -0.027190685272216797, -0.025037765502929688, -0.022884845733642578, -0.02073192596435547, -0.01857900619506836, -0.01642608642578125, -0.01427316665649414, -0.012120246887207031, -0.009967327117919922, -0.007814407348632812, -0.005661487579345703, -0.0035085678100585938, -0.0013556480407714844, 0.000797271728515625, 0.0029501914978027344, 0.005103111267089844, 0.007256031036376953, 0.009408950805664062, 0.011561870574951172, 0.013714790344238281, 0.01586771011352539, 0.0180206298828125, 0.02017354965209961, 0.02232646942138672, 0.024479389190673828, 0.026632308959960938, 0.028785228729248047, 0.030938148498535156, 0.033091068267822266, 0.035243988037109375, 0.037396907806396484, 0.039549827575683594, 0.0417027473449707, 0.04385566711425781, 0.04600858688354492, 0.04816150665283203, 0.05031442642211914, 0.05246734619140625, 0.05462026596069336, 0.05677318572998047, 0.05892610549926758, 0.06107902526855469, 0.0632319450378418, 0.0653848648071289, 0.06753778457641602, 0.06969070434570312, 0.07184362411499023, 0.07399654388427734, 0.07614946365356445, 0.07830238342285156, 0.08045530319213867, 0.08260822296142578, 0.08476114273071289, 0.0869140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 30.0, 603.0, 342.0, 17.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39007556438446045, -0.3403872549533844, -0.29069894552230835, -0.2410106658935547, -0.19132235646247864, -0.1416340470314026, -0.09194576740264893, -0.042257457971572876, 0.007430851459503174, 0.05711915343999863, 0.10680745542049408, 0.15649574995040894, 0.20618405938148499, 0.25587236881256104, 0.3055606484413147, 0.35524895787239075, 0.4049372673034668, 0.45462557673454285, 0.5043138861656189, 0.5540021657943726, 0.603690505027771, 0.6533787846565247, 0.7030670642852783, 0.7527554035186768, 0.8024436831474304, 0.8521319627761841, 0.9018203020095825, 0.9515085816383362, 1.0011968612670898, 1.0508852005004883, 1.1005735397338867, 1.1502617597579956, 1.1999499797821045, 1.249638319015503, 1.2993265390396118, 1.3490148782730103, 1.3987032175064087, 1.4483914375305176, 1.498079776763916, 1.5477681159973145, 1.597456455230713, 1.6471447944641113, 1.6968330144882202, 1.7465213537216187, 1.796209692955017, 1.845897912979126, 1.8955862522125244, 1.9452745914459229, 1.9949628114700317, 2.0446510314941406, 2.094339370727539, 2.1440277099609375, 2.193716049194336, 2.2434043884277344, 2.293092727661133, 2.342780828475952, 2.3924691677093506, 2.442157506942749, 2.4918458461761475, 2.541533946990967, 2.5912222862243652, 2.6409106254577637, 2.690598964691162, 2.7402873039245605, 2.789975643157959]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 10.0, 7.0, 13.0, 14.0, 30.0, 34.0, 28.0, 34.0, 50.0, 57.0, 66.0, 74.0, 75.0, 74.0, 61.0, 78.0, 56.0, 40.0, 48.0, 36.0, 21.0, 23.0, 19.0, 12.0, 9.0, 7.0, 3.0, 6.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37470340728759766, -0.3640134930610657, -0.3533235788345337, -0.3426336646080017, -0.3319437801837921, -0.32125386595726013, -0.31056395173072815, -0.29987403750419617, -0.2891841530799866, -0.2784942388534546, -0.2678043246269226, -0.2571144104003906, -0.24642452597618103, -0.23573461174964905, -0.22504469752311707, -0.21435478329658508, -0.2036648690700531, -0.19297495484352112, -0.18228505551815033, -0.17159514129161835, -0.16090524196624756, -0.15021532773971558, -0.1395254135131836, -0.1288354992866516, -0.11814559996128082, -0.10745569318532944, -0.09676578640937805, -0.08607587218284607, -0.07538596540689468, -0.0646960586309433, -0.054006144404411316, -0.04331623762845993, -0.032626330852508545, -0.02193642221391201, -0.011246513575315475, -0.0005566030740737915, 0.010133303701877594, 0.02082321047782898, 0.03151312470436096, 0.04220303148031235, 0.05289293825626373, 0.06358284503221512, 0.0742727518081665, 0.08496266603469849, 0.09565257281064987, 0.10634247958660126, 0.11703239381313324, 0.12772229313850403, 0.138412207365036, 0.149102121591568, 0.15979202091693878, 0.17048193514347076, 0.18117183446884155, 0.19186174869537354, 0.20255166292190552, 0.2132415771484375, 0.2239314764738083, 0.23462139070034027, 0.24531129002571106, 0.25600120425224304, 0.266691118478775, 0.2773810029029846, 0.2880709171295166, 0.2987608313560486, 0.30945074558258057]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 16.0, 24.0, 25.0, 47.0, 65.0, 85.0, 149.0, 251.0, 384.0, 681.0, 1264.0, 2439.0, 5247.0, 13232.0, 45199.0, 799595.0, 140698.0, 23171.0, 8301.0, 3567.0, 1829.0, 913.0, 494.0, 285.0, 207.0, 117.0, 76.0, 56.0, 38.0, 16.0, 23.0, 11.0, 8.0, 6.0, 5.0, 1.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.3802146911621094, -0.36785125732421875, -0.3554878234863281, -0.3431243896484375, -0.3307609558105469, -0.31839752197265625, -0.3060340881347656, -0.293670654296875, -0.2813072204589844, -0.26894378662109375, -0.2565803527832031, -0.2442169189453125, -0.23185348510742188, -0.21949005126953125, -0.20712661743164062, -0.19476318359375, -0.18239974975585938, -0.17003631591796875, -0.15767288208007812, -0.1453094482421875, -0.13294601440429688, -0.12058258056640625, -0.10821914672851562, -0.095855712890625, -0.08349227905273438, -0.07112884521484375, -0.058765411376953125, -0.0464019775390625, -0.034038543701171875, -0.02167510986328125, -0.009311676025390625, 0.0030517578125, 0.015415191650390625, 0.02777862548828125, 0.040142059326171875, 0.0525054931640625, 0.06486892700195312, 0.07723236083984375, 0.08959579467773438, 0.101959228515625, 0.11432266235351562, 0.12668609619140625, 0.13904953002929688, 0.1514129638671875, 0.16377639770507812, 0.17613983154296875, 0.18850326538085938, 0.20086669921875, 0.21323013305664062, 0.22559356689453125, 0.23795700073242188, 0.2503204345703125, 0.2626838684082031, 0.27504730224609375, 0.2874107360839844, 0.299774169921875, 0.3121376037597656, 0.32450103759765625, 0.3368644714355469, 0.3492279052734375, 0.3615913391113281, 0.37395477294921875, 0.3863182067871094, 0.398681640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 3.0, 9.0, 10.0, 12.0, 12.0, 23.0, 41.0, 110.0, 268.0, 245.0, 98.0, 51.0, 19.0, 15.0, 11.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.06343650817871094, -0.061382293701171875, -0.05932807922363281, -0.05727386474609375, -0.05521965026855469, -0.053165435791015625, -0.05111122131347656, -0.0490570068359375, -0.04700279235839844, -0.044948577880859375, -0.04289436340332031, -0.04084014892578125, -0.03878593444824219, -0.036731719970703125, -0.03467750549316406, -0.032623291015625, -0.030569076538085938, -0.028514862060546875, -0.026460647583007812, -0.02440643310546875, -0.022352218627929688, -0.020298004150390625, -0.018243789672851562, -0.0161895751953125, -0.014135360717773438, -0.012081146240234375, -0.010026931762695312, -0.00797271728515625, -0.0059185028076171875, -0.003864288330078125, -0.0018100738525390625, 0.000244140625, 0.0022983551025390625, 0.004352569580078125, 0.0064067840576171875, 0.00846099853515625, 0.010515213012695312, 0.012569427490234375, 0.014623641967773438, 0.0166778564453125, 0.018732070922851562, 0.020786285400390625, 0.022840499877929688, 0.02489471435546875, 0.026948928833007812, 0.029003143310546875, 0.031057357788085938, 0.033111572265625, 0.03516578674316406, 0.037220001220703125, 0.03927421569824219, 0.04132843017578125, 0.04338264465332031, 0.045436859130859375, 0.04749107360839844, 0.0495452880859375, 0.05159950256347656, 0.053653717041015625, 0.05570793151855469, 0.05776214599609375, 0.05981636047363281, 0.061870574951171875, 0.06392478942871094, 0.06597900390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 13.0, 17.0, 14.0, 32.0, 31.0, 49.0, 73.0, 141.0, 217.0, 500.0, 1278.0, 3590.0, 12762.0, 65192.0, 573668.0, 336304.0, 41212.0, 8938.0, 2550.0, 954.0, 436.0, 223.0, 87.0, 54.0, 57.0, 34.0, 25.0, 15.0, 20.0, 12.0, 6.0, 6.0, 8.0, 7.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2415771484375, -0.23399734497070312, -0.22641754150390625, -0.21883773803710938, -0.2112579345703125, -0.20367813110351562, -0.19609832763671875, -0.18851852416992188, -0.180938720703125, -0.17335891723632812, -0.16577911376953125, -0.15819931030273438, -0.1506195068359375, -0.14303970336914062, -0.13545989990234375, -0.12788009643554688, -0.12030029296875, -0.11272048950195312, -0.10514068603515625, -0.09756088256835938, -0.0899810791015625, -0.08240127563476562, -0.07482147216796875, -0.06724166870117188, -0.059661865234375, -0.052082061767578125, -0.04450225830078125, -0.036922454833984375, -0.0293426513671875, -0.021762847900390625, -0.01418304443359375, -0.006603240966796875, 0.0009765625, 0.008556365966796875, 0.01613616943359375, 0.023715972900390625, 0.0312957763671875, 0.038875579833984375, 0.04645538330078125, 0.054035186767578125, 0.061614990234375, 0.06919479370117188, 0.07677459716796875, 0.08435440063476562, 0.0919342041015625, 0.09951400756835938, 0.10709381103515625, 0.11467361450195312, 0.12225341796875, 0.12983322143554688, 0.13741302490234375, 0.14499282836914062, 0.1525726318359375, 0.16015243530273438, 0.16773223876953125, 0.17531204223632812, 0.182891845703125, 0.19047164916992188, 0.19805145263671875, 0.20563125610351562, 0.2132110595703125, 0.22079086303710938, 0.22837066650390625, 0.23595046997070312, 0.2435302734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 13.0, 13.0, 13.0, 14.0, 22.0, 21.0, 19.0, 30.0, 31.0, 35.0, 31.0, 37.0, 50.0, 54.0, 60.0, 50.0, 51.0, 50.0, 56.0, 38.0, 41.0, 29.0, 41.0, 22.0, 16.0, 28.0, 25.0, 21.0, 9.0, 18.0, 12.0, 9.0, 7.0, 7.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.14720726013183594, -0.14207077026367188, -0.1369342803955078, -0.13179779052734375, -0.1266613006591797, -0.12152481079101562, -0.11638832092285156, -0.1112518310546875, -0.10611534118652344, -0.10097885131835938, -0.09584236145019531, -0.09070587158203125, -0.08556938171386719, -0.08043289184570312, -0.07529640197753906, -0.070159912109375, -0.06502342224121094, -0.059886932373046875, -0.05475044250488281, -0.04961395263671875, -0.04447746276855469, -0.039340972900390625, -0.03420448303222656, -0.0290679931640625, -0.023931503295898438, -0.018795013427734375, -0.013658523559570312, -0.00852203369140625, -0.0033855438232421875, 0.001750946044921875, 0.0068874359130859375, 0.01202392578125, 0.017160415649414062, 0.022296905517578125, 0.027433395385742188, 0.03256988525390625, 0.03770637512207031, 0.042842864990234375, 0.04797935485839844, 0.0531158447265625, 0.05825233459472656, 0.06338882446289062, 0.06852531433105469, 0.07366180419921875, 0.07879829406738281, 0.08393478393554688, 0.08907127380371094, 0.094207763671875, 0.09934425354003906, 0.10448074340820312, 0.10961723327636719, 0.11475372314453125, 0.11989021301269531, 0.12502670288085938, 0.13016319274902344, 0.1352996826171875, 0.14043617248535156, 0.14557266235351562, 0.1507091522216797, 0.15584564208984375, 0.1609821319580078, 0.16611862182617188, 0.17125511169433594, 0.1763916015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 12.0, 14.0, 9.0, 27.0, 64.0, 90.0, 133.0, 276.0, 630.0, 1937.0, 10080.0, 291906.0, 721612.0, 17500.0, 2706.0, 840.0, 325.0, 172.0, 89.0, 47.0, 28.0, 18.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.52294921875, -0.5113582611083984, -0.4997673034667969, -0.4881763458251953, -0.47658538818359375, -0.4649944305419922, -0.4534034729003906, -0.44181251525878906, -0.4302215576171875, -0.41863059997558594, -0.4070396423339844, -0.3954486846923828, -0.38385772705078125, -0.3722667694091797, -0.3606758117675781, -0.34908485412597656, -0.337493896484375, -0.32590293884277344, -0.3143119812011719, -0.3027210235595703, -0.29113006591796875, -0.2795391082763672, -0.2679481506347656, -0.25635719299316406, -0.2447662353515625, -0.23317527770996094, -0.22158432006835938, -0.2099933624267578, -0.19840240478515625, -0.1868114471435547, -0.17522048950195312, -0.16362953186035156, -0.15203857421875, -0.14044761657714844, -0.12885665893554688, -0.11726570129394531, -0.10567474365234375, -0.09408378601074219, -0.08249282836914062, -0.07090187072753906, -0.0593109130859375, -0.04771995544433594, -0.036128997802734375, -0.024538040161132812, -0.01294708251953125, -0.0013561248779296875, 0.010234832763671875, 0.021825790405273438, 0.033416748046875, 0.04500770568847656, 0.056598663330078125, 0.06818962097167969, 0.07978057861328125, 0.09137153625488281, 0.10296249389648438, 0.11455345153808594, 0.1261444091796875, 0.13773536682128906, 0.14932632446289062, 0.1609172821044922, 0.17250823974609375, 0.1840991973876953, 0.19569015502929688, 0.20728111267089844, 0.2188720703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 11.0, 9.0, 5.0, 11.0, 20.0, 27.0, 47.0, 46.0, 53.0, 77.0, 96.0, 84.0, 100.0, 95.0, 66.0, 64.0, 42.0, 42.0, 30.0, 11.0, 14.0, 6.0, 15.0, 6.0, 3.0, 1.0, 5.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.546476364135742e-05, -3.448314964771271e-05, -3.350153565406799e-05, -3.251992166042328e-05, -3.1538307666778564e-05, -3.055669367313385e-05, -2.9575079679489136e-05, -2.859346568584442e-05, -2.7611851692199707e-05, -2.6630237698554993e-05, -2.564862370491028e-05, -2.4667009711265564e-05, -2.368539571762085e-05, -2.2703781723976135e-05, -2.172216773033142e-05, -2.0740553736686707e-05, -1.9758939743041992e-05, -1.8777325749397278e-05, -1.7795711755752563e-05, -1.681409776210785e-05, -1.5832483768463135e-05, -1.485086977481842e-05, -1.3869255781173706e-05, -1.2887641787528992e-05, -1.1906027793884277e-05, -1.0924413800239563e-05, -9.942799806594849e-06, -8.961185812950134e-06, -7.97957181930542e-06, -6.9979578256607056e-06, -6.016343832015991e-06, -5.034729838371277e-06, -4.0531158447265625e-06, -3.071501851081848e-06, -2.089887857437134e-06, -1.1082738637924194e-06, -1.2665987014770508e-07, 8.549541234970093e-07, 1.8365681171417236e-06, 2.818182110786438e-06, 3.7997961044311523e-06, 4.781410098075867e-06, 5.763024091720581e-06, 6.744638085365295e-06, 7.72625207901001e-06, 8.707866072654724e-06, 9.689480066299438e-06, 1.0671094059944153e-05, 1.1652708053588867e-05, 1.2634322047233582e-05, 1.3615936040878296e-05, 1.459755003452301e-05, 1.5579164028167725e-05, 1.656077802181244e-05, 1.7542392015457153e-05, 1.8524006009101868e-05, 1.9505620002746582e-05, 2.0487233996391296e-05, 2.146884799003601e-05, 2.2450461983680725e-05, 2.343207597732544e-05, 2.4413689970970154e-05, 2.5395303964614868e-05, 2.6376917958259583e-05, 2.7358531951904297e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 14.0, 13.0, 16.0, 32.0, 50.0, 97.0, 211.0, 401.0, 990.0, 3615.0, 21476.0, 489862.0, 504561.0, 21887.0, 3615.0, 985.0, 329.0, 167.0, 77.0, 58.0, 41.0, 15.0, 7.0, 5.0, 6.0, 3.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3465614318847656, -0.33789825439453125, -0.3292350769042969, -0.3205718994140625, -0.3119087219238281, -0.30324554443359375, -0.2945823669433594, -0.285919189453125, -0.2772560119628906, -0.26859283447265625, -0.2599296569824219, -0.2512664794921875, -0.24260330200195312, -0.23394012451171875, -0.22527694702148438, -0.21661376953125, -0.20795059204101562, -0.19928741455078125, -0.19062423706054688, -0.1819610595703125, -0.17329788208007812, -0.16463470458984375, -0.15597152709960938, -0.147308349609375, -0.13864517211914062, -0.12998199462890625, -0.12131881713867188, -0.1126556396484375, -0.10399246215820312, -0.09532928466796875, -0.08666610717773438, -0.0780029296875, -0.06933975219726562, -0.06067657470703125, -0.052013397216796875, -0.0433502197265625, -0.034687042236328125, -0.02602386474609375, -0.017360687255859375, -0.008697509765625, -3.4332275390625e-05, 0.00862884521484375, 0.017292022705078125, 0.0259552001953125, 0.034618377685546875, 0.04328155517578125, 0.051944732666015625, 0.06060791015625, 0.06927108764648438, 0.07793426513671875, 0.08659744262695312, 0.0952606201171875, 0.10392379760742188, 0.11258697509765625, 0.12125015258789062, 0.129913330078125, 0.13857650756835938, 0.14723968505859375, 0.15590286254882812, 0.1645660400390625, 0.17322921752929688, 0.18189239501953125, 0.19055557250976562, 0.19921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 3.0, 14.0, 18.0, 40.0, 36.0, 44.0, 89.0, 136.0, 168.0, 161.0, 102.0, 62.0, 35.0, 15.0, 22.0, 14.0, 12.0, 10.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.2398223876953125, -0.233917236328125, -0.2280120849609375, -0.22210693359375, -0.2162017822265625, -0.210296630859375, -0.2043914794921875, -0.198486328125, -0.1925811767578125, -0.186676025390625, -0.1807708740234375, -0.17486572265625, -0.1689605712890625, -0.163055419921875, -0.1571502685546875, -0.1512451171875, -0.1453399658203125, -0.139434814453125, -0.1335296630859375, -0.12762451171875, -0.1217193603515625, -0.115814208984375, -0.1099090576171875, -0.10400390625, -0.0980987548828125, -0.092193603515625, -0.0862884521484375, -0.08038330078125, -0.0744781494140625, -0.068572998046875, -0.0626678466796875, -0.0567626953125, -0.0508575439453125, -0.044952392578125, -0.0390472412109375, -0.03314208984375, -0.0272369384765625, -0.021331787109375, -0.0154266357421875, -0.009521484375, -0.0036163330078125, 0.002288818359375, 0.0081939697265625, 0.01409912109375, 0.0200042724609375, 0.025909423828125, 0.0318145751953125, 0.0377197265625, 0.0436248779296875, 0.049530029296875, 0.0554351806640625, 0.06134033203125, 0.0672454833984375, 0.073150634765625, 0.0790557861328125, 0.0849609375, 0.0908660888671875, 0.096771240234375, 0.1026763916015625, 0.10858154296875, 0.1144866943359375, 0.120391845703125, 0.1262969970703125, 0.1322021484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 91.0, 746.0, 134.0, 17.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4037139415740967, -2.2271244525909424, -2.050535202026367, -1.873945713043213, -1.6973564624786377, -1.5207669734954834, -1.3441776037216187, -1.167588233947754, -0.9909988641738892, -0.8144094944000244, -0.6378201246261597, -0.46123069524765015, -0.2846413254737854, -0.10805195569992065, 0.06853747367858887, 0.2451268434524536, 0.42171621322631836, 0.5983055830001831, 0.7748949527740479, 0.9514843821525574, 1.1280736923217773, 1.3046631813049316, 1.4812525510787964, 1.6578419208526611, 1.8344312906265259, 2.0110206604003906, 2.187610149383545, 2.36419939994812, 2.5407888889312744, 2.7173781394958496, 2.893967628479004, 3.070557117462158, 3.2471461296081543, 3.4237356185913086, 3.600324869155884, 3.776914358139038, 3.9535036087036133, 4.130093097686768, 4.306682586669922, 4.483271598815918, 4.659861087799072, 4.836450576782227, 5.013040065765381, 5.189629077911377, 5.366218566894531, 5.5428080558776855, 5.71939754486084, 5.895986557006836, 6.072576522827148, 6.249166011810303, 6.425755500793457, 6.602344512939453, 6.778934001922607, 6.955523490905762, 7.132112979888916, 7.30870246887207, 7.485291481018066, 7.661880970001221, 7.838470458984375, 8.015059471130371, 8.191649436950684, 8.36823844909668, 8.544827461242676, 8.721417427062988, 8.898006439208984]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 8.0, 11.0, 16.0, 19.0, 21.0, 25.0, 34.0, 74.0, 62.0, 83.0, 97.0, 102.0, 69.0, 86.0, 73.0, 57.0, 34.0, 31.0, 26.0, 18.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.964937448501587, -1.9055211544036865, -1.8461049795150757, -1.7866886854171753, -1.7272725105285645, -1.667856216430664, -1.6084399223327637, -1.5490236282348633, -1.4896074533462524, -1.430191159248352, -1.3707749843597412, -1.3113586902618408, -1.2519423961639404, -1.1925262212753296, -1.1331099271774292, -1.0736937522888184, -1.014277458190918, -0.9548612236976624, -0.8954449892044067, -0.8360286951065063, -0.7766124606132507, -0.7171962261199951, -0.6577799320220947, -0.5983636975288391, -0.5389474630355835, -0.4795312285423279, -0.4201149642467499, -0.3606986999511719, -0.30128246545791626, -0.24186623096466064, -0.18244996666908264, -0.12303370237350464, -0.06361734867095947, -0.004201099276542664, 0.055215150117874146, 0.11463139951229095, 0.17404764890670776, 0.23346388339996338, 0.2928801476955414, 0.3522964119911194, 0.411712646484375, 0.4711288809776306, 0.5305451154708862, 0.5899614095687866, 0.6493776440620422, 0.7087938785552979, 0.7682101726531982, 0.8276264071464539, 0.8870426416397095, 0.9464588761329651, 1.0058751106262207, 1.065291404724121, 1.1247076988220215, 1.1841238737106323, 1.2435401678085327, 1.3029563426971436, 1.362372636795044, 1.4217889308929443, 1.4812051057815552, 1.5406213998794556, 1.6000375747680664, 1.6594538688659668, 1.7188701629638672, 1.7782864570617676, 1.8377026319503784]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 6.0, 6.0, 2.0, 3.0, 3.0, 13.0, 10.0, 15.0, 14.0, 22.0, 24.0, 29.0, 41.0, 69.0, 72.0, 89.0, 139.0, 188.0, 222.0, 370.0, 515.0, 814.0, 1201.0, 1973.0, 3632.0, 8720.0, 36898.0, 3933959.0, 175413.0, 17911.0, 5356.0, 2506.0, 1422.0, 880.0, 569.0, 404.0, 261.0, 174.0, 112.0, 69.0, 42.0, 32.0, 24.0, 14.0, 8.0, 9.0, 7.0, 5.0, 7.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6591796875, -0.6384353637695312, -0.6176910400390625, -0.5969467163085938, -0.576202392578125, -0.5554580688476562, -0.5347137451171875, -0.5139694213867188, -0.49322509765625, -0.47248077392578125, -0.4517364501953125, -0.43099212646484375, -0.410247802734375, -0.38950347900390625, -0.3687591552734375, -0.34801483154296875, -0.3272705078125, -0.30652618408203125, -0.2857818603515625, -0.26503753662109375, -0.244293212890625, -0.22354888916015625, -0.2028045654296875, -0.18206024169921875, -0.16131591796875, -0.14057159423828125, -0.1198272705078125, -0.09908294677734375, -0.078338623046875, -0.05759429931640625, -0.0368499755859375, -0.01610565185546875, 0.004638671875, 0.02538299560546875, 0.0461273193359375, 0.06687164306640625, 0.087615966796875, 0.10836029052734375, 0.1291046142578125, 0.14984893798828125, 0.17059326171875, 0.19133758544921875, 0.2120819091796875, 0.23282623291015625, 0.253570556640625, 0.27431488037109375, 0.2950592041015625, 0.31580352783203125, 0.3365478515625, 0.35729217529296875, 0.3780364990234375, 0.39878082275390625, 0.419525146484375, 0.44026947021484375, 0.4610137939453125, 0.48175811767578125, 0.50250244140625, 0.5232467651367188, 0.5439910888671875, 0.5647354125976562, 0.585479736328125, 0.6062240600585938, 0.6269683837890625, 0.6477127075195312, 0.66845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 10.0, 6.0, 12.0, 7.0, 15.0, 26.0, 65.0, 121.0, 238.0, 220.0, 122.0, 57.0, 22.0, 8.0, 12.0, 10.0, 10.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.0672750473022461, -0.06509208679199219, -0.06290912628173828, -0.060726165771484375, -0.05854320526123047, -0.05636024475097656, -0.054177284240722656, -0.05199432373046875, -0.049811363220214844, -0.04762840270996094, -0.04544544219970703, -0.043262481689453125, -0.04107952117919922, -0.03889656066894531, -0.036713600158691406, -0.0345306396484375, -0.032347679138183594, -0.030164718627929688, -0.02798175811767578, -0.025798797607421875, -0.02361583709716797, -0.021432876586914062, -0.019249916076660156, -0.01706695556640625, -0.014883995056152344, -0.012701034545898438, -0.010518074035644531, -0.008335113525390625, -0.006152153015136719, -0.0039691925048828125, -0.0017862319946289062, 0.000396728515625, 0.0025796890258789062, 0.0047626495361328125, 0.006945610046386719, 0.009128570556640625, 0.011311531066894531, 0.013494491577148438, 0.015677452087402344, 0.01786041259765625, 0.020043373107910156, 0.022226333618164062, 0.02440929412841797, 0.026592254638671875, 0.02877521514892578, 0.030958175659179688, 0.033141136169433594, 0.0353240966796875, 0.037507057189941406, 0.03969001770019531, 0.04187297821044922, 0.044055938720703125, 0.04623889923095703, 0.04842185974121094, 0.050604820251464844, 0.05278778076171875, 0.054970741271972656, 0.05715370178222656, 0.05933666229248047, 0.061519622802734375, 0.06370258331298828, 0.06588554382324219, 0.0680685043334961, 0.07025146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 5.0, 8.0, 8.0, 7.0, 7.0, 12.0, 15.0, 27.0, 47.0, 66.0, 139.0, 328.0, 1158.0, 4772.0, 29905.0, 3692246.0, 443837.0, 17197.0, 3117.0, 854.0, 256.0, 92.0, 47.0, 38.0, 15.0, 13.0, 15.0, 11.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6919403076171875, -0.669525146484375, -0.6471099853515625, -0.62469482421875, -0.6022796630859375, -0.579864501953125, -0.5574493408203125, -0.5350341796875, -0.5126190185546875, -0.490203857421875, -0.4677886962890625, -0.44537353515625, -0.4229583740234375, -0.400543212890625, -0.3781280517578125, -0.355712890625, -0.3332977294921875, -0.310882568359375, -0.2884674072265625, -0.26605224609375, -0.2436370849609375, -0.221221923828125, -0.1988067626953125, -0.1763916015625, -0.1539764404296875, -0.131561279296875, -0.1091461181640625, -0.08673095703125, -0.0643157958984375, -0.041900634765625, -0.0194854736328125, 0.0029296875, 0.0253448486328125, 0.047760009765625, 0.0701751708984375, 0.09259033203125, 0.1150054931640625, 0.137420654296875, 0.1598358154296875, 0.1822509765625, 0.2046661376953125, 0.227081298828125, 0.2494964599609375, 0.27191162109375, 0.2943267822265625, 0.316741943359375, 0.3391571044921875, 0.361572265625, 0.3839874267578125, 0.406402587890625, 0.4288177490234375, 0.45123291015625, 0.4736480712890625, 0.496063232421875, 0.5184783935546875, 0.5408935546875, 0.5633087158203125, 0.585723876953125, 0.6081390380859375, 0.63055419921875, 0.6529693603515625, 0.675384521484375, 0.6977996826171875, 0.72021484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 8.0, 8.0, 16.0, 37.0, 68.0, 114.0, 218.0, 710.0, 2140.0, 334.0, 159.0, 84.0, 40.0, 27.0, 21.0, 17.0, 5.0, 9.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07810592651367188, -0.07534027099609375, -0.07257461547851562, -0.0698089599609375, -0.06704330444335938, -0.06427764892578125, -0.061511993408203125, -0.058746337890625, -0.055980682373046875, -0.05321502685546875, -0.050449371337890625, -0.0476837158203125, -0.044918060302734375, -0.04215240478515625, -0.039386749267578125, -0.03662109375, -0.033855438232421875, -0.03108978271484375, -0.028324127197265625, -0.0255584716796875, -0.022792816162109375, -0.02002716064453125, -0.017261505126953125, -0.014495849609375, -0.011730194091796875, -0.00896453857421875, -0.006198883056640625, -0.0034332275390625, -0.000667572021484375, 0.00209808349609375, 0.004863739013671875, 0.00762939453125, 0.010395050048828125, 0.01316070556640625, 0.015926361083984375, 0.0186920166015625, 0.021457672119140625, 0.02422332763671875, 0.026988983154296875, 0.029754638671875, 0.032520294189453125, 0.03528594970703125, 0.038051605224609375, 0.0408172607421875, 0.043582916259765625, 0.04634857177734375, 0.049114227294921875, 0.0518798828125, 0.054645538330078125, 0.05741119384765625, 0.060176849365234375, 0.0629425048828125, 0.06570816040039062, 0.06847381591796875, 0.07123947143554688, 0.074005126953125, 0.07677078247070312, 0.07953643798828125, 0.08230209350585938, 0.0850677490234375, 0.08783340454101562, 0.09059906005859375, 0.09336471557617188, 0.09613037109375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 8.0, 14.0, 39.0, 84.0, 236.0, 267.0, 204.0, 89.0, 35.0, 13.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25120946764945984, -0.23506291210651398, -0.21891635656356812, -0.20276981592178345, -0.1866232454776764, -0.17047670483589172, -0.15433014929294586, -0.13818359375, -0.12203703820705414, -0.10589048266410828, -0.08974392712116241, -0.07359737902879715, -0.05745082348585129, -0.041304267942905426, -0.02515771985054016, -0.0090111643075943, 0.0071353912353515625, 0.023281944915652275, 0.03942849859595299, 0.05557505041360855, 0.07172160595655441, 0.08786816149950027, 0.10401470959186554, 0.1201612651348114, 0.13630782067775726, 0.15245437622070312, 0.168600931763649, 0.18474748730659485, 0.20089402794837952, 0.21704059839248657, 0.23318713903427124, 0.2493336945772171, 0.26548027992248535, 0.28162682056427, 0.2977733910083771, 0.31391993165016174, 0.3300665020942688, 0.34621304273605347, 0.36235958337783813, 0.3785061538219452, 0.39465272426605225, 0.4107992649078369, 0.42694583535194397, 0.44309237599372864, 0.4592389464378357, 0.47538548707962036, 0.49153202772140503, 0.5076786279678345, 0.5238251686096191, 0.5399717092514038, 0.5561182498931885, 0.5722648501396179, 0.5884113907814026, 0.6045579314231873, 0.6207044720649719, 0.6368510723114014, 0.6529975533485413, 0.6691440939903259, 0.6852906346321106, 0.70143723487854, 0.7175837755203247, 0.7337303161621094, 0.749876856803894, 0.7660233974456787, 0.7821699976921082]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 11.0, 13.0, 11.0, 21.0, 24.0, 27.0, 41.0, 50.0, 44.0, 79.0, 77.0, 78.0, 74.0, 64.0, 73.0, 66.0, 54.0, 50.0, 35.0, 29.0, 23.0, 8.0, 6.0, 9.0, 13.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3986917734146118, -0.3883019685745239, -0.37791216373443604, -0.36752235889434814, -0.35713255405426025, -0.34674274921417236, -0.3363529443740845, -0.3259631097316742, -0.3155733048915863, -0.3051835000514984, -0.2947936952114105, -0.28440389037132263, -0.27401408553123474, -0.26362425088882446, -0.2532344460487366, -0.24284464120864868, -0.23245485126972198, -0.2220650464296341, -0.2116752415895462, -0.20128542184829712, -0.19089561700820923, -0.18050581216812134, -0.17011600732803345, -0.15972620248794556, -0.14933639764785767, -0.13894659280776978, -0.12855678796768188, -0.1181669756770134, -0.10777716338634491, -0.09738735854625702, -0.08699755370616913, -0.07660774141550064, -0.06621792912483215, -0.055828120559453964, -0.045438311994075775, -0.035048507153987885, -0.024658698588609695, -0.014268890023231506, -0.0038790851831436157, 0.006510727107524872, 0.016900531947612762, 0.02729034051299095, 0.03768014907836914, 0.04806995391845703, 0.05845976248383522, 0.06884957104921341, 0.0792393758893013, 0.08962918817996979, 0.10001899302005768, 0.11040879786014557, 0.12079861015081406, 0.13118842244148254, 0.14157822728157043, 0.15196803212165833, 0.16235783696174622, 0.1727476418018341, 0.183137446641922, 0.1935272514820099, 0.20391705632209778, 0.21430686116218567, 0.22469668090343475, 0.23508648574352264, 0.24547629058361053, 0.2558661103248596, 0.2662559151649475]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 10.0, 9.0, 15.0, 13.0, 21.0, 38.0, 44.0, 76.0, 109.0, 142.0, 272.0, 503.0, 801.0, 1654.0, 3404.0, 9290.0, 32667.0, 444039.0, 504265.0, 34259.0, 9567.0, 3617.0, 1622.0, 818.0, 495.0, 276.0, 176.0, 107.0, 66.0, 41.0, 42.0, 26.0, 19.0, 15.0, 13.0, 11.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41959381103515625, -0.4046173095703125, -0.38964080810546875, -0.374664306640625, -0.35968780517578125, -0.3447113037109375, -0.32973480224609375, -0.31475830078125, -0.29978179931640625, -0.2848052978515625, -0.26982879638671875, -0.254852294921875, -0.23987579345703125, -0.2248992919921875, -0.20992279052734375, -0.1949462890625, -0.17996978759765625, -0.1649932861328125, -0.15001678466796875, -0.135040283203125, -0.12006378173828125, -0.1050872802734375, -0.09011077880859375, -0.07513427734375, -0.06015777587890625, -0.0451812744140625, -0.03020477294921875, -0.015228271484375, -0.00025177001953125, 0.0147247314453125, 0.02970123291015625, 0.044677734375, 0.05965423583984375, 0.0746307373046875, 0.08960723876953125, 0.104583740234375, 0.11956024169921875, 0.1345367431640625, 0.14951324462890625, 0.16448974609375, 0.17946624755859375, 0.1944427490234375, 0.20941925048828125, 0.224395751953125, 0.23937225341796875, 0.2543487548828125, 0.26932525634765625, 0.2843017578125, 0.29927825927734375, 0.3142547607421875, 0.32923126220703125, 0.344207763671875, 0.35918426513671875, 0.3741607666015625, 0.38913726806640625, 0.40411376953125, 0.41909027099609375, 0.4340667724609375, 0.44904327392578125, 0.464019775390625, 0.47899627685546875, 0.4939727783203125, 0.5089492797851562, 0.52392578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 15.0, 12.0, 22.0, 55.0, 108.0, 187.0, 218.0, 162.0, 71.0, 43.0, 14.0, 20.0, 13.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06855344772338867, -0.06648921966552734, -0.06442499160766602, -0.06236076354980469, -0.06029653549194336, -0.05823230743408203, -0.0561680793762207, -0.054103851318359375, -0.05203962326049805, -0.04997539520263672, -0.04791116714477539, -0.04584693908691406, -0.043782711029052734, -0.041718482971191406, -0.03965425491333008, -0.03759002685546875, -0.03552579879760742, -0.033461570739746094, -0.031397342681884766, -0.029333114624023438, -0.02726888656616211, -0.02520465850830078, -0.023140430450439453, -0.021076202392578125, -0.019011974334716797, -0.01694774627685547, -0.01488351821899414, -0.012819290161132812, -0.010755062103271484, -0.008690834045410156, -0.006626605987548828, -0.0045623779296875, -0.002498149871826172, -0.00043392181396484375, 0.0016303062438964844, 0.0036945343017578125, 0.005758762359619141, 0.007822990417480469, 0.009887218475341797, 0.011951446533203125, 0.014015674591064453, 0.01607990264892578, 0.01814413070678711, 0.020208358764648438, 0.022272586822509766, 0.024336814880371094, 0.026401042938232422, 0.02846527099609375, 0.030529499053955078, 0.032593727111816406, 0.034657955169677734, 0.03672218322753906, 0.03878641128540039, 0.04085063934326172, 0.04291486740112305, 0.044979095458984375, 0.0470433235168457, 0.04910755157470703, 0.05117177963256836, 0.05323600769042969, 0.055300235748291016, 0.057364463806152344, 0.05942869186401367, 0.061492919921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 9.0, 13.0, 10.0, 21.0, 19.0, 35.0, 48.0, 72.0, 110.0, 175.0, 299.0, 597.0, 1414.0, 5209.0, 34093.0, 492698.0, 473079.0, 32940.0, 4905.0, 1372.0, 607.0, 296.0, 162.0, 95.0, 71.0, 47.0, 30.0, 21.0, 20.0, 17.0, 10.0, 7.0, 10.0, 7.0, 3.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.51806640625, -0.5032615661621094, -0.48845672607421875, -0.4736518859863281, -0.4588470458984375, -0.4440422058105469, -0.42923736572265625, -0.4144325256347656, -0.399627685546875, -0.3848228454589844, -0.37001800537109375, -0.3552131652832031, -0.3404083251953125, -0.3256034851074219, -0.31079864501953125, -0.2959938049316406, -0.28118896484375, -0.2663841247558594, -0.25157928466796875, -0.23677444458007812, -0.2219696044921875, -0.20716476440429688, -0.19235992431640625, -0.17755508422851562, -0.162750244140625, -0.14794540405273438, -0.13314056396484375, -0.11833572387695312, -0.1035308837890625, -0.08872604370117188, -0.07392120361328125, -0.059116363525390625, -0.0443115234375, -0.029506683349609375, -0.01470184326171875, 0.000102996826171875, 0.0149078369140625, 0.029712677001953125, 0.04451751708984375, 0.059322357177734375, 0.074127197265625, 0.08893203735351562, 0.10373687744140625, 0.11854171752929688, 0.1333465576171875, 0.14815139770507812, 0.16295623779296875, 0.17776107788085938, 0.19256591796875, 0.20737075805664062, 0.22217559814453125, 0.23698043823242188, 0.2517852783203125, 0.2665901184082031, 0.28139495849609375, 0.2961997985839844, 0.311004638671875, 0.3258094787597656, 0.34061431884765625, 0.3554191589355469, 0.3702239990234375, 0.3850288391113281, 0.39983367919921875, 0.4146385192871094, 0.429443359375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 6.0, 9.0, 16.0, 13.0, 13.0, 30.0, 26.0, 20.0, 30.0, 38.0, 36.0, 29.0, 36.0, 47.0, 50.0, 54.0, 50.0, 35.0, 42.0, 56.0, 40.0, 34.0, 32.0, 42.0, 25.0, 28.0, 21.0, 16.0, 16.0, 19.0, 10.0, 17.0, 6.0, 5.0, 10.0, 6.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.193603515625, -0.18836593627929688, -0.18312835693359375, -0.17789077758789062, -0.1726531982421875, -0.16741561889648438, -0.16217803955078125, -0.15694046020507812, -0.151702880859375, -0.14646530151367188, -0.14122772216796875, -0.13599014282226562, -0.1307525634765625, -0.12551498413085938, -0.12027740478515625, -0.11503982543945312, -0.10980224609375, -0.10456466674804688, -0.09932708740234375, -0.09408950805664062, -0.0888519287109375, -0.08361434936523438, -0.07837677001953125, -0.07313919067382812, -0.067901611328125, -0.06266403198242188, -0.05742645263671875, -0.052188873291015625, -0.0469512939453125, -0.041713714599609375, -0.03647613525390625, -0.031238555908203125, -0.0260009765625, -0.020763397216796875, -0.01552581787109375, -0.010288238525390625, -0.0050506591796875, 0.000186920166015625, 0.00542449951171875, 0.010662078857421875, 0.015899658203125, 0.021137237548828125, 0.02637481689453125, 0.031612396240234375, 0.0368499755859375, 0.042087554931640625, 0.04732513427734375, 0.052562713623046875, 0.05780029296875, 0.06303787231445312, 0.06827545166015625, 0.07351303100585938, 0.0787506103515625, 0.08398818969726562, 0.08922576904296875, 0.09446334838867188, 0.099700927734375, 0.10493850708007812, 0.11017608642578125, 0.11541366577148438, 0.1206512451171875, 0.12588882446289062, 0.13112640380859375, 0.13636398315429688, 0.1416015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 7.0, 11.0, 25.0, 31.0, 48.0, 79.0, 141.0, 222.0, 464.0, 984.0, 2176.0, 5498.0, 16982.0, 64715.0, 321303.0, 490534.0, 106177.0, 25782.0, 7963.0, 2917.0, 1247.0, 571.0, 260.0, 148.0, 82.0, 52.0, 45.0, 30.0, 13.0, 9.0, 11.0, 4.0, 9.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143798828125, -0.1393280029296875, -0.134857177734375, -0.1303863525390625, -0.12591552734375, -0.1214447021484375, -0.116973876953125, -0.1125030517578125, -0.1080322265625, -0.1035614013671875, -0.099090576171875, -0.0946197509765625, -0.09014892578125, -0.0856781005859375, -0.081207275390625, -0.0767364501953125, -0.072265625, -0.0677947998046875, -0.063323974609375, -0.0588531494140625, -0.05438232421875, -0.0499114990234375, -0.045440673828125, -0.0409698486328125, -0.0364990234375, -0.0320281982421875, -0.027557373046875, -0.0230865478515625, -0.01861572265625, -0.0141448974609375, -0.009674072265625, -0.0052032470703125, -0.000732421875, 0.0037384033203125, 0.008209228515625, 0.0126800537109375, 0.01715087890625, 0.0216217041015625, 0.026092529296875, 0.0305633544921875, 0.0350341796875, 0.0395050048828125, 0.043975830078125, 0.0484466552734375, 0.05291748046875, 0.0573883056640625, 0.061859130859375, 0.0663299560546875, 0.07080078125, 0.0752716064453125, 0.079742431640625, 0.0842132568359375, 0.08868408203125, 0.0931549072265625, 0.097625732421875, 0.1020965576171875, 0.1065673828125, 0.1110382080078125, 0.115509033203125, 0.1199798583984375, 0.12445068359375, 0.1289215087890625, 0.133392333984375, 0.1378631591796875, 0.142333984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 11.0, 13.0, 4.0, 18.0, 15.0, 11.0, 23.0, 21.0, 24.0, 28.0, 46.0, 51.0, 53.0, 44.0, 49.0, 61.0, 45.0, 49.0, 62.0, 54.0, 39.0, 28.0, 44.0, 37.0, 30.0, 29.0, 22.0, 20.0, 13.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24249267578125e-05, -3.15103679895401e-05, -3.05958092212677e-05, -2.96812504529953e-05, -2.87666916847229e-05, -2.78521329164505e-05, -2.69375741481781e-05, -2.60230153799057e-05, -2.51084566116333e-05, -2.41938978433609e-05, -2.32793390750885e-05, -2.23647803068161e-05, -2.14502215385437e-05, -2.05356627702713e-05, -1.96211040019989e-05, -1.87065452337265e-05, -1.77919864654541e-05, -1.68774276971817e-05, -1.5962868928909302e-05, -1.5048310160636902e-05, -1.4133751392364502e-05, -1.3219192624092102e-05, -1.2304633855819702e-05, -1.1390075087547302e-05, -1.0475516319274902e-05, -9.560957551002502e-06, -8.646398782730103e-06, -7.731840014457703e-06, -6.817281246185303e-06, -5.902722477912903e-06, -4.988163709640503e-06, -4.073604941368103e-06, -3.159046173095703e-06, -2.2444874048233032e-06, -1.3299286365509033e-06, -4.153698682785034e-07, 4.991888999938965e-07, 1.4137476682662964e-06, 2.3283064365386963e-06, 3.242865204811096e-06, 4.157423973083496e-06, 5.071982741355896e-06, 5.986541509628296e-06, 6.901100277900696e-06, 7.815659046173096e-06, 8.730217814445496e-06, 9.644776582717896e-06, 1.0559335350990295e-05, 1.1473894119262695e-05, 1.2388452887535095e-05, 1.3303011655807495e-05, 1.4217570424079895e-05, 1.5132129192352295e-05, 1.6046687960624695e-05, 1.6961246728897095e-05, 1.7875805497169495e-05, 1.8790364265441895e-05, 1.9704923033714294e-05, 2.0619481801986694e-05, 2.1534040570259094e-05, 2.2448599338531494e-05, 2.3363158106803894e-05, 2.4277716875076294e-05, 2.5192275643348694e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 5.0, 12.0, 18.0, 12.0, 31.0, 43.0, 67.0, 97.0, 201.0, 401.0, 990.0, 3451.0, 20010.0, 250674.0, 702202.0, 60061.0, 7279.0, 1725.0, 604.0, 253.0, 149.0, 79.0, 48.0, 42.0, 14.0, 12.0, 13.0, 12.0, 5.0, 11.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.22545433044433594, -0.21799850463867188, -0.2105426788330078, -0.20308685302734375, -0.1956310272216797, -0.18817520141601562, -0.18071937561035156, -0.1732635498046875, -0.16580772399902344, -0.15835189819335938, -0.1508960723876953, -0.14344024658203125, -0.1359844207763672, -0.12852859497070312, -0.12107276916503906, -0.113616943359375, -0.10616111755371094, -0.09870529174804688, -0.09124946594238281, -0.08379364013671875, -0.07633781433105469, -0.06888198852539062, -0.06142616271972656, -0.0539703369140625, -0.04651451110839844, -0.039058685302734375, -0.03160285949707031, -0.02414703369140625, -0.016691207885742188, -0.009235382080078125, -0.0017795562744140625, 0.00567626953125, 0.013132095336914062, 0.020587921142578125, 0.028043746948242188, 0.03549957275390625, 0.04295539855957031, 0.050411224365234375, 0.05786705017089844, 0.0653228759765625, 0.07277870178222656, 0.08023452758789062, 0.08769035339355469, 0.09514617919921875, 0.10260200500488281, 0.11005783081054688, 0.11751365661621094, 0.124969482421875, 0.13242530822753906, 0.13988113403320312, 0.1473369598388672, 0.15479278564453125, 0.1622486114501953, 0.16970443725585938, 0.17716026306152344, 0.1846160888671875, 0.19207191467285156, 0.19952774047851562, 0.2069835662841797, 0.21443939208984375, 0.2218952178955078, 0.22935104370117188, 0.23680686950683594, 0.2442626953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 11.0, 12.0, 9.0, 11.0, 11.0, 15.0, 28.0, 29.0, 37.0, 42.0, 45.0, 52.0, 67.0, 67.0, 81.0, 84.0, 65.0, 52.0, 53.0, 37.0, 30.0, 28.0, 21.0, 18.0, 17.0, 12.0, 8.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07537841796875, -0.07311534881591797, -0.07085227966308594, -0.0685892105102539, -0.06632614135742188, -0.06406307220458984, -0.06180000305175781, -0.05953693389892578, -0.05727386474609375, -0.05501079559326172, -0.05274772644042969, -0.050484657287597656, -0.048221588134765625, -0.045958518981933594, -0.04369544982910156, -0.04143238067626953, -0.0391693115234375, -0.03690624237060547, -0.03464317321777344, -0.032380104064941406, -0.030117034912109375, -0.027853965759277344, -0.025590896606445312, -0.02332782745361328, -0.02106475830078125, -0.01880168914794922, -0.016538619995117188, -0.014275550842285156, -0.012012481689453125, -0.009749412536621094, -0.0074863433837890625, -0.005223274230957031, -0.002960205078125, -0.0006971359252929688, 0.0015659332275390625, 0.0038290023803710938, 0.006092071533203125, 0.008355140686035156, 0.010618209838867188, 0.012881278991699219, 0.01514434814453125, 0.01740741729736328, 0.019670486450195312, 0.021933555603027344, 0.024196624755859375, 0.026459693908691406, 0.028722763061523438, 0.03098583221435547, 0.0332489013671875, 0.03551197052001953, 0.03777503967285156, 0.040038108825683594, 0.042301177978515625, 0.044564247131347656, 0.04682731628417969, 0.04909038543701172, 0.05135345458984375, 0.05361652374267578, 0.05587959289550781, 0.058142662048339844, 0.060405731201171875, 0.0626688003540039, 0.06493186950683594, 0.06719493865966797, 0.0694580078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 23.0, 119.0, 474.0, 302.0, 56.0, 21.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.012691020965576, -1.855126142501831, -1.697561264038086, -1.5399965047836304, -1.3824316263198853, -1.2248667478561401, -1.0673019886016846, -0.9097371101379395, -0.7521722316741943, -0.5946073532104492, -0.4370425343513489, -0.27947768568992615, -0.12191283702850342, 0.0356520414352417, 0.19321686029434204, 0.3507816791534424, 0.5083465576171875, 0.6659114360809326, 0.823476254940033, 0.9810410737991333, 1.1386059522628784, 1.2961708307266235, 1.453735589981079, 1.6113004684448242, 1.7688653469085693, 1.9264302253723145, 2.0839951038360596, 2.2415599822998047, 2.3991246223449707, 2.556689739227295, 2.714254379272461, 2.871819257736206, 3.029383659362793, 3.186948537826538, 3.344513416290283, 3.5020782947540283, 3.6596431732177734, 3.8172078132629395, 3.9747726917266846, 4.13233757019043, 4.289902687072754, 4.44746732711792, 4.605032444000244, 4.76259708404541, 4.920162200927734, 5.0777268409729, 5.235291957855225, 5.392856597900391, 5.550421237945557, 5.707985877990723, 5.865550994873047, 6.023115634918213, 6.180680751800537, 6.338245391845703, 6.495810508728027, 6.653375148773193, 6.810939788818359, 6.968504428863525, 7.12606954574585, 7.283634185791016, 7.44119930267334, 7.598763942718506, 7.75632905960083, 7.913893699645996, 8.07145881652832]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 10.0, 20.0, 25.0, 24.0, 32.0, 40.0, 44.0, 38.0, 61.0, 67.0, 57.0, 66.0, 72.0, 51.0, 80.0, 42.0, 35.0, 40.0, 42.0, 33.0, 22.0, 17.0, 11.0, 12.0, 9.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9406133890151978, -1.8857911825180054, -1.8309688568115234, -1.776146650314331, -1.7213244438171387, -1.6665022373199463, -1.611680030822754, -1.556857705116272, -1.5020354986190796, -1.4472132921218872, -1.3923909664154053, -1.337568759918213, -1.2827465534210205, -1.2279243469238281, -1.1731021404266357, -1.1182798147201538, -1.0634576082229614, -1.008635401725769, -0.9538131356239319, -0.8989908695220947, -0.8441686630249023, -0.78934645652771, -0.7345241904258728, -0.6797019243240356, -0.6248797178268433, -0.5700575113296509, -0.5152352452278137, -0.46041300892829895, -0.4055907726287842, -0.3507685363292694, -0.29594630002975464, -0.24112406373023987, -0.18630194664001465, -0.13147971034049988, -0.07665747404098511, -0.021835237741470337, 0.032986998558044434, 0.0878092348575592, 0.14263147115707397, 0.19745370745658875, 0.2522759437561035, 0.3070981800556183, 0.36192041635513306, 0.4167426526546478, 0.4715648889541626, 0.526387095451355, 0.5812093615531921, 0.6360316276550293, 0.6908538341522217, 0.7456760406494141, 0.8004983067512512, 0.8553205728530884, 0.9101427793502808, 0.9649649858474731, 1.019787311553955, 1.0746095180511475, 1.1294317245483398, 1.1842539310455322, 1.2390761375427246, 1.2938984632492065, 1.348720669746399, 1.4035428762435913, 1.4583652019500732, 1.5131874084472656, 1.568009614944458]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 11.0, 15.0, 23.0, 38.0, 86.0, 164.0, 377.0, 1260.0, 9295.0, 4110605.0, 69112.0, 2482.0, 483.0, 155.0, 87.0, 26.0, 20.0, 12.0, 9.0, 5.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.467529296875, -1.41650390625, -1.365478515625, -1.314453125, -1.263427734375, -1.21240234375, -1.161376953125, -1.1103515625, -1.059326171875, -1.00830078125, -0.957275390625, -0.90625, -0.855224609375, -0.80419921875, -0.753173828125, -0.7021484375, -0.651123046875, -0.60009765625, -0.549072265625, -0.498046875, -0.447021484375, -0.39599609375, -0.344970703125, -0.2939453125, -0.242919921875, -0.19189453125, -0.140869140625, -0.08984375, -0.038818359375, 0.01220703125, 0.063232421875, 0.1142578125, 0.165283203125, 0.21630859375, 0.267333984375, 0.318359375, 0.369384765625, 0.42041015625, 0.471435546875, 0.5224609375, 0.573486328125, 0.62451171875, 0.675537109375, 0.7265625, 0.777587890625, 0.82861328125, 0.879638671875, 0.9306640625, 0.981689453125, 1.03271484375, 1.083740234375, 1.134765625, 1.185791015625, 1.23681640625, 1.287841796875, 1.3388671875, 1.389892578125, 1.44091796875, 1.491943359375, 1.54296875, 1.593994140625, 1.64501953125, 1.696044921875, 1.7470703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 8.0, 10.0, 9.0, 17.0, 42.0, 42.0, 83.0, 132.0, 182.0, 155.0, 121.0, 61.0, 47.0, 29.0, 19.0, 10.0, 6.0, 9.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06628894805908203, -0.06397438049316406, -0.061659812927246094, -0.059345245361328125, -0.057030677795410156, -0.05471611022949219, -0.05240154266357422, -0.05008697509765625, -0.04777240753173828, -0.04545783996582031, -0.043143272399902344, -0.040828704833984375, -0.038514137268066406, -0.03619956970214844, -0.03388500213623047, -0.0315704345703125, -0.02925586700439453, -0.026941299438476562, -0.024626731872558594, -0.022312164306640625, -0.019997596740722656, -0.017683029174804688, -0.015368461608886719, -0.01305389404296875, -0.010739326477050781, -0.008424758911132812, -0.006110191345214844, -0.003795623779296875, -0.0014810562133789062, 0.0008335113525390625, 0.0031480789184570312, 0.005462646484375, 0.007777214050292969, 0.010091781616210938, 0.012406349182128906, 0.014720916748046875, 0.017035484313964844, 0.019350051879882812, 0.02166461944580078, 0.02397918701171875, 0.02629375457763672, 0.028608322143554688, 0.030922889709472656, 0.033237457275390625, 0.035552024841308594, 0.03786659240722656, 0.04018115997314453, 0.0424957275390625, 0.04481029510498047, 0.04712486267089844, 0.049439430236816406, 0.051753997802734375, 0.054068565368652344, 0.05638313293457031, 0.05869770050048828, 0.06101226806640625, 0.06332683563232422, 0.06564140319824219, 0.06795597076416016, 0.07027053833007812, 0.0725851058959961, 0.07489967346191406, 0.07721424102783203, 0.07952880859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 8.0, 9.0, 30.0, 43.0, 85.0, 162.0, 320.0, 780.0, 2637.0, 11211.0, 80389.0, 3740875.0, 323037.0, 26662.0, 5431.0, 1479.0, 529.0, 239.0, 119.0, 68.0, 49.0, 29.0, 23.0, 17.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4329261779785156, -0.41785430908203125, -0.4027824401855469, -0.3877105712890625, -0.3726387023925781, -0.35756683349609375, -0.3424949645996094, -0.327423095703125, -0.3123512268066406, -0.29727935791015625, -0.2822074890136719, -0.2671356201171875, -0.2520637512207031, -0.23699188232421875, -0.22192001342773438, -0.20684814453125, -0.19177627563476562, -0.17670440673828125, -0.16163253784179688, -0.1465606689453125, -0.13148880004882812, -0.11641693115234375, -0.10134506225585938, -0.086273193359375, -0.07120132446289062, -0.05612945556640625, -0.041057586669921875, -0.0259857177734375, -0.010913848876953125, 0.00415802001953125, 0.019229888916015625, 0.0343017578125, 0.049373626708984375, 0.06444549560546875, 0.07951736450195312, 0.0945892333984375, 0.10966110229492188, 0.12473297119140625, 0.13980484008789062, 0.154876708984375, 0.16994857788085938, 0.18502044677734375, 0.20009231567382812, 0.2151641845703125, 0.23023605346679688, 0.24530792236328125, 0.2603797912597656, 0.27545166015625, 0.2905235290527344, 0.30559539794921875, 0.3206672668457031, 0.3357391357421875, 0.3508110046386719, 0.36588287353515625, 0.3809547424316406, 0.396026611328125, 0.4110984802246094, 0.42617034912109375, 0.4412422180175781, 0.4563140869140625, 0.4713859558105469, 0.48645782470703125, 0.5015296936035156, 0.5166015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 6.0, 14.0, 16.0, 22.0, 31.0, 42.0, 76.0, 84.0, 156.0, 327.0, 1228.0, 1235.0, 294.0, 156.0, 89.0, 65.0, 48.0, 28.0, 25.0, 20.0, 19.0, 15.0, 12.0, 8.0, 6.0, 10.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.07440185546875, -0.07221412658691406, -0.07002639770507812, -0.06783866882324219, -0.06565093994140625, -0.06346321105957031, -0.061275482177734375, -0.05908775329589844, -0.0569000244140625, -0.05471229553222656, -0.052524566650390625, -0.05033683776855469, -0.04814910888671875, -0.04596138000488281, -0.043773651123046875, -0.04158592224121094, -0.039398193359375, -0.03721046447753906, -0.035022735595703125, -0.03283500671386719, -0.03064727783203125, -0.028459548950195312, -0.026271820068359375, -0.024084091186523438, -0.0218963623046875, -0.019708633422851562, -0.017520904541015625, -0.015333175659179688, -0.01314544677734375, -0.010957717895507812, -0.008769989013671875, -0.0065822601318359375, -0.00439453125, -0.0022068023681640625, -1.9073486328125e-05, 0.0021686553955078125, 0.00435638427734375, 0.0065441131591796875, 0.008731842041015625, 0.010919570922851562, 0.0131072998046875, 0.015295028686523438, 0.017482757568359375, 0.019670486450195312, 0.02185821533203125, 0.024045944213867188, 0.026233673095703125, 0.028421401977539062, 0.030609130859375, 0.03279685974121094, 0.034984588623046875, 0.03717231750488281, 0.03936004638671875, 0.04154777526855469, 0.043735504150390625, 0.04592323303222656, 0.0481109619140625, 0.05029869079589844, 0.052486419677734375, 0.05467414855957031, 0.05686187744140625, 0.05904960632324219, 0.061237335205078125, 0.06342506408691406, 0.06561279296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 13.0, 68.0, 322.0, 442.0, 134.0, 23.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2751205265522003, -0.23692554235458374, -0.19873055815696716, -0.1605355590581894, -0.12234057486057281, -0.08414559066295624, -0.04595059156417847, -0.00775560736656189, 0.030439376831054688, 0.06863436102867126, 0.10682935267686844, 0.1450243443250656, 0.1832193285226822, 0.22141431272029877, 0.25960931181907654, 0.2978042960166931, 0.3359992802143097, 0.37419426441192627, 0.41238924860954285, 0.4505842328071594, 0.4887792468070984, 0.5269742012023926, 0.5651692152023315, 0.6033642292022705, 0.6415591835975647, 0.6797541975975037, 0.7179491519927979, 0.7561441659927368, 0.794339120388031, 0.83253413438797, 0.8707290887832642, 0.9089241027832031, 0.9471191167831421, 0.985314130783081, 1.02350914478302, 1.0617040395736694, 1.0998990535736084, 1.1380940675735474, 1.1762890815734863, 1.2144839763641357, 1.2526789903640747, 1.2908740043640137, 1.3290690183639526, 1.367263913154602, 1.405458927154541, 1.44365394115448, 1.481848955154419, 1.5200438499450684, 1.5582389831542969, 1.5964339971542358, 1.6346290111541748, 1.6728239059448242, 1.7110189199447632, 1.7492139339447021, 1.7874089479446411, 1.82560396194458, 1.8637988567352295, 1.9019938707351685, 1.9401888847351074, 1.9783837795257568, 2.0165789127349854, 2.0547738075256348, 2.092968702316284, 2.1311638355255127, 2.169358730316162]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 6.0, 13.0, 10.0, 6.0, 17.0, 18.0, 16.0, 19.0, 26.0, 28.0, 26.0, 28.0, 38.0, 32.0, 39.0, 43.0, 42.0, 49.0, 47.0, 43.0, 34.0, 50.0, 39.0, 28.0, 39.0, 29.0, 21.0, 26.0, 30.0, 28.0, 21.0, 23.0, 12.0, 9.0, 16.0, 10.0, 14.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21693402528762817, -0.20960736274719238, -0.2022807002067566, -0.1949540376663208, -0.187627375125885, -0.18030071258544922, -0.17297405004501343, -0.16564738750457764, -0.15832072496414185, -0.15099406242370605, -0.14366739988327026, -0.13634073734283447, -0.12901407480239868, -0.12168741226196289, -0.1143607497215271, -0.10703408718109131, -0.09970742464065552, -0.09238076210021973, -0.08505409955978394, -0.07772743701934814, -0.07040077447891235, -0.06307411193847656, -0.05574744939804077, -0.04842078685760498, -0.04109412431716919, -0.0337674617767334, -0.026440799236297607, -0.019114136695861816, -0.011787474155426025, -0.004460811614990234, 0.0028658509254455566, 0.010192513465881348, 0.01751917600631714, 0.02484583854675293, 0.03217250108718872, 0.03949916362762451, 0.0468258261680603, 0.054152488708496094, 0.061479151248931885, 0.06880581378936768, 0.07613247632980347, 0.08345913887023926, 0.09078580141067505, 0.09811246395111084, 0.10543912649154663, 0.11276578903198242, 0.12009245157241821, 0.127419114112854, 0.1347457766532898, 0.14207243919372559, 0.14939910173416138, 0.15672576427459717, 0.16405242681503296, 0.17137908935546875, 0.17870575189590454, 0.18603241443634033, 0.19335907697677612, 0.20068573951721191, 0.2080124020576477, 0.2153390645980835, 0.2226657271385193, 0.22999238967895508, 0.23731905221939087, 0.24464571475982666, 0.25197237730026245]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 9.0, 9.0, 6.0, 17.0, 17.0, 25.0, 32.0, 57.0, 61.0, 111.0, 150.0, 213.0, 356.0, 571.0, 1154.0, 2165.0, 4723.0, 13110.0, 52276.0, 385229.0, 495137.0, 66677.0, 15653.0, 5542.0, 2386.0, 1141.0, 640.0, 383.0, 215.0, 154.0, 97.0, 66.0, 44.0, 32.0, 25.0, 15.0, 12.0, 6.0, 5.0, 12.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.339111328125, -0.3285369873046875, -0.317962646484375, -0.3073883056640625, -0.29681396484375, -0.2862396240234375, -0.275665283203125, -0.2650909423828125, -0.2545166015625, -0.2439422607421875, -0.233367919921875, -0.2227935791015625, -0.21221923828125, -0.2016448974609375, -0.191070556640625, -0.1804962158203125, -0.169921875, -0.1593475341796875, -0.148773193359375, -0.1381988525390625, -0.12762451171875, -0.1170501708984375, -0.106475830078125, -0.0959014892578125, -0.0853271484375, -0.0747528076171875, -0.064178466796875, -0.0536041259765625, -0.04302978515625, -0.0324554443359375, -0.021881103515625, -0.0113067626953125, -0.000732421875, 0.0098419189453125, 0.020416259765625, 0.0309906005859375, 0.04156494140625, 0.0521392822265625, 0.062713623046875, 0.0732879638671875, 0.0838623046875, 0.0944366455078125, 0.105010986328125, 0.1155853271484375, 0.12615966796875, 0.1367340087890625, 0.147308349609375, 0.1578826904296875, 0.16845703125, 0.1790313720703125, 0.189605712890625, 0.2001800537109375, 0.21075439453125, 0.2213287353515625, 0.231903076171875, 0.2424774169921875, 0.2530517578125, 0.2636260986328125, 0.274200439453125, 0.2847747802734375, 0.29534912109375, 0.3059234619140625, 0.316497802734375, 0.3270721435546875, 0.337646484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 22.0, 29.0, 51.0, 81.0, 131.0, 140.0, 147.0, 122.0, 75.0, 71.0, 36.0, 23.0, 18.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07018089294433594, -0.06791305541992188, -0.06564521789550781, -0.06337738037109375, -0.06110954284667969, -0.058841705322265625, -0.05657386779785156, -0.0543060302734375, -0.05203819274902344, -0.049770355224609375, -0.04750251770019531, -0.04523468017578125, -0.04296684265136719, -0.040699005126953125, -0.03843116760253906, -0.036163330078125, -0.03389549255371094, -0.031627655029296875, -0.029359817504882812, -0.02709197998046875, -0.024824142456054688, -0.022556304931640625, -0.020288467407226562, -0.0180206298828125, -0.015752792358398438, -0.013484954833984375, -0.011217117309570312, -0.00894927978515625, -0.0066814422607421875, -0.004413604736328125, -0.0021457672119140625, 0.0001220703125, 0.0023899078369140625, 0.004657745361328125, 0.0069255828857421875, 0.00919342041015625, 0.011461257934570312, 0.013729095458984375, 0.015996932983398438, 0.0182647705078125, 0.020532608032226562, 0.022800445556640625, 0.025068283081054688, 0.02733612060546875, 0.029603958129882812, 0.031871795654296875, 0.03413963317871094, 0.036407470703125, 0.03867530822753906, 0.040943145751953125, 0.04321098327636719, 0.04547882080078125, 0.04774665832519531, 0.050014495849609375, 0.05228233337402344, 0.0545501708984375, 0.05681800842285156, 0.059085845947265625, 0.06135368347167969, 0.06362152099609375, 0.06588935852050781, 0.06815719604492188, 0.07042503356933594, 0.07269287109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 8.0, 4.0, 8.0, 7.0, 7.0, 14.0, 15.0, 26.0, 24.0, 37.0, 51.0, 90.0, 122.0, 218.0, 337.0, 650.0, 1420.0, 4443.0, 21404.0, 171660.0, 708476.0, 117052.0, 16297.0, 3491.0, 1174.0, 589.0, 302.0, 214.0, 119.0, 90.0, 47.0, 40.0, 26.0, 19.0, 10.0, 12.0, 12.0, 4.0, 5.0, 8.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3681640625, -0.354736328125, -0.34130859375, -0.327880859375, -0.314453125, -0.301025390625, -0.28759765625, -0.274169921875, -0.2607421875, -0.247314453125, -0.23388671875, -0.220458984375, -0.20703125, -0.193603515625, -0.18017578125, -0.166748046875, -0.1533203125, -0.139892578125, -0.12646484375, -0.113037109375, -0.099609375, -0.086181640625, -0.07275390625, -0.059326171875, -0.0458984375, -0.032470703125, -0.01904296875, -0.005615234375, 0.0078125, 0.021240234375, 0.03466796875, 0.048095703125, 0.0615234375, 0.074951171875, 0.08837890625, 0.101806640625, 0.115234375, 0.128662109375, 0.14208984375, 0.155517578125, 0.1689453125, 0.182373046875, 0.19580078125, 0.209228515625, 0.22265625, 0.236083984375, 0.24951171875, 0.262939453125, 0.2763671875, 0.289794921875, 0.30322265625, 0.316650390625, 0.330078125, 0.343505859375, 0.35693359375, 0.370361328125, 0.3837890625, 0.397216796875, 0.41064453125, 0.424072265625, 0.4375, 0.450927734375, 0.46435546875, 0.477783203125, 0.4912109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 13.0, 6.0, 6.0, 9.0, 16.0, 15.0, 19.0, 26.0, 34.0, 31.0, 34.0, 36.0, 39.0, 44.0, 44.0, 51.0, 59.0, 61.0, 47.0, 52.0, 57.0, 45.0, 36.0, 26.0, 38.0, 20.0, 21.0, 16.0, 12.0, 20.0, 13.0, 8.0, 10.0, 7.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2279052734375, -0.22083282470703125, -0.2137603759765625, -0.20668792724609375, -0.199615478515625, -0.19254302978515625, -0.1854705810546875, -0.17839813232421875, -0.17132568359375, -0.16425323486328125, -0.1571807861328125, -0.15010833740234375, -0.143035888671875, -0.13596343994140625, -0.1288909912109375, -0.12181854248046875, -0.11474609375, -0.10767364501953125, -0.1006011962890625, -0.09352874755859375, -0.086456298828125, -0.07938385009765625, -0.0723114013671875, -0.06523895263671875, -0.05816650390625, -0.05109405517578125, -0.0440216064453125, -0.03694915771484375, -0.029876708984375, -0.02280426025390625, -0.0157318115234375, -0.00865936279296875, -0.0015869140625, 0.00548553466796875, 0.0125579833984375, 0.01963043212890625, 0.026702880859375, 0.03377532958984375, 0.0408477783203125, 0.04792022705078125, 0.05499267578125, 0.06206512451171875, 0.0691375732421875, 0.07621002197265625, 0.083282470703125, 0.09035491943359375, 0.0974273681640625, 0.10449981689453125, 0.111572265625, 0.11864471435546875, 0.1257171630859375, 0.13278961181640625, 0.139862060546875, 0.14693450927734375, 0.1540069580078125, 0.16107940673828125, 0.16815185546875, 0.17522430419921875, 0.1822967529296875, 0.18936920166015625, 0.196441650390625, 0.20351409912109375, 0.2105865478515625, 0.21765899658203125, 0.2247314453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 17.0, 20.0, 27.0, 47.0, 55.0, 92.0, 133.0, 265.0, 435.0, 791.0, 1402.0, 2868.0, 6339.0, 14871.0, 44134.0, 197044.0, 583623.0, 138573.0, 34778.0, 12472.0, 5219.0, 2467.0, 1274.0, 635.0, 376.0, 205.0, 133.0, 80.0, 58.0, 33.0, 21.0, 15.0, 10.0, 7.0, 1.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.13743972778320312, -0.13242340087890625, -0.12740707397460938, -0.1223907470703125, -0.11737442016601562, -0.11235809326171875, -0.10734176635742188, -0.102325439453125, -0.09730911254882812, -0.09229278564453125, -0.08727645874023438, -0.0822601318359375, -0.07724380493164062, -0.07222747802734375, -0.06721115112304688, -0.06219482421875, -0.057178497314453125, -0.05216217041015625, -0.047145843505859375, -0.0421295166015625, -0.037113189697265625, -0.03209686279296875, -0.027080535888671875, -0.022064208984375, -0.017047882080078125, -0.01203155517578125, -0.007015228271484375, -0.0019989013671875, 0.003017425537109375, 0.00803375244140625, 0.013050079345703125, 0.01806640625, 0.023082733154296875, 0.02809906005859375, 0.033115386962890625, 0.0381317138671875, 0.043148040771484375, 0.04816436767578125, 0.053180694580078125, 0.058197021484375, 0.06321334838867188, 0.06822967529296875, 0.07324600219726562, 0.0782623291015625, 0.08327865600585938, 0.08829498291015625, 0.09331130981445312, 0.09832763671875, 0.10334396362304688, 0.10836029052734375, 0.11337661743164062, 0.1183929443359375, 0.12340927124023438, 0.12842559814453125, 0.13344192504882812, 0.138458251953125, 0.14347457885742188, 0.14849090576171875, 0.15350723266601562, 0.1585235595703125, 0.16353988647460938, 0.16855621337890625, 0.17357254028320312, 0.1785888671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 8.0, 13.0, 21.0, 30.0, 45.0, 43.0, 47.0, 66.0, 75.0, 90.0, 93.0, 105.0, 87.0, 73.0, 60.0, 37.0, 27.0, 21.0, 14.0, 8.0, 9.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.297494888305664e-05, -4.1513703763484955e-05, -4.005245864391327e-05, -3.859121352434158e-05, -3.71299684047699e-05, -3.566872328519821e-05, -3.4207478165626526e-05, -3.274623304605484e-05, -3.1284987926483154e-05, -2.982374280691147e-05, -2.8362497687339783e-05, -2.6901252567768097e-05, -2.544000744819641e-05, -2.3978762328624725e-05, -2.251751720905304e-05, -2.1056272089481354e-05, -1.9595026969909668e-05, -1.8133781850337982e-05, -1.6672536730766296e-05, -1.521129161119461e-05, -1.3750046491622925e-05, -1.2288801372051239e-05, -1.0827556252479553e-05, -9.366311132907867e-06, -7.905066013336182e-06, -6.443820893764496e-06, -4.98257577419281e-06, -3.5213306546211243e-06, -2.0600855350494385e-06, -5.988404154777527e-07, 8.624047040939331e-07, 2.323649823665619e-06, 3.7848949432373047e-06, 5.2461400628089905e-06, 6.707385182380676e-06, 8.168630301952362e-06, 9.629875421524048e-06, 1.1091120541095734e-05, 1.255236566066742e-05, 1.4013610780239105e-05, 1.547485589981079e-05, 1.6936101019382477e-05, 1.8397346138954163e-05, 1.985859125852585e-05, 2.1319836378097534e-05, 2.278108149766922e-05, 2.4242326617240906e-05, 2.570357173681259e-05, 2.7164816856384277e-05, 2.8626061975955963e-05, 3.008730709552765e-05, 3.1548552215099335e-05, 3.300979733467102e-05, 3.4471042454242706e-05, 3.593228757381439e-05, 3.739353269338608e-05, 3.8854777812957764e-05, 4.031602293252945e-05, 4.1777268052101135e-05, 4.323851317167282e-05, 4.469975829124451e-05, 4.616100341081619e-05, 4.762224853038788e-05, 4.9083493649959564e-05, 5.054473876953125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 10.0, 14.0, 21.0, 24.0, 49.0, 85.0, 162.0, 376.0, 1036.0, 3798.0, 28192.0, 801304.0, 198810.0, 11333.0, 2145.0, 641.0, 261.0, 108.0, 66.0, 31.0, 21.0, 12.0, 13.0, 7.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.43119049072265625, -0.4180450439453125, -0.40489959716796875, -0.391754150390625, -0.37860870361328125, -0.3654632568359375, -0.35231781005859375, -0.33917236328125, -0.32602691650390625, -0.3128814697265625, -0.29973602294921875, -0.286590576171875, -0.27344512939453125, -0.2602996826171875, -0.24715423583984375, -0.2340087890625, -0.22086334228515625, -0.2077178955078125, -0.19457244873046875, -0.181427001953125, -0.16828155517578125, -0.1551361083984375, -0.14199066162109375, -0.12884521484375, -0.11569976806640625, -0.1025543212890625, -0.08940887451171875, -0.076263427734375, -0.06311798095703125, -0.0499725341796875, -0.03682708740234375, -0.023681640625, -0.01053619384765625, 0.0026092529296875, 0.01575469970703125, 0.028900146484375, 0.04204559326171875, 0.0551910400390625, 0.06833648681640625, 0.08148193359375, 0.09462738037109375, 0.1077728271484375, 0.12091827392578125, 0.134063720703125, 0.14720916748046875, 0.1603546142578125, 0.17350006103515625, 0.1866455078125, 0.19979095458984375, 0.2129364013671875, 0.22608184814453125, 0.239227294921875, 0.25237274169921875, 0.2655181884765625, 0.27866363525390625, 0.29180908203125, 0.30495452880859375, 0.3180999755859375, 0.33124542236328125, 0.344390869140625, 0.35753631591796875, 0.3706817626953125, 0.38382720947265625, 0.39697265625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 7.0, 11.0, 9.0, 9.0, 12.0, 15.0, 29.0, 32.0, 51.0, 71.0, 77.0, 111.0, 151.0, 128.0, 79.0, 57.0, 31.0, 27.0, 18.0, 21.0, 11.0, 6.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.16032028198242188, -0.15547943115234375, -0.15063858032226562, -0.1457977294921875, -0.14095687866210938, -0.13611602783203125, -0.13127517700195312, -0.126434326171875, -0.12159347534179688, -0.11675262451171875, -0.11191177368164062, -0.1070709228515625, -0.10223007202148438, -0.09738922119140625, -0.09254837036132812, -0.08770751953125, -0.08286666870117188, -0.07802581787109375, -0.07318496704101562, -0.0683441162109375, -0.06350326538085938, -0.05866241455078125, -0.053821563720703125, -0.048980712890625, -0.044139862060546875, -0.03929901123046875, -0.034458160400390625, -0.0296173095703125, -0.024776458740234375, -0.01993560791015625, -0.015094757080078125, -0.01025390625, -0.005413055419921875, -0.00057220458984375, 0.004268646240234375, 0.0091094970703125, 0.013950347900390625, 0.01879119873046875, 0.023632049560546875, 0.028472900390625, 0.033313751220703125, 0.03815460205078125, 0.042995452880859375, 0.0478363037109375, 0.052677154541015625, 0.05751800537109375, 0.062358856201171875, 0.06719970703125, 0.07204055786132812, 0.07688140869140625, 0.08172225952148438, 0.0865631103515625, 0.09140396118164062, 0.09624481201171875, 0.10108566284179688, 0.105926513671875, 0.11076736450195312, 0.11560821533203125, 0.12044906616210938, 0.1252899169921875, 0.13013076782226562, 0.13497161865234375, 0.13981246948242188, 0.1446533203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 14.0, 86.0, 442.0, 394.0, 58.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3341137170791626, -1.1095914840698242, -0.8850691914558411, -0.6605468988418579, -0.43602466583251953, -0.21150243282318115, 0.013019919395446777, 0.23754215240478516, 0.46206438541412354, 0.6865866184234619, 0.9111089110374451, 1.1356312036514282, 1.3601534366607666, 1.584675669670105, 1.809198021888733, 2.0337202548980713, 2.258242607116699, 2.482764959335327, 2.707287073135376, 2.931809425354004, 3.1563315391540527, 3.3808538913726807, 3.6053762435913086, 3.8298983573913574, 4.054420471191406, 4.278942584991455, 4.503465175628662, 4.727987289428711, 4.95250940322876, 5.177031517028809, 5.401554107666016, 5.6260762214660645, 5.850598335266113, 6.075120449066162, 6.299643039703369, 6.524165153503418, 6.748687267303467, 6.973209381103516, 7.197731971740723, 7.4222540855407715, 7.64677619934082, 7.871298313140869, 8.095820426940918, 8.320343017578125, 8.544865608215332, 8.769387245178223, 8.99390983581543, 9.218432426452637, 9.442955017089844, 9.66747760772705, 9.891999244689941, 10.116521835327148, 10.341044425964355, 10.565566062927246, 10.790088653564453, 11.01461124420166, 11.23913288116455, 11.463655471801758, 11.688177108764648, 11.912699699401855, 12.137222290039062, 12.361743927001953, 12.58626651763916, 12.810789108276367, 13.035310745239258]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 7.0, 8.0, 9.0, 17.0, 20.0, 15.0, 16.0, 31.0, 27.0, 28.0, 34.0, 35.0, 29.0, 43.0, 31.0, 39.0, 42.0, 59.0, 40.0, 50.0, 44.0, 29.0, 45.0, 35.0, 38.0, 26.0, 36.0, 23.0, 18.0, 19.0, 15.0, 18.0, 15.0, 10.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2969822883605957, -1.2545192241668701, -1.2120561599731445, -1.1695929765701294, -1.1271299123764038, -1.0846668481826782, -1.042203664779663, -0.9997406005859375, -0.9572775363922119, -0.9148144721984863, -0.872351348400116, -0.8298882246017456, -0.78742516040802, -0.7449620962142944, -0.7024989724159241, -0.6600358486175537, -0.6175727844238281, -0.5751097202301025, -0.5326465964317322, -0.4901835024356842, -0.44772040843963623, -0.40525731444358826, -0.3627942204475403, -0.3203311264514923, -0.27786803245544434, -0.23540493845939636, -0.1929418444633484, -0.15047875046730042, -0.10801565647125244, -0.06555256247520447, -0.023089468479156494, 0.01937362551689148, 0.061836838722229004, 0.10429993271827698, 0.14676302671432495, 0.18922612071037292, 0.2316892147064209, 0.27415230870246887, 0.31661540269851685, 0.3590784966945648, 0.4015415906906128, 0.44400468468666077, 0.48646777868270874, 0.5289309024810791, 0.5713939666748047, 0.6138570308685303, 0.6563201546669006, 0.698783278465271, 0.7412463426589966, 0.7837094068527222, 0.8261725306510925, 0.8686356544494629, 0.9110987186431885, 0.9535617828369141, 0.9960249066352844, 1.0384880304336548, 1.0809510946273804, 1.123414158821106, 1.165877342224121, 1.2083404064178467, 1.2508034706115723, 1.2932665348052979, 1.3357295989990234, 1.3781927824020386, 1.4206558465957642]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 8.0, 12.0, 13.0, 20.0, 33.0, 50.0, 61.0, 122.0, 242.0, 437.0, 953.0, 2437.0, 8017.0, 58453.0, 3979016.0, 127187.0, 12173.0, 2938.0, 1036.0, 509.0, 212.0, 137.0, 81.0, 47.0, 23.0, 16.0, 12.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5166015625, -0.49973297119140625, -0.4828643798828125, -0.46599578857421875, -0.449127197265625, -0.43225860595703125, -0.4153900146484375, -0.39852142333984375, -0.38165283203125, -0.36478424072265625, -0.3479156494140625, -0.33104705810546875, -0.314178466796875, -0.29730987548828125, -0.2804412841796875, -0.26357269287109375, -0.2467041015625, -0.22983551025390625, -0.2129669189453125, -0.19609832763671875, -0.179229736328125, -0.16236114501953125, -0.1454925537109375, -0.12862396240234375, -0.11175537109375, -0.09488677978515625, -0.0780181884765625, -0.06114959716796875, -0.044281005859375, -0.02741241455078125, -0.0105438232421875, 0.00632476806640625, 0.023193359375, 0.04006195068359375, 0.0569305419921875, 0.07379913330078125, 0.090667724609375, 0.10753631591796875, 0.1244049072265625, 0.14127349853515625, 0.15814208984375, 0.17501068115234375, 0.1918792724609375, 0.20874786376953125, 0.225616455078125, 0.24248504638671875, 0.2593536376953125, 0.27622222900390625, 0.2930908203125, 0.30995941162109375, 0.3268280029296875, 0.34369659423828125, 0.360565185546875, 0.37743377685546875, 0.3943023681640625, 0.41117095947265625, 0.42803955078125, 0.44490814208984375, 0.4617767333984375, 0.47864532470703125, 0.495513916015625, 0.5123825073242188, 0.5292510986328125, 0.5461196899414062, 0.56298828125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 15.0, 22.0, 24.0, 52.0, 76.0, 93.0, 118.0, 109.0, 94.0, 96.0, 74.0, 69.0, 42.0, 39.0, 11.0, 11.0, 12.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06891059875488281, -0.06659317016601562, -0.06427574157714844, -0.06195831298828125, -0.05964088439941406, -0.057323455810546875, -0.05500602722167969, -0.0526885986328125, -0.05037117004394531, -0.048053741455078125, -0.04573631286621094, -0.04341888427734375, -0.04110145568847656, -0.038784027099609375, -0.03646659851074219, -0.034149169921875, -0.03183174133300781, -0.029514312744140625, -0.027196884155273438, -0.02487945556640625, -0.022562026977539062, -0.020244598388671875, -0.017927169799804688, -0.0156097412109375, -0.013292312622070312, -0.010974884033203125, -0.008657455444335938, -0.00634002685546875, -0.0040225982666015625, -0.001705169677734375, 0.0006122589111328125, 0.0029296875, 0.0052471160888671875, 0.007564544677734375, 0.009881973266601562, 0.01219940185546875, 0.014516830444335938, 0.016834259033203125, 0.019151687622070312, 0.0214691162109375, 0.023786544799804688, 0.026103973388671875, 0.028421401977539062, 0.03073883056640625, 0.03305625915527344, 0.035373687744140625, 0.03769111633300781, 0.040008544921875, 0.04232597351074219, 0.044643402099609375, 0.04696083068847656, 0.04927825927734375, 0.05159568786621094, 0.053913116455078125, 0.05623054504394531, 0.0585479736328125, 0.06086540222167969, 0.06318283081054688, 0.06550025939941406, 0.06781768798828125, 0.07013511657714844, 0.07245254516601562, 0.07476997375488281, 0.07708740234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 6.0, 6.0, 13.0, 26.0, 42.0, 75.0, 154.0, 294.0, 583.0, 1470.0, 3704.0, 11461.0, 49159.0, 605717.0, 3405345.0, 90489.0, 16936.0, 5258.0, 1930.0, 814.0, 377.0, 192.0, 89.0, 30.0, 22.0, 20.0, 8.0, 9.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3195762634277344, -0.30931854248046875, -0.2990608215332031, -0.2888031005859375, -0.2785453796386719, -0.26828765869140625, -0.2580299377441406, -0.247772216796875, -0.23751449584960938, -0.22725677490234375, -0.21699905395507812, -0.2067413330078125, -0.19648361206054688, -0.18622589111328125, -0.17596817016601562, -0.16571044921875, -0.15545272827148438, -0.14519500732421875, -0.13493728637695312, -0.1246795654296875, -0.11442184448242188, -0.10416412353515625, -0.09390640258789062, -0.083648681640625, -0.07339096069335938, -0.06313323974609375, -0.052875518798828125, -0.0426177978515625, -0.032360076904296875, -0.02210235595703125, -0.011844635009765625, -0.0015869140625, 0.008670806884765625, 0.01892852783203125, 0.029186248779296875, 0.0394439697265625, 0.049701690673828125, 0.05995941162109375, 0.07021713256835938, 0.080474853515625, 0.09073257446289062, 0.10099029541015625, 0.11124801635742188, 0.1215057373046875, 0.13176345825195312, 0.14202117919921875, 0.15227890014648438, 0.16253662109375, 0.17279434204101562, 0.18305206298828125, 0.19330978393554688, 0.2035675048828125, 0.21382522583007812, 0.22408294677734375, 0.23434066772460938, 0.244598388671875, 0.2548561096191406, 0.26511383056640625, 0.2753715515136719, 0.2856292724609375, 0.2958869934082031, 0.30614471435546875, 0.3164024353027344, 0.32666015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 7.0, 4.0, 7.0, 16.0, 20.0, 30.0, 30.0, 47.0, 91.0, 158.0, 325.0, 1703.0, 913.0, 289.0, 117.0, 95.0, 61.0, 37.0, 28.0, 21.0, 12.0, 7.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06473255157470703, -0.06232643127441406, -0.059920310974121094, -0.057514190673828125, -0.055108070373535156, -0.05270195007324219, -0.05029582977294922, -0.04788970947265625, -0.04548358917236328, -0.04307746887207031, -0.040671348571777344, -0.038265228271484375, -0.035859107971191406, -0.03345298767089844, -0.03104686737060547, -0.0286407470703125, -0.02623462677001953, -0.023828506469726562, -0.021422386169433594, -0.019016265869140625, -0.016610145568847656, -0.014204025268554688, -0.011797904968261719, -0.00939178466796875, -0.006985664367675781, -0.0045795440673828125, -0.0021734237670898438, 0.000232696533203125, 0.0026388168334960938, 0.0050449371337890625, 0.007451057434082031, 0.009857177734375, 0.012263298034667969, 0.014669418334960938, 0.017075538635253906, 0.019481658935546875, 0.021887779235839844, 0.024293899536132812, 0.02670001983642578, 0.02910614013671875, 0.03151226043701172, 0.03391838073730469, 0.036324501037597656, 0.038730621337890625, 0.041136741638183594, 0.04354286193847656, 0.04594898223876953, 0.0483551025390625, 0.05076122283935547, 0.05316734313964844, 0.055573463439941406, 0.057979583740234375, 0.060385704040527344, 0.06279182434082031, 0.06519794464111328, 0.06760406494140625, 0.07001018524169922, 0.07241630554199219, 0.07482242584228516, 0.07722854614257812, 0.0796346664428711, 0.08204078674316406, 0.08444690704345703, 0.08685302734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 8.0, 19.0, 154.0, 569.0, 229.0, 32.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7553646564483643, -2.6998515129089355, -2.644338369369507, -2.588825225830078, -2.5333120822906494, -2.4777989387512207, -2.422285795211792, -2.3667726516723633, -2.3112595081329346, -2.255746364593506, -2.200233221054077, -2.1447200775146484, -2.0892069339752197, -2.033693790435791, -1.9781806468963623, -1.9226675033569336, -1.8671542406082153, -1.8116410970687866, -1.756127953529358, -1.7006148099899292, -1.6451016664505005, -1.5895885229110718, -1.5340752601623535, -1.4785621166229248, -1.423048973083496, -1.3675358295440674, -1.3120226860046387, -1.25650954246521, -1.2009963989257812, -1.1454832553863525, -1.0899701118469238, -1.0344569683074951, -0.9789438247680664, -0.9234306812286377, -0.867917537689209, -0.8124043941497803, -0.7568912506103516, -0.7013781070709229, -0.6458649039268494, -0.5903517603874207, -0.5348386168479919, -0.47932547330856323, -0.4238123297691345, -0.3682991564273834, -0.3127860128879547, -0.257272869348526, -0.2017596960067749, -0.1462465524673462, -0.09073340892791748, -0.03522025793790817, 0.020292893052101135, 0.07580605149269104, 0.13131919503211975, 0.18683233857154846, 0.24234551191329956, 0.29785865545272827, 0.353371798992157, 0.4088849425315857, 0.4643980860710144, 0.5199112892150879, 0.5754244327545166, 0.6309375762939453, 0.686450719833374, 0.7419638633728027, 0.7974770069122314]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 9.0, 8.0, 14.0, 16.0, 21.0, 32.0, 28.0, 15.0, 34.0, 36.0, 48.0, 39.0, 24.0, 42.0, 32.0, 58.0, 42.0, 34.0, 51.0, 45.0, 45.0, 39.0, 31.0, 29.0, 29.0, 27.0, 23.0, 18.0, 18.0, 14.0, 16.0, 12.0, 9.0, 11.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2598996162414551, -0.2520107626914978, -0.24412190914154053, -0.23623305559158325, -0.22834420204162598, -0.2204553484916687, -0.21256649494171143, -0.20467764139175415, -0.19678878784179688, -0.1888999342918396, -0.18101108074188232, -0.17312222719192505, -0.16523337364196777, -0.1573445200920105, -0.14945566654205322, -0.14156681299209595, -0.13367794454097748, -0.1257890909910202, -0.11790023744106293, -0.11001138389110565, -0.10212253034114838, -0.0942336767911911, -0.08634481579065323, -0.07845596224069595, -0.07056710869073868, -0.0626782551407814, -0.05478940159082413, -0.04690054431557655, -0.03901169076561928, -0.031122837215662003, -0.02323397994041443, -0.015345126390457153, -0.007456272840499878, 0.0004325816407799721, 0.008321436122059822, 0.016210291534662247, 0.024099145084619522, 0.0319879986345768, 0.03987685590982437, 0.04776570945978165, 0.05565456300973892, 0.0635434165596962, 0.07143227010965347, 0.07932113111019135, 0.08720998466014862, 0.0950988382101059, 0.10298769176006317, 0.11087654531002045, 0.11876539885997772, 0.126654252409935, 0.13454310595989227, 0.14243195950984955, 0.15032081305980682, 0.1582096666097641, 0.16609853506088257, 0.17398738861083984, 0.18187624216079712, 0.1897650957107544, 0.19765394926071167, 0.20554280281066895, 0.21343165636062622, 0.2213205099105835, 0.22920936346054077, 0.23709821701049805, 0.24498707056045532]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 8.0, 9.0, 17.0, 22.0, 32.0, 31.0, 56.0, 74.0, 106.0, 129.0, 182.0, 225.0, 324.0, 579.0, 869.0, 1458.0, 2628.0, 5153.0, 11095.0, 25648.0, 66025.0, 193083.0, 409245.0, 208730.0, 71008.0, 27548.0, 11653.0, 5515.0, 2819.0, 1518.0, 897.0, 575.0, 365.0, 256.0, 171.0, 130.0, 106.0, 62.0, 45.0, 38.0, 28.0, 29.0, 17.0, 13.0, 10.0, 4.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.189453125, -0.18396759033203125, -0.1784820556640625, -0.17299652099609375, -0.167510986328125, -0.16202545166015625, -0.1565399169921875, -0.15105438232421875, -0.14556884765625, -0.14008331298828125, -0.1345977783203125, -0.12911224365234375, -0.123626708984375, -0.11814117431640625, -0.1126556396484375, -0.10717010498046875, -0.1016845703125, -0.09619903564453125, -0.0907135009765625, -0.08522796630859375, -0.079742431640625, -0.07425689697265625, -0.0687713623046875, -0.06328582763671875, -0.05780029296875, -0.05231475830078125, -0.0468292236328125, -0.04134368896484375, -0.035858154296875, -0.03037261962890625, -0.0248870849609375, -0.01940155029296875, -0.013916015625, -0.00843048095703125, -0.0029449462890625, 0.00254058837890625, 0.008026123046875, 0.01351165771484375, 0.0189971923828125, 0.02448272705078125, 0.02996826171875, 0.03545379638671875, 0.0409393310546875, 0.04642486572265625, 0.051910400390625, 0.05739593505859375, 0.0628814697265625, 0.06836700439453125, 0.0738525390625, 0.07933807373046875, 0.0848236083984375, 0.09030914306640625, 0.095794677734375, 0.10128021240234375, 0.1067657470703125, 0.11225128173828125, 0.11773681640625, 0.12322235107421875, 0.1287078857421875, 0.13419342041015625, 0.139678955078125, 0.14516448974609375, 0.1506500244140625, 0.15613555908203125, 0.16162109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 16.0, 21.0, 19.0, 39.0, 59.0, 65.0, 76.0, 103.0, 102.0, 103.0, 86.0, 89.0, 59.0, 57.0, 29.0, 12.0, 13.0, 14.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07379150390625, -0.07160377502441406, -0.06941604614257812, -0.06722831726074219, -0.06504058837890625, -0.06285285949707031, -0.060665130615234375, -0.05847740173339844, -0.0562896728515625, -0.05410194396972656, -0.051914215087890625, -0.04972648620605469, -0.04753875732421875, -0.04535102844238281, -0.043163299560546875, -0.04097557067871094, -0.038787841796875, -0.03660011291503906, -0.034412384033203125, -0.03222465515136719, -0.03003692626953125, -0.027849197387695312, -0.025661468505859375, -0.023473739624023438, -0.0212860107421875, -0.019098281860351562, -0.016910552978515625, -0.014722824096679688, -0.01253509521484375, -0.010347366333007812, -0.008159637451171875, -0.0059719085693359375, -0.0037841796875, -0.0015964508056640625, 0.000591278076171875, 0.0027790069580078125, 0.00496673583984375, 0.0071544647216796875, 0.009342193603515625, 0.011529922485351562, 0.0137176513671875, 0.015905380249023438, 0.018093109130859375, 0.020280838012695312, 0.02246856689453125, 0.024656295776367188, 0.026844024658203125, 0.029031753540039062, 0.031219482421875, 0.03340721130371094, 0.035594940185546875, 0.03778266906738281, 0.03997039794921875, 0.04215812683105469, 0.044345855712890625, 0.04653358459472656, 0.0487213134765625, 0.05090904235839844, 0.053096771240234375, 0.05528450012207031, 0.05747222900390625, 0.05965995788574219, 0.061847686767578125, 0.06403541564941406, 0.06622314453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 12.0, 18.0, 28.0, 30.0, 61.0, 84.0, 122.0, 228.0, 410.0, 805.0, 2125.0, 8448.0, 64309.0, 685742.0, 257273.0, 22138.0, 4105.0, 1251.0, 585.0, 313.0, 169.0, 96.0, 62.0, 39.0, 33.0, 18.0, 14.0, 10.0, 6.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3442878723144531, -0.33188629150390625, -0.3194847106933594, -0.3070831298828125, -0.2946815490722656, -0.28227996826171875, -0.2698783874511719, -0.257476806640625, -0.24507522583007812, -0.23267364501953125, -0.22027206420898438, -0.2078704833984375, -0.19546890258789062, -0.18306732177734375, -0.17066574096679688, -0.15826416015625, -0.14586257934570312, -0.13346099853515625, -0.12105941772460938, -0.1086578369140625, -0.09625625610351562, -0.08385467529296875, -0.07145309448242188, -0.059051513671875, -0.046649932861328125, -0.03424835205078125, -0.021846771240234375, -0.0094451904296875, 0.002956390380859375, 0.01535797119140625, 0.027759552001953125, 0.0401611328125, 0.052562713623046875, 0.06496429443359375, 0.07736587524414062, 0.0897674560546875, 0.10216903686523438, 0.11457061767578125, 0.12697219848632812, 0.139373779296875, 0.15177536010742188, 0.16417694091796875, 0.17657852172851562, 0.1889801025390625, 0.20138168334960938, 0.21378326416015625, 0.22618484497070312, 0.23858642578125, 0.2509880065917969, 0.26338958740234375, 0.2757911682128906, 0.2881927490234375, 0.3005943298339844, 0.31299591064453125, 0.3253974914550781, 0.337799072265625, 0.3502006530761719, 0.36260223388671875, 0.3750038146972656, 0.3874053955078125, 0.3998069763183594, 0.41220855712890625, 0.4246101379394531, 0.43701171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 7.0, 10.0, 23.0, 28.0, 41.0, 50.0, 38.0, 53.0, 55.0, 60.0, 72.0, 76.0, 77.0, 64.0, 75.0, 48.0, 43.0, 30.0, 32.0, 33.0, 15.0, 8.0, 13.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.2376537322998047, -0.22835922241210938, -0.21906471252441406, -0.20977020263671875, -0.20047569274902344, -0.19118118286132812, -0.1818866729736328, -0.1725921630859375, -0.1632976531982422, -0.15400314331054688, -0.14470863342285156, -0.13541412353515625, -0.12611961364746094, -0.11682510375976562, -0.10753059387207031, -0.098236083984375, -0.08894157409667969, -0.07964706420898438, -0.07035255432128906, -0.06105804443359375, -0.05176353454589844, -0.042469024658203125, -0.03317451477050781, -0.0238800048828125, -0.014585494995117188, -0.005290985107421875, 0.0040035247802734375, 0.01329803466796875, 0.022592544555664062, 0.031887054443359375, 0.04118156433105469, 0.05047607421875, 0.05977058410644531, 0.06906509399414062, 0.07835960388183594, 0.08765411376953125, 0.09694862365722656, 0.10624313354492188, 0.11553764343261719, 0.1248321533203125, 0.1341266632080078, 0.14342117309570312, 0.15271568298339844, 0.16201019287109375, 0.17130470275878906, 0.18059921264648438, 0.1898937225341797, 0.199188232421875, 0.2084827423095703, 0.21777725219726562, 0.22707176208496094, 0.23636627197265625, 0.24566078186035156, 0.2549552917480469, 0.2642498016357422, 0.2735443115234375, 0.2828388214111328, 0.2921333312988281, 0.30142784118652344, 0.31072235107421875, 0.32001686096191406, 0.3293113708496094, 0.3386058807373047, 0.347900390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 17.0, 10.0, 23.0, 23.0, 36.0, 57.0, 76.0, 97.0, 189.0, 300.0, 536.0, 1075.0, 1975.0, 4657.0, 12494.0, 47591.0, 345682.0, 537505.0, 68983.0, 16321.0, 5626.0, 2496.0, 1201.0, 627.0, 335.0, 198.0, 117.0, 96.0, 67.0, 37.0, 21.0, 17.0, 16.0, 10.0, 9.0, 4.0, 12.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1746826171875, -0.17009925842285156, -0.16551589965820312, -0.1609325408935547, -0.15634918212890625, -0.1517658233642578, -0.14718246459960938, -0.14259910583496094, -0.1380157470703125, -0.13343238830566406, -0.12884902954101562, -0.12426567077636719, -0.11968231201171875, -0.11509895324707031, -0.11051559448242188, -0.10593223571777344, -0.101348876953125, -0.09676551818847656, -0.09218215942382812, -0.08759880065917969, -0.08301544189453125, -0.07843208312988281, -0.07384872436523438, -0.06926536560058594, -0.0646820068359375, -0.06009864807128906, -0.055515289306640625, -0.05093193054199219, -0.04634857177734375, -0.04176521301269531, -0.037181854248046875, -0.03259849548339844, -0.02801513671875, -0.023431777954101562, -0.018848419189453125, -0.014265060424804688, -0.00968170166015625, -0.0050983428955078125, -0.000514984130859375, 0.0040683746337890625, 0.0086517333984375, 0.013235092163085938, 0.017818450927734375, 0.022401809692382812, 0.02698516845703125, 0.03156852722167969, 0.036151885986328125, 0.04073524475097656, 0.045318603515625, 0.04990196228027344, 0.054485321044921875, 0.05906867980957031, 0.06365203857421875, 0.06823539733886719, 0.07281875610351562, 0.07740211486816406, 0.0819854736328125, 0.08656883239746094, 0.09115219116210938, 0.09573554992675781, 0.10031890869140625, 0.10490226745605469, 0.10948562622070312, 0.11406898498535156, 0.11865234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 11.0, 13.0, 14.0, 13.0, 29.0, 33.0, 44.0, 55.0, 71.0, 82.0, 84.0, 82.0, 93.0, 66.0, 74.0, 50.0, 42.0, 31.0, 13.0, 26.0, 17.0, 10.0, 8.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9114227294921875e-05, -4.783552139997482e-05, -4.655681550502777e-05, -4.527810961008072e-05, -4.399940371513367e-05, -4.2720697820186615e-05, -4.144199192523956e-05, -4.016328603029251e-05, -3.888458013534546e-05, -3.760587424039841e-05, -3.6327168345451355e-05, -3.50484624505043e-05, -3.376975655555725e-05, -3.24910506606102e-05, -3.121234476566315e-05, -2.9933638870716095e-05, -2.8654932975769043e-05, -2.737622708082199e-05, -2.609752118587494e-05, -2.4818815290927887e-05, -2.3540109395980835e-05, -2.2261403501033783e-05, -2.098269760608673e-05, -1.970399171113968e-05, -1.8425285816192627e-05, -1.7146579921245575e-05, -1.5867874026298523e-05, -1.4589168131351471e-05, -1.3310462236404419e-05, -1.2031756341457367e-05, -1.0753050446510315e-05, -9.474344551563263e-06, -8.195638656616211e-06, -6.916932761669159e-06, -5.638226866722107e-06, -4.359520971775055e-06, -3.080815076828003e-06, -1.802109181880951e-06, -5.234032869338989e-07, 7.553026080131531e-07, 2.034008502960205e-06, 3.312714397907257e-06, 4.591420292854309e-06, 5.870126187801361e-06, 7.148832082748413e-06, 8.427537977695465e-06, 9.706243872642517e-06, 1.0984949767589569e-05, 1.2263655662536621e-05, 1.3542361557483673e-05, 1.4821067452430725e-05, 1.6099773347377777e-05, 1.737847924232483e-05, 1.865718513727188e-05, 1.9935891032218933e-05, 2.1214596927165985e-05, 2.2493302822113037e-05, 2.377200871706009e-05, 2.505071461200714e-05, 2.6329420506954193e-05, 2.7608126401901245e-05, 2.8886832296848297e-05, 3.016553819179535e-05, 3.14442440867424e-05, 3.272294998168945e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 14.0, 13.0, 21.0, 27.0, 74.0, 108.0, 172.0, 354.0, 691.0, 1867.0, 6039.0, 29380.0, 381784.0, 577290.0, 39444.0, 7369.0, 2154.0, 862.0, 381.0, 206.0, 98.0, 72.0, 38.0, 28.0, 13.0, 8.0, 10.0, 5.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.217529296875, -0.21114540100097656, -0.20476150512695312, -0.1983776092529297, -0.19199371337890625, -0.1856098175048828, -0.17922592163085938, -0.17284202575683594, -0.1664581298828125, -0.16007423400878906, -0.15369033813476562, -0.1473064422607422, -0.14092254638671875, -0.1345386505126953, -0.12815475463867188, -0.12177085876464844, -0.115386962890625, -0.10900306701660156, -0.10261917114257812, -0.09623527526855469, -0.08985137939453125, -0.08346748352050781, -0.07708358764648438, -0.07069969177246094, -0.0643157958984375, -0.05793190002441406, -0.051548004150390625, -0.04516410827636719, -0.03878021240234375, -0.03239631652832031, -0.026012420654296875, -0.019628524780273438, -0.01324462890625, -0.0068607330322265625, -0.000476837158203125, 0.0059070587158203125, 0.01229095458984375, 0.018674850463867188, 0.025058746337890625, 0.03144264221191406, 0.0378265380859375, 0.04421043395996094, 0.050594329833984375, 0.05697822570800781, 0.06336212158203125, 0.06974601745605469, 0.07612991333007812, 0.08251380920410156, 0.088897705078125, 0.09528160095214844, 0.10166549682617188, 0.10804939270019531, 0.11443328857421875, 0.12081718444824219, 0.12720108032226562, 0.13358497619628906, 0.1399688720703125, 0.14635276794433594, 0.15273666381835938, 0.1591205596923828, 0.16550445556640625, 0.1718883514404297, 0.17827224731445312, 0.18465614318847656, 0.1910400390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 11.0, 6.0, 6.0, 6.0, 16.0, 14.0, 26.0, 26.0, 26.0, 45.0, 80.0, 80.0, 105.0, 95.0, 110.0, 78.0, 59.0, 41.0, 40.0, 18.0, 27.0, 16.0, 8.0, 6.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.08046150207519531, -0.07779312133789062, -0.07512474060058594, -0.07245635986328125, -0.06978797912597656, -0.06711959838867188, -0.06445121765136719, -0.0617828369140625, -0.05911445617675781, -0.056446075439453125, -0.05377769470214844, -0.05110931396484375, -0.04844093322753906, -0.045772552490234375, -0.04310417175292969, -0.040435791015625, -0.03776741027832031, -0.035099029541015625, -0.03243064880371094, -0.02976226806640625, -0.027093887329101562, -0.024425506591796875, -0.021757125854492188, -0.0190887451171875, -0.016420364379882812, -0.013751983642578125, -0.011083602905273438, -0.00841522216796875, -0.0057468414306640625, -0.003078460693359375, -0.0004100799560546875, 0.00225830078125, 0.0049266815185546875, 0.007595062255859375, 0.010263442993164062, 0.01293182373046875, 0.015600204467773438, 0.018268585205078125, 0.020936965942382812, 0.0236053466796875, 0.026273727416992188, 0.028942108154296875, 0.03161048889160156, 0.03427886962890625, 0.03694725036621094, 0.039615631103515625, 0.04228401184082031, 0.044952392578125, 0.04762077331542969, 0.050289154052734375, 0.05295753479003906, 0.05562591552734375, 0.05829429626464844, 0.060962677001953125, 0.06363105773925781, 0.0662994384765625, 0.06896781921386719, 0.07163619995117188, 0.07430458068847656, 0.07697296142578125, 0.07964134216308594, 0.08230972290039062, 0.08497810363769531, 0.087646484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 10.0, 19.0, 25.0, 53.0, 89.0, 139.0, 149.0, 151.0, 129.0, 86.0, 63.0, 31.0, 21.0, 7.0, 9.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.450547218322754, -1.4065881967544556, -1.3626291751861572, -1.3186701536178589, -1.2747111320495605, -1.2307521104812622, -1.1867930889129639, -1.1428340673446655, -1.0988750457763672, -1.0549160242080688, -1.0109570026397705, -0.9669979810714722, -0.9230389595031738, -0.8790799379348755, -0.8351209163665771, -0.7911618947982788, -0.7472028136253357, -0.7032437920570374, -0.659284770488739, -0.6153257489204407, -0.5713667273521423, -0.527407705783844, -0.48344865441322327, -0.4394896328449249, -0.3955306112766266, -0.35157158970832825, -0.3076125681400299, -0.2636535167694092, -0.21969451010227203, -0.1757354885339737, -0.13177645206451416, -0.08781743049621582, -0.04385840892791748, 0.00010061636567115784, 0.044059641659259796, 0.08801867067813873, 0.13197769224643707, 0.1759367138147354, 0.21989575028419495, 0.2638547718524933, 0.3078137934207916, 0.35177281498908997, 0.3957318365573883, 0.43969088792800903, 0.4836499094963074, 0.5276089310646057, 0.571567952632904, 0.6155269742012024, 0.6594859957695007, 0.7034450173377991, 0.7474040389060974, 0.7913630604743958, 0.8353220820426941, 0.8792811036109924, 0.9232401847839355, 0.9671992063522339, 1.0111582279205322, 1.0551172494888306, 1.099076271057129, 1.1430352926254272, 1.1869943141937256, 1.230953335762024, 1.2749123573303223, 1.3188713788986206, 1.362830400466919]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 14.0, 12.0, 14.0, 16.0, 22.0, 20.0, 21.0, 26.0, 29.0, 39.0, 32.0, 31.0, 39.0, 33.0, 40.0, 32.0, 44.0, 50.0, 38.0, 43.0, 41.0, 38.0, 42.0, 31.0, 33.0, 36.0, 18.0, 12.0, 20.0, 22.0, 13.0, 15.0, 12.0, 9.0, 14.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0191164016723633, -0.9862051010131836, -0.9532938599586487, -0.9203826189041138, -0.8874713182449341, -0.8545600175857544, -0.8216487765312195, -0.7887375354766846, -0.7558262348175049, -0.7229149341583252, -0.6900036931037903, -0.6570924520492554, -0.6241811513900757, -0.591269850730896, -0.5583586096763611, -0.5254473686218262, -0.4925360679626465, -0.4596247971057892, -0.4267135262489319, -0.3938022553920746, -0.3608909845352173, -0.32797971367836, -0.2950684428215027, -0.2621571719646454, -0.22924590110778809, -0.1963346302509308, -0.1634233593940735, -0.1305120885372162, -0.09760081768035889, -0.06468954682350159, -0.03177827596664429, 0.0011329948902130127, 0.03404414653778076, 0.06695541739463806, 0.09986668825149536, 0.13277795910835266, 0.16568922996520996, 0.19860050082206726, 0.23151177167892456, 0.26442304253578186, 0.29733431339263916, 0.33024558424949646, 0.36315685510635376, 0.39606812596321106, 0.42897939682006836, 0.46189066767692566, 0.49480193853378296, 0.5277131795883179, 0.5606244802474976, 0.5935357809066772, 0.6264470219612122, 0.6593582630157471, 0.6922695636749268, 0.7251808643341064, 0.7580921053886414, 0.7910033464431763, 0.823914647102356, 0.8568259477615356, 0.8897371888160706, 0.9226484298706055, 0.9555597305297852, 0.9884710311889648, 1.0213823318481445, 1.0542935132980347, 1.0872048139572144]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 14.0, 7.0, 12.0, 19.0, 26.0, 47.0, 67.0, 153.0, 239.0, 531.0, 1253.0, 3712.0, 18489.0, 440281.0, 3693445.0, 28827.0, 4653.0, 1349.0, 563.0, 260.0, 135.0, 61.0, 50.0, 28.0, 20.0, 12.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.494873046875, -0.4799232482910156, -0.46497344970703125, -0.4500236511230469, -0.4350738525390625, -0.4201240539550781, -0.40517425537109375, -0.3902244567871094, -0.375274658203125, -0.3603248596191406, -0.34537506103515625, -0.3304252624511719, -0.3154754638671875, -0.3005256652832031, -0.28557586669921875, -0.2706260681152344, -0.25567626953125, -0.24072647094726562, -0.22577667236328125, -0.21082687377929688, -0.1958770751953125, -0.18092727661132812, -0.16597747802734375, -0.15102767944335938, -0.136077880859375, -0.12112808227539062, -0.10617828369140625, -0.09122848510742188, -0.0762786865234375, -0.061328887939453125, -0.04637908935546875, -0.031429290771484375, -0.0164794921875, -0.001529693603515625, 0.01342010498046875, 0.028369903564453125, 0.0433197021484375, 0.058269500732421875, 0.07321929931640625, 0.08816909790039062, 0.103118896484375, 0.11806869506835938, 0.13301849365234375, 0.14796829223632812, 0.1629180908203125, 0.17786788940429688, 0.19281768798828125, 0.20776748657226562, 0.22271728515625, 0.23766708374023438, 0.25261688232421875, 0.2675666809082031, 0.2825164794921875, 0.2974662780761719, 0.31241607666015625, 0.3273658752441406, 0.342315673828125, 0.3572654724121094, 0.37221527099609375, 0.3871650695800781, 0.4021148681640625, 0.4170646667480469, 0.43201446533203125, 0.4469642639160156, 0.4619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 11.0, 12.0, 27.0, 37.0, 55.0, 52.0, 71.0, 80.0, 78.0, 86.0, 96.0, 76.0, 81.0, 57.0, 50.0, 37.0, 21.0, 16.0, 11.0, 4.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.0672616958618164, -0.06518745422363281, -0.06311321258544922, -0.061038970947265625, -0.05896472930908203, -0.05689048767089844, -0.054816246032714844, -0.05274200439453125, -0.050667762756347656, -0.04859352111816406, -0.04651927947998047, -0.044445037841796875, -0.04237079620361328, -0.04029655456542969, -0.038222312927246094, -0.0361480712890625, -0.034073829650878906, -0.03199958801269531, -0.02992534637451172, -0.027851104736328125, -0.02577686309814453, -0.023702621459960938, -0.021628379821777344, -0.01955413818359375, -0.017479896545410156, -0.015405654907226562, -0.013331413269042969, -0.011257171630859375, -0.009182929992675781, -0.0071086883544921875, -0.005034446716308594, -0.002960205078125, -0.0008859634399414062, 0.0011882781982421875, 0.0032625198364257812, 0.005336761474609375, 0.007411003112792969, 0.009485244750976562, 0.011559486389160156, 0.01363372802734375, 0.015707969665527344, 0.017782211303710938, 0.01985645294189453, 0.021930694580078125, 0.02400493621826172, 0.026079177856445312, 0.028153419494628906, 0.0302276611328125, 0.032301902770996094, 0.03437614440917969, 0.03645038604736328, 0.038524627685546875, 0.04059886932373047, 0.04267311096191406, 0.044747352600097656, 0.04682159423828125, 0.048895835876464844, 0.05097007751464844, 0.05304431915283203, 0.055118560791015625, 0.05719280242919922, 0.05926704406738281, 0.061341285705566406, 0.06341552734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 11.0, 16.0, 40.0, 64.0, 153.0, 397.0, 1304.0, 5820.0, 45254.0, 3848256.0, 275038.0, 14260.0, 2510.0, 686.0, 240.0, 97.0, 58.0, 28.0, 14.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409912109375, -0.3933601379394531, -0.37680816650390625, -0.3602561950683594, -0.3437042236328125, -0.3271522521972656, -0.31060028076171875, -0.2940483093261719, -0.277496337890625, -0.2609443664550781, -0.24439239501953125, -0.22784042358398438, -0.2112884521484375, -0.19473648071289062, -0.17818450927734375, -0.16163253784179688, -0.14508056640625, -0.12852859497070312, -0.11197662353515625, -0.09542465209960938, -0.0788726806640625, -0.062320709228515625, -0.04576873779296875, -0.029216766357421875, -0.012664794921875, 0.003887176513671875, 0.02043914794921875, 0.036991119384765625, 0.0535430908203125, 0.07009506225585938, 0.08664703369140625, 0.10319900512695312, 0.1197509765625, 0.13630294799804688, 0.15285491943359375, 0.16940689086914062, 0.1859588623046875, 0.20251083374023438, 0.21906280517578125, 0.23561477661132812, 0.252166748046875, 0.2687187194824219, 0.28527069091796875, 0.3018226623535156, 0.3183746337890625, 0.3349266052246094, 0.35147857666015625, 0.3680305480957031, 0.38458251953125, 0.4011344909667969, 0.41768646240234375, 0.4342384338378906, 0.4507904052734375, 0.4673423767089844, 0.48389434814453125, 0.5004463195800781, 0.516998291015625, 0.5335502624511719, 0.5501022338867188, 0.5666542053222656, 0.5832061767578125, 0.5997581481933594, 0.6163101196289062, 0.6328620910644531, 0.6494140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 8.0, 10.0, 14.0, 8.0, 21.0, 30.0, 32.0, 66.0, 124.0, 187.0, 609.0, 2155.0, 382.0, 169.0, 88.0, 59.0, 39.0, 18.0, 17.0, 7.0, 3.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.0759744644165039, -0.07309150695800781, -0.07020854949951172, -0.06732559204101562, -0.06444263458251953, -0.06155967712402344, -0.058676719665527344, -0.05579376220703125, -0.052910804748535156, -0.05002784729003906, -0.04714488983154297, -0.044261932373046875, -0.04137897491455078, -0.03849601745605469, -0.035613059997558594, -0.0327301025390625, -0.029847145080566406, -0.026964187622070312, -0.02408123016357422, -0.021198272705078125, -0.01831531524658203, -0.015432357788085938, -0.012549400329589844, -0.00966644287109375, -0.006783485412597656, -0.0039005279541015625, -0.0010175704956054688, 0.001865386962890625, 0.004748344421386719, 0.0076313018798828125, 0.010514259338378906, 0.013397216796875, 0.016280174255371094, 0.019163131713867188, 0.02204608917236328, 0.024929046630859375, 0.02781200408935547, 0.030694961547851562, 0.033577919006347656, 0.03646087646484375, 0.039343833923339844, 0.04222679138183594, 0.04510974884033203, 0.047992706298828125, 0.05087566375732422, 0.05375862121582031, 0.056641578674316406, 0.0595245361328125, 0.062407493591308594, 0.06529045104980469, 0.06817340850830078, 0.07105636596679688, 0.07393932342529297, 0.07682228088378906, 0.07970523834228516, 0.08258819580078125, 0.08547115325927734, 0.08835411071777344, 0.09123706817626953, 0.09412002563476562, 0.09700298309326172, 0.09988594055175781, 0.1027688980102539, 0.10565185546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 46.0, 115.0, 291.0, 356.0, 141.0, 35.0, 12.0, 6.0, 0.0, 1.0, 2.0], "bins": [-1.8550047874450684, -1.8219696283340454, -1.788934588432312, -1.755899429321289, -1.7228642702102661, -1.6898291110992432, -1.6567940711975098, -1.6237589120864868, -1.5907237529754639, -1.557688593864441, -1.5246535539627075, -1.4916183948516846, -1.4585832357406616, -1.4255480766296387, -1.3925130367279053, -1.3594778776168823, -1.3264427185058594, -1.2934075593948364, -1.260372519493103, -1.22733736038208, -1.1943022012710571, -1.1612670421600342, -1.1282320022583008, -1.0951968431472778, -1.0621618032455444, -1.0291266441345215, -0.9960915446281433, -0.9630564451217651, -0.9300212860107422, -0.896986186504364, -0.8639510869979858, -0.8309159278869629, -0.7978808283805847, -0.7648457288742065, -0.7318105697631836, -0.6987754702568054, -0.6657403111457825, -0.6327052116394043, -0.5996700525283813, -0.5666349530220032, -0.533599853515625, -0.5005647540092468, -0.4675295948982239, -0.4344944953918457, -0.40145933628082275, -0.3684242367744446, -0.335389107465744, -0.30235397815704346, -0.2693188190460205, -0.23628368973731995, -0.20324856042861938, -0.17021344602108002, -0.13717831671237946, -0.1041431874036789, -0.07110807299613953, -0.038072943687438965, -0.005037814378738403, 0.02799731120467186, 0.06103243678808212, 0.09406755864620209, 0.12710268795490265, 0.1601378172636032, 0.19317293167114258, 0.22620806097984314, 0.2592431902885437]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 8.0, 25.0, 13.0, 16.0, 19.0, 29.0, 20.0, 27.0, 46.0, 33.0, 35.0, 51.0, 46.0, 46.0, 52.0, 52.0, 57.0, 50.0, 44.0, 45.0, 31.0, 37.0, 33.0, 29.0, 20.0, 19.0, 16.0, 14.0, 11.0, 10.0, 10.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2625809907913208, -0.25440624356269836, -0.24623146653175354, -0.2380567193031311, -0.22988195717334747, -0.22170719504356384, -0.2135324329137802, -0.20535767078399658, -0.19718292355537415, -0.18900816142559052, -0.18083339929580688, -0.17265865206718445, -0.16448388993740082, -0.1563091278076172, -0.14813436567783356, -0.13995960354804993, -0.1317848414182663, -0.12361007928848267, -0.11543532460927963, -0.107260562479496, -0.09908580780029297, -0.09091104567050934, -0.08273628354072571, -0.07456152141094208, -0.06638676673173904, -0.05821200832724571, -0.05003724992275238, -0.04186248779296875, -0.03368772938847542, -0.025512970983982086, -0.017338208854198456, -0.009163450449705124, -0.000988692045211792, 0.0071860672906041145, 0.015360826626420021, 0.023535586893558502, 0.031710345298051834, 0.039885103702545166, 0.048059865832328796, 0.05623462423682213, 0.06440938264131546, 0.07258414477109909, 0.08075889945030212, 0.08893366158008575, 0.09710842370986938, 0.10528317838907242, 0.11345794051885605, 0.12163269519805908, 0.1298074573278427, 0.13798221945762634, 0.14615698158740997, 0.1543317437171936, 0.16250649094581604, 0.17068125307559967, 0.1788560152053833, 0.18703077733516693, 0.19520553946495056, 0.2033803015947342, 0.21155506372451782, 0.21972981095314026, 0.2279045730829239, 0.23607933521270752, 0.24425409734249115, 0.2524288594722748, 0.2606036067008972]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 12.0, 12.0, 11.0, 31.0, 37.0, 67.0, 126.0, 191.0, 358.0, 620.0, 1297.0, 3346.0, 9480.0, 33091.0, 156531.0, 555692.0, 223254.0, 45103.0, 12038.0, 3908.0, 1608.0, 755.0, 384.0, 229.0, 145.0, 87.0, 46.0, 30.0, 26.0, 13.0, 14.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.26387977600097656, -0.2557868957519531, -0.2476940155029297, -0.23960113525390625, -0.2315082550048828, -0.22341537475585938, -0.21532249450683594, -0.2072296142578125, -0.19913673400878906, -0.19104385375976562, -0.1829509735107422, -0.17485809326171875, -0.1667652130126953, -0.15867233276367188, -0.15057945251464844, -0.142486572265625, -0.13439369201660156, -0.12630081176757812, -0.11820793151855469, -0.11011505126953125, -0.10202217102050781, -0.09392929077148438, -0.08583641052246094, -0.0777435302734375, -0.06965065002441406, -0.061557769775390625, -0.05346488952636719, -0.04537200927734375, -0.03727912902832031, -0.029186248779296875, -0.021093368530273438, -0.01300048828125, -0.0049076080322265625, 0.003185272216796875, 0.011278152465820312, 0.01937103271484375, 0.027463912963867188, 0.035556793212890625, 0.04364967346191406, 0.0517425537109375, 0.05983543395996094, 0.06792831420898438, 0.07602119445800781, 0.08411407470703125, 0.09220695495605469, 0.10029983520507812, 0.10839271545410156, 0.116485595703125, 0.12457847595214844, 0.13267135620117188, 0.1407642364501953, 0.14885711669921875, 0.1569499969482422, 0.16504287719726562, 0.17313575744628906, 0.1812286376953125, 0.18932151794433594, 0.19741439819335938, 0.2055072784423828, 0.21360015869140625, 0.2216930389404297, 0.22978591918945312, 0.23787879943847656, 0.2459716796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 17.0, 14.0, 22.0, 32.0, 48.0, 56.0, 58.0, 68.0, 77.0, 67.0, 80.0, 95.0, 67.0, 73.0, 63.0, 37.0, 42.0, 23.0, 9.0, 9.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07159423828125, -0.06954240798950195, -0.0674905776977539, -0.06543874740600586, -0.06338691711425781, -0.061335086822509766, -0.05928325653076172, -0.05723142623901367, -0.055179595947265625, -0.05312776565551758, -0.05107593536376953, -0.049024105072021484, -0.04697227478027344, -0.04492044448852539, -0.042868614196777344, -0.0408167839050293, -0.03876495361328125, -0.0367131233215332, -0.034661293029785156, -0.03260946273803711, -0.030557632446289062, -0.028505802154541016, -0.02645397186279297, -0.024402141571044922, -0.022350311279296875, -0.020298480987548828, -0.01824665069580078, -0.016194820404052734, -0.014142990112304688, -0.01209115982055664, -0.010039329528808594, -0.007987499237060547, -0.0059356689453125, -0.003883838653564453, -0.0018320083618164062, 0.00021982192993164062, 0.0022716522216796875, 0.004323482513427734, 0.006375312805175781, 0.008427143096923828, 0.010478973388671875, 0.012530803680419922, 0.014582633972167969, 0.016634464263916016, 0.018686294555664062, 0.02073812484741211, 0.022789955139160156, 0.024841785430908203, 0.02689361572265625, 0.028945446014404297, 0.030997276306152344, 0.03304910659790039, 0.03510093688964844, 0.037152767181396484, 0.03920459747314453, 0.04125642776489258, 0.043308258056640625, 0.04536008834838867, 0.04741191864013672, 0.049463748931884766, 0.05151557922363281, 0.05356740951538086, 0.055619239807128906, 0.05767107009887695, 0.059722900390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 13.0, 16.0, 18.0, 29.0, 55.0, 52.0, 99.0, 155.0, 259.0, 563.0, 1263.0, 3984.0, 21539.0, 239689.0, 691469.0, 76038.0, 9291.0, 2200.0, 842.0, 395.0, 194.0, 124.0, 71.0, 50.0, 35.0, 26.0, 14.0, 17.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.2946929931640625, -0.283477783203125, -0.2722625732421875, -0.26104736328125, -0.2498321533203125, -0.238616943359375, -0.2274017333984375, -0.2161865234375, -0.2049713134765625, -0.193756103515625, -0.1825408935546875, -0.17132568359375, -0.1601104736328125, -0.148895263671875, -0.1376800537109375, -0.12646484375, -0.1152496337890625, -0.104034423828125, -0.0928192138671875, -0.08160400390625, -0.0703887939453125, -0.059173583984375, -0.0479583740234375, -0.0367431640625, -0.0255279541015625, -0.014312744140625, -0.0030975341796875, 0.00811767578125, 0.0193328857421875, 0.030548095703125, 0.0417633056640625, 0.052978515625, 0.0641937255859375, 0.075408935546875, 0.0866241455078125, 0.09783935546875, 0.1090545654296875, 0.120269775390625, 0.1314849853515625, 0.1427001953125, 0.1539154052734375, 0.165130615234375, 0.1763458251953125, 0.18756103515625, 0.1987762451171875, 0.209991455078125, 0.2212066650390625, 0.232421875, 0.2436370849609375, 0.254852294921875, 0.2660675048828125, 0.27728271484375, 0.2884979248046875, 0.299713134765625, 0.3109283447265625, 0.3221435546875, 0.3333587646484375, 0.344573974609375, 0.3557891845703125, 0.36700439453125, 0.3782196044921875, 0.389434814453125, 0.4006500244140625, 0.411865234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 11.0, 7.0, 15.0, 21.0, 17.0, 25.0, 30.0, 37.0, 30.0, 45.0, 48.0, 48.0, 51.0, 45.0, 51.0, 49.0, 42.0, 44.0, 53.0, 42.0, 45.0, 36.0, 38.0, 19.0, 23.0, 18.0, 24.0, 18.0, 15.0, 4.0, 9.0, 6.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18701171875, -0.18027687072753906, -0.17354202270507812, -0.1668071746826172, -0.16007232666015625, -0.1533374786376953, -0.14660263061523438, -0.13986778259277344, -0.1331329345703125, -0.12639808654785156, -0.11966323852539062, -0.11292839050292969, -0.10619354248046875, -0.09945869445800781, -0.09272384643554688, -0.08598899841308594, -0.079254150390625, -0.07251930236816406, -0.06578445434570312, -0.05904960632324219, -0.05231475830078125, -0.04557991027832031, -0.038845062255859375, -0.03211021423339844, -0.0253753662109375, -0.018640518188476562, -0.011905670166015625, -0.0051708221435546875, 0.00156402587890625, 0.008298873901367188, 0.015033721923828125, 0.021768569946289062, 0.02850341796875, 0.03523826599121094, 0.041973114013671875, 0.04870796203613281, 0.05544281005859375, 0.06217765808105469, 0.06891250610351562, 0.07564735412597656, 0.0823822021484375, 0.08911705017089844, 0.09585189819335938, 0.10258674621582031, 0.10932159423828125, 0.11605644226074219, 0.12279129028320312, 0.12952613830566406, 0.136260986328125, 0.14299583435058594, 0.14973068237304688, 0.1564655303955078, 0.16320037841796875, 0.1699352264404297, 0.17667007446289062, 0.18340492248535156, 0.1901397705078125, 0.19687461853027344, 0.20360946655273438, 0.2103443145751953, 0.21707916259765625, 0.2238140106201172, 0.23054885864257812, 0.23728370666503906, 0.2440185546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 11.0, 23.0, 28.0, 47.0, 86.0, 113.0, 192.0, 351.0, 598.0, 1073.0, 2314.0, 5140.0, 13962.0, 48854.0, 276784.0, 557283.0, 102850.0, 23993.0, 8082.0, 3337.0, 1540.0, 758.0, 441.0, 259.0, 160.0, 96.0, 49.0, 30.0, 21.0, 23.0, 11.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.11199951171875, -0.1084136962890625, -0.104827880859375, -0.1012420654296875, -0.09765625, -0.0940704345703125, -0.090484619140625, -0.0868988037109375, -0.08331298828125, -0.0797271728515625, -0.076141357421875, -0.0725555419921875, -0.0689697265625, -0.0653839111328125, -0.061798095703125, -0.0582122802734375, -0.05462646484375, -0.0510406494140625, -0.047454833984375, -0.0438690185546875, -0.040283203125, -0.0366973876953125, -0.033111572265625, -0.0295257568359375, -0.02593994140625, -0.0223541259765625, -0.018768310546875, -0.0151824951171875, -0.0115966796875, -0.0080108642578125, -0.004425048828125, -0.0008392333984375, 0.00274658203125, 0.0063323974609375, 0.009918212890625, 0.0135040283203125, 0.01708984375, 0.0206756591796875, 0.024261474609375, 0.0278472900390625, 0.03143310546875, 0.0350189208984375, 0.038604736328125, 0.0421905517578125, 0.0457763671875, 0.0493621826171875, 0.052947998046875, 0.0565338134765625, 0.06011962890625, 0.0637054443359375, 0.067291259765625, 0.0708770751953125, 0.074462890625, 0.0780487060546875, 0.081634521484375, 0.0852203369140625, 0.08880615234375, 0.0923919677734375, 0.095977783203125, 0.0995635986328125, 0.1031494140625, 0.1067352294921875, 0.110321044921875, 0.1139068603515625, 0.11749267578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 17.0, 30.0, 47.0, 83.0, 108.0, 141.0, 163.0, 116.0, 101.0, 60.0, 43.0, 30.0, 23.0, 9.0, 13.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.8677978813648224e-05, -5.66188246011734e-05, -5.455967038869858e-05, -5.2500516176223755e-05, -5.044136196374893e-05, -4.838220775127411e-05, -4.6323053538799286e-05, -4.426389932632446e-05, -4.220474511384964e-05, -4.014559090137482e-05, -3.8086436688899994e-05, -3.602728247642517e-05, -3.396812826395035e-05, -3.1908974051475525e-05, -2.9849819839000702e-05, -2.779066562652588e-05, -2.5731511414051056e-05, -2.3672357201576233e-05, -2.161320298910141e-05, -1.9554048776626587e-05, -1.7494894564151764e-05, -1.543574035167694e-05, -1.3376586139202118e-05, -1.1317431926727295e-05, -9.258277714252472e-06, -7.199123501777649e-06, -5.139969289302826e-06, -3.080815076828003e-06, -1.02166086435318e-06, 1.037493348121643e-06, 3.096647560596466e-06, 5.155801773071289e-06, 7.214955985546112e-06, 9.274110198020935e-06, 1.1333264410495758e-05, 1.3392418622970581e-05, 1.5451572835445404e-05, 1.7510727047920227e-05, 1.956988126039505e-05, 2.1629035472869873e-05, 2.3688189685344696e-05, 2.574734389781952e-05, 2.7806498110294342e-05, 2.9865652322769165e-05, 3.192480653524399e-05, 3.398396074771881e-05, 3.6043114960193634e-05, 3.810226917266846e-05, 4.016142338514328e-05, 4.22205775976181e-05, 4.4279731810092926e-05, 4.633888602256775e-05, 4.839804023504257e-05, 5.0457194447517395e-05, 5.251634865999222e-05, 5.457550287246704e-05, 5.6634657084941864e-05, 5.869381129741669e-05, 6.075296550989151e-05, 6.281211972236633e-05, 6.487127393484116e-05, 6.693042814731598e-05, 6.89895823597908e-05, 7.104873657226562e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 5.0, 15.0, 12.0, 24.0, 46.0, 61.0, 147.0, 304.0, 876.0, 3620.0, 32883.0, 789359.0, 207528.0, 10901.0, 1779.0, 560.0, 202.0, 92.0, 54.0, 30.0, 21.0, 7.0, 5.0, 10.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.236572265625, -0.22888565063476562, -0.22119903564453125, -0.21351242065429688, -0.2058258056640625, -0.19813919067382812, -0.19045257568359375, -0.18276596069335938, -0.175079345703125, -0.16739273071289062, -0.15970611572265625, -0.15201950073242188, -0.1443328857421875, -0.13664627075195312, -0.12895965576171875, -0.12127304077148438, -0.11358642578125, -0.10589981079101562, -0.09821319580078125, -0.09052658081054688, -0.0828399658203125, -0.07515335083007812, -0.06746673583984375, -0.059780120849609375, -0.052093505859375, -0.044406890869140625, -0.03672027587890625, -0.029033660888671875, -0.0213470458984375, -0.013660430908203125, -0.00597381591796875, 0.001712799072265625, 0.0093994140625, 0.017086029052734375, 0.02477264404296875, 0.032459259033203125, 0.0401458740234375, 0.047832489013671875, 0.05551910400390625, 0.06320571899414062, 0.070892333984375, 0.07857894897460938, 0.08626556396484375, 0.09395217895507812, 0.1016387939453125, 0.10932540893554688, 0.11701202392578125, 0.12469863891601562, 0.13238525390625, 0.14007186889648438, 0.14775848388671875, 0.15544509887695312, 0.1631317138671875, 0.17081832885742188, 0.17850494384765625, 0.18619155883789062, 0.193878173828125, 0.20156478881835938, 0.20925140380859375, 0.21693801879882812, 0.2246246337890625, 0.23231124877929688, 0.23999786376953125, 0.24768447875976562, 0.25537109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 17.0, 14.0, 34.0, 30.0, 42.0, 76.0, 86.0, 96.0, 105.0, 116.0, 90.0, 66.0, 50.0, 52.0, 27.0, 28.0, 17.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10187721252441406, -0.09846878051757812, -0.09506034851074219, -0.09165191650390625, -0.08824348449707031, -0.08483505249023438, -0.08142662048339844, -0.0780181884765625, -0.07460975646972656, -0.07120132446289062, -0.06779289245605469, -0.06438446044921875, -0.06097602844238281, -0.057567596435546875, -0.05415916442871094, -0.050750732421875, -0.04734230041503906, -0.043933868408203125, -0.04052543640136719, -0.03711700439453125, -0.03370857238769531, -0.030300140380859375, -0.026891708374023438, -0.0234832763671875, -0.020074844360351562, -0.016666412353515625, -0.013257980346679688, -0.00984954833984375, -0.0064411163330078125, -0.003032684326171875, 0.0003757476806640625, 0.0037841796875, 0.0071926116943359375, 0.010601043701171875, 0.014009475708007812, 0.01741790771484375, 0.020826339721679688, 0.024234771728515625, 0.027643203735351562, 0.0310516357421875, 0.03446006774902344, 0.037868499755859375, 0.04127693176269531, 0.04468536376953125, 0.04809379577636719, 0.051502227783203125, 0.05491065979003906, 0.058319091796875, 0.06172752380371094, 0.06513595581054688, 0.06854438781738281, 0.07195281982421875, 0.07536125183105469, 0.07876968383789062, 0.08217811584472656, 0.0855865478515625, 0.08899497985839844, 0.09240341186523438, 0.09581184387207031, 0.09922027587890625, 0.10262870788574219, 0.10603713989257812, 0.10944557189941406, 0.11285400390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 49.0, 188.0, 385.0, 270.0, 84.0, 19.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1447193622589111, -1.0274990797042847, -0.9102786779403687, -0.7930583953857422, -0.675838053226471, -0.5586177110671997, -0.44139742851257324, -0.324177086353302, -0.20695674419403076, -0.08973641693592072, 0.02748391032218933, 0.14470422267913818, 0.2619245648384094, 0.37914490699768066, 0.49636518955230713, 0.6135855317115784, 0.7308058738708496, 0.8480262160301208, 0.9652465581893921, 1.0824668407440186, 1.1996872425079346, 1.316907525062561, 1.4341278076171875, 1.5513482093811035, 1.66856849193573, 1.7857887744903564, 1.9030091762542725, 2.0202293395996094, 2.1374497413635254, 2.2546701431274414, 2.3718905448913574, 2.4891107082366943, 2.6063313484191895, 2.7235517501831055, 2.8407719135284424, 2.9579923152923584, 3.0752127170562744, 3.1924328804016113, 3.3096532821655273, 3.4268736839294434, 3.5440940856933594, 3.6613144874572754, 3.7785346508026123, 3.8957550525665283, 4.012975215911865, 4.130195617675781, 4.247416019439697, 4.364636421203613, 4.481856346130371, 4.599076747894287, 4.716297149658203, 4.833517074584961, 4.950737476348877, 5.067957878112793, 5.185178279876709, 5.302398681640625, 5.419619083404541, 5.536839485168457, 5.654059886932373, 5.771280288696289, 5.888500213623047, 6.005720615386963, 6.122941017150879, 6.240161418914795, 6.357381820678711]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 7.0, 6.0, 6.0, 13.0, 14.0, 16.0, 21.0, 20.0, 19.0, 29.0, 28.0, 29.0, 36.0, 42.0, 34.0, 40.0, 58.0, 58.0, 49.0, 44.0, 42.0, 42.0, 42.0, 35.0, 38.0, 29.0, 40.0, 27.0, 22.0, 30.0, 17.0, 13.0, 7.0, 7.0, 9.0, 11.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1114375591278076, -1.0776102542877197, -1.0437829494476318, -1.009955644607544, -0.976128339767456, -0.9423010349273682, -0.9084737300872803, -0.8746464252471924, -0.8408191204071045, -0.8069918155670166, -0.7731645107269287, -0.7393372058868408, -0.7055099010467529, -0.671682596206665, -0.6378552913665771, -0.6040279865264893, -0.5702007412910461, -0.5363734364509583, -0.5025461316108704, -0.46871882677078247, -0.4348915219306946, -0.4010642170906067, -0.3672369420528412, -0.3334096372127533, -0.2995823323726654, -0.2657550275325775, -0.23192772269248962, -0.19810043275356293, -0.16427312791347504, -0.13044582307338715, -0.09661853313446045, -0.06279122829437256, -0.028963923454284668, 0.004863377660512924, 0.038690678775310516, 0.07251797616481781, 0.1063452810049057, 0.1401725858449936, 0.1739998757839203, 0.20782718062400818, 0.24165448546409607, 0.27548179030418396, 0.30930909514427185, 0.34313637018203735, 0.37696367502212524, 0.41079097986221313, 0.444618284702301, 0.4784455895423889, 0.5122728943824768, 0.5461001992225647, 0.5799275040626526, 0.6137548089027405, 0.6475821137428284, 0.6814094185829163, 0.7152366638183594, 0.7490639686584473, 0.7828912734985352, 0.816718578338623, 0.8505458831787109, 0.8843731880187988, 0.9182004928588867, 0.9520277976989746, 0.9858551025390625, 1.0196824073791504, 1.0535097122192383]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 10.0, 17.0, 12.0, 25.0, 37.0, 40.0, 72.0, 115.0, 157.0, 285.0, 493.0, 860.0, 1689.0, 3745.0, 9583.0, 30725.0, 157313.0, 3653209.0, 272545.0, 42615.0, 12082.0, 4505.0, 1967.0, 944.0, 490.0, 246.0, 178.0, 99.0, 62.0, 33.0, 30.0, 20.0, 18.0, 11.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24280738830566406, -0.23512649536132812, -0.2274456024169922, -0.21976470947265625, -0.2120838165283203, -0.20440292358398438, -0.19672203063964844, -0.1890411376953125, -0.18136024475097656, -0.17367935180664062, -0.1659984588623047, -0.15831756591796875, -0.1506366729736328, -0.14295578002929688, -0.13527488708496094, -0.127593994140625, -0.11991310119628906, -0.11223220825195312, -0.10455131530761719, -0.09687042236328125, -0.08918952941894531, -0.08150863647460938, -0.07382774353027344, -0.0661468505859375, -0.05846595764160156, -0.050785064697265625, -0.04310417175292969, -0.03542327880859375, -0.027742385864257812, -0.020061492919921875, -0.012380599975585938, -0.00469970703125, 0.0029811859130859375, 0.010662078857421875, 0.018342971801757812, 0.02602386474609375, 0.03370475769042969, 0.041385650634765625, 0.04906654357910156, 0.0567474365234375, 0.06442832946777344, 0.07210922241210938, 0.07979011535644531, 0.08747100830078125, 0.09515190124511719, 0.10283279418945312, 0.11051368713378906, 0.118194580078125, 0.12587547302246094, 0.13355636596679688, 0.1412372589111328, 0.14891815185546875, 0.1565990447998047, 0.16427993774414062, 0.17196083068847656, 0.1796417236328125, 0.18732261657714844, 0.19500350952148438, 0.2026844024658203, 0.21036529541015625, 0.2180461883544922, 0.22572708129882812, 0.23340797424316406, 0.2410888671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 11.0, 8.0, 18.0, 18.0, 23.0, 40.0, 40.0, 66.0, 69.0, 57.0, 65.0, 64.0, 74.0, 70.0, 65.0, 63.0, 55.0, 48.0, 49.0, 24.0, 15.0, 12.0, 12.0, 10.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0616455078125, -0.059771060943603516, -0.05789661407470703, -0.05602216720581055, -0.05414772033691406, -0.05227327346801758, -0.050398826599121094, -0.04852437973022461, -0.046649932861328125, -0.04477548599243164, -0.042901039123535156, -0.04102659225463867, -0.03915214538574219, -0.0372776985168457, -0.03540325164794922, -0.033528804779052734, -0.03165435791015625, -0.029779911041259766, -0.02790546417236328, -0.026031017303466797, -0.024156570434570312, -0.022282123565673828, -0.020407676696777344, -0.01853322982788086, -0.016658782958984375, -0.01478433609008789, -0.012909889221191406, -0.011035442352294922, -0.009160995483398438, -0.007286548614501953, -0.005412101745605469, -0.0035376548767089844, -0.0016632080078125, 0.00021123886108398438, 0.0020856857299804688, 0.003960132598876953, 0.0058345794677734375, 0.007709026336669922, 0.009583473205566406, 0.01145792007446289, 0.013332366943359375, 0.01520681381225586, 0.017081260681152344, 0.018955707550048828, 0.020830154418945312, 0.022704601287841797, 0.02457904815673828, 0.026453495025634766, 0.02832794189453125, 0.030202388763427734, 0.03207683563232422, 0.0339512825012207, 0.03582572937011719, 0.03770017623901367, 0.039574623107910156, 0.04144906997680664, 0.043323516845703125, 0.04519796371459961, 0.047072410583496094, 0.04894685745239258, 0.05082130432128906, 0.05269575119018555, 0.05457019805908203, 0.056444644927978516, 0.058319091796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 11.0, 12.0, 7.0, 16.0, 21.0, 69.0, 101.0, 185.0, 486.0, 1645.0, 7485.0, 58951.0, 3463896.0, 625782.0, 29355.0, 4460.0, 1117.0, 323.0, 152.0, 71.0, 35.0, 27.0, 21.0, 10.0, 6.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3215217590332031, -0.30954742431640625, -0.2975730895996094, -0.2855987548828125, -0.2736244201660156, -0.26165008544921875, -0.24967575073242188, -0.237701416015625, -0.22572708129882812, -0.21375274658203125, -0.20177841186523438, -0.1898040771484375, -0.17782974243164062, -0.16585540771484375, -0.15388107299804688, -0.14190673828125, -0.12993240356445312, -0.11795806884765625, -0.10598373413085938, -0.0940093994140625, -0.08203506469726562, -0.07006072998046875, -0.058086395263671875, -0.046112060546875, -0.034137725830078125, -0.02216339111328125, -0.010189056396484375, 0.0017852783203125, 0.013759613037109375, 0.02573394775390625, 0.037708282470703125, 0.0496826171875, 0.061656951904296875, 0.07363128662109375, 0.08560562133789062, 0.0975799560546875, 0.10955429077148438, 0.12152862548828125, 0.13350296020507812, 0.145477294921875, 0.15745162963867188, 0.16942596435546875, 0.18140029907226562, 0.1933746337890625, 0.20534896850585938, 0.21732330322265625, 0.22929763793945312, 0.24127197265625, 0.2532463073730469, 0.26522064208984375, 0.2771949768066406, 0.2891693115234375, 0.3011436462402344, 0.31311798095703125, 0.3250923156738281, 0.337066650390625, 0.3490409851074219, 0.36101531982421875, 0.3729896545410156, 0.3849639892578125, 0.3969383239746094, 0.40891265869140625, 0.4208869934082031, 0.432861328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 12.0, 14.0, 20.0, 34.0, 44.0, 61.0, 124.0, 184.0, 441.0, 1699.0, 745.0, 279.0, 158.0, 77.0, 51.0, 37.0, 18.0, 14.0, 9.0, 10.0, 8.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1416015625, -0.13812732696533203, -0.13465309143066406, -0.1311788558959961, -0.12770462036132812, -0.12423038482666016, -0.12075614929199219, -0.11728191375732422, -0.11380767822265625, -0.11033344268798828, -0.10685920715332031, -0.10338497161865234, -0.09991073608398438, -0.0964365005493164, -0.09296226501464844, -0.08948802947998047, -0.0860137939453125, -0.08253955841064453, -0.07906532287597656, -0.0755910873413086, -0.07211685180664062, -0.06864261627197266, -0.06516838073730469, -0.06169414520263672, -0.05821990966796875, -0.05474567413330078, -0.05127143859863281, -0.047797203063964844, -0.044322967529296875, -0.040848731994628906, -0.03737449645996094, -0.03390026092529297, -0.030426025390625, -0.02695178985595703, -0.023477554321289062, -0.020003318786621094, -0.016529083251953125, -0.013054847717285156, -0.009580612182617188, -0.006106376647949219, -0.00263214111328125, 0.0008420944213867188, 0.0043163299560546875, 0.007790565490722656, 0.011264801025390625, 0.014739036560058594, 0.018213272094726562, 0.02168750762939453, 0.0251617431640625, 0.02863597869873047, 0.03211021423339844, 0.035584449768066406, 0.039058685302734375, 0.042532920837402344, 0.04600715637207031, 0.04948139190673828, 0.05295562744140625, 0.05642986297607422, 0.05990409851074219, 0.06337833404541016, 0.06685256958007812, 0.0703268051147461, 0.07380104064941406, 0.07727527618408203, 0.08074951171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 17.0, 44.0, 64.0, 101.0, 151.0, 154.0, 160.0, 132.0, 83.0, 44.0, 21.0, 11.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9112545847892761, -0.8900306224822998, -0.8688066601753235, -0.8475827574729919, -0.8263587951660156, -0.8051348328590393, -0.783910870552063, -0.7626869678497314, -0.7414630055427551, -0.7202390432357788, -0.6990150809288025, -0.677791178226471, -0.6565672159194946, -0.6353432536125183, -0.614119291305542, -0.5928953886032104, -0.5716713666915894, -0.550447404384613, -0.5292234420776367, -0.5079995393753052, -0.48677557706832886, -0.46555161476135254, -0.4443276524543762, -0.4231037199497223, -0.40187978744506836, -0.38065582513809204, -0.3594318926334381, -0.3382079303264618, -0.31698399782180786, -0.29576003551483154, -0.2745360732078552, -0.2533121407032013, -0.23208820819854736, -0.21086426079273224, -0.18964031338691711, -0.1684163510799408, -0.14719241857528687, -0.12596845626831055, -0.10474450886249542, -0.0835205614566803, -0.06229661405086517, -0.04107266664505005, -0.019848715513944626, 0.0013752356171607971, 0.02259918302297592, 0.043823130428791046, 0.06504708528518677, 0.08627103269100189, 0.10749498009681702, 0.12871892750263214, 0.14994287490844727, 0.17116683721542358, 0.19239076972007751, 0.21361473202705383, 0.23483867943286896, 0.2560626268386841, 0.2772865891456604, 0.2985105514526367, 0.31973448395729065, 0.34095844626426697, 0.3621823787689209, 0.3834063410758972, 0.40463030338287354, 0.42585423588752747, 0.4470781683921814]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 11.0, 6.0, 6.0, 14.0, 10.0, 13.0, 14.0, 26.0, 29.0, 25.0, 41.0, 19.0, 27.0, 47.0, 32.0, 45.0, 45.0, 52.0, 41.0, 47.0, 51.0, 29.0, 53.0, 33.0, 35.0, 36.0, 31.0, 27.0, 19.0, 24.0, 25.0, 27.0, 11.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27719610929489136, -0.26700854301452637, -0.25682100653648376, -0.24663344025611877, -0.23644588887691498, -0.22625833749771118, -0.21607078611850739, -0.2058832347393036, -0.1956956684589386, -0.1855081170797348, -0.175320565700531, -0.16513299942016602, -0.15494544804096222, -0.14475789666175842, -0.13457034528255463, -0.12438278645277023, -0.11419524252414703, -0.10400769114494324, -0.09382013231515884, -0.08363258093595505, -0.07344502210617065, -0.06325747072696686, -0.05306991934776306, -0.04288236051797867, -0.03269480913877487, -0.022507254034280777, -0.012319700792431831, -0.0021321475505828857, 0.008055407553911209, 0.018242962658405304, 0.0284305140376091, 0.038618072867393494, 0.04880562424659729, 0.058993179351091385, 0.06918073445558548, 0.07936828583478928, 0.08955584466457367, 0.09974339604377747, 0.10993094742298126, 0.12011850625276566, 0.13030606508255005, 0.14049361646175385, 0.15068116784095764, 0.16086873412132263, 0.17105628550052643, 0.18124383687973022, 0.19143138825893402, 0.20161893963813782, 0.2118064910173416, 0.2219940423965454, 0.2321815937757492, 0.242369145154953, 0.252556711435318, 0.2627442479133606, 0.2729318141937256, 0.2831193804740906, 0.2933069169521332, 0.30349448323249817, 0.31368201971054077, 0.32386958599090576, 0.33405712246894836, 0.34424468874931335, 0.35443222522735596, 0.36461979150772095, 0.37480735778808594]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 14.0, 8.0, 11.0, 15.0, 28.0, 45.0, 71.0, 141.0, 236.0, 436.0, 850.0, 1739.0, 4264.0, 11946.0, 40904.0, 163083.0, 580005.0, 179512.0, 44124.0, 12952.0, 4453.0, 1820.0, 865.0, 461.0, 227.0, 126.0, 74.0, 48.0, 31.0, 19.0, 14.0, 15.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2890625, -0.28069114685058594, -0.2723197937011719, -0.2639484405517578, -0.25557708740234375, -0.2472057342529297, -0.23883438110351562, -0.23046302795410156, -0.2220916748046875, -0.21372032165527344, -0.20534896850585938, -0.1969776153564453, -0.18860626220703125, -0.1802349090576172, -0.17186355590820312, -0.16349220275878906, -0.155120849609375, -0.14674949645996094, -0.13837814331054688, -0.1300067901611328, -0.12163543701171875, -0.11326408386230469, -0.10489273071289062, -0.09652137756347656, -0.0881500244140625, -0.07977867126464844, -0.07140731811523438, -0.06303596496582031, -0.05466461181640625, -0.04629325866699219, -0.037921905517578125, -0.029550552368164062, -0.02117919921875, -0.012807846069335938, -0.004436492919921875, 0.0039348602294921875, 0.01230621337890625, 0.020677566528320312, 0.029048919677734375, 0.03742027282714844, 0.0457916259765625, 0.05416297912597656, 0.06253433227539062, 0.07090568542480469, 0.07927703857421875, 0.08764839172363281, 0.09601974487304688, 0.10439109802246094, 0.112762451171875, 0.12113380432128906, 0.12950515747070312, 0.1378765106201172, 0.14624786376953125, 0.1546192169189453, 0.16299057006835938, 0.17136192321777344, 0.1797332763671875, 0.18810462951660156, 0.19647598266601562, 0.2048473358154297, 0.21321868896484375, 0.2215900421142578, 0.22996139526367188, 0.23833274841308594, 0.2467041015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 17.0, 20.0, 16.0, 32.0, 46.0, 39.0, 55.0, 66.0, 75.0, 83.0, 65.0, 73.0, 71.0, 66.0, 70.0, 56.0, 37.0, 21.0, 26.0, 21.0, 8.0, 11.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05675458908081055, -0.054823875427246094, -0.05289316177368164, -0.05096244812011719, -0.049031734466552734, -0.04710102081298828, -0.04517030715942383, -0.043239593505859375, -0.04130887985229492, -0.03937816619873047, -0.037447452545166016, -0.03551673889160156, -0.03358602523803711, -0.031655311584472656, -0.029724597930908203, -0.02779388427734375, -0.025863170623779297, -0.023932456970214844, -0.02200174331665039, -0.020071029663085938, -0.018140316009521484, -0.01620960235595703, -0.014278888702392578, -0.012348175048828125, -0.010417461395263672, -0.008486747741699219, -0.006556034088134766, -0.0046253204345703125, -0.0026946067810058594, -0.0007638931274414062, 0.0011668205261230469, 0.0030975341796875, 0.005028247833251953, 0.006958961486816406, 0.00888967514038086, 0.010820388793945312, 0.012751102447509766, 0.014681816101074219, 0.016612529754638672, 0.018543243408203125, 0.020473957061767578, 0.02240467071533203, 0.024335384368896484, 0.026266098022460938, 0.02819681167602539, 0.030127525329589844, 0.0320582389831543, 0.03398895263671875, 0.0359196662902832, 0.037850379943847656, 0.03978109359741211, 0.04171180725097656, 0.043642520904541016, 0.04557323455810547, 0.04750394821166992, 0.049434661865234375, 0.05136537551879883, 0.05329608917236328, 0.055226802825927734, 0.05715751647949219, 0.05908823013305664, 0.061018943786621094, 0.06294965744018555, 0.06488037109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 17.0, 24.0, 33.0, 41.0, 68.0, 108.0, 166.0, 332.0, 702.0, 1580.0, 4837.0, 22859.0, 173923.0, 720651.0, 101464.0, 15456.0, 3722.0, 1265.0, 533.0, 290.0, 182.0, 103.0, 57.0, 42.0, 25.0, 12.0, 7.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.378173828125, -0.36748504638671875, -0.3567962646484375, -0.34610748291015625, -0.335418701171875, -0.32472991943359375, -0.3140411376953125, -0.30335235595703125, -0.29266357421875, -0.28197479248046875, -0.2712860107421875, -0.26059722900390625, -0.249908447265625, -0.23921966552734375, -0.2285308837890625, -0.21784210205078125, -0.2071533203125, -0.19646453857421875, -0.1857757568359375, -0.17508697509765625, -0.164398193359375, -0.15370941162109375, -0.1430206298828125, -0.13233184814453125, -0.12164306640625, -0.11095428466796875, -0.1002655029296875, -0.08957672119140625, -0.078887939453125, -0.06819915771484375, -0.0575103759765625, -0.04682159423828125, -0.0361328125, -0.02544403076171875, -0.0147552490234375, -0.00406646728515625, 0.006622314453125, 0.01731109619140625, 0.0279998779296875, 0.03868865966796875, 0.04937744140625, 0.06006622314453125, 0.0707550048828125, 0.08144378662109375, 0.092132568359375, 0.10282135009765625, 0.1135101318359375, 0.12419891357421875, 0.1348876953125, 0.14557647705078125, 0.1562652587890625, 0.16695404052734375, 0.177642822265625, 0.18833160400390625, 0.1990203857421875, 0.20970916748046875, 0.22039794921875, 0.23108673095703125, 0.2417755126953125, 0.25246429443359375, 0.263153076171875, 0.27384185791015625, 0.2845306396484375, 0.29521942138671875, 0.305908203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 8.0, 8.0, 7.0, 12.0, 18.0, 22.0, 26.0, 25.0, 30.0, 29.0, 42.0, 45.0, 45.0, 46.0, 50.0, 66.0, 65.0, 54.0, 53.0, 55.0, 45.0, 39.0, 30.0, 30.0, 25.0, 28.0, 17.0, 22.0, 12.0, 11.0, 11.0, 7.0, 5.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.24191856384277344, -0.23469161987304688, -0.2274646759033203, -0.22023773193359375, -0.2130107879638672, -0.20578384399414062, -0.19855690002441406, -0.1913299560546875, -0.18410301208496094, -0.17687606811523438, -0.1696491241455078, -0.16242218017578125, -0.1551952362060547, -0.14796829223632812, -0.14074134826660156, -0.133514404296875, -0.12628746032714844, -0.11906051635742188, -0.11183357238769531, -0.10460662841796875, -0.09737968444824219, -0.09015274047851562, -0.08292579650878906, -0.0756988525390625, -0.06847190856933594, -0.061244964599609375, -0.05401802062988281, -0.04679107666015625, -0.03956413269042969, -0.032337188720703125, -0.025110244750976562, -0.01788330078125, -0.010656356811523438, -0.003429412841796875, 0.0037975311279296875, 0.01102447509765625, 0.018251419067382812, 0.025478363037109375, 0.03270530700683594, 0.0399322509765625, 0.04715919494628906, 0.054386138916015625, 0.06161308288574219, 0.06884002685546875, 0.07606697082519531, 0.08329391479492188, 0.09052085876464844, 0.097747802734375, 0.10497474670410156, 0.11220169067382812, 0.11942863464355469, 0.12665557861328125, 0.1338825225830078, 0.14110946655273438, 0.14833641052246094, 0.1555633544921875, 0.16279029846191406, 0.17001724243164062, 0.1772441864013672, 0.18447113037109375, 0.1916980743408203, 0.19892501831054688, 0.20615196228027344, 0.21337890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 5.0, 8.0, 10.0, 5.0, 16.0, 12.0, 33.0, 45.0, 65.0, 120.0, 224.0, 364.0, 616.0, 1260.0, 2518.0, 6015.0, 17809.0, 83403.0, 744466.0, 152019.0, 25216.0, 7768.0, 3122.0, 1580.0, 783.0, 430.0, 232.0, 138.0, 87.0, 59.0, 35.0, 23.0, 22.0, 12.0, 7.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2413330078125, -0.23393821716308594, -0.22654342651367188, -0.2191486358642578, -0.21175384521484375, -0.2043590545654297, -0.19696426391601562, -0.18956947326660156, -0.1821746826171875, -0.17477989196777344, -0.16738510131835938, -0.1599903106689453, -0.15259552001953125, -0.1452007293701172, -0.13780593872070312, -0.13041114807128906, -0.123016357421875, -0.11562156677246094, -0.10822677612304688, -0.10083198547363281, -0.09343719482421875, -0.08604240417480469, -0.07864761352539062, -0.07125282287597656, -0.0638580322265625, -0.05646324157714844, -0.049068450927734375, -0.04167366027832031, -0.03427886962890625, -0.026884078979492188, -0.019489288330078125, -0.012094497680664062, -0.00469970703125, 0.0026950836181640625, 0.010089874267578125, 0.017484664916992188, 0.02487945556640625, 0.03227424621582031, 0.039669036865234375, 0.04706382751464844, 0.0544586181640625, 0.06185340881347656, 0.06924819946289062, 0.07664299011230469, 0.08403778076171875, 0.09143257141113281, 0.09882736206054688, 0.10622215270996094, 0.113616943359375, 0.12101173400878906, 0.12840652465820312, 0.1358013153076172, 0.14319610595703125, 0.1505908966064453, 0.15798568725585938, 0.16538047790527344, 0.1727752685546875, 0.18017005920410156, 0.18756484985351562, 0.1949596405029297, 0.20235443115234375, 0.2097492218017578, 0.21714401245117188, 0.22453880310058594, 0.23193359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 11.0, 7.0, 8.0, 15.0, 21.0, 28.0, 29.0, 56.0, 63.0, 104.0, 87.0, 106.0, 120.0, 102.0, 70.0, 46.0, 46.0, 24.0, 19.0, 15.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3451786041259766e-05, -4.1754916310310364e-05, -4.005804657936096e-05, -3.836117684841156e-05, -3.666430711746216e-05, -3.4967437386512756e-05, -3.3270567655563354e-05, -3.157369792461395e-05, -2.987682819366455e-05, -2.817995846271515e-05, -2.6483088731765747e-05, -2.4786219000816345e-05, -2.3089349269866943e-05, -2.139247953891754e-05, -1.969560980796814e-05, -1.7998740077018738e-05, -1.6301870346069336e-05, -1.4605000615119934e-05, -1.2908130884170532e-05, -1.121126115322113e-05, -9.514391422271729e-06, -7.817521691322327e-06, -6.120651960372925e-06, -4.423782229423523e-06, -2.726912498474121e-06, -1.0300427675247192e-06, 6.668269634246826e-07, 2.3636966943740845e-06, 4.060566425323486e-06, 5.757436156272888e-06, 7.45430588722229e-06, 9.151175618171692e-06, 1.0848045349121094e-05, 1.2544915080070496e-05, 1.4241784811019897e-05, 1.59386545419693e-05, 1.76355242729187e-05, 1.9332394003868103e-05, 2.1029263734817505e-05, 2.2726133465766907e-05, 2.442300319671631e-05, 2.611987292766571e-05, 2.7816742658615112e-05, 2.9513612389564514e-05, 3.1210482120513916e-05, 3.290735185146332e-05, 3.460422158241272e-05, 3.630109131336212e-05, 3.7997961044311523e-05, 3.9694830775260925e-05, 4.139170050621033e-05, 4.308857023715973e-05, 4.478543996810913e-05, 4.648230969905853e-05, 4.8179179430007935e-05, 4.9876049160957336e-05, 5.157291889190674e-05, 5.326978862285614e-05, 5.496665835380554e-05, 5.6663528084754944e-05, 5.8360397815704346e-05, 6.005726754665375e-05, 6.175413727760315e-05, 6.345100700855255e-05, 6.514787673950195e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 12.0, 19.0, 31.0, 53.0, 101.0, 222.0, 491.0, 1307.0, 5123.0, 46469.0, 931137.0, 55520.0, 5735.0, 1356.0, 493.0, 233.0, 114.0, 54.0, 30.0, 12.0, 16.0, 7.0, 0.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45703125, -0.442535400390625, -0.42803955078125, -0.413543701171875, -0.3990478515625, -0.384552001953125, -0.37005615234375, -0.355560302734375, -0.341064453125, -0.326568603515625, -0.31207275390625, -0.297576904296875, -0.2830810546875, -0.268585205078125, -0.25408935546875, -0.239593505859375, -0.22509765625, -0.210601806640625, -0.19610595703125, -0.181610107421875, -0.1671142578125, -0.152618408203125, -0.13812255859375, -0.123626708984375, -0.109130859375, -0.094635009765625, -0.08013916015625, -0.065643310546875, -0.0511474609375, -0.036651611328125, -0.02215576171875, -0.007659912109375, 0.0068359375, 0.021331787109375, 0.03582763671875, 0.050323486328125, 0.0648193359375, 0.079315185546875, 0.09381103515625, 0.108306884765625, 0.122802734375, 0.137298583984375, 0.15179443359375, 0.166290283203125, 0.1807861328125, 0.195281982421875, 0.20977783203125, 0.224273681640625, 0.23876953125, 0.253265380859375, 0.26776123046875, 0.282257080078125, 0.2967529296875, 0.311248779296875, 0.32574462890625, 0.340240478515625, 0.354736328125, 0.369232177734375, 0.38372802734375, 0.398223876953125, 0.4127197265625, 0.427215576171875, 0.44171142578125, 0.456207275390625, 0.470703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 16.0, 23.0, 33.0, 33.0, 91.0, 163.0, 224.0, 182.0, 83.0, 39.0, 29.0, 14.0, 17.0, 7.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23779296875, -0.23044395446777344, -0.22309494018554688, -0.2157459259033203, -0.20839691162109375, -0.2010478973388672, -0.19369888305664062, -0.18634986877441406, -0.1790008544921875, -0.17165184020996094, -0.16430282592773438, -0.1569538116455078, -0.14960479736328125, -0.1422557830810547, -0.13490676879882812, -0.12755775451660156, -0.120208740234375, -0.11285972595214844, -0.10551071166992188, -0.09816169738769531, -0.09081268310546875, -0.08346366882324219, -0.07611465454101562, -0.06876564025878906, -0.0614166259765625, -0.05406761169433594, -0.046718597412109375, -0.03936958312988281, -0.03202056884765625, -0.024671554565429688, -0.017322540283203125, -0.009973526000976562, -0.00262451171875, 0.0047245025634765625, 0.012073516845703125, 0.019422531127929688, 0.02677154541015625, 0.03412055969238281, 0.041469573974609375, 0.04881858825683594, 0.0561676025390625, 0.06351661682128906, 0.07086563110351562, 0.07821464538574219, 0.08556365966796875, 0.09291267395019531, 0.10026168823242188, 0.10761070251464844, 0.114959716796875, 0.12230873107910156, 0.12965774536132812, 0.1370067596435547, 0.14435577392578125, 0.1517047882080078, 0.15905380249023438, 0.16640281677246094, 0.1737518310546875, 0.18110084533691406, 0.18844985961914062, 0.1957988739013672, 0.20314788818359375, 0.2104969024658203, 0.21784591674804688, 0.22519493103027344, 0.2325439453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 70.0, 262.0, 377.0, 207.0, 54.0, 15.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4786880016326904, -1.3231526613235474, -1.1676174402236938, -1.0120820999145508, -0.8565468192100525, -0.7010115385055542, -0.5454761981964111, -0.3899409770965576, -0.23440563678741455, -0.07887034118175507, 0.07666495442390442, 0.2322002649307251, 0.3877355456352234, 0.5432708263397217, 0.6988061666488647, 0.8543413877487183, 1.0098767280578613, 1.1654120683670044, 1.320947289466858, 1.476482629776001, 1.6320178508758545, 1.7875531911849976, 1.9430885314941406, 2.098623752593994, 2.2541589736938477, 2.409694194793701, 2.565229654312134, 2.7207648754119873, 2.876300096511841, 3.0318355560302734, 3.187370777130127, 3.3429059982299805, 3.498441219329834, 3.6539764404296875, 3.80951189994812, 3.9650471210479736, 4.120582580566406, 4.27611780166626, 4.431653022766113, 4.587188243865967, 4.74272346496582, 4.898258686065674, 5.053793907165527, 5.209329605102539, 5.364864826202393, 5.520400047302246, 5.6759352684021, 5.831470489501953, 5.987006187438965, 6.142541408538818, 6.298076629638672, 6.453612327575684, 6.609147548675537, 6.764682769775391, 6.920217990875244, 7.075753211975098, 7.231288433074951, 7.386823654174805, 7.542358875274658, 7.697894096374512, 7.853429794311523, 8.008964538574219, 8.16450023651123, 8.320035934448242, 8.475570678710938]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 3.0, 9.0, 8.0, 12.0, 11.0, 14.0, 24.0, 19.0, 22.0, 24.0, 13.0, 21.0, 20.0, 37.0, 26.0, 41.0, 35.0, 37.0, 48.0, 41.0, 38.0, 40.0, 35.0, 42.0, 41.0, 42.0, 23.0, 26.0, 21.0, 31.0, 29.0, 34.0, 8.0, 18.0, 11.0, 15.0, 15.0, 9.0, 11.0, 6.0, 9.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0830885171890259, -1.0505239963531494, -1.0179593563079834, -0.9853948354721069, -0.9528303146362305, -0.920265793800354, -0.8877012133598328, -0.8551366329193115, -0.8225721120834351, -0.7900075912475586, -0.7574430108070374, -0.7248784303665161, -0.6923139095306396, -0.6597493886947632, -0.6271848082542419, -0.5946202278137207, -0.5620557069778442, -0.5294911861419678, -0.49692660570144653, -0.4643620550632477, -0.43179750442504883, -0.39923295378685, -0.3666684031486511, -0.33410385251045227, -0.3015393018722534, -0.26897475123405457, -0.2364102005958557, -0.20384564995765686, -0.171281099319458, -0.13871654868125916, -0.1061519980430603, -0.07358744740486145, -0.04102301597595215, -0.008458465337753296, 0.024106085300445557, 0.05667063593864441, 0.08923518657684326, 0.12179973721504211, 0.15436428785324097, 0.18692883849143982, 0.21949338912963867, 0.2520579397678375, 0.2846224904060364, 0.31718704104423523, 0.3497515916824341, 0.38231614232063293, 0.4148806929588318, 0.44744524359703064, 0.4800097942352295, 0.512574315071106, 0.5451388955116272, 0.5777034759521484, 0.6102679967880249, 0.6428325176239014, 0.6753970980644226, 0.7079616785049438, 0.7405261993408203, 0.7730907201766968, 0.805655300617218, 0.8382198810577393, 0.8707844018936157, 0.9033489227294922, 0.9359135031700134, 0.9684780836105347, 1.0010426044464111]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 16.0, 10.0, 19.0, 27.0, 37.0, 47.0, 89.0, 132.0, 227.0, 413.0, 744.0, 1411.0, 2945.0, 7122.0, 20595.0, 81087.0, 3133046.0, 851121.0, 65734.0, 17679.0, 6376.0, 2665.0, 1330.0, 604.0, 324.0, 177.0, 89.0, 84.0, 42.0, 39.0, 20.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24714279174804688, -0.23940277099609375, -0.23166275024414062, -0.2239227294921875, -0.21618270874023438, -0.20844268798828125, -0.20070266723632812, -0.192962646484375, -0.18522262573242188, -0.17748260498046875, -0.16974258422851562, -0.1620025634765625, -0.15426254272460938, -0.14652252197265625, -0.13878250122070312, -0.13104248046875, -0.12330245971679688, -0.11556243896484375, -0.10782241821289062, -0.1000823974609375, -0.09234237670898438, -0.08460235595703125, -0.07686233520507812, -0.069122314453125, -0.061382293701171875, -0.05364227294921875, -0.045902252197265625, -0.0381622314453125, -0.030422210693359375, -0.02268218994140625, -0.014942169189453125, -0.0072021484375, 0.000537872314453125, 0.00827789306640625, 0.016017913818359375, 0.0237579345703125, 0.031497955322265625, 0.03923797607421875, 0.046977996826171875, 0.054718017578125, 0.062458038330078125, 0.07019805908203125, 0.07793807983398438, 0.0856781005859375, 0.09341812133789062, 0.10115814208984375, 0.10889816284179688, 0.11663818359375, 0.12437820434570312, 0.13211822509765625, 0.13985824584960938, 0.1475982666015625, 0.15533828735351562, 0.16307830810546875, 0.17081832885742188, 0.178558349609375, 0.18629837036132812, 0.19403839111328125, 0.20177841186523438, 0.2095184326171875, 0.21725845336914062, 0.22499847412109375, 0.23273849487304688, 0.240478515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 3.0, 9.0, 14.0, 11.0, 24.0, 30.0, 26.0, 25.0, 42.0, 61.0, 64.0, 65.0, 65.0, 59.0, 56.0, 52.0, 65.0, 75.0, 38.0, 42.0, 41.0, 41.0, 23.0, 16.0, 10.0, 11.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0625, -0.06059408187866211, -0.05868816375732422, -0.05678224563598633, -0.05487632751464844, -0.05297040939331055, -0.051064491271972656, -0.049158573150634766, -0.047252655029296875, -0.045346736907958984, -0.043440818786621094, -0.0415349006652832, -0.03962898254394531, -0.03772306442260742, -0.03581714630126953, -0.03391122817993164, -0.03200531005859375, -0.03009939193725586, -0.02819347381591797, -0.026287555694580078, -0.024381637573242188, -0.022475719451904297, -0.020569801330566406, -0.018663883209228516, -0.016757965087890625, -0.014852046966552734, -0.012946128845214844, -0.011040210723876953, -0.009134292602539062, -0.007228374481201172, -0.005322456359863281, -0.0034165382385253906, -0.0015106201171875, 0.0003952980041503906, 0.0023012161254882812, 0.004207134246826172, 0.0061130523681640625, 0.008018970489501953, 0.009924888610839844, 0.011830806732177734, 0.013736724853515625, 0.015642642974853516, 0.017548561096191406, 0.019454479217529297, 0.021360397338867188, 0.023266315460205078, 0.02517223358154297, 0.02707815170288086, 0.02898406982421875, 0.03088998794555664, 0.03279590606689453, 0.03470182418823242, 0.03660774230957031, 0.0385136604309082, 0.040419578552246094, 0.042325496673583984, 0.044231414794921875, 0.046137332916259766, 0.048043251037597656, 0.04994916915893555, 0.05185508728027344, 0.05376100540161133, 0.05566692352294922, 0.05757284164428711, 0.059478759765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 7.0, 9.0, 18.0, 15.0, 36.0, 60.0, 85.0, 186.0, 353.0, 669.0, 1488.0, 3589.0, 9920.0, 34471.0, 219669.0, 3698399.0, 178694.0, 30853.0, 9491.0, 3480.0, 1394.0, 652.0, 340.0, 159.0, 97.0, 52.0, 32.0, 21.0, 20.0, 12.0, 3.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3510017395019531, -0.34018707275390625, -0.3293724060058594, -0.3185577392578125, -0.3077430725097656, -0.29692840576171875, -0.2861137390136719, -0.275299072265625, -0.2644844055175781, -0.25366973876953125, -0.24285507202148438, -0.2320404052734375, -0.22122573852539062, -0.21041107177734375, -0.19959640502929688, -0.18878173828125, -0.17796707153320312, -0.16715240478515625, -0.15633773803710938, -0.1455230712890625, -0.13470840454101562, -0.12389373779296875, -0.11307907104492188, -0.102264404296875, -0.09144973754882812, -0.08063507080078125, -0.06982040405273438, -0.0590057373046875, -0.048191070556640625, -0.03737640380859375, -0.026561737060546875, -0.0157470703125, -0.004932403564453125, 0.00588226318359375, 0.016696929931640625, 0.0275115966796875, 0.038326263427734375, 0.04914093017578125, 0.059955596923828125, 0.070770263671875, 0.08158493041992188, 0.09239959716796875, 0.10321426391601562, 0.1140289306640625, 0.12484359741210938, 0.13565826416015625, 0.14647293090820312, 0.15728759765625, 0.16810226440429688, 0.17891693115234375, 0.18973159790039062, 0.2005462646484375, 0.21136093139648438, 0.22217559814453125, 0.23299026489257812, 0.243804931640625, 0.2546195983886719, 0.26543426513671875, 0.2762489318847656, 0.2870635986328125, 0.2978782653808594, 0.30869293212890625, 0.3195075988769531, 0.330322265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 14.0, 6.0, 16.0, 18.0, 31.0, 56.0, 82.0, 128.0, 301.0, 1533.0, 1168.0, 290.0, 141.0, 82.0, 43.0, 36.0, 23.0, 21.0, 21.0, 11.0, 15.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12143707275390625, -0.1177520751953125, -0.11406707763671875, -0.110382080078125, -0.10669708251953125, -0.1030120849609375, -0.09932708740234375, -0.09564208984375, -0.09195709228515625, -0.0882720947265625, -0.08458709716796875, -0.080902099609375, -0.07721710205078125, -0.0735321044921875, -0.06984710693359375, -0.066162109375, -0.06247711181640625, -0.0587921142578125, -0.05510711669921875, -0.051422119140625, -0.04773712158203125, -0.0440521240234375, -0.04036712646484375, -0.03668212890625, -0.03299713134765625, -0.0293121337890625, -0.02562713623046875, -0.021942138671875, -0.01825714111328125, -0.0145721435546875, -0.01088714599609375, -0.0072021484375, -0.00351715087890625, 0.0001678466796875, 0.00385284423828125, 0.007537841796875, 0.01122283935546875, 0.0149078369140625, 0.01859283447265625, 0.02227783203125, 0.02596282958984375, 0.0296478271484375, 0.03333282470703125, 0.037017822265625, 0.04070281982421875, 0.0443878173828125, 0.04807281494140625, 0.0517578125, 0.05544281005859375, 0.0591278076171875, 0.06281280517578125, 0.066497802734375, 0.07018280029296875, 0.0738677978515625, 0.07755279541015625, 0.08123779296875, 0.08492279052734375, 0.0886077880859375, 0.09229278564453125, 0.095977783203125, 0.09966278076171875, 0.1033477783203125, 0.10703277587890625, 0.1107177734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 18.0, 33.0, 85.0, 160.0, 197.0, 215.0, 144.0, 82.0, 35.0, 15.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5483378171920776, -0.5134613513946533, -0.4785849153995514, -0.4437084496021271, -0.40883201360702515, -0.37395554780960083, -0.3390790820121765, -0.3042026162147522, -0.26932618021965027, -0.23444972932338715, -0.19957327842712402, -0.1646968126296997, -0.12982036173343658, -0.09494391083717346, -0.060067445039749146, -0.025190994143486023, 0.0096854567527771, 0.04456191137433052, 0.07943836599588394, 0.11431482434272766, 0.14919127523899078, 0.1840677261352539, 0.21894419193267822, 0.25382065773010254, 0.28869709372520447, 0.3235735595226288, 0.3584499955177307, 0.39332646131515503, 0.42820292711257935, 0.4630793631076813, 0.4979558289051056, 0.5328322649002075, 0.5677087306976318, 0.6025851964950562, 0.6374616622924805, 0.6723381280899048, 0.7072145342826843, 0.7420910000801086, 0.776967465877533, 0.8118439316749573, 0.8467203378677368, 0.8815968036651611, 0.9164732694625854, 0.9513497352600098, 0.9862261414527893, 1.0211026668548584, 1.0559790134429932, 1.0908554792404175, 1.1257319450378418, 1.1606084108352661, 1.1954848766326904, 1.2303613424301147, 1.265237808227539, 1.3001141548156738, 1.3349907398223877, 1.3698670864105225, 1.4047436714172363, 1.4396201372146606, 1.474496603012085, 1.5093730688095093, 1.5442495346069336, 1.5791258811950684, 1.6140024662017822, 1.648878812789917, 1.6837552785873413]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 4.0, 11.0, 5.0, 9.0, 10.0, 14.0, 18.0, 26.0, 32.0, 32.0, 22.0, 34.0, 33.0, 33.0, 45.0, 47.0, 51.0, 39.0, 37.0, 47.0, 31.0, 56.0, 38.0, 40.0, 39.0, 34.0, 32.0, 28.0, 22.0, 21.0, 18.0, 21.0, 11.0, 14.0, 10.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.37145864963531494, -0.3599833846092224, -0.3485080897808075, -0.33703282475471497, -0.32555752992630005, -0.3140822649002075, -0.302606999874115, -0.2911317050457001, -0.27965644001960754, -0.268181174993515, -0.2567058801651001, -0.24523061513900757, -0.23375533521175385, -0.22228005528450012, -0.2108047753572464, -0.19932949542999268, -0.18785421550273895, -0.17637893557548523, -0.1649036556482315, -0.15342837572097778, -0.14195311069488525, -0.13047783076763153, -0.11900255084037781, -0.10752727836370468, -0.09605199843645096, -0.08457671850919724, -0.07310144603252411, -0.061626166105270386, -0.05015088990330696, -0.038675613701343536, -0.027200333774089813, -0.015725061297416687, -0.004249781370162964, 0.007225495763123035, 0.018700772896409035, 0.03017605096101761, 0.04165132716298103, 0.05312660336494446, 0.06460188329219818, 0.07607715576887131, 0.08755243569612503, 0.09902771562337875, 0.11050298810005188, 0.1219782680273056, 0.13345354795455933, 0.14492881298065186, 0.15640410780906677, 0.1678793728351593, 0.17935465276241302, 0.19082993268966675, 0.20230521261692047, 0.2137804925441742, 0.22525575757026672, 0.23673103749752045, 0.24820631742477417, 0.2596815824508667, 0.2711568772792816, 0.28263214230537415, 0.29410743713378906, 0.3055827021598816, 0.3170579969882965, 0.32853326201438904, 0.34000855684280396, 0.3514838218688965, 0.362959086894989]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 11.0, 25.0, 32.0, 40.0, 66.0, 96.0, 165.0, 260.0, 465.0, 746.0, 1374.0, 2547.0, 5176.0, 11158.0, 25411.0, 65155.0, 189160.0, 443216.0, 189920.0, 65793.0, 25719.0, 10900.0, 5176.0, 2557.0, 1403.0, 776.0, 435.0, 261.0, 180.0, 101.0, 81.0, 45.0, 40.0, 27.0, 8.0, 8.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2462158203125, -0.23928070068359375, -0.2323455810546875, -0.22541046142578125, -0.218475341796875, -0.21154022216796875, -0.2046051025390625, -0.19766998291015625, -0.19073486328125, -0.18379974365234375, -0.1768646240234375, -0.16992950439453125, -0.162994384765625, -0.15605926513671875, -0.1491241455078125, -0.14218902587890625, -0.13525390625, -0.12831878662109375, -0.1213836669921875, -0.11444854736328125, -0.107513427734375, -0.10057830810546875, -0.0936431884765625, -0.08670806884765625, -0.07977294921875, -0.07283782958984375, -0.0659027099609375, -0.05896759033203125, -0.052032470703125, -0.04509735107421875, -0.0381622314453125, -0.03122711181640625, -0.0242919921875, -0.01735687255859375, -0.0104217529296875, -0.00348663330078125, 0.003448486328125, 0.01038360595703125, 0.0173187255859375, 0.02425384521484375, 0.03118896484375, 0.03812408447265625, 0.0450592041015625, 0.05199432373046875, 0.058929443359375, 0.06586456298828125, 0.0727996826171875, 0.07973480224609375, 0.086669921875, 0.09360504150390625, 0.1005401611328125, 0.10747528076171875, 0.114410400390625, 0.12134552001953125, 0.1282806396484375, 0.13521575927734375, 0.14215087890625, 0.14908599853515625, 0.1560211181640625, 0.16295623779296875, 0.169891357421875, 0.17682647705078125, 0.1837615966796875, 0.19069671630859375, 0.1976318359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 7.0, 7.0, 7.0, 8.0, 16.0, 16.0, 23.0, 21.0, 21.0, 31.0, 39.0, 58.0, 46.0, 63.0, 60.0, 59.0, 57.0, 46.0, 50.0, 49.0, 61.0, 46.0, 48.0, 31.0, 30.0, 23.0, 18.0, 11.0, 11.0, 12.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.062255859375, -0.060442447662353516, -0.05862903594970703, -0.05681562423706055, -0.05500221252441406, -0.05318880081176758, -0.051375389099121094, -0.04956197738647461, -0.047748565673828125, -0.04593515396118164, -0.044121742248535156, -0.04230833053588867, -0.04049491882324219, -0.0386815071105957, -0.03686809539794922, -0.035054683685302734, -0.03324127197265625, -0.031427860260009766, -0.02961444854736328, -0.027801036834716797, -0.025987625122070312, -0.024174213409423828, -0.022360801696777344, -0.02054738998413086, -0.018733978271484375, -0.01692056655883789, -0.015107154846191406, -0.013293743133544922, -0.011480331420898438, -0.009666919708251953, -0.007853507995605469, -0.006040096282958984, -0.0042266845703125, -0.0024132728576660156, -0.0005998611450195312, 0.0012135505676269531, 0.0030269622802734375, 0.004840373992919922, 0.006653785705566406, 0.00846719741821289, 0.010280609130859375, 0.01209402084350586, 0.013907432556152344, 0.015720844268798828, 0.017534255981445312, 0.019347667694091797, 0.02116107940673828, 0.022974491119384766, 0.02478790283203125, 0.026601314544677734, 0.02841472625732422, 0.030228137969970703, 0.03204154968261719, 0.03385496139526367, 0.035668373107910156, 0.03748178482055664, 0.039295196533203125, 0.04110860824584961, 0.042922019958496094, 0.04473543167114258, 0.04654884338378906, 0.04836225509643555, 0.05017566680908203, 0.051989078521728516, 0.053802490234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 24.0, 41.0, 51.0, 98.0, 196.0, 311.0, 630.0, 1662.0, 5582.0, 37622.0, 536430.0, 427184.0, 31050.0, 4848.0, 1455.0, 589.0, 317.0, 179.0, 105.0, 61.0, 35.0, 30.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5784149169921875, -0.563568115234375, -0.5487213134765625, -0.53387451171875, -0.5190277099609375, -0.504180908203125, -0.4893341064453125, -0.4744873046875, -0.4596405029296875, -0.444793701171875, -0.4299468994140625, -0.41510009765625, -0.4002532958984375, -0.385406494140625, -0.3705596923828125, -0.355712890625, -0.3408660888671875, -0.326019287109375, -0.3111724853515625, -0.29632568359375, -0.2814788818359375, -0.266632080078125, -0.2517852783203125, -0.2369384765625, -0.2220916748046875, -0.207244873046875, -0.1923980712890625, -0.17755126953125, -0.1627044677734375, -0.147857666015625, -0.1330108642578125, -0.1181640625, -0.1033172607421875, -0.088470458984375, -0.0736236572265625, -0.05877685546875, -0.0439300537109375, -0.029083251953125, -0.0142364501953125, 0.0006103515625, 0.0154571533203125, 0.030303955078125, 0.0451507568359375, 0.05999755859375, 0.0748443603515625, 0.089691162109375, 0.1045379638671875, 0.119384765625, 0.1342315673828125, 0.149078369140625, 0.1639251708984375, 0.17877197265625, 0.1936187744140625, 0.208465576171875, 0.2233123779296875, 0.2381591796875, 0.2530059814453125, 0.267852783203125, 0.2826995849609375, 0.29754638671875, 0.3123931884765625, 0.327239990234375, 0.3420867919921875, 0.35693359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 13.0, 18.0, 18.0, 21.0, 24.0, 33.0, 40.0, 41.0, 62.0, 53.0, 68.0, 64.0, 78.0, 73.0, 62.0, 63.0, 61.0, 36.0, 32.0, 24.0, 27.0, 22.0, 13.0, 17.0, 8.0, 1.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39111328125, -0.38060760498046875, -0.3701019287109375, -0.35959625244140625, -0.349090576171875, -0.33858489990234375, -0.3280792236328125, -0.31757354736328125, -0.30706787109375, -0.29656219482421875, -0.2860565185546875, -0.27555084228515625, -0.265045166015625, -0.25453948974609375, -0.2440338134765625, -0.23352813720703125, -0.2230224609375, -0.21251678466796875, -0.2020111083984375, -0.19150543212890625, -0.180999755859375, -0.17049407958984375, -0.1599884033203125, -0.14948272705078125, -0.13897705078125, -0.12847137451171875, -0.1179656982421875, -0.10746002197265625, -0.096954345703125, -0.08644866943359375, -0.0759429931640625, -0.06543731689453125, -0.054931640625, -0.04442596435546875, -0.0339202880859375, -0.02341461181640625, -0.012908935546875, -0.00240325927734375, 0.0081024169921875, 0.01860809326171875, 0.02911376953125, 0.03961944580078125, 0.0501251220703125, 0.06063079833984375, 0.071136474609375, 0.08164215087890625, 0.0921478271484375, 0.10265350341796875, 0.1131591796875, 0.12366485595703125, 0.1341705322265625, 0.14467620849609375, 0.155181884765625, 0.16568756103515625, 0.1761932373046875, 0.18669891357421875, 0.19720458984375, 0.20771026611328125, 0.2182159423828125, 0.22872161865234375, 0.239227294921875, 0.24973297119140625, 0.2602386474609375, 0.27074432373046875, 0.28125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 12.0, 9.0, 19.0, 16.0, 27.0, 46.0, 53.0, 86.0, 157.0, 222.0, 376.0, 645.0, 1117.0, 2098.0, 4073.0, 8570.0, 20785.0, 59727.0, 255209.0, 528501.0, 108666.0, 33256.0, 12731.0, 5771.0, 2797.0, 1462.0, 790.0, 459.0, 299.0, 186.0, 125.0, 72.0, 56.0, 41.0, 26.0, 15.0, 19.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1690673828125, -0.16365432739257812, -0.15824127197265625, -0.15282821655273438, -0.1474151611328125, -0.14200210571289062, -0.13658905029296875, -0.13117599487304688, -0.125762939453125, -0.12034988403320312, -0.11493682861328125, -0.10952377319335938, -0.1041107177734375, -0.09869766235351562, -0.09328460693359375, -0.08787155151367188, -0.08245849609375, -0.07704544067382812, -0.07163238525390625, -0.06621932983398438, -0.0608062744140625, -0.055393218994140625, -0.04998016357421875, -0.044567108154296875, -0.039154052734375, -0.033740997314453125, -0.02832794189453125, -0.022914886474609375, -0.0175018310546875, -0.012088775634765625, -0.00667572021484375, -0.001262664794921875, 0.004150390625, 0.009563446044921875, 0.01497650146484375, 0.020389556884765625, 0.0258026123046875, 0.031215667724609375, 0.03662872314453125, 0.042041778564453125, 0.047454833984375, 0.052867889404296875, 0.05828094482421875, 0.06369400024414062, 0.0691070556640625, 0.07452011108398438, 0.07993316650390625, 0.08534622192382812, 0.09075927734375, 0.09617233276367188, 0.10158538818359375, 0.10699844360351562, 0.1124114990234375, 0.11782455444335938, 0.12323760986328125, 0.12865066528320312, 0.134063720703125, 0.13947677612304688, 0.14488983154296875, 0.15030288696289062, 0.1557159423828125, 0.16112899780273438, 0.16654205322265625, 0.17195510864257812, 0.1773681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 14.0, 14.0, 15.0, 34.0, 27.0, 37.0, 45.0, 65.0, 89.0, 78.0, 93.0, 73.0, 81.0, 57.0, 46.0, 45.0, 38.0, 29.0, 16.0, 17.0, 8.0, 8.0, 5.0, 4.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6253204345703125e-05, -4.484318196773529e-05, -4.3433159589767456e-05, -4.202313721179962e-05, -4.061311483383179e-05, -3.920309245586395e-05, -3.779307007789612e-05, -3.6383047699928284e-05, -3.497302532196045e-05, -3.3563002943992615e-05, -3.215298056602478e-05, -3.0742958188056946e-05, -2.933293581008911e-05, -2.7922913432121277e-05, -2.6512891054153442e-05, -2.5102868676185608e-05, -2.3692846298217773e-05, -2.228282392024994e-05, -2.0872801542282104e-05, -1.946277916431427e-05, -1.8052756786346436e-05, -1.66427344083786e-05, -1.5232712030410767e-05, -1.3822689652442932e-05, -1.2412667274475098e-05, -1.1002644896507263e-05, -9.592622518539429e-06, -8.182600140571594e-06, -6.77257776260376e-06, -5.362555384635925e-06, -3.952533006668091e-06, -2.5425106287002563e-06, -1.1324882507324219e-06, 2.775341272354126e-07, 1.687556505203247e-06, 3.0975788831710815e-06, 4.507601261138916e-06, 5.9176236391067505e-06, 7.327646017074585e-06, 8.73766839504242e-06, 1.0147690773010254e-05, 1.1557713150978088e-05, 1.2967735528945923e-05, 1.4377757906913757e-05, 1.5787780284881592e-05, 1.7197802662849426e-05, 1.860782504081726e-05, 2.0017847418785095e-05, 2.142786979675293e-05, 2.2837892174720764e-05, 2.42479145526886e-05, 2.5657936930656433e-05, 2.7067959308624268e-05, 2.8477981686592102e-05, 2.9888004064559937e-05, 3.129802644252777e-05, 3.2708048820495605e-05, 3.411807119846344e-05, 3.5528093576431274e-05, 3.693811595439911e-05, 3.834813833236694e-05, 3.975816071033478e-05, 4.116818308830261e-05, 4.257820546627045e-05, 4.398822784423828e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 15.0, 12.0, 33.0, 45.0, 69.0, 128.0, 247.0, 538.0, 1144.0, 3510.0, 13660.0, 82022.0, 768987.0, 149718.0, 20816.0, 4770.0, 1505.0, 628.0, 300.0, 164.0, 78.0, 66.0, 39.0, 16.0, 7.0, 2.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.26918792724609375, -0.2590789794921875, -0.24897003173828125, -0.238861083984375, -0.22875213623046875, -0.2186431884765625, -0.20853424072265625, -0.19842529296875, -0.18831634521484375, -0.1782073974609375, -0.16809844970703125, -0.157989501953125, -0.14788055419921875, -0.1377716064453125, -0.12766265869140625, -0.1175537109375, -0.10744476318359375, -0.0973358154296875, -0.08722686767578125, -0.077117919921875, -0.06700897216796875, -0.0569000244140625, -0.04679107666015625, -0.03668212890625, -0.02657318115234375, -0.0164642333984375, -0.00635528564453125, 0.003753662109375, 0.01386260986328125, 0.0239715576171875, 0.03408050537109375, 0.044189453125, 0.05429840087890625, 0.0644073486328125, 0.07451629638671875, 0.084625244140625, 0.09473419189453125, 0.1048431396484375, 0.11495208740234375, 0.12506103515625, 0.13516998291015625, 0.1452789306640625, 0.15538787841796875, 0.165496826171875, 0.17560577392578125, 0.1857147216796875, 0.19582366943359375, 0.2059326171875, 0.21604156494140625, 0.2261505126953125, 0.23625946044921875, 0.246368408203125, 0.25647735595703125, 0.2665863037109375, 0.27669525146484375, 0.28680419921875, 0.29691314697265625, 0.3070220947265625, 0.31713104248046875, 0.327239990234375, 0.33734893798828125, 0.3474578857421875, 0.35756683349609375, 0.36767578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 3.0, 9.0, 13.0, 10.0, 8.0, 24.0, 10.0, 26.0, 30.0, 54.0, 66.0, 107.0, 130.0, 111.0, 79.0, 67.0, 45.0, 39.0, 26.0, 20.0, 16.0, 11.0, 14.0, 12.0, 11.0, 10.0, 5.0, 0.0, 2.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142822265625, -0.13818931579589844, -0.13355636596679688, -0.1289234161376953, -0.12429046630859375, -0.11965751647949219, -0.11502456665039062, -0.11039161682128906, -0.1057586669921875, -0.10112571716308594, -0.09649276733398438, -0.09185981750488281, -0.08722686767578125, -0.08259391784667969, -0.07796096801757812, -0.07332801818847656, -0.068695068359375, -0.06406211853027344, -0.059429168701171875, -0.05479621887207031, -0.05016326904296875, -0.04553031921386719, -0.040897369384765625, -0.03626441955566406, -0.0316314697265625, -0.026998519897460938, -0.022365570068359375, -0.017732620239257812, -0.01309967041015625, -0.008466720581054688, -0.003833770751953125, 0.0007991790771484375, 0.00543212890625, 0.010065078735351562, 0.014698028564453125, 0.019330978393554688, 0.02396392822265625, 0.028596878051757812, 0.033229827880859375, 0.03786277770996094, 0.0424957275390625, 0.04712867736816406, 0.051761627197265625, 0.05639457702636719, 0.06102752685546875, 0.06566047668457031, 0.07029342651367188, 0.07492637634277344, 0.079559326171875, 0.08419227600097656, 0.08882522583007812, 0.09345817565917969, 0.09809112548828125, 0.10272407531738281, 0.10735702514648438, 0.11198997497558594, 0.1166229248046875, 0.12125587463378906, 0.12588882446289062, 0.1305217742919922, 0.13515472412109375, 0.1397876739501953, 0.14442062377929688, 0.14905357360839844, 0.1536865234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 16.0, 19.0, 47.0, 67.0, 85.0, 139.0, 140.0, 141.0, 116.0, 93.0, 46.0, 38.0, 21.0, 8.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.738926649093628, -1.6743013858795166, -1.6096762418746948, -1.5450509786605835, -1.4804257154464722, -1.4158005714416504, -1.351175308227539, -1.2865500450134277, -1.2219247817993164, -1.157299518585205, -1.0926743745803833, -1.028049111366272, -0.9634238481521606, -0.8987986445426941, -0.8341734409332275, -0.7695481777191162, -0.7049230337142944, -0.6402978301048279, -0.5756725668907166, -0.51104736328125, -0.44642212986946106, -0.3817968964576721, -0.31717169284820557, -0.2525464594364166, -0.18792122602462769, -0.12329600006341934, -0.058670774102211, 0.005954444408416748, 0.07057967782020569, 0.13520491123199463, 0.19983011484146118, 0.2644553482532501, 0.32908058166503906, 0.393705815076828, 0.45833104848861694, 0.5229562520980835, 0.5875815153121948, 0.6522067189216614, 0.7168319225311279, 0.7814571857452393, 0.8460823893547058, 0.9107075929641724, 0.9753328561782837, 1.0399580001831055, 1.1045832633972168, 1.1692085266113281, 1.2338337898254395, 1.2984589338302612, 1.3630841970443726, 1.4277094602584839, 1.4923346042633057, 1.556959867477417, 1.6215851306915283, 1.6862103939056396, 1.7508355379104614, 1.8154608011245728, 1.8800859451293945, 1.9447112083435059, 2.009336471557617, 2.0739617347717285, 2.1385867595672607, 2.203212022781372, 2.2678372859954834, 2.3324625492095947, 2.397087812423706]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 7.0, 7.0, 10.0, 11.0, 19.0, 21.0, 21.0, 19.0, 27.0, 24.0, 49.0, 41.0, 50.0, 40.0, 56.0, 54.0, 48.0, 52.0, 44.0, 37.0, 58.0, 32.0, 49.0, 36.0, 35.0, 26.0, 23.0, 18.0, 20.0, 14.0, 6.0, 4.0, 4.0, 9.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6430422067642212, -1.598127841949463, -1.5532134771347046, -1.5082991123199463, -1.4633848667144775, -1.4184705018997192, -1.373556137084961, -1.3286417722702026, -1.2837274074554443, -1.238813042640686, -1.1938986778259277, -1.1489843130111694, -1.1040699481964111, -1.0591557025909424, -1.014241337776184, -0.9693269729614258, -0.9244126081466675, -0.8794982433319092, -0.8345838785171509, -0.7896695733070374, -0.744755208492279, -0.6998408436775208, -0.6549265384674072, -0.6100121736526489, -0.5650978088378906, -0.5201834440231323, -0.4752691090106964, -0.4303547739982605, -0.3854404091835022, -0.3405260443687439, -0.295611709356308, -0.25069737434387207, -0.20578312873840332, -0.1608687788248062, -0.1159544289112091, -0.071040078997612, -0.026125729084014893, 0.018788620829582214, 0.06370297074317932, 0.10861730575561523, 0.15353167057037354, 0.19844602048397064, 0.24336037039756775, 0.28827470541000366, 0.33318907022476196, 0.37810343503952026, 0.4230177700519562, 0.4679321050643921, 0.5128464698791504, 0.5577608346939087, 0.602675199508667, 0.6475895047187805, 0.6925038695335388, 0.7374182343482971, 0.7823325395584106, 0.827246904373169, 0.8721612691879272, 0.9170756340026855, 0.9619899988174438, 1.0069043636322021, 1.051818609237671, 1.0967329740524292, 1.1416473388671875, 1.1865617036819458, 1.231476068496704]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 10.0, 11.0, 15.0, 23.0, 35.0, 49.0, 84.0, 128.0, 211.0, 324.0, 555.0, 1033.0, 1958.0, 4029.0, 9137.0, 25165.0, 91019.0, 2496218.0, 1437920.0, 85717.0, 23669.0, 8874.0, 3799.0, 1866.0, 978.0, 557.0, 303.0, 182.0, 125.0, 81.0, 58.0, 36.0, 31.0, 19.0, 15.0, 13.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.2370586395263672, -0.22887802124023438, -0.22069740295410156, -0.21251678466796875, -0.20433616638183594, -0.19615554809570312, -0.1879749298095703, -0.1797943115234375, -0.1716136932373047, -0.16343307495117188, -0.15525245666503906, -0.14707183837890625, -0.13889122009277344, -0.13071060180664062, -0.12252998352050781, -0.114349365234375, -0.10616874694824219, -0.09798812866210938, -0.08980751037597656, -0.08162689208984375, -0.07344627380371094, -0.06526565551757812, -0.05708503723144531, -0.0489044189453125, -0.04072380065917969, -0.032543182373046875, -0.024362564086914062, -0.01618194580078125, -0.008001327514648438, 0.000179290771484375, 0.008359909057617188, 0.01654052734375, 0.024721145629882812, 0.032901763916015625, 0.04108238220214844, 0.04926300048828125, 0.05744361877441406, 0.06562423706054688, 0.07380485534667969, 0.0819854736328125, 0.09016609191894531, 0.09834671020507812, 0.10652732849121094, 0.11470794677734375, 0.12288856506347656, 0.13106918334960938, 0.1392498016357422, 0.147430419921875, 0.1556110382080078, 0.16379165649414062, 0.17197227478027344, 0.18015289306640625, 0.18833351135253906, 0.19651412963867188, 0.2046947479248047, 0.2128753662109375, 0.2210559844970703, 0.22923660278320312, 0.23741722106933594, 0.24559783935546875, 0.25377845764160156, 0.2619590759277344, 0.2701396942138672, 0.2783203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 17.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 49.0, 47.0, 54.0, 55.0, 77.0, 58.0, 63.0, 68.0, 60.0, 53.0, 58.0, 46.0, 29.0, 25.0, 29.0, 21.0, 13.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06298828125, -0.06085777282714844, -0.058727264404296875, -0.05659675598144531, -0.05446624755859375, -0.05233573913574219, -0.050205230712890625, -0.04807472229003906, -0.0459442138671875, -0.04381370544433594, -0.041683197021484375, -0.03955268859863281, -0.03742218017578125, -0.03529167175292969, -0.033161163330078125, -0.031030654907226562, -0.028900146484375, -0.026769638061523438, -0.024639129638671875, -0.022508621215820312, -0.02037811279296875, -0.018247604370117188, -0.016117095947265625, -0.013986587524414062, -0.0118560791015625, -0.009725570678710938, -0.007595062255859375, -0.0054645538330078125, -0.00333404541015625, -0.0012035369873046875, 0.000926971435546875, 0.0030574798583984375, 0.00518798828125, 0.0073184967041015625, 0.009449005126953125, 0.011579513549804688, 0.01371002197265625, 0.015840530395507812, 0.017971038818359375, 0.020101547241210938, 0.0222320556640625, 0.024362564086914062, 0.026493072509765625, 0.028623580932617188, 0.03075408935546875, 0.03288459777832031, 0.035015106201171875, 0.03714561462402344, 0.039276123046875, 0.04140663146972656, 0.043537139892578125, 0.04566764831542969, 0.04779815673828125, 0.04992866516113281, 0.052059173583984375, 0.05418968200683594, 0.0563201904296875, 0.05845069885253906, 0.060581207275390625, 0.06271171569824219, 0.06484222412109375, 0.06697273254394531, 0.06910324096679688, 0.07123374938964844, 0.0733642578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 16.0, 11.0, 17.0, 36.0, 46.0, 66.0, 86.0, 183.0, 391.0, 783.0, 1946.0, 5259.0, 16393.0, 67744.0, 599282.0, 3329645.0, 131783.0, 27636.0, 8037.0, 2818.0, 1079.0, 431.0, 225.0, 139.0, 71.0, 46.0, 35.0, 24.0, 10.0, 11.0, 6.0, 5.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.430908203125, -0.41991424560546875, -0.4089202880859375, -0.39792633056640625, -0.386932373046875, -0.37593841552734375, -0.3649444580078125, -0.35395050048828125, -0.34295654296875, -0.33196258544921875, -0.3209686279296875, -0.30997467041015625, -0.298980712890625, -0.28798675537109375, -0.2769927978515625, -0.26599884033203125, -0.2550048828125, -0.24401092529296875, -0.2330169677734375, -0.22202301025390625, -0.211029052734375, -0.20003509521484375, -0.1890411376953125, -0.17804718017578125, -0.16705322265625, -0.15605926513671875, -0.1450653076171875, -0.13407135009765625, -0.123077392578125, -0.11208343505859375, -0.1010894775390625, -0.09009552001953125, -0.0791015625, -0.06810760498046875, -0.0571136474609375, -0.04611968994140625, -0.035125732421875, -0.02413177490234375, -0.0131378173828125, -0.00214385986328125, 0.00885009765625, 0.01984405517578125, 0.0308380126953125, 0.04183197021484375, 0.052825927734375, 0.06381988525390625, 0.0748138427734375, 0.08580780029296875, 0.0968017578125, 0.10779571533203125, 0.1187896728515625, 0.12978363037109375, 0.140777587890625, 0.15177154541015625, 0.1627655029296875, 0.17375946044921875, 0.18475341796875, 0.19574737548828125, 0.2067413330078125, 0.21773529052734375, 0.228729248046875, 0.23972320556640625, 0.2507171630859375, 0.26171112060546875, 0.272705078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 10.0, 15.0, 14.0, 34.0, 38.0, 72.0, 102.0, 163.0, 369.0, 1721.0, 845.0, 288.0, 114.0, 88.0, 58.0, 34.0, 21.0, 25.0, 16.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2093505859375, -0.20434284210205078, -0.19933509826660156, -0.19432735443115234, -0.18931961059570312, -0.1843118667602539, -0.1793041229248047, -0.17429637908935547, -0.16928863525390625, -0.16428089141845703, -0.1592731475830078, -0.1542654037475586, -0.14925765991210938, -0.14424991607666016, -0.13924217224121094, -0.13423442840576172, -0.1292266845703125, -0.12421894073486328, -0.11921119689941406, -0.11420345306396484, -0.10919570922851562, -0.1041879653930664, -0.09918022155761719, -0.09417247772216797, -0.08916473388671875, -0.08415699005126953, -0.07914924621582031, -0.0741415023803711, -0.06913375854492188, -0.06412601470947266, -0.05911827087402344, -0.05411052703857422, -0.049102783203125, -0.04409503936767578, -0.03908729553222656, -0.034079551696777344, -0.029071807861328125, -0.024064064025878906, -0.019056320190429688, -0.014048576354980469, -0.00904083251953125, -0.004033088684082031, 0.0009746551513671875, 0.005982398986816406, 0.010990142822265625, 0.015997886657714844, 0.021005630493164062, 0.02601337432861328, 0.0310211181640625, 0.03602886199951172, 0.04103660583496094, 0.046044349670410156, 0.051052093505859375, 0.056059837341308594, 0.06106758117675781, 0.06607532501220703, 0.07108306884765625, 0.07609081268310547, 0.08109855651855469, 0.0861063003540039, 0.09111404418945312, 0.09612178802490234, 0.10112953186035156, 0.10613727569580078, 0.11114501953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 11.0, 16.0, 55.0, 148.0, 283.0, 251.0, 156.0, 54.0, 23.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.73797869682312, -2.681168556213379, -2.6243584156036377, -2.5675482749938965, -2.5107381343841553, -2.453927993774414, -2.397117853164673, -2.3403077125549316, -2.2834973335266113, -2.22668719291687, -2.169877052307129, -2.1130669116973877, -2.0562567710876465, -1.9994466304779053, -1.9426363706588745, -1.8858262300491333, -1.8290162086486816, -1.7722060680389404, -1.7153959274291992, -1.658585786819458, -1.6017756462097168, -1.5449655055999756, -1.4881552457809448, -1.4313451051712036, -1.3745349645614624, -1.3177248239517212, -1.26091468334198, -1.2041045427322388, -1.147294282913208, -1.0904841423034668, -1.0336740016937256, -0.9768638610839844, -0.9200537800788879, -0.8632436394691467, -0.8064334392547607, -0.7496232986450195, -0.6928131580352783, -0.6360030174255371, -0.5791928768157959, -0.5223826766014099, -0.4655725359916687, -0.4087623953819275, -0.3519522249698639, -0.2951420545578003, -0.23833191394805908, -0.18152177333831787, -0.12471160292625427, -0.06790143251419067, -0.011091291904449463, 0.04571886360645294, 0.10252901911735535, 0.15933917462825775, 0.21614933013916016, 0.27295947074890137, 0.32976964116096497, 0.38657981157302856, 0.4433899521827698, 0.500200092792511, 0.557010293006897, 0.6138204336166382, 0.6706305742263794, 0.7274407148361206, 0.7842508554458618, 0.8410610556602478, 0.897871196269989]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 22.0, 33.0, 42.0, 41.0, 54.0, 58.0, 70.0, 70.0, 65.0, 64.0, 68.0, 63.0, 59.0, 56.0, 48.0, 42.0, 24.0, 31.0, 28.0, 11.0, 11.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8174375295639038, -0.7941892743110657, -0.7709410190582275, -0.7476927042007446, -0.7244444489479065, -0.7011961936950684, -0.6779479384422302, -0.6546996831893921, -0.6314513683319092, -0.608203113079071, -0.5849548578262329, -0.56170654296875, -0.5384582877159119, -0.5152100324630737, -0.4919617772102356, -0.46871352195739746, -0.4454652667045593, -0.4222170114517212, -0.39896872639656067, -0.37572047114372253, -0.352472186088562, -0.3292239308357239, -0.30597567558288574, -0.2827274203300476, -0.2594791352748871, -0.23623086512088776, -0.21298259496688843, -0.1897343397140503, -0.16648606956005096, -0.14323779940605164, -0.1199895441532135, -0.09674127399921417, -0.07349306344985962, -0.05024479702115059, -0.02699653059244156, -0.003748267889022827, 0.0195000022649765, 0.04274827241897583, 0.06599652767181396, 0.0892447978258133, 0.11249306797981262, 0.13574133813381195, 0.15898960828781128, 0.18223786354064941, 0.20548613369464874, 0.22873440384864807, 0.2519826591014862, 0.27523094415664673, 0.29847919940948486, 0.321727454662323, 0.3449757397174835, 0.36822399497032166, 0.3914722800254822, 0.4147205352783203, 0.43796879053115845, 0.4612170457839966, 0.4844653308391571, 0.5077136158943176, 0.5309618711471558, 0.5542101263999939, 0.577458381652832, 0.6007066965103149, 0.6239548921585083, 0.6472032070159912, 0.6704514622688293]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 15.0, 31.0, 27.0, 56.0, 90.0, 114.0, 163.0, 292.0, 446.0, 800.0, 1294.0, 2353.0, 4379.0, 8584.0, 17701.0, 38781.0, 102292.0, 524241.0, 233138.0, 61435.0, 26391.0, 12223.0, 6098.0, 3234.0, 1790.0, 987.0, 567.0, 361.0, 246.0, 124.0, 84.0, 63.0, 51.0, 34.0, 19.0, 5.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21329116821289062, -0.20612335205078125, -0.19895553588867188, -0.1917877197265625, -0.18461990356445312, -0.17745208740234375, -0.17028427124023438, -0.163116455078125, -0.15594863891601562, -0.14878082275390625, -0.14161300659179688, -0.1344451904296875, -0.12727737426757812, -0.12010955810546875, -0.11294174194335938, -0.10577392578125, -0.09860610961914062, -0.09143829345703125, -0.08427047729492188, -0.0771026611328125, -0.06993484497070312, -0.06276702880859375, -0.055599212646484375, -0.048431396484375, -0.041263580322265625, -0.03409576416015625, -0.026927947998046875, -0.0197601318359375, -0.012592315673828125, -0.00542449951171875, 0.001743316650390625, 0.0089111328125, 0.016078948974609375, 0.02324676513671875, 0.030414581298828125, 0.0375823974609375, 0.044750213623046875, 0.05191802978515625, 0.059085845947265625, 0.066253662109375, 0.07342147827148438, 0.08058929443359375, 0.08775711059570312, 0.0949249267578125, 0.10209274291992188, 0.10926055908203125, 0.11642837524414062, 0.12359619140625, 0.13076400756835938, 0.13793182373046875, 0.14509963989257812, 0.1522674560546875, 0.15943527221679688, 0.16660308837890625, 0.17377090454101562, 0.180938720703125, 0.18810653686523438, 0.19527435302734375, 0.20244216918945312, 0.2096099853515625, 0.21677780151367188, 0.22394561767578125, 0.23111343383789062, 0.23828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 6.0, 16.0, 10.0, 23.0, 14.0, 19.0, 25.0, 32.0, 27.0, 31.0, 34.0, 41.0, 50.0, 42.0, 46.0, 47.0, 66.0, 43.0, 39.0, 53.0, 45.0, 40.0, 49.0, 35.0, 26.0, 30.0, 17.0, 13.0, 15.0, 10.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.056243896484375, -0.0545191764831543, -0.052794456481933594, -0.05106973648071289, -0.04934501647949219, -0.047620296478271484, -0.04589557647705078, -0.04417085647583008, -0.042446136474609375, -0.04072141647338867, -0.03899669647216797, -0.037271976470947266, -0.03554725646972656, -0.03382253646850586, -0.032097816467285156, -0.030373096466064453, -0.02864837646484375, -0.026923656463623047, -0.025198936462402344, -0.02347421646118164, -0.021749496459960938, -0.020024776458740234, -0.01830005645751953, -0.016575336456298828, -0.014850616455078125, -0.013125896453857422, -0.011401176452636719, -0.009676456451416016, -0.007951736450195312, -0.006227016448974609, -0.004502296447753906, -0.002777576446533203, -0.0010528564453125, 0.0006718635559082031, 0.0023965835571289062, 0.004121303558349609, 0.0058460235595703125, 0.007570743560791016, 0.009295463562011719, 0.011020183563232422, 0.012744903564453125, 0.014469623565673828, 0.01619434356689453, 0.017919063568115234, 0.019643783569335938, 0.02136850357055664, 0.023093223571777344, 0.024817943572998047, 0.02654266357421875, 0.028267383575439453, 0.029992103576660156, 0.03171682357788086, 0.03344154357910156, 0.035166263580322266, 0.03689098358154297, 0.03861570358276367, 0.040340423583984375, 0.04206514358520508, 0.04378986358642578, 0.045514583587646484, 0.04723930358886719, 0.04896402359008789, 0.050688743591308594, 0.0524134635925293, 0.05413818359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 9.0, 16.0, 18.0, 43.0, 58.0, 92.0, 173.0, 344.0, 617.0, 1440.0, 5368.0, 30667.0, 480709.0, 489801.0, 30995.0, 5350.0, 1374.0, 688.0, 322.0, 183.0, 127.0, 57.0, 32.0, 23.0, 17.0, 13.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5108909606933594, -0.49492645263671875, -0.4789619445800781, -0.4629974365234375, -0.4470329284667969, -0.43106842041015625, -0.4151039123535156, -0.399139404296875, -0.3831748962402344, -0.36721038818359375, -0.3512458801269531, -0.3352813720703125, -0.3193168640136719, -0.30335235595703125, -0.2873878479003906, -0.27142333984375, -0.2554588317871094, -0.23949432373046875, -0.22352981567382812, -0.2075653076171875, -0.19160079956054688, -0.17563629150390625, -0.15967178344726562, -0.143707275390625, -0.12774276733398438, -0.11177825927734375, -0.09581375122070312, -0.0798492431640625, -0.06388473510742188, -0.04792022705078125, -0.031955718994140625, -0.0159912109375, -2.6702880859375e-05, 0.01593780517578125, 0.031902313232421875, 0.0478668212890625, 0.06383132934570312, 0.07979583740234375, 0.09576034545898438, 0.111724853515625, 0.12768936157226562, 0.14365386962890625, 0.15961837768554688, 0.1755828857421875, 0.19154739379882812, 0.20751190185546875, 0.22347640991210938, 0.23944091796875, 0.2554054260253906, 0.27136993408203125, 0.2873344421386719, 0.3032989501953125, 0.3192634582519531, 0.33522796630859375, 0.3511924743652344, 0.367156982421875, 0.3831214904785156, 0.39908599853515625, 0.4150505065917969, 0.4310150146484375, 0.4469795227050781, 0.46294403076171875, 0.4789085388183594, 0.494873046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 5.0, 5.0, 7.0, 14.0, 18.0, 18.0, 21.0, 26.0, 41.0, 62.0, 56.0, 74.0, 70.0, 70.0, 79.0, 72.0, 72.0, 52.0, 66.0, 40.0, 30.0, 23.0, 17.0, 16.0, 12.0, 11.0, 10.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.423828125, -0.4123382568359375, -0.400848388671875, -0.3893585205078125, -0.37786865234375, -0.3663787841796875, -0.354888916015625, -0.3433990478515625, -0.3319091796875, -0.3204193115234375, -0.308929443359375, -0.2974395751953125, -0.28594970703125, -0.2744598388671875, -0.262969970703125, -0.2514801025390625, -0.239990234375, -0.2285003662109375, -0.217010498046875, -0.2055206298828125, -0.19403076171875, -0.1825408935546875, -0.171051025390625, -0.1595611572265625, -0.1480712890625, -0.1365814208984375, -0.125091552734375, -0.1136016845703125, -0.10211181640625, -0.0906219482421875, -0.079132080078125, -0.0676422119140625, -0.05615234375, -0.0446624755859375, -0.033172607421875, -0.0216827392578125, -0.01019287109375, 0.0012969970703125, 0.012786865234375, 0.0242767333984375, 0.0357666015625, 0.0472564697265625, 0.058746337890625, 0.0702362060546875, 0.08172607421875, 0.0932159423828125, 0.104705810546875, 0.1161956787109375, 0.127685546875, 0.1391754150390625, 0.150665283203125, 0.1621551513671875, 0.17364501953125, 0.1851348876953125, 0.196624755859375, 0.2081146240234375, 0.2196044921875, 0.2310943603515625, 0.242584228515625, 0.2540740966796875, 0.26556396484375, 0.2770538330078125, 0.288543701171875, 0.3000335693359375, 0.3115234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 17.0, 16.0, 30.0, 69.0, 111.0, 163.0, 339.0, 757.0, 1920.0, 5371.0, 19654.0, 590198.0, 403358.0, 18164.0, 5005.0, 1809.0, 732.0, 351.0, 190.0, 109.0, 59.0, 26.0, 43.0, 15.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52001953125, -0.5047149658203125, -0.489410400390625, -0.4741058349609375, -0.45880126953125, -0.4434967041015625, -0.428192138671875, -0.4128875732421875, -0.3975830078125, -0.3822784423828125, -0.366973876953125, -0.3516693115234375, -0.33636474609375, -0.3210601806640625, -0.305755615234375, -0.2904510498046875, -0.275146484375, -0.2598419189453125, -0.244537353515625, -0.2292327880859375, -0.21392822265625, -0.1986236572265625, -0.183319091796875, -0.1680145263671875, -0.1527099609375, -0.1374053955078125, -0.122100830078125, -0.1067962646484375, -0.09149169921875, -0.0761871337890625, -0.060882568359375, -0.0455780029296875, -0.0302734375, -0.0149688720703125, 0.000335693359375, 0.0156402587890625, 0.03094482421875, 0.0462493896484375, 0.061553955078125, 0.0768585205078125, 0.0921630859375, 0.1074676513671875, 0.122772216796875, 0.1380767822265625, 0.15338134765625, 0.1686859130859375, 0.183990478515625, 0.1992950439453125, 0.214599609375, 0.2299041748046875, 0.245208740234375, 0.2605133056640625, 0.27581787109375, 0.2911224365234375, 0.306427001953125, 0.3217315673828125, 0.3370361328125, 0.3523406982421875, 0.367645263671875, 0.3829498291015625, 0.39825439453125, 0.4135589599609375, 0.428863525390625, 0.4441680908203125, 0.45947265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 11.0, 18.0, 31.0, 61.0, 117.0, 218.0, 213.0, 148.0, 73.0, 43.0, 21.0, 13.0, 11.0, 9.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.161233901977539e-05, -8.811336010694504e-05, -8.461438119411469e-05, -8.111540228128433e-05, -7.761642336845398e-05, -7.411744445562363e-05, -7.061846554279327e-05, -6.711948662996292e-05, -6.362050771713257e-05, -6.0121528804302216e-05, -5.662254989147186e-05, -5.312357097864151e-05, -4.962459206581116e-05, -4.6125613152980804e-05, -4.262663424015045e-05, -3.91276553273201e-05, -3.5628676414489746e-05, -3.212969750165939e-05, -2.863071858882904e-05, -2.5131739675998688e-05, -2.1632760763168335e-05, -1.8133781850337982e-05, -1.463480293750763e-05, -1.1135824024677277e-05, -7.636845111846924e-06, -4.137866199016571e-06, -6.388872861862183e-07, 2.8600916266441345e-06, 6.359070539474487e-06, 9.85804945230484e-06, 1.3357028365135193e-05, 1.6856007277965546e-05, 2.03549861907959e-05, 2.385396510362625e-05, 2.7352944016456604e-05, 3.085192292928696e-05, 3.435090184211731e-05, 3.784988075494766e-05, 4.1348859667778015e-05, 4.484783858060837e-05, 4.834681749343872e-05, 5.1845796406269073e-05, 5.5344775319099426e-05, 5.884375423192978e-05, 6.234273314476013e-05, 6.584171205759048e-05, 6.934069097042084e-05, 7.283966988325119e-05, 7.633864879608154e-05, 7.98376277089119e-05, 8.333660662174225e-05, 8.68355855345726e-05, 9.033456444740295e-05, 9.383354336023331e-05, 9.733252227306366e-05, 0.00010083150118589401, 0.00010433048009872437, 0.00010782945901155472, 0.00011132843792438507, 0.00011482741683721542, 0.00011832639575004578, 0.00012182537466287613, 0.00012532435357570648, 0.00012882333248853683, 0.0001323223114013672]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 7.0, 11.0, 12.0, 27.0, 27.0, 58.0, 71.0, 127.0, 223.0, 419.0, 795.0, 1909.0, 5176.0, 17029.0, 225274.0, 764033.0, 22752.0, 6262.0, 2294.0, 945.0, 447.0, 261.0, 135.0, 86.0, 45.0, 33.0, 25.0, 24.0, 7.0, 8.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5543899536132812, -0.5394439697265625, -0.5244979858398438, -0.509552001953125, -0.49460601806640625, -0.4796600341796875, -0.46471405029296875, -0.44976806640625, -0.43482208251953125, -0.4198760986328125, -0.40493011474609375, -0.389984130859375, -0.37503814697265625, -0.3600921630859375, -0.34514617919921875, -0.3302001953125, -0.31525421142578125, -0.3003082275390625, -0.28536224365234375, -0.270416259765625, -0.25547027587890625, -0.2405242919921875, -0.22557830810546875, -0.21063232421875, -0.19568634033203125, -0.1807403564453125, -0.16579437255859375, -0.150848388671875, -0.13590240478515625, -0.1209564208984375, -0.10601043701171875, -0.091064453125, -0.07611846923828125, -0.0611724853515625, -0.04622650146484375, -0.031280517578125, -0.01633453369140625, -0.0013885498046875, 0.01355743408203125, 0.02850341796875, 0.04344940185546875, 0.0583953857421875, 0.07334136962890625, 0.088287353515625, 0.10323333740234375, 0.1181793212890625, 0.13312530517578125, 0.1480712890625, 0.16301727294921875, 0.1779632568359375, 0.19290924072265625, 0.207855224609375, 0.22280120849609375, 0.2377471923828125, 0.25269317626953125, 0.26763916015625, 0.28258514404296875, 0.2975311279296875, 0.31247711181640625, 0.327423095703125, 0.34236907958984375, 0.3573150634765625, 0.37226104736328125, 0.38720703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 4.0, 3.0, 11.0, 11.0, 14.0, 21.0, 27.0, 49.0, 122.0, 444.0, 139.0, 54.0, 38.0, 18.0, 12.0, 6.0, 8.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.3944816589355469, -0.38368988037109375, -0.3728981018066406, -0.3621063232421875, -0.3513145446777344, -0.34052276611328125, -0.3297309875488281, -0.318939208984375, -0.3081474304199219, -0.29735565185546875, -0.2865638732910156, -0.2757720947265625, -0.2649803161621094, -0.25418853759765625, -0.24339675903320312, -0.23260498046875, -0.22181320190429688, -0.21102142333984375, -0.20022964477539062, -0.1894378662109375, -0.17864608764648438, -0.16785430908203125, -0.15706253051757812, -0.146270751953125, -0.13547897338867188, -0.12468719482421875, -0.11389541625976562, -0.1031036376953125, -0.09231185913085938, -0.08152008056640625, -0.07072830200195312, -0.0599365234375, -0.049144744873046875, -0.03835296630859375, -0.027561187744140625, -0.0167694091796875, -0.005977630615234375, 0.00481414794921875, 0.015605926513671875, 0.026397705078125, 0.037189483642578125, 0.04798126220703125, 0.058773040771484375, 0.0695648193359375, 0.08035659790039062, 0.09114837646484375, 0.10194015502929688, 0.11273193359375, 0.12352371215820312, 0.13431549072265625, 0.14510726928710938, 0.1558990478515625, 0.16669082641601562, 0.17748260498046875, 0.18827438354492188, 0.199066162109375, 0.20985794067382812, 0.22064971923828125, 0.23144149780273438, 0.2422332763671875, 0.2530250549316406, 0.26381683349609375, 0.2746086120605469, 0.285400390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 14.0, 23.0, 79.0, 121.0, 255.0, 217.0, 168.0, 77.0, 29.0, 10.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.621408939361572, -5.481589317321777, -5.341769695281982, -5.201949596405029, -5.062129974365234, -4.9223103523254395, -4.7824907302856445, -4.64267110824585, -4.502851486206055, -4.36303186416626, -4.223212242126465, -4.083392143249512, -3.943572521209717, -3.803752899169922, -3.663933277130127, -3.524113655090332, -3.384293556213379, -3.244473934173584, -3.10465407371521, -2.964834451675415, -2.825014591217041, -2.685194969177246, -2.545375347137451, -2.4055557250976562, -2.2657358646392822, -2.1259162425994873, -1.9860963821411133, -1.8462767601013184, -1.7064570188522339, -1.5666372776031494, -1.4268176555633545, -1.28699791431427, -1.1471786499023438, -1.0073589086532593, -0.8675392270088196, -0.7277195453643799, -0.5878998041152954, -0.44808006286621094, -0.30826038122177124, -0.16844069957733154, -0.02862095832824707, 0.11119875311851501, 0.2510184645652771, 0.3908381760120392, 0.5306578874588013, 0.6704776287078857, 0.8102973103523254, 0.9501169919967651, 1.0899367332458496, 1.229756474494934, 1.3695762157440186, 1.5093958377838135, 1.649215579032898, 1.7890353202819824, 1.9288549423217773, 2.0686745643615723, 2.2084944248199463, 2.348314046859741, 2.4881339073181152, 2.62795352935791, 2.767773151397705, 2.907593011856079, 3.047412633895874, 3.187232494354248, 3.327052116394043]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 7.0, 6.0, 12.0, 6.0, 8.0, 15.0, 15.0, 16.0, 20.0, 27.0, 21.0, 21.0, 27.0, 40.0, 28.0, 38.0, 39.0, 46.0, 48.0, 29.0, 50.0, 38.0, 37.0, 33.0, 38.0, 35.0, 39.0, 36.0, 34.0, 31.0, 15.0, 23.0, 9.0, 17.0, 13.0, 13.0, 23.0, 10.0, 5.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2642617225646973, -1.2237061262130737, -1.1831506490707397, -1.1425950527191162, -1.1020395755767822, -1.0614839792251587, -1.0209285020828247, -0.9803729057312012, -0.9398173689842224, -0.8992618322372437, -0.8587062954902649, -0.8181507587432861, -0.7775951623916626, -0.7370396852493286, -0.6964840888977051, -0.6559285521507263, -0.6153730154037476, -0.5748174786567688, -0.53426194190979, -0.4937063753604889, -0.45315083861351013, -0.41259530186653137, -0.3720397353172302, -0.33148419857025146, -0.2909286618232727, -0.25037312507629395, -0.209817573428154, -0.16926202178001404, -0.12870648503303528, -0.08815094828605652, -0.047595396637916565, -0.007039844989776611, 0.03351569175720215, 0.0740712359547615, 0.11462678015232086, 0.15518233180046082, 0.19573786854743958, 0.23629340529441833, 0.2768489718437195, 0.31740450859069824, 0.357960045337677, 0.39851558208465576, 0.4390711188316345, 0.47962668538093567, 0.5201822519302368, 0.5607377290725708, 0.6012933254241943, 0.6418488621711731, 0.6824043989181519, 0.7229599356651306, 0.7635154724121094, 0.8040710091590881, 0.8446265459060669, 0.8851821422576904, 0.9257376790046692, 0.966293215751648, 1.0068488121032715, 1.047404408454895, 1.087959885597229, 1.1285154819488525, 1.1690709590911865, 1.20962655544281, 1.250182032585144, 1.2907376289367676, 1.3312931060791016]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 13.0, 9.0, 11.0, 14.0, 17.0, 27.0, 42.0, 51.0, 59.0, 96.0, 115.0, 210.0, 371.0, 546.0, 843.0, 1457.0, 2537.0, 4800.0, 10310.0, 24374.0, 75655.0, 810517.0, 3114533.0, 94877.0, 28500.0, 11608.0, 5564.0, 2919.0, 1621.0, 947.0, 556.0, 371.0, 229.0, 151.0, 100.0, 60.0, 35.0, 40.0, 21.0, 29.0, 10.0, 8.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.279541015625, -0.2715721130371094, -0.26360321044921875, -0.2556343078613281, -0.2476654052734375, -0.23969650268554688, -0.23172760009765625, -0.22375869750976562, -0.215789794921875, -0.20782089233398438, -0.19985198974609375, -0.19188308715820312, -0.1839141845703125, -0.17594528198242188, -0.16797637939453125, -0.16000747680664062, -0.15203857421875, -0.14406967163085938, -0.13610076904296875, -0.12813186645507812, -0.1201629638671875, -0.11219406127929688, -0.10422515869140625, -0.09625625610351562, -0.088287353515625, -0.08031845092773438, -0.07234954833984375, -0.06438064575195312, -0.0564117431640625, -0.048442840576171875, -0.04047393798828125, -0.032505035400390625, -0.0245361328125, -0.016567230224609375, -0.00859832763671875, -0.000629425048828125, 0.0073394775390625, 0.015308380126953125, 0.02327728271484375, 0.031246185302734375, 0.039215087890625, 0.047183990478515625, 0.05515289306640625, 0.06312179565429688, 0.0710906982421875, 0.07905960083007812, 0.08702850341796875, 0.09499740600585938, 0.10296630859375, 0.11093521118164062, 0.11890411376953125, 0.12687301635742188, 0.1348419189453125, 0.14281082153320312, 0.15077972412109375, 0.15874862670898438, 0.166717529296875, 0.17468643188476562, 0.18265533447265625, 0.19062423706054688, 0.1985931396484375, 0.20656204223632812, 0.21453094482421875, 0.22249984741210938, 0.23046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 10.0, 9.0, 8.0, 17.0, 17.0, 20.0, 16.0, 26.0, 28.0, 34.0, 44.0, 41.0, 39.0, 48.0, 52.0, 47.0, 46.0, 32.0, 51.0, 39.0, 58.0, 45.0, 40.0, 32.0, 31.0, 31.0, 36.0, 22.0, 13.0, 14.0, 6.0, 10.0, 7.0, 8.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06640625, -0.06442022323608398, -0.06243419647216797, -0.06044816970825195, -0.05846214294433594, -0.05647611618041992, -0.054490089416503906, -0.05250406265258789, -0.050518035888671875, -0.04853200912475586, -0.046545982360839844, -0.04455995559692383, -0.04257392883300781, -0.0405879020690918, -0.03860187530517578, -0.036615848541259766, -0.03462982177734375, -0.032643795013427734, -0.03065776824951172, -0.028671741485595703, -0.026685714721679688, -0.024699687957763672, -0.022713661193847656, -0.02072763442993164, -0.018741607666015625, -0.01675558090209961, -0.014769554138183594, -0.012783527374267578, -0.010797500610351562, -0.008811473846435547, -0.006825447082519531, -0.004839420318603516, -0.0028533935546875, -0.0008673667907714844, 0.0011186599731445312, 0.003104686737060547, 0.0050907135009765625, 0.007076740264892578, 0.009062767028808594, 0.01104879379272461, 0.013034820556640625, 0.01502084732055664, 0.017006874084472656, 0.018992900848388672, 0.020978927612304688, 0.022964954376220703, 0.02495098114013672, 0.026937007904052734, 0.02892303466796875, 0.030909061431884766, 0.03289508819580078, 0.0348811149597168, 0.03686714172363281, 0.03885316848754883, 0.040839195251464844, 0.04282522201538086, 0.044811248779296875, 0.04679727554321289, 0.048783302307128906, 0.05076932907104492, 0.05275535583496094, 0.05474138259887695, 0.05672740936279297, 0.058713436126708984, 0.060699462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 22.0, 32.0, 45.0, 76.0, 103.0, 125.0, 232.0, 357.0, 616.0, 1223.0, 2294.0, 5417.0, 14938.0, 51274.0, 342935.0, 3589827.0, 137256.0, 30023.0, 9574.0, 3787.0, 1772.0, 947.0, 523.0, 303.0, 177.0, 112.0, 71.0, 62.0, 34.0, 19.0, 12.0, 18.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.457275390625, -0.44467926025390625, -0.4320831298828125, -0.41948699951171875, -0.406890869140625, -0.39429473876953125, -0.3816986083984375, -0.36910247802734375, -0.35650634765625, -0.34391021728515625, -0.3313140869140625, -0.31871795654296875, -0.306121826171875, -0.29352569580078125, -0.2809295654296875, -0.26833343505859375, -0.2557373046875, -0.24314117431640625, -0.2305450439453125, -0.21794891357421875, -0.205352783203125, -0.19275665283203125, -0.1801605224609375, -0.16756439208984375, -0.15496826171875, -0.14237213134765625, -0.1297760009765625, -0.11717987060546875, -0.104583740234375, -0.09198760986328125, -0.0793914794921875, -0.06679534912109375, -0.05419921875, -0.04160308837890625, -0.0290069580078125, -0.01641082763671875, -0.003814697265625, 0.00878143310546875, 0.0213775634765625, 0.03397369384765625, 0.04656982421875, 0.05916595458984375, 0.0717620849609375, 0.08435821533203125, 0.096954345703125, 0.10955047607421875, 0.1221466064453125, 0.13474273681640625, 0.1473388671875, 0.15993499755859375, 0.1725311279296875, 0.18512725830078125, 0.197723388671875, 0.21031951904296875, 0.2229156494140625, 0.23551177978515625, 0.24810791015625, 0.26070404052734375, 0.2733001708984375, 0.28589630126953125, 0.298492431640625, 0.31108856201171875, 0.3236846923828125, 0.33628082275390625, 0.348876953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 4.0, 10.0, 14.0, 30.0, 33.0, 60.0, 84.0, 154.0, 580.0, 2321.0, 381.0, 153.0, 82.0, 50.0, 36.0, 21.0, 21.0, 4.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21848106384277344, -0.21247482299804688, -0.2064685821533203, -0.20046234130859375, -0.1944561004638672, -0.18844985961914062, -0.18244361877441406, -0.1764373779296875, -0.17043113708496094, -0.16442489624023438, -0.1584186553955078, -0.15241241455078125, -0.1464061737060547, -0.14039993286132812, -0.13439369201660156, -0.128387451171875, -0.12238121032714844, -0.11637496948242188, -0.11036872863769531, -0.10436248779296875, -0.09835624694824219, -0.09235000610351562, -0.08634376525878906, -0.0803375244140625, -0.07433128356933594, -0.06832504272460938, -0.06231880187988281, -0.05631256103515625, -0.05030632019042969, -0.044300079345703125, -0.03829383850097656, -0.03228759765625, -0.026281356811523438, -0.020275115966796875, -0.014268875122070312, -0.00826263427734375, -0.0022563934326171875, 0.003749847412109375, 0.009756088256835938, 0.0157623291015625, 0.021768569946289062, 0.027774810791015625, 0.03378105163574219, 0.03978729248046875, 0.04579353332519531, 0.051799774169921875, 0.05780601501464844, 0.063812255859375, 0.06981849670410156, 0.07582473754882812, 0.08183097839355469, 0.08783721923828125, 0.09384346008300781, 0.09984970092773438, 0.10585594177246094, 0.1118621826171875, 0.11786842346191406, 0.12387466430664062, 0.1298809051513672, 0.13588714599609375, 0.1418933868408203, 0.14789962768554688, 0.15390586853027344, 0.159912109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 36.0, 42.0, 56.0, 113.0, 103.0, 129.0, 110.0, 125.0, 96.0, 51.0, 40.0, 18.0, 26.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0710904598236084, -1.042158603668213, -1.0132266283035278, -0.9842947125434875, -0.9553627967834473, -0.9264309406280518, -0.8974990248680115, -0.8685671091079712, -0.8396351933479309, -0.8107032775878906, -0.7817713618278503, -0.7528394460678101, -0.7239075899124146, -0.6949756145477295, -0.666043758392334, -0.6371118426322937, -0.6081799268722534, -0.5792480111122131, -0.5503160953521729, -0.5213841795921326, -0.4924522936344147, -0.4635203778743744, -0.4345884919166565, -0.4056565761566162, -0.3767246603965759, -0.34779274463653564, -0.31886082887649536, -0.28992894291877747, -0.2609970271587372, -0.2320651113986969, -0.2031332105398178, -0.17420130968093872, -0.14526933431625366, -0.11633742600679398, -0.08740551769733429, -0.0584736093878746, -0.029541701078414917, -0.0006097853183746338, 0.028322115540504456, 0.057254016399383545, 0.08618593215942383, 0.11511784046888351, 0.1440497487783432, 0.1729816496372223, 0.20191356539726257, 0.23084548115730286, 0.25977736711502075, 0.28870928287506104, 0.3176411986351013, 0.3465731143951416, 0.3755050301551819, 0.4044369161128998, 0.43336883187294006, 0.46230074763298035, 0.49123263359069824, 0.5201645493507385, 0.5490964651107788, 0.5780283808708191, 0.6069602966308594, 0.6358922123908997, 0.6648241281509399, 0.6937559843063354, 0.7226879000663757, 0.751619815826416, 0.7805517315864563]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 9.0, 10.0, 12.0, 10.0, 14.0, 29.0, 23.0, 24.0, 20.0, 27.0, 30.0, 29.0, 30.0, 30.0, 34.0, 28.0, 40.0, 38.0, 44.0, 40.0, 30.0, 45.0, 34.0, 35.0, 26.0, 25.0, 30.0, 25.0, 26.0, 15.0, 25.0, 19.0, 28.0, 19.0, 18.0, 11.0, 8.0, 10.0, 7.0, 8.0, 7.0, 4.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.42418307065963745, -0.41092607378959656, -0.3976690471172333, -0.3844120502471924, -0.3711550533771515, -0.3578980267047882, -0.3446410298347473, -0.33138400316238403, -0.31812700629234314, -0.30487000942230225, -0.29161298274993896, -0.27835598587989807, -0.2650989890098572, -0.2518419623374939, -0.238584965467453, -0.22532795369625092, -0.21207095682621002, -0.19881394505500793, -0.18555694818496704, -0.17229993641376495, -0.15904292464256287, -0.14578592777252197, -0.13252891600131989, -0.1192719042301178, -0.10601489990949631, -0.09275789558887482, -0.07950088381767273, -0.06624387949705124, -0.05298687145113945, -0.03972986340522766, -0.02647285908460617, -0.013215847313404083, 4.1157007217407227e-05, 0.013298164121806622, 0.026555171236395836, 0.039812177419662476, 0.053069185465574265, 0.06632619351148605, 0.07958319783210754, 0.09284020960330963, 0.10609721392393112, 0.11935421824455261, 0.1326112300157547, 0.1458682417869568, 0.15912523865699768, 0.17238225042819977, 0.18563926219940186, 0.19889625906944275, 0.21215327084064484, 0.22541028261184692, 0.23866727948188782, 0.2519242763519287, 0.265181303024292, 0.2784382998943329, 0.2916952967643738, 0.30495232343673706, 0.31820932030677795, 0.33146631717681885, 0.34472334384918213, 0.357980340719223, 0.3712373375892639, 0.3844943642616272, 0.3977513611316681, 0.411008358001709, 0.42426538467407227]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 10.0, 12.0, 15.0, 14.0, 27.0, 44.0, 60.0, 94.0, 135.0, 212.0, 372.0, 598.0, 994.0, 1760.0, 3241.0, 6365.0, 12656.0, 26285.0, 61200.0, 219200.0, 493876.0, 134307.0, 45022.0, 20501.0, 10103.0, 5020.0, 2801.0, 1449.0, 767.0, 505.0, 293.0, 196.0, 113.0, 95.0, 55.0, 45.0, 23.0, 24.0, 16.0, 12.0, 11.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.23486328125, -0.22873687744140625, -0.2226104736328125, -0.21648406982421875, -0.210357666015625, -0.20423126220703125, -0.1981048583984375, -0.19197845458984375, -0.18585205078125, -0.17972564697265625, -0.1735992431640625, -0.16747283935546875, -0.161346435546875, -0.15522003173828125, -0.1490936279296875, -0.14296722412109375, -0.1368408203125, -0.13071441650390625, -0.1245880126953125, -0.11846160888671875, -0.112335205078125, -0.10620880126953125, -0.1000823974609375, -0.09395599365234375, -0.08782958984375, -0.08170318603515625, -0.0755767822265625, -0.06945037841796875, -0.063323974609375, -0.05719757080078125, -0.0510711669921875, -0.04494476318359375, -0.038818359375, -0.03269195556640625, -0.0265655517578125, -0.02043914794921875, -0.014312744140625, -0.00818634033203125, -0.0020599365234375, 0.00406646728515625, 0.01019287109375, 0.01631927490234375, 0.0224456787109375, 0.02857208251953125, 0.034698486328125, 0.04082489013671875, 0.0469512939453125, 0.05307769775390625, 0.0592041015625, 0.06533050537109375, 0.0714569091796875, 0.07758331298828125, 0.083709716796875, 0.08983612060546875, 0.0959625244140625, 0.10208892822265625, 0.10821533203125, 0.11434173583984375, 0.1204681396484375, 0.12659454345703125, 0.132720947265625, 0.13884735107421875, 0.1449737548828125, 0.15110015869140625, 0.1572265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 9.0, 8.0, 14.0, 19.0, 15.0, 26.0, 25.0, 31.0, 35.0, 39.0, 31.0, 46.0, 45.0, 50.0, 47.0, 61.0, 50.0, 49.0, 41.0, 42.0, 51.0, 38.0, 47.0, 31.0, 33.0, 18.0, 31.0, 11.0, 9.0, 13.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07811260223388672, -0.07584190368652344, -0.07357120513916016, -0.07130050659179688, -0.0690298080444336, -0.06675910949707031, -0.06448841094970703, -0.06221771240234375, -0.05994701385498047, -0.05767631530761719, -0.055405616760253906, -0.053134918212890625, -0.050864219665527344, -0.04859352111816406, -0.04632282257080078, -0.0440521240234375, -0.04178142547607422, -0.03951072692871094, -0.037240028381347656, -0.034969329833984375, -0.032698631286621094, -0.030427932739257812, -0.02815723419189453, -0.02588653564453125, -0.02361583709716797, -0.021345138549804688, -0.019074440002441406, -0.016803741455078125, -0.014533042907714844, -0.012262344360351562, -0.009991645812988281, -0.007720947265625, -0.005450248718261719, -0.0031795501708984375, -0.0009088516235351562, 0.001361846923828125, 0.0036325454711914062, 0.0059032440185546875, 0.008173942565917969, 0.01044464111328125, 0.012715339660644531, 0.014986038208007812, 0.017256736755371094, 0.019527435302734375, 0.021798133850097656, 0.024068832397460938, 0.02633953094482422, 0.0286102294921875, 0.03088092803955078, 0.03315162658691406, 0.035422325134277344, 0.037693023681640625, 0.039963722229003906, 0.04223442077636719, 0.04450511932373047, 0.04677581787109375, 0.04904651641845703, 0.05131721496582031, 0.053587913513183594, 0.055858612060546875, 0.058129310607910156, 0.06040000915527344, 0.06267070770263672, 0.06494140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 12.0, 17.0, 24.0, 28.0, 57.0, 78.0, 202.0, 301.0, 608.0, 1536.0, 4370.0, 13719.0, 53823.0, 783424.0, 152811.0, 25639.0, 7392.0, 2545.0, 980.0, 439.0, 221.0, 117.0, 65.0, 41.0, 23.0, 29.0, 15.0, 10.0, 3.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54345703125, -0.5273513793945312, -0.5112457275390625, -0.49514007568359375, -0.479034423828125, -0.46292877197265625, -0.4468231201171875, -0.43071746826171875, -0.41461181640625, -0.39850616455078125, -0.3824005126953125, -0.36629486083984375, -0.350189208984375, -0.33408355712890625, -0.3179779052734375, -0.30187225341796875, -0.2857666015625, -0.26966094970703125, -0.2535552978515625, -0.23744964599609375, -0.221343994140625, -0.20523834228515625, -0.1891326904296875, -0.17302703857421875, -0.15692138671875, -0.14081573486328125, -0.1247100830078125, -0.10860443115234375, -0.092498779296875, -0.07639312744140625, -0.0602874755859375, -0.04418182373046875, -0.028076171875, -0.01197052001953125, 0.0041351318359375, 0.02024078369140625, 0.036346435546875, 0.05245208740234375, 0.0685577392578125, 0.08466339111328125, 0.10076904296875, 0.11687469482421875, 0.1329803466796875, 0.14908599853515625, 0.165191650390625, 0.18129730224609375, 0.1974029541015625, 0.21350860595703125, 0.2296142578125, 0.24571990966796875, 0.2618255615234375, 0.27793121337890625, 0.294036865234375, 0.31014251708984375, 0.3262481689453125, 0.34235382080078125, 0.35845947265625, 0.37456512451171875, 0.3906707763671875, 0.40677642822265625, 0.422882080078125, 0.43898773193359375, 0.4550933837890625, 0.47119903564453125, 0.4873046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 4.0, 7.0, 12.0, 17.0, 19.0, 36.0, 52.0, 55.0, 60.0, 89.0, 73.0, 93.0, 93.0, 80.0, 64.0, 54.0, 45.0, 38.0, 27.0, 20.0, 10.0, 5.0, 12.0, 6.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.65087890625, -0.6347808837890625, -0.618682861328125, -0.6025848388671875, -0.58648681640625, -0.5703887939453125, -0.554290771484375, -0.5381927490234375, -0.5220947265625, -0.5059967041015625, -0.489898681640625, -0.4738006591796875, -0.45770263671875, -0.4416046142578125, -0.425506591796875, -0.4094085693359375, -0.393310546875, -0.3772125244140625, -0.361114501953125, -0.3450164794921875, -0.32891845703125, -0.3128204345703125, -0.296722412109375, -0.2806243896484375, -0.2645263671875, -0.2484283447265625, -0.232330322265625, -0.2162322998046875, -0.20013427734375, -0.1840362548828125, -0.167938232421875, -0.1518402099609375, -0.1357421875, -0.1196441650390625, -0.103546142578125, -0.0874481201171875, -0.07135009765625, -0.0552520751953125, -0.039154052734375, -0.0230560302734375, -0.0069580078125, 0.0091400146484375, 0.025238037109375, 0.0413360595703125, 0.05743408203125, 0.0735321044921875, 0.089630126953125, 0.1057281494140625, 0.121826171875, 0.1379241943359375, 0.154022216796875, 0.1701202392578125, 0.18621826171875, 0.2023162841796875, 0.218414306640625, 0.2345123291015625, 0.2506103515625, 0.2667083740234375, 0.282806396484375, 0.2989044189453125, 0.31500244140625, 0.3311004638671875, 0.347198486328125, 0.3632965087890625, 0.37939453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 21.0, 13.0, 36.0, 45.0, 46.0, 87.0, 119.0, 157.0, 267.0, 401.0, 609.0, 1069.0, 1887.0, 3883.0, 10519.0, 37420.0, 688278.0, 258670.0, 28580.0, 8676.0, 3415.0, 1688.0, 931.0, 566.0, 371.0, 247.0, 158.0, 115.0, 87.0, 49.0, 38.0, 27.0, 14.0, 11.0, 7.0, 9.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369384765625, -0.358489990234375, -0.34759521484375, -0.336700439453125, -0.3258056640625, -0.314910888671875, -0.30401611328125, -0.293121337890625, -0.2822265625, -0.271331787109375, -0.26043701171875, -0.249542236328125, -0.2386474609375, -0.227752685546875, -0.21685791015625, -0.205963134765625, -0.195068359375, -0.184173583984375, -0.17327880859375, -0.162384033203125, -0.1514892578125, -0.140594482421875, -0.12969970703125, -0.118804931640625, -0.10791015625, -0.097015380859375, -0.08612060546875, -0.075225830078125, -0.0643310546875, -0.053436279296875, -0.04254150390625, -0.031646728515625, -0.020751953125, -0.009857177734375, 0.00103759765625, 0.011932373046875, 0.0228271484375, 0.033721923828125, 0.04461669921875, 0.055511474609375, 0.06640625, 0.077301025390625, 0.08819580078125, 0.099090576171875, 0.1099853515625, 0.120880126953125, 0.13177490234375, 0.142669677734375, 0.153564453125, 0.164459228515625, 0.17535400390625, 0.186248779296875, 0.1971435546875, 0.208038330078125, 0.21893310546875, 0.229827880859375, 0.24072265625, 0.251617431640625, 0.26251220703125, 0.273406982421875, 0.2843017578125, 0.295196533203125, 0.30609130859375, 0.316986083984375, 0.327880859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 11.0, 16.0, 26.0, 34.0, 109.0, 311.0, 288.0, 89.0, 39.0, 18.0, 14.0, 13.0, 8.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.00014095008373260498, -0.00013622641563415527, -0.00013150274753570557, -0.00012677907943725586, -0.00012205541133880615, -0.00011733174324035645, -0.00011260807514190674, -0.00010788440704345703, -0.00010316073894500732, -9.843707084655762e-05, -9.371340274810791e-05, -8.89897346496582e-05, -8.42660665512085e-05, -7.954239845275879e-05, -7.481873035430908e-05, -7.009506225585938e-05, -6.537139415740967e-05, -6.064772605895996e-05, -5.5924057960510254e-05, -5.120038986206055e-05, -4.647672176361084e-05, -4.175305366516113e-05, -3.7029385566711426e-05, -3.230571746826172e-05, -2.7582049369812012e-05, -2.2858381271362305e-05, -1.8134713172912598e-05, -1.341104507446289e-05, -8.687376976013184e-06, -3.9637088775634766e-06, 7.599592208862305e-07, 5.4836273193359375e-06, 1.0207295417785645e-05, 1.4930963516235352e-05, 1.965463161468506e-05, 2.4378299713134766e-05, 2.9101967811584473e-05, 3.382563591003418e-05, 3.854930400848389e-05, 4.3272972106933594e-05, 4.79966402053833e-05, 5.272030830383301e-05, 5.7443976402282715e-05, 6.216764450073242e-05, 6.689131259918213e-05, 7.161498069763184e-05, 7.633864879608154e-05, 8.106231689453125e-05, 8.578598499298096e-05, 9.050965309143066e-05, 9.523332118988037e-05, 9.995698928833008e-05, 0.00010468065738677979, 0.00010940432548522949, 0.0001141279935836792, 0.0001188516616821289, 0.0001235753297805786, 0.00012829899787902832, 0.00013302266597747803, 0.00013774633407592773, 0.00014247000217437744, 0.00014719367027282715, 0.00015191733837127686, 0.00015664100646972656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 2.0, 6.0, 3.0, 6.0, 10.0, 12.0, 12.0, 32.0, 34.0, 88.0, 84.0, 154.0, 238.0, 362.0, 512.0, 740.0, 1026.0, 1720.0, 3059.0, 6684.0, 17857.0, 74302.0, 829378.0, 78661.0, 18521.0, 6735.0, 3167.0, 1743.0, 1088.0, 699.0, 500.0, 368.0, 202.0, 175.0, 102.0, 83.0, 49.0, 44.0, 16.0, 18.0, 20.0, 10.0, 4.0, 0.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34033203125, -0.3295326232910156, -0.31873321533203125, -0.3079338073730469, -0.2971343994140625, -0.2863349914550781, -0.27553558349609375, -0.2647361755371094, -0.253936767578125, -0.24313735961914062, -0.23233795166015625, -0.22153854370117188, -0.2107391357421875, -0.19993972778320312, -0.18914031982421875, -0.17834091186523438, -0.16754150390625, -0.15674209594726562, -0.14594268798828125, -0.13514328002929688, -0.1243438720703125, -0.11354446411132812, -0.10274505615234375, -0.09194564819335938, -0.081146240234375, -0.07034683227539062, -0.05954742431640625, -0.048748016357421875, -0.0379486083984375, -0.027149200439453125, -0.01634979248046875, -0.005550384521484375, 0.0052490234375, 0.016048431396484375, 0.02684783935546875, 0.037647247314453125, 0.0484466552734375, 0.059246063232421875, 0.07004547119140625, 0.08084487915039062, 0.091644287109375, 0.10244369506835938, 0.11324310302734375, 0.12404251098632812, 0.1348419189453125, 0.14564132690429688, 0.15644073486328125, 0.16724014282226562, 0.17803955078125, 0.18883895874023438, 0.19963836669921875, 0.21043777465820312, 0.2212371826171875, 0.23203659057617188, 0.24283599853515625, 0.2536354064941406, 0.264434814453125, 0.2752342224121094, 0.28603363037109375, 0.2968330383300781, 0.3076324462890625, 0.3184318542480469, 0.32923126220703125, 0.3400306701660156, 0.350830078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 10.0, 14.0, 14.0, 14.0, 32.0, 62.0, 178.0, 328.0, 139.0, 62.0, 35.0, 17.0, 16.0, 10.0, 14.0, 4.0, 5.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.36865234375, -0.3587989807128906, -0.34894561767578125, -0.3390922546386719, -0.3292388916015625, -0.3193855285644531, -0.30953216552734375, -0.2996788024902344, -0.289825439453125, -0.2799720764160156, -0.27011871337890625, -0.2602653503417969, -0.2504119873046875, -0.24055862426757812, -0.23070526123046875, -0.22085189819335938, -0.21099853515625, -0.20114517211914062, -0.19129180908203125, -0.18143844604492188, -0.1715850830078125, -0.16173171997070312, -0.15187835693359375, -0.14202499389648438, -0.132171630859375, -0.12231826782226562, -0.11246490478515625, -0.10261154174804688, -0.0927581787109375, -0.08290481567382812, -0.07305145263671875, -0.06319808959960938, -0.0533447265625, -0.043491363525390625, -0.03363800048828125, -0.023784637451171875, -0.0139312744140625, -0.004077911376953125, 0.00577545166015625, 0.015628814697265625, 0.025482177734375, 0.035335540771484375, 0.04518890380859375, 0.055042266845703125, 0.0648956298828125, 0.07474899291992188, 0.08460235595703125, 0.09445571899414062, 0.10430908203125, 0.11416244506835938, 0.12401580810546875, 0.13386917114257812, 0.1437225341796875, 0.15357589721679688, 0.16342926025390625, 0.17328262329101562, 0.183135986328125, 0.19298934936523438, 0.20284271240234375, 0.21269607543945312, 0.2225494384765625, 0.23240280151367188, 0.24225616455078125, 0.2521095275878906, 0.261962890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 5.0, 28.0, 37.0, 90.0, 139.0, 206.0, 215.0, 141.0, 74.0, 29.0, 26.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.804680109024048, -3.663499355316162, -3.5223186016082764, -3.3811378479003906, -3.239956855773926, -3.098776340484619, -2.9575953483581543, -2.8164145946502686, -2.675233840942383, -2.534053087234497, -2.3928723335266113, -2.2516915798187256, -2.11051082611084, -1.9693299531936646, -1.8281490802764893, -1.6869683265686035, -1.5457875728607178, -1.404606819152832, -1.2634260654449463, -1.122245192527771, -0.9810644388198853, -0.8398836851119995, -0.698702871799469, -0.5575220584869385, -0.41634130477905273, -0.2751605212688446, -0.13397973775863647, 0.007201045751571655, 0.14838182926177979, 0.2895625829696655, 0.43074339628219604, 0.5719242095947266, 0.7131052017211914, 0.8542859554290771, 0.9954667687416077, 1.1366475820541382, 1.277828335762024, 1.4190090894699097, 1.560189962387085, 1.7013707160949707, 1.8425514698028564, 1.9837322235107422, 2.124912977218628, 2.2660937309265137, 2.4072747230529785, 2.548455238342285, 2.68963623046875, 2.8308169841766357, 2.9719977378845215, 3.1131784915924072, 3.254359245300293, 3.3955399990081787, 3.5367207527160645, 3.6779017448425293, 3.819082498550415, 3.960263252258301, 4.101444244384766, 4.2426252365112305, 4.383805751800537, 4.524986743927002, 4.666167259216309, 4.807348251342773, 4.94852876663208, 5.089709758758545, 5.230890274047852]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 8.0, 12.0, 16.0, 22.0, 27.0, 24.0, 22.0, 30.0, 35.0, 37.0, 33.0, 31.0, 38.0, 47.0, 41.0, 58.0, 42.0, 42.0, 38.0, 49.0, 35.0, 34.0, 33.0, 33.0, 28.0, 26.0, 18.0, 11.0, 22.0, 12.0, 15.0, 5.0, 10.0, 6.0, 4.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5043754577636719, -1.4553288221359253, -1.4062821865081787, -1.3572355508804321, -1.3081889152526855, -1.259142279624939, -1.2100956439971924, -1.1610491275787354, -1.1120023727416992, -1.0629557371139526, -1.013909101486206, -0.9648624658584595, -0.9158158302307129, -0.8667691946029663, -0.8177226185798645, -0.7686759829521179, -0.7196294069290161, -0.6705827713012695, -0.621536135673523, -0.5724895000457764, -0.5234428644180298, -0.4743962585926056, -0.4253496527671814, -0.3763030171394348, -0.32725638151168823, -0.27820974588394165, -0.22916312515735626, -0.18011650443077087, -0.1310698688030243, -0.08202323317527771, -0.032976627349853516, 0.016070008277893066, 0.06511664390563965, 0.11416327208280563, 0.16320990025997162, 0.212256520986557, 0.2613031566143036, 0.31034979224205017, 0.35939639806747437, 0.40844303369522095, 0.45748966932296753, 0.5065363049507141, 0.5555829405784607, 0.6046295166015625, 0.6536761522293091, 0.7027227878570557, 0.7517694234848022, 0.8008160591125488, 0.8498626947402954, 0.898909330368042, 0.9479559659957886, 0.9970026016235352, 1.0460492372512817, 1.0950958728790283, 1.1441423892974854, 1.1931891441345215, 1.2422356605529785, 1.291282296180725, 1.3403289318084717, 1.3893755674362183, 1.4384222030639648, 1.4874688386917114, 1.536515474319458, 1.585561990737915, 1.6346087455749512]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 11.0, 10.0, 14.0, 23.0, 26.0, 37.0, 65.0, 83.0, 156.0, 215.0, 354.0, 674.0, 1249.0, 2543.0, 5499.0, 14515.0, 51157.0, 692791.0, 3331799.0, 64389.0, 16950.0, 6213.0, 2601.0, 1332.0, 651.0, 357.0, 191.0, 136.0, 81.0, 53.0, 39.0, 23.0, 12.0, 7.0, 11.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.525390625, -0.5108261108398438, -0.4962615966796875, -0.48169708251953125, -0.467132568359375, -0.45256805419921875, -0.4380035400390625, -0.42343902587890625, -0.40887451171875, -0.39430999755859375, -0.3797454833984375, -0.36518096923828125, -0.350616455078125, -0.33605194091796875, -0.3214874267578125, -0.30692291259765625, -0.2923583984375, -0.27779388427734375, -0.2632293701171875, -0.24866485595703125, -0.234100341796875, -0.21953582763671875, -0.2049713134765625, -0.19040679931640625, -0.17584228515625, -0.16127777099609375, -0.1467132568359375, -0.13214874267578125, -0.117584228515625, -0.10301971435546875, -0.0884552001953125, -0.07389068603515625, -0.059326171875, -0.04476165771484375, -0.0301971435546875, -0.01563262939453125, -0.001068115234375, 0.01349639892578125, 0.0280609130859375, 0.04262542724609375, 0.05718994140625, 0.07175445556640625, 0.0863189697265625, 0.10088348388671875, 0.115447998046875, 0.13001251220703125, 0.1445770263671875, 0.15914154052734375, 0.1737060546875, 0.18827056884765625, 0.2028350830078125, 0.21739959716796875, 0.231964111328125, 0.24652862548828125, 0.2610931396484375, 0.27565765380859375, 0.29022216796875, 0.30478668212890625, 0.3193511962890625, 0.33391571044921875, 0.348480224609375, 0.36304473876953125, 0.3776092529296875, 0.39217376708984375, 0.40673828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 14.0, 15.0, 12.0, 13.0, 21.0, 25.0, 25.0, 38.0, 36.0, 38.0, 51.0, 55.0, 44.0, 45.0, 40.0, 56.0, 36.0, 58.0, 39.0, 46.0, 49.0, 38.0, 30.0, 38.0, 23.0, 22.0, 23.0, 13.0, 4.0, 11.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08831787109375, -0.08587169647216797, -0.08342552185058594, -0.0809793472290039, -0.07853317260742188, -0.07608699798583984, -0.07364082336425781, -0.07119464874267578, -0.06874847412109375, -0.06630229949951172, -0.06385612487792969, -0.061409950256347656, -0.058963775634765625, -0.056517601013183594, -0.05407142639160156, -0.05162525177001953, -0.0491790771484375, -0.04673290252685547, -0.04428672790527344, -0.041840553283691406, -0.039394378662109375, -0.036948204040527344, -0.03450202941894531, -0.03205585479736328, -0.02960968017578125, -0.02716350555419922, -0.024717330932617188, -0.022271156311035156, -0.019824981689453125, -0.017378807067871094, -0.014932632446289062, -0.012486457824707031, -0.010040283203125, -0.007594108581542969, -0.0051479339599609375, -0.0027017593383789062, -0.000255584716796875, 0.0021905899047851562, 0.0046367645263671875, 0.007082939147949219, 0.00952911376953125, 0.011975288391113281, 0.014421463012695312, 0.016867637634277344, 0.019313812255859375, 0.021759986877441406, 0.024206161499023438, 0.02665233612060547, 0.0290985107421875, 0.03154468536376953, 0.03399085998535156, 0.036437034606933594, 0.038883209228515625, 0.041329383850097656, 0.04377555847167969, 0.04622173309326172, 0.04866790771484375, 0.05111408233642578, 0.05356025695800781, 0.056006431579589844, 0.058452606201171875, 0.060898780822753906, 0.06334495544433594, 0.06579113006591797, 0.0682373046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 14.0, 20.0, 23.0, 28.0, 48.0, 62.0, 76.0, 121.0, 200.0, 286.0, 448.0, 639.0, 972.0, 1637.0, 2577.0, 4430.0, 8439.0, 18132.0, 48368.0, 219672.0, 3604008.0, 200659.0, 46226.0, 17715.0, 8248.0, 4358.0, 2551.0, 1518.0, 966.0, 551.0, 400.0, 288.0, 170.0, 125.0, 93.0, 73.0, 45.0, 39.0, 22.0, 14.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4349517822265625, -0.420196533203125, -0.4054412841796875, -0.39068603515625, -0.3759307861328125, -0.361175537109375, -0.3464202880859375, -0.3316650390625, -0.3169097900390625, -0.302154541015625, -0.2873992919921875, -0.27264404296875, -0.2578887939453125, -0.243133544921875, -0.2283782958984375, -0.213623046875, -0.1988677978515625, -0.184112548828125, -0.1693572998046875, -0.15460205078125, -0.1398468017578125, -0.125091552734375, -0.1103363037109375, -0.0955810546875, -0.0808258056640625, -0.066070556640625, -0.0513153076171875, -0.03656005859375, -0.0218048095703125, -0.007049560546875, 0.0077056884765625, 0.0224609375, 0.0372161865234375, 0.051971435546875, 0.0667266845703125, 0.08148193359375, 0.0962371826171875, 0.110992431640625, 0.1257476806640625, 0.1405029296875, 0.1552581787109375, 0.170013427734375, 0.1847686767578125, 0.19952392578125, 0.2142791748046875, 0.229034423828125, 0.2437896728515625, 0.258544921875, 0.2733001708984375, 0.288055419921875, 0.3028106689453125, 0.31756591796875, 0.3323211669921875, 0.347076416015625, 0.3618316650390625, 0.3765869140625, 0.3913421630859375, 0.406097412109375, 0.4208526611328125, 0.43560791015625, 0.4503631591796875, 0.465118408203125, 0.4798736572265625, 0.49462890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 9.0, 10.0, 9.0, 12.0, 22.0, 30.0, 33.0, 61.0, 108.0, 304.0, 2340.0, 643.0, 196.0, 96.0, 55.0, 37.0, 23.0, 15.0, 14.0, 12.0, 8.0, 2.0, 3.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21198463439941406, -0.20460891723632812, -0.1972332000732422, -0.18985748291015625, -0.1824817657470703, -0.17510604858398438, -0.16773033142089844, -0.1603546142578125, -0.15297889709472656, -0.14560317993164062, -0.1382274627685547, -0.13085174560546875, -0.12347602844238281, -0.11610031127929688, -0.10872459411621094, -0.101348876953125, -0.09397315979003906, -0.08659744262695312, -0.07922172546386719, -0.07184600830078125, -0.06447029113769531, -0.057094573974609375, -0.04971885681152344, -0.0423431396484375, -0.03496742248535156, -0.027591705322265625, -0.020215988159179688, -0.01284027099609375, -0.0054645538330078125, 0.001911163330078125, 0.009286880493164062, 0.01666259765625, 0.024038314819335938, 0.031414031982421875, 0.03878974914550781, 0.04616546630859375, 0.05354118347167969, 0.060916900634765625, 0.06829261779785156, 0.0756683349609375, 0.08304405212402344, 0.09041976928710938, 0.09779548645019531, 0.10517120361328125, 0.11254692077636719, 0.11992263793945312, 0.12729835510253906, 0.134674072265625, 0.14204978942871094, 0.14942550659179688, 0.1568012237548828, 0.16417694091796875, 0.1715526580810547, 0.17892837524414062, 0.18630409240722656, 0.1936798095703125, 0.20105552673339844, 0.20843124389648438, 0.2158069610595703, 0.22318267822265625, 0.2305583953857422, 0.23793411254882812, 0.24530982971191406, 0.252685546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 21.0, 41.0, 69.0, 87.0, 124.0, 144.0, 156.0, 110.0, 86.0, 62.0, 34.0, 25.0, 14.0, 5.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8972572684288025, -0.8539426922798157, -0.8106281757354736, -0.7673135995864868, -0.7239990234375, -0.6806844472885132, -0.6373698711395264, -0.5940553545951843, -0.5507407784461975, -0.5074262022972107, -0.46411165595054626, -0.42079710960388184, -0.377482533454895, -0.3341679573059082, -0.2908534109592438, -0.24753886461257935, -0.20422428846359253, -0.1609097272157669, -0.11759516596794128, -0.07428060472011566, -0.03096604347229004, 0.012348517775535583, 0.055663079023361206, 0.09897762537002563, 0.14229220151901245, 0.18560676276683807, 0.2289213240146637, 0.2722358703613281, 0.31555044651031494, 0.35886502265930176, 0.4021795690059662, 0.4454941153526306, 0.48880863189697266, 0.5321232080459595, 0.5754377841949463, 0.6187523007392883, 0.6620668768882751, 0.705381453037262, 0.748695969581604, 0.7920105457305908, 0.8353251218795776, 0.8786396980285645, 0.9219542741775513, 0.9652687907218933, 1.0085833072662354, 1.0518978834152222, 1.095212459564209, 1.1385270357131958, 1.1818416118621826, 1.2251561880111694, 1.2684707641601562, 1.311785340309143, 1.3550999164581299, 1.3984143733978271, 1.441728949546814, 1.4850435256958008, 1.5283581018447876, 1.5716726779937744, 1.6149872541427612, 1.658301830291748, 1.7016162872314453, 1.7449308633804321, 1.788245439529419, 1.8315600156784058, 1.8748745918273926]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 7.0, 9.0, 11.0, 11.0, 11.0, 12.0, 10.0, 16.0, 20.0, 11.0, 25.0, 21.0, 30.0, 33.0, 27.0, 30.0, 53.0, 39.0, 40.0, 39.0, 45.0, 48.0, 32.0, 35.0, 33.0, 35.0, 35.0, 36.0, 19.0, 27.0, 26.0, 30.0, 17.0, 19.0, 23.0, 16.0, 13.0, 16.0, 10.0, 5.0, 8.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5524599552154541, -0.5349141359329224, -0.5173683166503906, -0.4998224973678589, -0.48227664828300476, -0.464730829000473, -0.4471850097179413, -0.42963919043540955, -0.4120933413505554, -0.3945475220680237, -0.37700170278549194, -0.3594558835029602, -0.3419100344181061, -0.32436421513557434, -0.3068183958530426, -0.28927257657051086, -0.2717267572879791, -0.2541809380054474, -0.23663510382175446, -0.21908928453922272, -0.20154345035552979, -0.18399763107299805, -0.1664518117904663, -0.14890599250793457, -0.13136015832424164, -0.1138143315911293, -0.09626850485801697, -0.07872268557548523, -0.061176858842372894, -0.04363103210926056, -0.02608521282672882, -0.008539386093616486, 0.00900644063949585, 0.026552265509963036, 0.04409809038043022, 0.06164391338825226, 0.0791897401213646, 0.09673556685447693, 0.11428138613700867, 0.1318272054195404, 0.14937303960323334, 0.16691885888576508, 0.184464693069458, 0.20201051235198975, 0.21955633163452148, 0.23710216581821442, 0.25464797019958496, 0.2721938192844391, 0.2897396385669708, 0.30728545784950256, 0.3248312771320343, 0.3423771262168884, 0.35992294549942017, 0.3774687647819519, 0.39501458406448364, 0.4125604033470154, 0.4301062226295471, 0.44765204191207886, 0.4651978611946106, 0.48274368047714233, 0.5002894997596741, 0.5178353786468506, 0.5353811979293823, 0.5529270172119141, 0.5704728364944458]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 7.0, 6.0, 14.0, 24.0, 19.0, 46.0, 49.0, 93.0, 91.0, 185.0, 257.0, 436.0, 651.0, 1039.0, 1705.0, 2930.0, 4793.0, 8325.0, 14451.0, 25542.0, 46654.0, 88678.0, 190621.0, 312192.0, 169476.0, 80725.0, 43242.0, 23781.0, 13584.0, 7601.0, 4408.0, 2596.0, 1556.0, 973.0, 647.0, 372.0, 269.0, 164.0, 103.0, 80.0, 43.0, 46.0, 22.0, 18.0, 10.0, 9.0, 3.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1846923828125, -0.17862319946289062, -0.17255401611328125, -0.16648483276367188, -0.1604156494140625, -0.15434646606445312, -0.14827728271484375, -0.14220809936523438, -0.136138916015625, -0.13006973266601562, -0.12400054931640625, -0.11793136596679688, -0.1118621826171875, -0.10579299926757812, -0.09972381591796875, -0.09365463256835938, -0.08758544921875, -0.08151626586914062, -0.07544708251953125, -0.06937789916992188, -0.0633087158203125, -0.057239532470703125, -0.05117034912109375, -0.045101165771484375, -0.039031982421875, -0.032962799072265625, -0.02689361572265625, -0.020824432373046875, -0.0147552490234375, -0.008686065673828125, -0.00261688232421875, 0.003452301025390625, 0.009521484375, 0.015590667724609375, 0.02165985107421875, 0.027729034423828125, 0.0337982177734375, 0.039867401123046875, 0.04593658447265625, 0.052005767822265625, 0.058074951171875, 0.06414413452148438, 0.07021331787109375, 0.07628250122070312, 0.0823516845703125, 0.08842086791992188, 0.09449005126953125, 0.10055923461914062, 0.10662841796875, 0.11269760131835938, 0.11876678466796875, 0.12483596801757812, 0.1309051513671875, 0.13697433471679688, 0.14304351806640625, 0.14911270141601562, 0.155181884765625, 0.16125106811523438, 0.16732025146484375, 0.17338943481445312, 0.1794586181640625, 0.18552780151367188, 0.19159698486328125, 0.19766616821289062, 0.2037353515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 7.0, 8.0, 9.0, 15.0, 10.0, 18.0, 19.0, 24.0, 24.0, 18.0, 36.0, 29.0, 33.0, 50.0, 52.0, 40.0, 51.0, 37.0, 31.0, 41.0, 44.0, 33.0, 40.0, 41.0, 50.0, 38.0, 31.0, 22.0, 27.0, 21.0, 18.0, 22.0, 9.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0819091796875, -0.07945442199707031, -0.07699966430664062, -0.07454490661621094, -0.07209014892578125, -0.06963539123535156, -0.06718063354492188, -0.06472587585449219, -0.0622711181640625, -0.05981636047363281, -0.057361602783203125, -0.05490684509277344, -0.05245208740234375, -0.04999732971191406, -0.047542572021484375, -0.04508781433105469, -0.042633056640625, -0.04017829895019531, -0.037723541259765625, -0.03526878356933594, -0.03281402587890625, -0.030359268188476562, -0.027904510498046875, -0.025449752807617188, -0.0229949951171875, -0.020540237426757812, -0.018085479736328125, -0.015630722045898438, -0.01317596435546875, -0.010721206665039062, -0.008266448974609375, -0.0058116912841796875, -0.00335693359375, -0.0009021759033203125, 0.001552581787109375, 0.0040073394775390625, 0.00646209716796875, 0.008916854858398438, 0.011371612548828125, 0.013826370239257812, 0.0162811279296875, 0.018735885620117188, 0.021190643310546875, 0.023645401000976562, 0.02610015869140625, 0.028554916381835938, 0.031009674072265625, 0.03346443176269531, 0.035919189453125, 0.03837394714355469, 0.040828704833984375, 0.04328346252441406, 0.04573822021484375, 0.04819297790527344, 0.050647735595703125, 0.05310249328613281, 0.0555572509765625, 0.05801200866699219, 0.060466766357421875, 0.06292152404785156, 0.06537628173828125, 0.06783103942871094, 0.07028579711914062, 0.07274055480957031, 0.0751953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 3.0, 9.0, 23.0, 16.0, 29.0, 28.0, 39.0, 59.0, 97.0, 161.0, 215.0, 307.0, 489.0, 837.0, 1556.0, 3521.0, 8939.0, 26640.0, 89165.0, 437279.0, 361724.0, 78566.0, 23545.0, 8218.0, 3346.0, 1545.0, 766.0, 471.0, 291.0, 181.0, 138.0, 94.0, 86.0, 36.0, 32.0, 28.0, 17.0, 15.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.455322265625, -0.442657470703125, -0.42999267578125, -0.417327880859375, -0.4046630859375, -0.391998291015625, -0.37933349609375, -0.366668701171875, -0.35400390625, -0.341339111328125, -0.32867431640625, -0.316009521484375, -0.3033447265625, -0.290679931640625, -0.27801513671875, -0.265350341796875, -0.252685546875, -0.240020751953125, -0.22735595703125, -0.214691162109375, -0.2020263671875, -0.189361572265625, -0.17669677734375, -0.164031982421875, -0.1513671875, -0.138702392578125, -0.12603759765625, -0.113372802734375, -0.1007080078125, -0.088043212890625, -0.07537841796875, -0.062713623046875, -0.050048828125, -0.037384033203125, -0.02471923828125, -0.012054443359375, 0.0006103515625, 0.013275146484375, 0.02593994140625, 0.038604736328125, 0.05126953125, 0.063934326171875, 0.07659912109375, 0.089263916015625, 0.1019287109375, 0.114593505859375, 0.12725830078125, 0.139923095703125, 0.152587890625, 0.165252685546875, 0.17791748046875, 0.190582275390625, 0.2032470703125, 0.215911865234375, 0.22857666015625, 0.241241455078125, 0.25390625, 0.266571044921875, 0.27923583984375, 0.291900634765625, 0.3045654296875, 0.317230224609375, 0.32989501953125, 0.342559814453125, 0.355224609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 5.0, 18.0, 10.0, 16.0, 20.0, 22.0, 31.0, 27.0, 39.0, 44.0, 34.0, 49.0, 55.0, 50.0, 58.0, 49.0, 41.0, 45.0, 41.0, 48.0, 39.0, 37.0, 31.0, 25.0, 24.0, 26.0, 24.0, 16.0, 10.0, 11.0, 4.0, 9.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3658714294433594, -0.35210418701171875, -0.3383369445800781, -0.3245697021484375, -0.3108024597167969, -0.29703521728515625, -0.2832679748535156, -0.269500732421875, -0.2557334899902344, -0.24196624755859375, -0.22819900512695312, -0.2144317626953125, -0.20066452026367188, -0.18689727783203125, -0.17313003540039062, -0.15936279296875, -0.14559555053710938, -0.13182830810546875, -0.11806106567382812, -0.1042938232421875, -0.09052658081054688, -0.07675933837890625, -0.06299209594726562, -0.049224853515625, -0.035457611083984375, -0.02169036865234375, -0.007923126220703125, 0.0058441162109375, 0.019611358642578125, 0.03337860107421875, 0.047145843505859375, 0.0609130859375, 0.07468032836914062, 0.08844757080078125, 0.10221481323242188, 0.1159820556640625, 0.12974929809570312, 0.14351654052734375, 0.15728378295898438, 0.171051025390625, 0.18481826782226562, 0.19858551025390625, 0.21235275268554688, 0.2261199951171875, 0.23988723754882812, 0.25365447998046875, 0.2674217224121094, 0.28118896484375, 0.2949562072753906, 0.30872344970703125, 0.3224906921386719, 0.3362579345703125, 0.3500251770019531, 0.36379241943359375, 0.3775596618652344, 0.391326904296875, 0.4050941467285156, 0.41886138916015625, 0.4326286315917969, 0.4463958740234375, 0.4601631164550781, 0.47393035888671875, 0.4876976013183594, 0.50146484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 11.0, 9.0, 16.0, 21.0, 27.0, 48.0, 61.0, 80.0, 147.0, 221.0, 275.0, 453.0, 858.0, 1643.0, 3606.0, 10581.0, 43776.0, 343158.0, 564245.0, 57702.0, 13039.0, 4306.0, 1844.0, 878.0, 561.0, 340.0, 199.0, 138.0, 111.0, 66.0, 45.0, 22.0, 25.0, 17.0, 7.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29132080078125, -0.2801513671875, -0.26898193359375, -0.2578125, -0.24664306640625, -0.2354736328125, -0.22430419921875, -0.213134765625, -0.20196533203125, -0.1907958984375, -0.17962646484375, -0.16845703125, -0.15728759765625, -0.1461181640625, -0.13494873046875, -0.123779296875, -0.11260986328125, -0.1014404296875, -0.09027099609375, -0.0791015625, -0.06793212890625, -0.0567626953125, -0.04559326171875, -0.034423828125, -0.02325439453125, -0.0120849609375, -0.00091552734375, 0.01025390625, 0.02142333984375, 0.0325927734375, 0.04376220703125, 0.054931640625, 0.06610107421875, 0.0772705078125, 0.08843994140625, 0.099609375, 0.11077880859375, 0.1219482421875, 0.13311767578125, 0.144287109375, 0.15545654296875, 0.1666259765625, 0.17779541015625, 0.18896484375, 0.20013427734375, 0.2113037109375, 0.22247314453125, 0.233642578125, 0.24481201171875, 0.2559814453125, 0.26715087890625, 0.2783203125, 0.28948974609375, 0.3006591796875, 0.31182861328125, 0.322998046875, 0.33416748046875, 0.3453369140625, 0.35650634765625, 0.36767578125, 0.37884521484375, 0.3900146484375, 0.40118408203125, 0.412353515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 8.0, 13.0, 27.0, 41.0, 55.0, 98.0, 150.0, 243.0, 150.0, 89.0, 49.0, 31.0, 17.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014066696166992188, -0.00013689789921045303, -0.0001331288367509842, -0.00012935977429151535, -0.0001255907118320465, -0.00012182164937257767, -0.00011805258691310883, -0.00011428352445363998, -0.00011051446199417114, -0.0001067453995347023, -0.00010297633707523346, -9.920727461576462e-05, -9.543821215629578e-05, -9.166914969682693e-05, -8.79000872373581e-05, -8.413102477788925e-05, -8.036196231842041e-05, -7.659289985895157e-05, -7.282383739948273e-05, -6.905477494001389e-05, -6.528571248054504e-05, -6.15166500210762e-05, -5.774758756160736e-05, -5.397852510213852e-05, -5.020946264266968e-05, -4.6440400183200836e-05, -4.2671337723731995e-05, -3.890227526426315e-05, -3.513321280479431e-05, -3.136415034532547e-05, -2.759508788585663e-05, -2.3826025426387787e-05, -2.0056962966918945e-05, -1.6287900507450104e-05, -1.2518838047981262e-05, -8.74977558851242e-06, -4.980713129043579e-06, -1.2116506695747375e-06, 2.557411789894104e-06, 6.3264742493629456e-06, 1.0095536708831787e-05, 1.3864599168300629e-05, 1.763366162776947e-05, 2.1402724087238312e-05, 2.5171786546707153e-05, 2.8940849006175995e-05, 3.2709911465644836e-05, 3.647897392511368e-05, 4.024803638458252e-05, 4.401709884405136e-05, 4.77861613035202e-05, 5.1555223762989044e-05, 5.5324286222457886e-05, 5.909334868192673e-05, 6.286241114139557e-05, 6.663147360086441e-05, 7.040053606033325e-05, 7.41695985198021e-05, 7.793866097927094e-05, 8.170772343873978e-05, 8.547678589820862e-05, 8.924584835767746e-05, 9.30149108171463e-05, 9.678397327661514e-05, 0.00010055303573608398]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 8.0, 4.0, 4.0, 8.0, 8.0, 10.0, 15.0, 29.0, 46.0, 63.0, 117.0, 209.0, 349.0, 626.0, 1273.0, 2605.0, 6917.0, 23644.0, 130796.0, 714788.0, 130835.0, 23705.0, 7060.0, 2647.0, 1220.0, 664.0, 378.0, 190.0, 129.0, 77.0, 45.0, 25.0, 15.0, 14.0, 11.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36483001708984375, -0.3524627685546875, -0.34009552001953125, -0.327728271484375, -0.31536102294921875, -0.3029937744140625, -0.29062652587890625, -0.27825927734375, -0.26589202880859375, -0.2535247802734375, -0.24115753173828125, -0.228790283203125, -0.21642303466796875, -0.2040557861328125, -0.19168853759765625, -0.1793212890625, -0.16695404052734375, -0.1545867919921875, -0.14221954345703125, -0.129852294921875, -0.11748504638671875, -0.1051177978515625, -0.09275054931640625, -0.08038330078125, -0.06801605224609375, -0.0556488037109375, -0.04328155517578125, -0.030914306640625, -0.01854705810546875, -0.0061798095703125, 0.00618743896484375, 0.0185546875, 0.03092193603515625, 0.0432891845703125, 0.05565643310546875, 0.068023681640625, 0.08039093017578125, 0.0927581787109375, 0.10512542724609375, 0.11749267578125, 0.12985992431640625, 0.1422271728515625, 0.15459442138671875, 0.166961669921875, 0.17932891845703125, 0.1916961669921875, 0.20406341552734375, 0.2164306640625, 0.22879791259765625, 0.2411651611328125, 0.25353240966796875, 0.265899658203125, 0.27826690673828125, 0.2906341552734375, 0.30300140380859375, 0.31536865234375, 0.32773590087890625, 0.3401031494140625, 0.35247039794921875, 0.364837646484375, 0.37720489501953125, 0.3895721435546875, 0.40193939208984375, 0.414306640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 11.0, 4.0, 20.0, 10.0, 25.0, 32.0, 44.0, 61.0, 88.0, 131.0, 137.0, 122.0, 77.0, 59.0, 43.0, 37.0, 25.0, 12.0, 14.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25390625, -0.24465560913085938, -0.23540496826171875, -0.22615432739257812, -0.2169036865234375, -0.20765304565429688, -0.19840240478515625, -0.18915176391601562, -0.179901123046875, -0.17065048217773438, -0.16139984130859375, -0.15214920043945312, -0.1428985595703125, -0.13364791870117188, -0.12439727783203125, -0.11514663696289062, -0.10589599609375, -0.09664535522460938, -0.08739471435546875, -0.07814407348632812, -0.0688934326171875, -0.059642791748046875, -0.05039215087890625, -0.041141510009765625, -0.031890869140625, -0.022640228271484375, -0.01338958740234375, -0.004138946533203125, 0.0051116943359375, 0.014362335205078125, 0.02361297607421875, 0.032863616943359375, 0.0421142578125, 0.051364898681640625, 0.06061553955078125, 0.06986618041992188, 0.0791168212890625, 0.08836746215820312, 0.09761810302734375, 0.10686874389648438, 0.116119384765625, 0.12537002563476562, 0.13462066650390625, 0.14387130737304688, 0.1531219482421875, 0.16237258911132812, 0.17162322998046875, 0.18087387084960938, 0.19012451171875, 0.19937515258789062, 0.20862579345703125, 0.21787643432617188, 0.2271270751953125, 0.23637771606445312, 0.24562835693359375, 0.2548789978027344, 0.264129638671875, 0.2733802795410156, 0.28263092041015625, 0.2918815612792969, 0.3011322021484375, 0.3103828430175781, 0.31963348388671875, 0.3288841247558594, 0.338134765625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 13.0, 84.0, 165.0, 313.0, 268.0, 105.0, 37.0, 8.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7446107864379883, -3.470951795578003, -3.1972928047180176, -2.9236338138580322, -2.649974822998047, -2.3763158321380615, -2.102656841278076, -1.8289978504180908, -1.5553388595581055, -1.2816798686981201, -1.0080208778381348, -0.7343618869781494, -0.46070289611816406, -0.1870439052581787, 0.08661508560180664, 0.360274076461792, 0.6339330673217773, 0.9075920581817627, 1.181251049041748, 1.4549100399017334, 1.7285690307617188, 2.002228021621704, 2.2758870124816895, 2.549546003341675, 2.82320499420166, 3.0968639850616455, 3.370522975921631, 3.644181966781616, 3.9178409576416016, 4.191499710083008, 4.465158939361572, 4.738818168640137, 5.012475967407227, 5.286134719848633, 5.559793949127197, 5.833453178405762, 6.107111930847168, 6.380770683288574, 6.654429912567139, 6.928089141845703, 7.201747894287109, 7.475406646728516, 7.74906587600708, 8.022725105285645, 8.29638385772705, 8.570042610168457, 8.84370231628418, 9.117361068725586, 9.391019821166992, 9.664678573608398, 9.938337326049805, 10.211997032165527, 10.485655784606934, 10.75931453704834, 11.032974243164062, 11.306632995605469, 11.580291748046875, 11.853950500488281, 12.127609252929688, 12.40126895904541, 12.674927711486816, 12.948586463928223, 13.222246170043945, 13.495904922485352, 13.769563674926758]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 12.0, 9.0, 9.0, 20.0, 15.0, 16.0, 17.0, 27.0, 32.0, 31.0, 36.0, 50.0, 47.0, 50.0, 49.0, 40.0, 51.0, 35.0, 39.0, 31.0, 45.0, 33.0, 37.0, 40.0, 29.0, 37.0, 26.0, 22.0, 21.0, 18.0, 20.0, 9.0, 5.0, 7.0, 4.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.277494430541992, -2.2030272483825684, -2.1285598278045654, -2.0540926456451416, -1.9796253442764282, -1.9051580429077148, -1.830690860748291, -1.7562235593795776, -1.6817562580108643, -1.6072889566421509, -1.532821774482727, -1.4583544731140137, -1.3838871717453003, -1.309419870376587, -1.234952688217163, -1.1604853868484497, -1.0860182046890259, -1.0115509033203125, -0.9370836615562439, -0.8626164197921753, -0.7881491184234619, -0.7136818766593933, -0.6392146348953247, -0.5647473335266113, -0.4902800917625427, -0.41581282019615173, -0.34134554862976074, -0.26687830686569214, -0.19241103529930115, -0.11794376373291016, -0.04347652196884155, 0.030990779399871826, 0.10545802116394043, 0.17992529273033142, 0.2543925642967224, 0.328859806060791, 0.403327077627182, 0.477794349193573, 0.5522615909576416, 0.626728892326355, 0.7011961340904236, 0.7756633758544922, 0.8501306772232056, 0.9245979189872742, 0.9990651607513428, 1.0735324621200562, 1.1479997634887695, 1.2224669456481934, 1.2969342470169067, 1.3714015483856201, 1.445868730545044, 1.5203360319137573, 1.5948033332824707, 1.6692705154418945, 1.743737816810608, 1.8182051181793213, 1.8926723003387451, 1.9671396017074585, 2.041606903076172, 2.1160740852355957, 2.1905412673950195, 2.2650086879730225, 2.3394758701324463, 2.413943290710449, 2.488410472869873]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 6.0, 14.0, 14.0, 20.0, 29.0, 38.0, 52.0, 92.0, 106.0, 181.0, 213.0, 310.0, 424.0, 680.0, 1043.0, 1646.0, 2768.0, 4803.0, 9031.0, 19490.0, 52281.0, 239593.0, 3558583.0, 212822.0, 50300.0, 19098.0, 8816.0, 4683.0, 2631.0, 1512.0, 983.0, 686.0, 442.0, 285.0, 172.0, 132.0, 77.0, 59.0, 50.0, 34.0, 25.0, 13.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.40283203125, -0.3914756774902344, -0.38011932373046875, -0.3687629699707031, -0.3574066162109375, -0.3460502624511719, -0.33469390869140625, -0.3233375549316406, -0.311981201171875, -0.3006248474121094, -0.28926849365234375, -0.2779121398925781, -0.2665557861328125, -0.2551994323730469, -0.24384307861328125, -0.23248672485351562, -0.22113037109375, -0.20977401733398438, -0.19841766357421875, -0.18706130981445312, -0.1757049560546875, -0.16434860229492188, -0.15299224853515625, -0.14163589477539062, -0.130279541015625, -0.11892318725585938, -0.10756683349609375, -0.09621047973632812, -0.0848541259765625, -0.07349777221679688, -0.06214141845703125, -0.050785064697265625, -0.0394287109375, -0.028072357177734375, -0.01671600341796875, -0.005359649658203125, 0.0059967041015625, 0.017353057861328125, 0.02870941162109375, 0.040065765380859375, 0.051422119140625, 0.06277847290039062, 0.07413482666015625, 0.08549118041992188, 0.0968475341796875, 0.10820388793945312, 0.11956024169921875, 0.13091659545898438, 0.14227294921875, 0.15362930297851562, 0.16498565673828125, 0.17634201049804688, 0.1876983642578125, 0.19905471801757812, 0.21041107177734375, 0.22176742553710938, 0.233123779296875, 0.24448013305664062, 0.25583648681640625, 0.2671928405761719, 0.2785491943359375, 0.2899055480957031, 0.30126190185546875, 0.3126182556152344, 0.323974609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 8.0, 7.0, 19.0, 19.0, 13.0, 28.0, 19.0, 24.0, 29.0, 44.0, 32.0, 37.0, 39.0, 39.0, 46.0, 35.0, 39.0, 48.0, 30.0, 30.0, 40.0, 35.0, 41.0, 38.0, 41.0, 26.0, 18.0, 24.0, 15.0, 25.0, 14.0, 7.0, 13.0, 8.0, 10.0, 10.0, 3.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.08551025390625, -0.08304214477539062, -0.08057403564453125, -0.07810592651367188, -0.0756378173828125, -0.07316970825195312, -0.07070159912109375, -0.06823348999023438, -0.065765380859375, -0.06329727172851562, -0.06082916259765625, -0.058361053466796875, -0.0558929443359375, -0.053424835205078125, -0.05095672607421875, -0.048488616943359375, -0.0460205078125, -0.043552398681640625, -0.04108428955078125, -0.038616180419921875, -0.0361480712890625, -0.033679962158203125, -0.03121185302734375, -0.028743743896484375, -0.026275634765625, -0.023807525634765625, -0.02133941650390625, -0.018871307373046875, -0.0164031982421875, -0.013935089111328125, -0.01146697998046875, -0.008998870849609375, -0.00653076171875, -0.004062652587890625, -0.00159454345703125, 0.000873565673828125, 0.0033416748046875, 0.005809783935546875, 0.00827789306640625, 0.010746002197265625, 0.013214111328125, 0.015682220458984375, 0.01815032958984375, 0.020618438720703125, 0.0230865478515625, 0.025554656982421875, 0.02802276611328125, 0.030490875244140625, 0.032958984375, 0.035427093505859375, 0.03789520263671875, 0.040363311767578125, 0.0428314208984375, 0.045299530029296875, 0.04776763916015625, 0.050235748291015625, 0.052703857421875, 0.055171966552734375, 0.05764007568359375, 0.060108184814453125, 0.0625762939453125, 0.06504440307617188, 0.06751251220703125, 0.06998062133789062, 0.07244873046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 1.0, 8.0, 2.0, 8.0, 11.0, 12.0, 20.0, 21.0, 37.0, 33.0, 47.0, 74.0, 120.0, 168.0, 267.0, 465.0, 622.0, 1116.0, 2008.0, 3811.0, 8433.0, 22410.0, 86781.0, 2497476.0, 1450241.0, 81340.0, 21879.0, 8166.0, 3832.0, 1854.0, 1089.0, 719.0, 412.0, 261.0, 156.0, 110.0, 80.0, 54.0, 42.0, 17.0, 17.0, 17.0, 14.0, 10.0, 6.0, 2.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.677734375, -0.6551284790039062, -0.6325225830078125, -0.6099166870117188, -0.587310791015625, -0.5647048950195312, -0.5420989990234375, -0.5194931030273438, -0.49688720703125, -0.47428131103515625, -0.4516754150390625, -0.42906951904296875, -0.406463623046875, -0.38385772705078125, -0.3612518310546875, -0.33864593505859375, -0.3160400390625, -0.29343414306640625, -0.2708282470703125, -0.24822235107421875, -0.225616455078125, -0.20301055908203125, -0.1804046630859375, -0.15779876708984375, -0.13519287109375, -0.11258697509765625, -0.0899810791015625, -0.06737518310546875, -0.044769287109375, -0.02216339111328125, 0.0004425048828125, 0.02304840087890625, 0.045654296875, 0.06826019287109375, 0.0908660888671875, 0.11347198486328125, 0.136077880859375, 0.15868377685546875, 0.1812896728515625, 0.20389556884765625, 0.22650146484375, 0.24910736083984375, 0.2717132568359375, 0.29431915283203125, 0.316925048828125, 0.33953094482421875, 0.3621368408203125, 0.38474273681640625, 0.4073486328125, 0.42995452880859375, 0.4525604248046875, 0.47516632080078125, 0.497772216796875, 0.5203781127929688, 0.5429840087890625, 0.5655899047851562, 0.58819580078125, 0.6108016967773438, 0.6334075927734375, 0.6560134887695312, 0.678619384765625, 0.7012252807617188, 0.7238311767578125, 0.7464370727539062, 0.76904296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 21.0, 27.0, 43.0, 73.0, 134.0, 356.0, 2337.0, 658.0, 168.0, 98.0, 47.0, 23.0, 23.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.4303131103515625, -0.416290283203125, -0.4022674560546875, -0.38824462890625, -0.3742218017578125, -0.360198974609375, -0.3461761474609375, -0.3321533203125, -0.3181304931640625, -0.304107666015625, -0.2900848388671875, -0.27606201171875, -0.2620391845703125, -0.248016357421875, -0.2339935302734375, -0.219970703125, -0.2059478759765625, -0.191925048828125, -0.1779022216796875, -0.16387939453125, -0.1498565673828125, -0.135833740234375, -0.1218109130859375, -0.1077880859375, -0.0937652587890625, -0.079742431640625, -0.0657196044921875, -0.05169677734375, -0.0376739501953125, -0.023651123046875, -0.0096282958984375, 0.00439453125, 0.0184173583984375, 0.032440185546875, 0.0464630126953125, 0.06048583984375, 0.0745086669921875, 0.088531494140625, 0.1025543212890625, 0.1165771484375, 0.1305999755859375, 0.144622802734375, 0.1586456298828125, 0.17266845703125, 0.1866912841796875, 0.200714111328125, 0.2147369384765625, 0.228759765625, 0.2427825927734375, 0.256805419921875, 0.2708282470703125, 0.28485107421875, 0.2988739013671875, 0.312896728515625, 0.3269195556640625, 0.3409423828125, 0.3549652099609375, 0.368988037109375, 0.3830108642578125, 0.39703369140625, 0.4110565185546875, 0.425079345703125, 0.4391021728515625, 0.453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 11.0, 33.0, 45.0, 64.0, 121.0, 162.0, 165.0, 154.0, 107.0, 49.0, 33.0, 21.0, 13.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4327988624572754, -3.3454413414001465, -3.2580835819244385, -3.1707260608673096, -3.0833685398101807, -2.9960107803344727, -2.9086532592773438, -2.821295738220215, -2.733938217163086, -2.646580696105957, -2.559222936630249, -2.47186541557312, -2.384507894515991, -2.297150135040283, -2.2097926139831543, -2.1224350929260254, -2.0350773334503174, -1.947719693183899, -1.86036217212677, -1.7730045318603516, -1.6856470108032227, -1.5982893705368042, -1.5109317302703857, -1.4235742092132568, -1.3362165689468384, -1.24885892868042, -1.161501407623291, -1.0741437673568726, -0.9867861866950989, -0.8994286060333252, -0.8120709657669067, -0.7247133851051331, -0.6373560428619385, -0.5499984622001648, -0.4626408517360687, -0.37528324127197266, -0.287925660610199, -0.2005680799484253, -0.11321043968200684, -0.025852859020233154, 0.06150472164154053, 0.1488623172044754, 0.23621991276741028, 0.32357752323150635, 0.41093510389328003, 0.4982926845550537, 0.5856503248214722, 0.6730079054832458, 0.7603654861450195, 0.8477230668067932, 0.9350806474685669, 1.0224382877349854, 1.1097958087921143, 1.1971534490585327, 1.2845110893249512, 1.37186861038208, 1.4592262506484985, 1.546583890914917, 1.633941411972046, 1.7212990522384644, 1.8086566925048828, 1.8960142135620117, 1.9833718538284302, 2.0707294940948486, 2.1580870151519775]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 5.0, 9.0, 8.0, 9.0, 14.0, 15.0, 9.0, 23.0, 23.0, 26.0, 29.0, 35.0, 33.0, 43.0, 40.0, 54.0, 47.0, 34.0, 37.0, 44.0, 45.0, 38.0, 26.0, 46.0, 45.0, 45.0, 25.0, 26.0, 30.0, 26.0, 16.0, 20.0, 7.0, 8.0, 14.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.1031018495559692, -1.0700597763061523, -1.037017822265625, -1.0039758682250977, -0.9709337949752808, -0.9378917813301086, -0.9048497676849365, -0.8718077540397644, -0.8387657403945923, -0.8057237267494202, -0.772681713104248, -0.7396396994590759, -0.7065976858139038, -0.6735556721687317, -0.6405136585235596, -0.6074716448783875, -0.5744296312332153, -0.5413876175880432, -0.5083456039428711, -0.475303590297699, -0.44226157665252686, -0.40921956300735474, -0.3761775493621826, -0.3431355357170105, -0.3100935220718384, -0.27705150842666626, -0.24400949478149414, -0.21096748113632202, -0.1779254674911499, -0.14488345384597778, -0.11184144020080566, -0.07879942655563354, -0.045757293701171875, -0.012715280055999756, 0.020326733589172363, 0.05336874723434448, 0.0864107608795166, 0.11945277452468872, 0.15249478816986084, 0.18553680181503296, 0.21857881546020508, 0.2516208291053772, 0.2846628427505493, 0.31770485639572144, 0.35074687004089355, 0.3837888836860657, 0.4168308973312378, 0.4498729109764099, 0.48291492462158203, 0.5159569382667542, 0.5489989519119263, 0.5820409655570984, 0.6150829792022705, 0.6481249928474426, 0.6811670064926147, 0.7142090201377869, 0.747251033782959, 0.7802930474281311, 0.8133350610733032, 0.8463770747184753, 0.8794190883636475, 0.9124611020088196, 0.9455031156539917, 0.9785451292991638, 1.011587142944336]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 8.0, 17.0, 18.0, 29.0, 35.0, 55.0, 108.0, 134.0, 190.0, 332.0, 501.0, 793.0, 1214.0, 2054.0, 3435.0, 5803.0, 10425.0, 20567.0, 42894.0, 104386.0, 258389.0, 325445.0, 152079.0, 60587.0, 27226.0, 13575.0, 7475.0, 4185.0, 2441.0, 1474.0, 974.0, 559.0, 386.0, 254.0, 153.0, 94.0, 75.0, 54.0, 38.0, 33.0, 16.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28594207763671875, -0.2764739990234375, -0.26700592041015625, -0.257537841796875, -0.24806976318359375, -0.2386016845703125, -0.22913360595703125, -0.21966552734375, -0.21019744873046875, -0.2007293701171875, -0.19126129150390625, -0.181793212890625, -0.17232513427734375, -0.1628570556640625, -0.15338897705078125, -0.1439208984375, -0.13445281982421875, -0.1249847412109375, -0.11551666259765625, -0.106048583984375, -0.09658050537109375, -0.0871124267578125, -0.07764434814453125, -0.06817626953125, -0.05870819091796875, -0.0492401123046875, -0.03977203369140625, -0.030303955078125, -0.02083587646484375, -0.0113677978515625, -0.00189971923828125, 0.007568359375, 0.01703643798828125, 0.0265045166015625, 0.03597259521484375, 0.045440673828125, 0.05490875244140625, 0.0643768310546875, 0.07384490966796875, 0.08331298828125, 0.09278106689453125, 0.1022491455078125, 0.11171722412109375, 0.121185302734375, 0.13065338134765625, 0.1401214599609375, 0.14958953857421875, 0.1590576171875, 0.16852569580078125, 0.1779937744140625, 0.18746185302734375, 0.196929931640625, 0.20639801025390625, 0.2158660888671875, 0.22533416748046875, 0.23480224609375, 0.24427032470703125, 0.2537384033203125, 0.26320648193359375, 0.272674560546875, 0.28214263916015625, 0.2916107177734375, 0.30107879638671875, 0.310546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 9.0, 14.0, 12.0, 14.0, 12.0, 23.0, 19.0, 22.0, 38.0, 27.0, 41.0, 39.0, 42.0, 47.0, 52.0, 57.0, 42.0, 53.0, 36.0, 65.0, 50.0, 46.0, 33.0, 34.0, 21.0, 25.0, 27.0, 17.0, 14.0, 14.0, 19.0, 10.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10546875, -0.10201168060302734, -0.09855461120605469, -0.09509754180908203, -0.09164047241210938, -0.08818340301513672, -0.08472633361816406, -0.0812692642211914, -0.07781219482421875, -0.0743551254272461, -0.07089805603027344, -0.06744098663330078, -0.06398391723632812, -0.06052684783935547, -0.05706977844238281, -0.053612709045410156, -0.0501556396484375, -0.046698570251464844, -0.04324150085449219, -0.03978443145751953, -0.036327362060546875, -0.03287029266357422, -0.029413223266601562, -0.025956153869628906, -0.02249908447265625, -0.019042015075683594, -0.015584945678710938, -0.012127876281738281, -0.008670806884765625, -0.005213737487792969, -0.0017566680908203125, 0.0017004013061523438, 0.005157470703125, 0.008614540100097656, 0.012071609497070312, 0.015528678894042969, 0.018985748291015625, 0.02244281768798828, 0.025899887084960938, 0.029356956481933594, 0.03281402587890625, 0.036271095275878906, 0.03972816467285156, 0.04318523406982422, 0.046642303466796875, 0.05009937286376953, 0.05355644226074219, 0.057013511657714844, 0.0604705810546875, 0.06392765045166016, 0.06738471984863281, 0.07084178924560547, 0.07429885864257812, 0.07775592803955078, 0.08121299743652344, 0.0846700668334961, 0.08812713623046875, 0.0915842056274414, 0.09504127502441406, 0.09849834442138672, 0.10195541381835938, 0.10541248321533203, 0.10886955261230469, 0.11232662200927734, 0.11578369140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 8.0, 15.0, 26.0, 29.0, 41.0, 71.0, 118.0, 204.0, 370.0, 868.0, 2330.0, 8798.0, 44156.0, 380054.0, 532958.0, 61980.0, 11372.0, 3094.0, 1011.0, 440.0, 202.0, 124.0, 72.0, 53.0, 35.0, 18.0, 24.0, 9.0, 10.0, 10.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6618194580078125, -0.639068603515625, -0.6163177490234375, -0.59356689453125, -0.5708160400390625, -0.548065185546875, -0.5253143310546875, -0.5025634765625, -0.4798126220703125, -0.457061767578125, -0.4343109130859375, -0.41156005859375, -0.3888092041015625, -0.366058349609375, -0.3433074951171875, -0.320556640625, -0.2978057861328125, -0.275054931640625, -0.2523040771484375, -0.22955322265625, -0.2068023681640625, -0.184051513671875, -0.1613006591796875, -0.1385498046875, -0.1157989501953125, -0.093048095703125, -0.0702972412109375, -0.04754638671875, -0.0247955322265625, -0.002044677734375, 0.0207061767578125, 0.04345703125, 0.0662078857421875, 0.088958740234375, 0.1117095947265625, 0.13446044921875, 0.1572113037109375, 0.179962158203125, 0.2027130126953125, 0.2254638671875, 0.2482147216796875, 0.270965576171875, 0.2937164306640625, 0.31646728515625, 0.3392181396484375, 0.361968994140625, 0.3847198486328125, 0.407470703125, 0.4302215576171875, 0.452972412109375, 0.4757232666015625, 0.49847412109375, 0.5212249755859375, 0.543975830078125, 0.5667266845703125, 0.5894775390625, 0.6122283935546875, 0.634979248046875, 0.6577301025390625, 0.68048095703125, 0.7032318115234375, 0.725982666015625, 0.7487335205078125, 0.771484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 8.0, 7.0, 15.0, 14.0, 12.0, 23.0, 31.0, 25.0, 23.0, 22.0, 28.0, 43.0, 36.0, 35.0, 47.0, 40.0, 44.0, 55.0, 46.0, 47.0, 33.0, 32.0, 38.0, 40.0, 33.0, 21.0, 34.0, 20.0, 25.0, 26.0, 10.0, 18.0, 9.0, 9.0, 10.0, 5.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5248336791992188, -0.5076751708984375, -0.49051666259765625, -0.473358154296875, -0.45619964599609375, -0.4390411376953125, -0.42188262939453125, -0.40472412109375, -0.38756561279296875, -0.3704071044921875, -0.35324859619140625, -0.336090087890625, -0.31893157958984375, -0.3017730712890625, -0.28461456298828125, -0.2674560546875, -0.25029754638671875, -0.2331390380859375, -0.21598052978515625, -0.198822021484375, -0.18166351318359375, -0.1645050048828125, -0.14734649658203125, -0.13018798828125, -0.11302947998046875, -0.0958709716796875, -0.07871246337890625, -0.061553955078125, -0.04439544677734375, -0.0272369384765625, -0.01007843017578125, 0.007080078125, 0.02423858642578125, 0.0413970947265625, 0.05855560302734375, 0.075714111328125, 0.09287261962890625, 0.1100311279296875, 0.12718963623046875, 0.14434814453125, 0.16150665283203125, 0.1786651611328125, 0.19582366943359375, 0.212982177734375, 0.23014068603515625, 0.2472991943359375, 0.26445770263671875, 0.2816162109375, 0.29877471923828125, 0.3159332275390625, 0.33309173583984375, 0.350250244140625, 0.36740875244140625, 0.3845672607421875, 0.40172576904296875, 0.41888427734375, 0.43604278564453125, 0.4532012939453125, 0.47035980224609375, 0.487518310546875, 0.5046768188476562, 0.5218353271484375, 0.5389938354492188, 0.55615234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 6.0, 14.0, 21.0, 31.0, 66.0, 129.0, 222.0, 543.0, 1503.0, 5319.0, 24280.0, 234395.0, 693604.0, 72556.0, 11369.0, 2818.0, 923.0, 376.0, 168.0, 74.0, 42.0, 24.0, 21.0, 16.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36572265625, -0.35124969482421875, -0.3367767333984375, -0.32230377197265625, -0.307830810546875, -0.29335784912109375, -0.2788848876953125, -0.26441192626953125, -0.24993896484375, -0.23546600341796875, -0.2209930419921875, -0.20652008056640625, -0.192047119140625, -0.17757415771484375, -0.1631011962890625, -0.14862823486328125, -0.1341552734375, -0.11968231201171875, -0.1052093505859375, -0.09073638916015625, -0.076263427734375, -0.06179046630859375, -0.0473175048828125, -0.03284454345703125, -0.01837158203125, -0.00389862060546875, 0.0105743408203125, 0.02504730224609375, 0.039520263671875, 0.05399322509765625, 0.0684661865234375, 0.08293914794921875, 0.097412109375, 0.11188507080078125, 0.1263580322265625, 0.14083099365234375, 0.155303955078125, 0.16977691650390625, 0.1842498779296875, 0.19872283935546875, 0.21319580078125, 0.22766876220703125, 0.2421417236328125, 0.25661468505859375, 0.271087646484375, 0.28556060791015625, 0.3000335693359375, 0.31450653076171875, 0.3289794921875, 0.34345245361328125, 0.3579254150390625, 0.37239837646484375, 0.386871337890625, 0.40134429931640625, 0.4158172607421875, 0.43029022216796875, 0.44476318359375, 0.45923614501953125, 0.4737091064453125, 0.48818206787109375, 0.502655029296875, 0.5171279907226562, 0.5316009521484375, 0.5460739135742188, 0.560546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 23.0, 27.0, 49.0, 57.0, 74.0, 109.0, 138.0, 146.0, 94.0, 87.0, 53.0, 38.0, 14.0, 19.0, 9.0, 9.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.328126907348633e-05, -9.015202522277832e-05, -8.702278137207031e-05, -8.38935375213623e-05, -8.07642936706543e-05, -7.763504981994629e-05, -7.450580596923828e-05, -7.137656211853027e-05, -6.824731826782227e-05, -6.511807441711426e-05, -6.198883056640625e-05, -5.885958671569824e-05, -5.5730342864990234e-05, -5.2601099014282227e-05, -4.947185516357422e-05, -4.634261131286621e-05, -4.32133674621582e-05, -4.0084123611450195e-05, -3.695487976074219e-05, -3.382563591003418e-05, -3.069639205932617e-05, -2.7567148208618164e-05, -2.4437904357910156e-05, -2.130866050720215e-05, -1.817941665649414e-05, -1.5050172805786133e-05, -1.1920928955078125e-05, -8.791685104370117e-06, -5.662441253662109e-06, -2.5331974029541016e-06, 5.960464477539062e-07, 3.725290298461914e-06, 6.854534149169922e-06, 9.98377799987793e-06, 1.3113021850585938e-05, 1.6242265701293945e-05, 1.9371509552001953e-05, 2.250075340270996e-05, 2.562999725341797e-05, 2.8759241104125977e-05, 3.1888484954833984e-05, 3.501772880554199e-05, 3.814697265625e-05, 4.127621650695801e-05, 4.4405460357666016e-05, 4.7534704208374023e-05, 5.066394805908203e-05, 5.379319190979004e-05, 5.692243576049805e-05, 6.0051679611206055e-05, 6.318092346191406e-05, 6.631016731262207e-05, 6.943941116333008e-05, 7.256865501403809e-05, 7.56978988647461e-05, 7.88271427154541e-05, 8.195638656616211e-05, 8.508563041687012e-05, 8.821487426757812e-05, 9.134411811828613e-05, 9.447336196899414e-05, 9.760260581970215e-05, 0.00010073184967041016, 0.00010386109352111816, 0.00010699033737182617]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 8.0, 5.0, 5.0, 6.0, 16.0, 31.0, 45.0, 53.0, 78.0, 103.0, 164.0, 303.0, 426.0, 825.0, 1509.0, 3065.0, 6448.0, 16102.0, 46941.0, 174048.0, 485243.0, 221205.0, 57728.0, 19089.0, 7536.0, 3400.0, 1773.0, 960.0, 516.0, 339.0, 198.0, 124.0, 81.0, 41.0, 34.0, 39.0, 15.0, 18.0, 7.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.264404296875, -0.2562904357910156, -0.24817657470703125, -0.24006271362304688, -0.2319488525390625, -0.22383499145507812, -0.21572113037109375, -0.20760726928710938, -0.199493408203125, -0.19137954711914062, -0.18326568603515625, -0.17515182495117188, -0.1670379638671875, -0.15892410278320312, -0.15081024169921875, -0.14269638061523438, -0.13458251953125, -0.12646865844726562, -0.11835479736328125, -0.11024093627929688, -0.1021270751953125, -0.09401321411132812, -0.08589935302734375, -0.07778549194335938, -0.069671630859375, -0.061557769775390625, -0.05344390869140625, -0.045330047607421875, -0.0372161865234375, -0.029102325439453125, -0.02098846435546875, -0.012874603271484375, -0.0047607421875, 0.003353118896484375, 0.01146697998046875, 0.019580841064453125, 0.0276947021484375, 0.035808563232421875, 0.04392242431640625, 0.052036285400390625, 0.060150146484375, 0.06826400756835938, 0.07637786865234375, 0.08449172973632812, 0.0926055908203125, 0.10071945190429688, 0.10883331298828125, 0.11694717407226562, 0.12506103515625, 0.13317489624023438, 0.14128875732421875, 0.14940261840820312, 0.1575164794921875, 0.16563034057617188, 0.17374420166015625, 0.18185806274414062, 0.189971923828125, 0.19808578491210938, 0.20619964599609375, 0.21431350708007812, 0.2224273681640625, 0.23054122924804688, 0.23865509033203125, 0.24676895141601562, 0.2548828125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 20.0, 26.0, 26.0, 41.0, 73.0, 68.0, 105.0, 139.0, 125.0, 113.0, 94.0, 54.0, 33.0, 23.0, 11.0, 14.0, 7.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.26171875, -0.250244140625, -0.23876953125, -0.227294921875, -0.2158203125, -0.204345703125, -0.19287109375, -0.181396484375, -0.169921875, -0.158447265625, -0.14697265625, -0.135498046875, -0.1240234375, -0.112548828125, -0.10107421875, -0.089599609375, -0.078125, -0.066650390625, -0.05517578125, -0.043701171875, -0.0322265625, -0.020751953125, -0.00927734375, 0.002197265625, 0.013671875, 0.025146484375, 0.03662109375, 0.048095703125, 0.0595703125, 0.071044921875, 0.08251953125, 0.093994140625, 0.10546875, 0.116943359375, 0.12841796875, 0.139892578125, 0.1513671875, 0.162841796875, 0.17431640625, 0.185791015625, 0.197265625, 0.208740234375, 0.22021484375, 0.231689453125, 0.2431640625, 0.254638671875, 0.26611328125, 0.277587890625, 0.2890625, 0.300537109375, 0.31201171875, 0.323486328125, 0.3349609375, 0.346435546875, 0.35791015625, 0.369384765625, 0.380859375, 0.392333984375, 0.40380859375, 0.415283203125, 0.4267578125, 0.438232421875, 0.44970703125, 0.461181640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 15.0, 33.0, 68.0, 120.0, 216.0, 215.0, 155.0, 109.0, 38.0, 22.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.987802028656006, -2.7788026332855225, -2.569803237915039, -2.3608040809631348, -2.1518044471740723, -1.9428051710128784, -1.7338058948516846, -1.5248064994812012, -1.3158071041107178, -1.1068077087402344, -0.8978083729743958, -0.6888090372085571, -0.47980964183807373, -0.27081024646759033, -0.061810970306396484, 0.14718842506408691, 0.3561878204345703, 0.5651872158050537, 0.7741865515708923, 0.983185887336731, 1.1921852827072144, 1.4011846780776978, 1.6101839542388916, 1.819183349609375, 2.0281827449798584, 2.237182140350342, 2.446181535720825, 2.6551809310913086, 2.864180088043213, 3.0731797218322754, 3.2821788787841797, 3.491178274154663, 3.7001771926879883, 3.9091765880584717, 4.118175983428955, 4.327175140380859, 4.536174774169922, 4.745173931121826, 4.9541730880737305, 5.163172721862793, 5.3721723556518555, 5.58117151260376, 5.790171146392822, 5.999170303344727, 6.208169937133789, 6.417169094085693, 6.626168251037598, 6.83516788482666, 7.0441670417785645, 7.253166198730469, 7.462165832519531, 7.6711649894714355, 7.880164623260498, 8.089163780212402, 8.298163414001465, 8.507162094116211, 8.716161727905273, 8.925161361694336, 9.134160041809082, 9.343159675598145, 9.552159309387207, 9.76115894317627, 9.970157623291016, 10.179157257080078, 10.38815689086914]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 11.0, 10.0, 13.0, 17.0, 14.0, 18.0, 21.0, 23.0, 14.0, 25.0, 41.0, 37.0, 40.0, 33.0, 33.0, 41.0, 44.0, 42.0, 52.0, 31.0, 43.0, 35.0, 39.0, 43.0, 38.0, 32.0, 27.0, 36.0, 20.0, 19.0, 23.0, 19.0, 7.0, 9.0, 8.0, 5.0, 3.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3804855346679688, -2.2952613830566406, -2.2100374698638916, -2.1248135566711426, -2.0395894050598145, -1.9543653726577759, -1.8691413402557373, -1.7839173078536987, -1.6986932754516602, -1.6134692430496216, -1.528245210647583, -1.4430211782455444, -1.3577971458435059, -1.2725731134414673, -1.1873490810394287, -1.1021250486373901, -1.0169010162353516, -0.931676983833313, -0.8464529514312744, -0.7612289190292358, -0.6760048866271973, -0.5907808542251587, -0.5055568218231201, -0.42033278942108154, -0.33510875701904297, -0.2498847246170044, -0.16466069221496582, -0.07943665981292725, 0.005787372589111328, 0.0910114049911499, 0.17623543739318848, 0.26145946979522705, 0.3466835021972656, 0.4319075345993042, 0.5171315670013428, 0.6023555994033813, 0.6875796318054199, 0.7728036642074585, 0.8580276966094971, 0.9432517290115356, 1.0284757614135742, 1.1136997938156128, 1.1989238262176514, 1.28414785861969, 1.3693718910217285, 1.454595923423767, 1.5398199558258057, 1.6250439882278442, 1.7102680206298828, 1.7954920530319214, 1.88071608543396, 1.9659401178359985, 2.051164150238037, 2.1363883018493652, 2.2216122150421143, 2.3068361282348633, 2.3920602798461914, 2.4772844314575195, 2.5625083446502686, 2.6477322578430176, 2.7329564094543457, 2.818180561065674, 2.903404474258423, 2.988628387451172, 3.0738525390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 4.0, 8.0, 5.0, 12.0, 17.0, 9.0, 22.0, 35.0, 43.0, 50.0, 70.0, 86.0, 133.0, 188.0, 274.0, 468.0, 751.0, 1324.0, 2525.0, 6502.0, 34900.0, 4116277.0, 20235.0, 5024.0, 2191.0, 1123.0, 719.0, 411.0, 229.0, 169.0, 116.0, 93.0, 60.0, 53.0, 34.0, 35.0, 27.0, 14.0, 16.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.244140625, -1.208984375, -1.173828125, -1.138671875, -1.103515625, -1.068359375, -1.033203125, -0.998046875, -0.962890625, -0.927734375, -0.892578125, -0.857421875, -0.822265625, -0.787109375, -0.751953125, -0.716796875, -0.681640625, -0.646484375, -0.611328125, -0.576171875, -0.541015625, -0.505859375, -0.470703125, -0.435546875, -0.400390625, -0.365234375, -0.330078125, -0.294921875, -0.259765625, -0.224609375, -0.189453125, -0.154296875, -0.119140625, -0.083984375, -0.048828125, -0.013671875, 0.021484375, 0.056640625, 0.091796875, 0.126953125, 0.162109375, 0.197265625, 0.232421875, 0.267578125, 0.302734375, 0.337890625, 0.373046875, 0.408203125, 0.443359375, 0.478515625, 0.513671875, 0.548828125, 0.583984375, 0.619140625, 0.654296875, 0.689453125, 0.724609375, 0.759765625, 0.794921875, 0.830078125, 0.865234375, 0.900390625, 0.935546875, 0.970703125, 1.005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 11.0, 11.0, 13.0, 15.0, 21.0, 20.0, 26.0, 19.0, 32.0, 44.0, 47.0, 49.0, 47.0, 50.0, 40.0, 60.0, 51.0, 55.0, 56.0, 41.0, 35.0, 43.0, 34.0, 29.0, 24.0, 19.0, 29.0, 12.0, 13.0, 9.0, 8.0, 3.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11187744140625, -0.10806751251220703, -0.10425758361816406, -0.1004476547241211, -0.09663772583007812, -0.09282779693603516, -0.08901786804199219, -0.08520793914794922, -0.08139801025390625, -0.07758808135986328, -0.07377815246582031, -0.06996822357177734, -0.06615829467773438, -0.062348365783691406, -0.05853843688964844, -0.05472850799560547, -0.0509185791015625, -0.04710865020751953, -0.04329872131347656, -0.039488792419433594, -0.035678863525390625, -0.031868934631347656, -0.028059005737304688, -0.02424907684326172, -0.02043914794921875, -0.01662921905517578, -0.012819290161132812, -0.009009361267089844, -0.005199432373046875, -0.0013895034790039062, 0.0024204254150390625, 0.006230354309082031, 0.010040283203125, 0.013850212097167969, 0.017660140991210938, 0.021470069885253906, 0.025279998779296875, 0.029089927673339844, 0.03289985656738281, 0.03670978546142578, 0.04051971435546875, 0.04432964324951172, 0.04813957214355469, 0.051949501037597656, 0.055759429931640625, 0.059569358825683594, 0.06337928771972656, 0.06718921661376953, 0.0709991455078125, 0.07480907440185547, 0.07861900329589844, 0.0824289321899414, 0.08623886108398438, 0.09004878997802734, 0.09385871887207031, 0.09766864776611328, 0.10147857666015625, 0.10528850555419922, 0.10909843444824219, 0.11290836334228516, 0.11671829223632812, 0.1205282211303711, 0.12433815002441406, 0.12814807891845703, 0.1319580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 8.0, 11.0, 16.0, 19.0, 19.0, 29.0, 45.0, 53.0, 53.0, 61.0, 89.0, 109.0, 163.0, 228.0, 351.0, 613.0, 1298.0, 2966.0, 8976.0, 77439.0, 4074369.0, 18222.0, 4843.0, 1885.0, 892.0, 435.0, 272.0, 208.0, 137.0, 99.0, 82.0, 61.0, 41.0, 48.0, 29.0, 26.0, 20.0, 14.0, 8.0, 12.0, 6.0, 1.0, 5.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0], "bins": [-1.6728515625, -1.6253662109375, -1.577880859375, -1.5303955078125, -1.48291015625, -1.4354248046875, -1.387939453125, -1.3404541015625, -1.29296875, -1.2454833984375, -1.197998046875, -1.1505126953125, -1.10302734375, -1.0555419921875, -1.008056640625, -0.9605712890625, -0.9130859375, -0.8656005859375, -0.818115234375, -0.7706298828125, -0.72314453125, -0.6756591796875, -0.628173828125, -0.5806884765625, -0.533203125, -0.4857177734375, -0.438232421875, -0.3907470703125, -0.34326171875, -0.2957763671875, -0.248291015625, -0.2008056640625, -0.1533203125, -0.1058349609375, -0.058349609375, -0.0108642578125, 0.03662109375, 0.0841064453125, 0.131591796875, 0.1790771484375, 0.2265625, 0.2740478515625, 0.321533203125, 0.3690185546875, 0.41650390625, 0.4639892578125, 0.511474609375, 0.5589599609375, 0.6064453125, 0.6539306640625, 0.701416015625, 0.7489013671875, 0.79638671875, 0.8438720703125, 0.891357421875, 0.9388427734375, 0.986328125, 1.0338134765625, 1.081298828125, 1.1287841796875, 1.17626953125, 1.2237548828125, 1.271240234375, 1.3187255859375, 1.3662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 21.0, 26.0, 266.0, 3634.0, 55.0, 35.0, 10.0, 6.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.421875, -0.41082000732421875, -0.3997650146484375, -0.38871002197265625, -0.377655029296875, -0.36660003662109375, -0.3555450439453125, -0.34449005126953125, -0.33343505859375, -0.32238006591796875, -0.3113250732421875, -0.30027008056640625, -0.289215087890625, -0.27816009521484375, -0.2671051025390625, -0.25605010986328125, -0.2449951171875, -0.23394012451171875, -0.2228851318359375, -0.21183013916015625, -0.200775146484375, -0.18972015380859375, -0.1786651611328125, -0.16761016845703125, -0.15655517578125, -0.14550018310546875, -0.1344451904296875, -0.12339019775390625, -0.112335205078125, -0.10128021240234375, -0.0902252197265625, -0.07917022705078125, -0.068115234375, -0.05706024169921875, -0.0460052490234375, -0.03495025634765625, -0.023895263671875, -0.01284027099609375, -0.0017852783203125, 0.00926971435546875, 0.02032470703125, 0.03137969970703125, 0.0424346923828125, 0.05348968505859375, 0.064544677734375, 0.07559967041015625, 0.0866546630859375, 0.09770965576171875, 0.1087646484375, 0.11981964111328125, 0.1308746337890625, 0.14192962646484375, 0.152984619140625, 0.16403961181640625, 0.1750946044921875, 0.18614959716796875, 0.19720458984375, 0.20825958251953125, 0.2193145751953125, 0.23036956787109375, 0.241424560546875, 0.25247955322265625, 0.2635345458984375, 0.27458953857421875, 0.28564453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 15.0, 21.0, 40.0, 50.0, 101.0, 126.0, 126.0, 155.0, 102.0, 55.0, 63.0, 40.0, 34.0, 23.0, 17.0, 7.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.322012186050415, -1.2915350198745728, -1.26105797290802, -1.2305808067321777, -1.200103759765625, -1.1696265935897827, -1.1391494274139404, -1.1086723804473877, -1.0781952142715454, -1.0477180480957031, -1.0172410011291504, -0.9867638349533081, -0.9562867283821106, -0.9258096218109131, -0.8953325152397156, -0.8648554086685181, -0.8343782424926758, -0.8039011359214783, -0.7734240293502808, -0.7429468631744385, -0.712469756603241, -0.6819926500320435, -0.651515543460846, -0.6210384368896484, -0.5905613303184509, -0.5600842237472534, -0.5296071171760559, -0.499129980802536, -0.4686528444290161, -0.4381757378578186, -0.4076986312866211, -0.3772214949131012, -0.3467443585395813, -0.3162672519683838, -0.2857901155948639, -0.2553130090236664, -0.22483587265014648, -0.19435876607894897, -0.16388164460659027, -0.13340452313423157, -0.10292740166187286, -0.07245028018951416, -0.041973162442445755, -0.01149604469537735, 0.018981076776981354, 0.04945819079875946, 0.07993531227111816, 0.11041243374347687, 0.14088955521583557, 0.17136667668819427, 0.20184379816055298, 0.2323209047317505, 0.2627980411052704, 0.2932751476764679, 0.3237522840499878, 0.3542293906211853, 0.3847064971923828, 0.4151836037635803, 0.4456607401371002, 0.47613784670829773, 0.5066149830818176, 0.5370920896530151, 0.5675691962242126, 0.5980463027954102, 0.6285234689712524]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 9.0, 15.0, 16.0, 17.0, 20.0, 26.0, 19.0, 39.0, 39.0, 39.0, 24.0, 36.0, 44.0, 39.0, 43.0, 30.0, 38.0, 29.0, 37.0, 32.0, 41.0, 37.0, 38.0, 34.0, 36.0, 29.0, 32.0, 27.0, 26.0, 25.0, 13.0, 17.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5178878903388977, -0.5019795298576355, -0.4860711693763733, -0.47016283869743347, -0.45425447821617126, -0.43834611773490906, -0.42243778705596924, -0.40652942657470703, -0.3906210660934448, -0.3747127056121826, -0.3588043451309204, -0.3428960144519806, -0.3269876539707184, -0.3110792934894562, -0.29517096281051636, -0.27926260232925415, -0.26335424184799194, -0.24744588136672974, -0.23153753578662872, -0.2156291902065277, -0.1997208297252655, -0.1838124692440033, -0.16790412366390228, -0.15199577808380127, -0.13608741760253906, -0.12017906457185745, -0.10427071154117584, -0.08836235851049423, -0.07245400547981262, -0.05654565244913101, -0.0406372994184494, -0.024728946387767792, -0.008820533752441406, 0.007087819278240204, 0.022996172308921814, 0.038904525339603424, 0.054812878370285034, 0.07072123140096664, 0.08662958443164825, 0.10253793746232986, 0.11844629049301147, 0.13435465097427368, 0.1502629965543747, 0.1661713421344757, 0.18207970261573792, 0.19798806309700012, 0.21389640867710114, 0.22980475425720215, 0.24571311473846436, 0.26162147521972656, 0.27752983570098877, 0.2934381663799286, 0.3093465268611908, 0.325254887342453, 0.3411632180213928, 0.35707157850265503, 0.37297993898391724, 0.38888829946517944, 0.40479665994644165, 0.42070499062538147, 0.4366133511066437, 0.4525217115879059, 0.4684300422668457, 0.4843384027481079, 0.5002467632293701]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 16.0, 19.0, 16.0, 33.0, 63.0, 75.0, 120.0, 191.0, 289.0, 495.0, 830.0, 1393.0, 2509.0, 4797.0, 9345.0, 19601.0, 47541.0, 133874.0, 362436.0, 295145.0, 99701.0, 37069.0, 15934.0, 7808.0, 4028.0, 2152.0, 1209.0, 723.0, 405.0, 245.0, 162.0, 112.0, 59.0, 47.0, 30.0, 20.0, 16.0, 12.0, 17.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5140647888183594, -0.49932098388671875, -0.4845771789550781, -0.4698333740234375, -0.4550895690917969, -0.44034576416015625, -0.4256019592285156, -0.410858154296875, -0.3961143493652344, -0.38137054443359375, -0.3666267395019531, -0.3518829345703125, -0.3371391296386719, -0.32239532470703125, -0.3076515197753906, -0.29290771484375, -0.2781639099121094, -0.26342010498046875, -0.24867630004882812, -0.2339324951171875, -0.21918869018554688, -0.20444488525390625, -0.18970108032226562, -0.174957275390625, -0.16021347045898438, -0.14546966552734375, -0.13072586059570312, -0.1159820556640625, -0.10123825073242188, -0.08649444580078125, -0.07175064086914062, -0.0570068359375, -0.042263031005859375, -0.02751922607421875, -0.012775421142578125, 0.0019683837890625, 0.016712188720703125, 0.03145599365234375, 0.046199798583984375, 0.060943603515625, 0.07568740844726562, 0.09043121337890625, 0.10517501831054688, 0.1199188232421875, 0.13466262817382812, 0.14940643310546875, 0.16415023803710938, 0.17889404296875, 0.19363784790039062, 0.20838165283203125, 0.22312545776367188, 0.2378692626953125, 0.2526130676269531, 0.26735687255859375, 0.2821006774902344, 0.296844482421875, 0.3115882873535156, 0.32633209228515625, 0.3410758972167969, 0.3558197021484375, 0.3705635070800781, 0.38530731201171875, 0.4000511169433594, 0.414794921875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 2.0, 9.0, 12.0, 9.0, 14.0, 14.0, 16.0, 19.0, 24.0, 16.0, 27.0, 37.0, 36.0, 35.0, 38.0, 38.0, 46.0, 43.0, 37.0, 50.0, 45.0, 46.0, 43.0, 44.0, 38.0, 43.0, 34.0, 24.0, 27.0, 27.0, 27.0, 15.0, 14.0, 9.0, 3.0, 9.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1260986328125, -0.12201881408691406, -0.11793899536132812, -0.11385917663574219, -0.10977935791015625, -0.10569953918457031, -0.10161972045898438, -0.09753990173339844, -0.0934600830078125, -0.08938026428222656, -0.08530044555664062, -0.08122062683105469, -0.07714080810546875, -0.07306098937988281, -0.06898117065429688, -0.06490135192871094, -0.060821533203125, -0.05674171447753906, -0.052661895751953125, -0.04858207702636719, -0.04450225830078125, -0.04042243957519531, -0.036342620849609375, -0.03226280212402344, -0.0281829833984375, -0.024103164672851562, -0.020023345947265625, -0.015943527221679688, -0.01186370849609375, -0.0077838897705078125, -0.003704071044921875, 0.0003757476806640625, 0.00445556640625, 0.008535385131835938, 0.012615203857421875, 0.016695022583007812, 0.02077484130859375, 0.024854660034179688, 0.028934478759765625, 0.03301429748535156, 0.0370941162109375, 0.04117393493652344, 0.045253753662109375, 0.04933357238769531, 0.05341339111328125, 0.05749320983886719, 0.061573028564453125, 0.06565284729003906, 0.069732666015625, 0.07381248474121094, 0.07789230346679688, 0.08197212219238281, 0.08605194091796875, 0.09013175964355469, 0.09421157836914062, 0.09829139709472656, 0.1023712158203125, 0.10645103454589844, 0.11053085327148438, 0.11461067199707031, 0.11869049072265625, 0.12277030944824219, 0.12685012817382812, 0.13092994689941406, 0.135009765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 10.0, 13.0, 17.0, 24.0, 42.0, 50.0, 61.0, 102.0, 149.0, 227.0, 339.0, 511.0, 864.0, 1501.0, 2480.0, 5107.0, 11059.0, 28469.0, 89941.0, 332654.0, 404642.0, 110637.0, 33801.0, 13031.0, 5753.0, 2872.0, 1511.0, 899.0, 542.0, 401.0, 247.0, 180.0, 98.0, 76.0, 66.0, 37.0, 27.0, 22.0, 15.0, 17.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.433837890625, -0.4198799133300781, -0.40592193603515625, -0.3919639587402344, -0.3780059814453125, -0.3640480041503906, -0.35009002685546875, -0.3361320495605469, -0.322174072265625, -0.3082160949707031, -0.29425811767578125, -0.2803001403808594, -0.2663421630859375, -0.2523841857910156, -0.23842620849609375, -0.22446823120117188, -0.21051025390625, -0.19655227661132812, -0.18259429931640625, -0.16863632202148438, -0.1546783447265625, -0.14072036743164062, -0.12676239013671875, -0.11280441284179688, -0.098846435546875, -0.08488845825195312, -0.07093048095703125, -0.056972503662109375, -0.0430145263671875, -0.029056549072265625, -0.01509857177734375, -0.001140594482421875, 0.0128173828125, 0.026775360107421875, 0.04073333740234375, 0.054691314697265625, 0.0686492919921875, 0.08260726928710938, 0.09656524658203125, 0.11052322387695312, 0.124481201171875, 0.13843917846679688, 0.15239715576171875, 0.16635513305664062, 0.1803131103515625, 0.19427108764648438, 0.20822906494140625, 0.22218704223632812, 0.23614501953125, 0.2501029968261719, 0.26406097412109375, 0.2780189514160156, 0.2919769287109375, 0.3059349060058594, 0.31989288330078125, 0.3338508605957031, 0.347808837890625, 0.3617668151855469, 0.37572479248046875, 0.3896827697753906, 0.4036407470703125, 0.4175987243652344, 0.43155670166015625, 0.4455146789550781, 0.45947265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 19.0, 18.0, 35.0, 15.0, 44.0, 37.0, 50.0, 48.0, 41.0, 51.0, 61.0, 50.0, 51.0, 50.0, 52.0, 42.0, 42.0, 57.0, 31.0, 36.0, 30.0, 24.0, 18.0, 22.0, 10.0, 12.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.617431640625, -0.59228515625, -0.567138671875, -0.5419921875, -0.516845703125, -0.49169921875, -0.466552734375, -0.44140625, -0.416259765625, -0.39111328125, -0.365966796875, -0.3408203125, -0.315673828125, -0.29052734375, -0.265380859375, -0.240234375, -0.215087890625, -0.18994140625, -0.164794921875, -0.1396484375, -0.114501953125, -0.08935546875, -0.064208984375, -0.0390625, -0.013916015625, 0.01123046875, 0.036376953125, 0.0615234375, 0.086669921875, 0.11181640625, 0.136962890625, 0.162109375, 0.187255859375, 0.21240234375, 0.237548828125, 0.2626953125, 0.287841796875, 0.31298828125, 0.338134765625, 0.36328125, 0.388427734375, 0.41357421875, 0.438720703125, 0.4638671875, 0.489013671875, 0.51416015625, 0.539306640625, 0.564453125, 0.589599609375, 0.61474609375, 0.639892578125, 0.6650390625, 0.690185546875, 0.71533203125, 0.740478515625, 0.765625, 0.790771484375, 0.81591796875, 0.841064453125, 0.8662109375, 0.891357421875, 0.91650390625, 0.941650390625, 0.966796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 4.0, 11.0, 18.0, 20.0, 29.0, 35.0, 58.0, 86.0, 120.0, 172.0, 282.0, 478.0, 851.0, 1786.0, 3753.0, 9491.0, 31748.0, 179988.0, 644234.0, 133647.0, 26105.0, 8497.0, 3401.0, 1633.0, 848.0, 465.0, 272.0, 155.0, 102.0, 65.0, 50.0, 31.0, 27.0, 23.0, 10.0, 14.0, 5.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.43603515625, -0.42438507080078125, -0.4127349853515625, -0.40108489990234375, -0.389434814453125, -0.37778472900390625, -0.3661346435546875, -0.35448455810546875, -0.34283447265625, -0.33118438720703125, -0.3195343017578125, -0.30788421630859375, -0.296234130859375, -0.28458404541015625, -0.2729339599609375, -0.26128387451171875, -0.2496337890625, -0.23798370361328125, -0.2263336181640625, -0.21468353271484375, -0.203033447265625, -0.19138336181640625, -0.1797332763671875, -0.16808319091796875, -0.15643310546875, -0.14478302001953125, -0.1331329345703125, -0.12148284912109375, -0.109832763671875, -0.09818267822265625, -0.0865325927734375, -0.07488250732421875, -0.063232421875, -0.05158233642578125, -0.0399322509765625, -0.02828216552734375, -0.016632080078125, -0.00498199462890625, 0.0066680908203125, 0.01831817626953125, 0.02996826171875, 0.04161834716796875, 0.0532684326171875, 0.06491851806640625, 0.076568603515625, 0.08821868896484375, 0.0998687744140625, 0.11151885986328125, 0.1231689453125, 0.13481903076171875, 0.1464691162109375, 0.15811920166015625, 0.169769287109375, 0.18141937255859375, 0.1930694580078125, 0.20471954345703125, 0.21636962890625, 0.22801971435546875, 0.2396697998046875, 0.25131988525390625, 0.262969970703125, 0.27462005615234375, 0.2862701416015625, 0.29792022705078125, 0.3095703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 2.0, 14.0, 17.0, 26.0, 35.0, 36.0, 46.0, 72.0, 95.0, 96.0, 110.0, 105.0, 86.0, 65.0, 56.0, 34.0, 30.0, 17.0, 14.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.343292236328125e-05, -7.093511521816254e-05, -6.843730807304382e-05, -6.593950092792511e-05, -6.34416937828064e-05, -6.094388663768768e-05, -5.844607949256897e-05, -5.5948272347450256e-05, -5.345046520233154e-05, -5.095265805721283e-05, -4.8454850912094116e-05, -4.59570437669754e-05, -4.345923662185669e-05, -4.0961429476737976e-05, -3.846362233161926e-05, -3.596581518650055e-05, -3.3468008041381836e-05, -3.097020089626312e-05, -2.847239375114441e-05, -2.5974586606025696e-05, -2.3476779460906982e-05, -2.097897231578827e-05, -1.8481165170669556e-05, -1.5983358025550842e-05, -1.3485550880432129e-05, -1.0987743735313416e-05, -8.489936590194702e-06, -5.992129445075989e-06, -3.4943222999572754e-06, -9.96515154838562e-07, 1.5012919902801514e-06, 3.999099135398865e-06, 6.496906280517578e-06, 8.994713425636292e-06, 1.1492520570755005e-05, 1.3990327715873718e-05, 1.648813486099243e-05, 1.8985942006111145e-05, 2.148374915122986e-05, 2.3981556296348572e-05, 2.6479363441467285e-05, 2.8977170586586e-05, 3.147497773170471e-05, 3.3972784876823425e-05, 3.647059202194214e-05, 3.896839916706085e-05, 4.1466206312179565e-05, 4.396401345729828e-05, 4.646182060241699e-05, 4.8959627747535706e-05, 5.145743489265442e-05, 5.395524203777313e-05, 5.6453049182891846e-05, 5.895085632801056e-05, 6.144866347312927e-05, 6.394647061824799e-05, 6.64442777633667e-05, 6.894208490848541e-05, 7.143989205360413e-05, 7.393769919872284e-05, 7.643550634384155e-05, 7.893331348896027e-05, 8.143112063407898e-05, 8.392892777919769e-05, 8.64267349243164e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 8.0, 10.0, 24.0, 28.0, 51.0, 73.0, 106.0, 210.0, 322.0, 753.0, 1645.0, 4920.0, 19530.0, 171505.0, 749913.0, 81004.0, 12441.0, 3440.0, 1294.0, 510.0, 331.0, 183.0, 91.0, 55.0, 36.0, 26.0, 15.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.625, -0.6073226928710938, -0.5896453857421875, -0.5719680786132812, -0.554290771484375, -0.5366134643554688, -0.5189361572265625, -0.5012588500976562, -0.48358154296875, -0.46590423583984375, -0.4482269287109375, -0.43054962158203125, -0.412872314453125, -0.39519500732421875, -0.3775177001953125, -0.35984039306640625, -0.3421630859375, -0.32448577880859375, -0.3068084716796875, -0.28913116455078125, -0.271453857421875, -0.25377655029296875, -0.2360992431640625, -0.21842193603515625, -0.20074462890625, -0.18306732177734375, -0.1653900146484375, -0.14771270751953125, -0.130035400390625, -0.11235809326171875, -0.0946807861328125, -0.07700347900390625, -0.059326171875, -0.04164886474609375, -0.0239715576171875, -0.00629425048828125, 0.011383056640625, 0.02906036376953125, 0.0467376708984375, 0.06441497802734375, 0.08209228515625, 0.09976959228515625, 0.1174468994140625, 0.13512420654296875, 0.152801513671875, 0.17047882080078125, 0.1881561279296875, 0.20583343505859375, 0.2235107421875, 0.24118804931640625, 0.2588653564453125, 0.27654266357421875, 0.294219970703125, 0.31189727783203125, 0.3295745849609375, 0.34725189208984375, 0.36492919921875, 0.38260650634765625, 0.4002838134765625, 0.41796112060546875, 0.435638427734375, 0.45331573486328125, 0.4709930419921875, 0.48867034912109375, 0.50634765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 14.0, 28.0, 30.0, 53.0, 96.0, 141.0, 159.0, 154.0, 131.0, 82.0, 41.0, 28.0, 14.0, 12.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8369140625, -0.8194084167480469, -0.8019027709960938, -0.7843971252441406, -0.7668914794921875, -0.7493858337402344, -0.7318801879882812, -0.7143745422363281, -0.696868896484375, -0.6793632507324219, -0.6618576049804688, -0.6443519592285156, -0.6268463134765625, -0.6093406677246094, -0.5918350219726562, -0.5743293762207031, -0.55682373046875, -0.5393180847167969, -0.5218124389648438, -0.5043067932128906, -0.4868011474609375, -0.4692955017089844, -0.45178985595703125, -0.4342842102050781, -0.416778564453125, -0.3992729187011719, -0.38176727294921875, -0.3642616271972656, -0.3467559814453125, -0.3292503356933594, -0.31174468994140625, -0.2942390441894531, -0.2767333984375, -0.2592277526855469, -0.24172210693359375, -0.22421646118164062, -0.2067108154296875, -0.18920516967773438, -0.17169952392578125, -0.15419387817382812, -0.136688232421875, -0.11918258666992188, -0.10167694091796875, -0.08417129516601562, -0.0666656494140625, -0.049160003662109375, -0.03165435791015625, -0.014148712158203125, 0.00335693359375, 0.020862579345703125, 0.03836822509765625, 0.055873870849609375, 0.0733795166015625, 0.09088516235351562, 0.10839080810546875, 0.12589645385742188, 0.143402099609375, 0.16090774536132812, 0.17841339111328125, 0.19591903686523438, 0.2134246826171875, 0.23093032836914062, 0.24843597412109375, 0.2659416198730469, 0.283447265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 15.0, 13.0, 25.0, 53.0, 75.0, 98.0, 143.0, 132.0, 118.0, 90.0, 86.0, 61.0, 30.0, 10.0, 17.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910872220993042, -3.7437593936920166, -3.576646566390991, -3.409533739089966, -3.2424209117889404, -3.075308084487915, -2.9081954956054688, -2.7410826683044434, -2.573969841003418, -2.4068570137023926, -2.239744186401367, -2.072631359100342, -1.9055185317993164, -1.738405704498291, -1.5712929964065552, -1.4041801691055298, -1.2370672225952148, -1.0699543952941895, -0.9028415679931641, -0.7357288002967834, -0.5686159729957581, -0.40150314569473267, -0.23439037799835205, -0.06727755069732666, 0.09983527660369873, 0.2669481039047241, 0.4340609014034271, 0.6011736989021301, 0.7682865262031555, 0.9353993535041809, 1.1025121212005615, 1.269624948501587, 1.4367375373840332, 1.6038503646850586, 1.770963191986084, 1.9380760192871094, 2.1051888465881348, 2.27230167388916, 2.4394145011901855, 2.606527328491211, 2.7736401557922363, 2.9407529830932617, 3.107865810394287, 3.2749786376953125, 3.442091464996338, 3.6092042922973633, 3.7763171195983887, 3.943429946899414, 4.110542297363281, 4.277655124664307, 4.444767951965332, 4.611880779266357, 4.778993606567383, 4.946106433868408, 5.113219261169434, 5.280332088470459, 5.447444915771484, 5.61455774307251, 5.781670570373535, 5.9487833976745605, 6.115896224975586, 6.283009052276611, 6.450121879577637, 6.617234706878662, 6.7843475341796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 6.0, 6.0, 4.0, 7.0, 11.0, 8.0, 19.0, 13.0, 17.0, 26.0, 26.0, 31.0, 31.0, 32.0, 36.0, 33.0, 47.0, 41.0, 34.0, 50.0, 53.0, 50.0, 43.0, 53.0, 37.0, 36.0, 34.0, 26.0, 31.0, 18.0, 20.0, 23.0, 11.0, 11.0, 8.0, 11.0, 13.0, 8.0, 11.0, 3.0, 9.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.3878402709960938, -3.2825968265533447, -3.1773533821105957, -3.072110176086426, -2.9668667316436768, -2.8616232872009277, -2.7563798427581787, -2.6511363983154297, -2.5458931922912598, -2.4406497478485107, -2.3354063034057617, -2.230163097381592, -2.1249196529388428, -2.0196762084960938, -1.9144327640533447, -1.8091894388198853, -1.7039459943771362, -1.5987025499343872, -1.4934592247009277, -1.3882157802581787, -1.2829724550247192, -1.1777290105819702, -1.0724856853485107, -0.9672422409057617, -0.8619988560676575, -0.7567554712295532, -0.651512086391449, -0.5462687015533447, -0.4410252869129181, -0.33578187227249146, -0.2305384874343872, -0.12529510259628296, -0.02005171775817871, 0.08519167453050613, 0.19043506681919098, 0.2956784665584564, 0.40092185139656067, 0.5061652660369873, 0.6114086508750916, 0.7166520357131958, 0.8218954205513, 0.9271388053894043, 1.0323822498321533, 1.1376255750656128, 1.2428690195083618, 1.3481123447418213, 1.4533557891845703, 1.5585992336273193, 1.6638425588607788, 1.7690860033035278, 1.8743293285369873, 1.9795727729797363, 2.0848162174224854, 2.1900596618652344, 2.2953028678894043, 2.4005463123321533, 2.5057897567749023, 2.6110332012176514, 2.7162766456604004, 2.8215198516845703, 2.9267632961273193, 3.0320067405700684, 3.1372501850128174, 3.2424936294555664, 3.3477368354797363]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 9.0, 6.0, 12.0, 11.0, 12.0, 31.0, 25.0, 39.0, 46.0, 57.0, 78.0, 109.0, 141.0, 255.0, 375.0, 590.0, 963.0, 1684.0, 3071.0, 6573.0, 20916.0, 3949820.0, 180957.0, 16214.0, 5651.0, 2691.0, 1400.0, 901.0, 486.0, 361.0, 252.0, 123.0, 103.0, 78.0, 62.0, 48.0, 29.0, 25.0, 29.0, 10.0, 8.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.87451171875, -0.8487167358398438, -0.8229217529296875, -0.7971267700195312, -0.771331787109375, -0.7455368041992188, -0.7197418212890625, -0.6939468383789062, -0.66815185546875, -0.6423568725585938, -0.6165618896484375, -0.5907669067382812, -0.564971923828125, -0.5391769409179688, -0.5133819580078125, -0.48758697509765625, -0.4617919921875, -0.43599700927734375, -0.4102020263671875, -0.38440704345703125, -0.358612060546875, -0.33281707763671875, -0.3070220947265625, -0.28122711181640625, -0.25543212890625, -0.22963714599609375, -0.2038421630859375, -0.17804718017578125, -0.152252197265625, -0.12645721435546875, -0.1006622314453125, -0.07486724853515625, -0.049072265625, -0.02327728271484375, 0.0025177001953125, 0.02831268310546875, 0.054107666015625, 0.07990264892578125, 0.1056976318359375, 0.13149261474609375, 0.15728759765625, 0.18308258056640625, 0.2088775634765625, 0.23467254638671875, 0.260467529296875, 0.28626251220703125, 0.3120574951171875, 0.33785247802734375, 0.3636474609375, 0.38944244384765625, 0.4152374267578125, 0.44103240966796875, 0.466827392578125, 0.49262237548828125, 0.5184173583984375, 0.5442123413085938, 0.57000732421875, 0.5958023071289062, 0.6215972900390625, 0.6473922729492188, 0.673187255859375, 0.6989822387695312, 0.7247772216796875, 0.7505722045898438, 0.7763671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 15.0, 11.0, 24.0, 24.0, 35.0, 34.0, 38.0, 43.0, 43.0, 52.0, 55.0, 42.0, 57.0, 57.0, 51.0, 52.0, 59.0, 42.0, 45.0, 26.0, 26.0, 21.0, 23.0, 15.0, 19.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14480018615722656, -0.14030838012695312, -0.1358165740966797, -0.13132476806640625, -0.1268329620361328, -0.12234115600585938, -0.11784934997558594, -0.1133575439453125, -0.10886573791503906, -0.10437393188476562, -0.09988212585449219, -0.09539031982421875, -0.09089851379394531, -0.08640670776367188, -0.08191490173339844, -0.077423095703125, -0.07293128967285156, -0.06843948364257812, -0.06394767761230469, -0.05945587158203125, -0.05496406555175781, -0.050472259521484375, -0.04598045349121094, -0.0414886474609375, -0.03699684143066406, -0.032505035400390625, -0.028013229370117188, -0.02352142333984375, -0.019029617309570312, -0.014537811279296875, -0.010046005249023438, -0.00555419921875, -0.0010623931884765625, 0.003429412841796875, 0.007921218872070312, 0.01241302490234375, 0.016904830932617188, 0.021396636962890625, 0.025888442993164062, 0.0303802490234375, 0.03487205505371094, 0.039363861083984375, 0.04385566711425781, 0.04834747314453125, 0.05283927917480469, 0.057331085205078125, 0.06182289123535156, 0.066314697265625, 0.07080650329589844, 0.07529830932617188, 0.07979011535644531, 0.08428192138671875, 0.08877372741699219, 0.09326553344726562, 0.09775733947753906, 0.1022491455078125, 0.10674095153808594, 0.11123275756835938, 0.11572456359863281, 0.12021636962890625, 0.12470817565917969, 0.12919998168945312, 0.13369178771972656, 0.13818359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 10.0, 12.0, 22.0, 34.0, 29.0, 46.0, 54.0, 75.0, 134.0, 171.0, 343.0, 701.0, 1316.0, 2972.0, 8733.0, 44805.0, 4093357.0, 29494.0, 6811.0, 2550.0, 1142.0, 561.0, 320.0, 155.0, 106.0, 79.0, 53.0, 45.0, 29.0, 26.0, 15.0, 14.0, 9.0, 10.0, 13.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.90234375, -1.8486175537109375, -1.794891357421875, -1.7411651611328125, -1.68743896484375, -1.6337127685546875, -1.579986572265625, -1.5262603759765625, -1.4725341796875, -1.4188079833984375, -1.365081787109375, -1.3113555908203125, -1.25762939453125, -1.2039031982421875, -1.150177001953125, -1.0964508056640625, -1.042724609375, -0.9889984130859375, -0.935272216796875, -0.8815460205078125, -0.82781982421875, -0.7740936279296875, -0.720367431640625, -0.6666412353515625, -0.6129150390625, -0.5591888427734375, -0.505462646484375, -0.4517364501953125, -0.39801025390625, -0.3442840576171875, -0.290557861328125, -0.2368316650390625, -0.18310546875, -0.1293792724609375, -0.075653076171875, -0.0219268798828125, 0.03179931640625, 0.0855255126953125, 0.139251708984375, 0.1929779052734375, 0.2467041015625, 0.3004302978515625, 0.354156494140625, 0.4078826904296875, 0.46160888671875, 0.5153350830078125, 0.569061279296875, 0.6227874755859375, 0.676513671875, 0.7302398681640625, 0.783966064453125, 0.8376922607421875, 0.89141845703125, 0.9451446533203125, 0.998870849609375, 1.0525970458984375, 1.1063232421875, 1.1600494384765625, 1.213775634765625, 1.2675018310546875, 1.32122802734375, 1.3749542236328125, 1.428680419921875, 1.4824066162109375, 1.5361328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 9.0, 18.0, 20.0, 85.0, 3673.0, 189.0, 30.0, 18.0, 7.0, 8.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.517791748046875, -0.50286865234375, -0.487945556640625, -0.4730224609375, -0.458099365234375, -0.44317626953125, -0.428253173828125, -0.413330078125, -0.398406982421875, -0.38348388671875, -0.368560791015625, -0.3536376953125, -0.338714599609375, -0.32379150390625, -0.308868408203125, -0.2939453125, -0.279022216796875, -0.26409912109375, -0.249176025390625, -0.2342529296875, -0.219329833984375, -0.20440673828125, -0.189483642578125, -0.174560546875, -0.159637451171875, -0.14471435546875, -0.129791259765625, -0.1148681640625, -0.099945068359375, -0.08502197265625, -0.070098876953125, -0.05517578125, -0.040252685546875, -0.02532958984375, -0.010406494140625, 0.0045166015625, 0.019439697265625, 0.03436279296875, 0.049285888671875, 0.064208984375, 0.079132080078125, 0.09405517578125, 0.108978271484375, 0.1239013671875, 0.138824462890625, 0.15374755859375, 0.168670654296875, 0.18359375, 0.198516845703125, 0.21343994140625, 0.228363037109375, 0.2432861328125, 0.258209228515625, 0.27313232421875, 0.288055419921875, 0.302978515625, 0.317901611328125, 0.33282470703125, 0.347747802734375, 0.3626708984375, 0.377593994140625, 0.39251708984375, 0.407440185546875, 0.42236328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 5.0, 10.0, 8.0, 18.0, 27.0, 24.0, 44.0, 73.0, 90.0, 93.0, 109.0, 131.0, 84.0, 87.0, 50.0, 36.0, 32.0, 24.0, 16.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0571504831314087, -1.0264272689819336, -0.9957041144371033, -0.964980959892273, -0.9342578053474426, -0.9035346508026123, -0.8728114366531372, -0.8420882821083069, -0.8113651275634766, -0.7806419730186462, -0.7499187588691711, -0.7191956043243408, -0.6884724497795105, -0.6577492952346802, -0.6270260810852051, -0.5963029265403748, -0.5655797719955444, -0.5348566174507141, -0.504133403301239, -0.4734102487564087, -0.44268709421157837, -0.41196390986442566, -0.38124072551727295, -0.3505175709724426, -0.31979435682296753, -0.2890711724758148, -0.2583480179309845, -0.2276248335838318, -0.19690167903900146, -0.16617849469184875, -0.13545532524585724, -0.10473215579986572, -0.0740090012550354, -0.043285831809043884, -0.01256265863776207, 0.018160514533519745, 0.04888368397951126, 0.07960686087608337, 0.11033003032207489, 0.1410531997680664, 0.17177636921405792, 0.20249953866004944, 0.23322270810604095, 0.26394587755203247, 0.2946690618991852, 0.3253922462463379, 0.3561154007911682, 0.38683855533599854, 0.41756173968315125, 0.44828492403030396, 0.4790080785751343, 0.5097312331199646, 0.5404544472694397, 0.57117760181427, 0.6019007563591003, 0.6326239109039307, 0.6633471250534058, 0.6940702795982361, 0.7247934937477112, 0.7555166482925415, 0.7862398028373718, 0.8169629573822021, 0.8476861715316772, 0.8784093260765076, 0.9091324806213379]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 5.0, 12.0, 10.0, 9.0, 14.0, 12.0, 14.0, 28.0, 29.0, 16.0, 27.0, 32.0, 29.0, 43.0, 27.0, 38.0, 40.0, 40.0, 34.0, 48.0, 52.0, 35.0, 43.0, 40.0, 33.0, 43.0, 39.0, 24.0, 30.0, 23.0, 22.0, 13.0, 20.0, 19.0, 11.0, 8.0, 11.0, 3.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5670897960662842, -0.5485234260559082, -0.5299570560455322, -0.5113906860351562, -0.4928243160247803, -0.4742579460144043, -0.45569154620170593, -0.43712517619132996, -0.418558806180954, -0.399992436170578, -0.381426066160202, -0.36285969614982605, -0.3442932963371277, -0.3257269263267517, -0.30716055631637573, -0.28859418630599976, -0.2700278162956238, -0.2514614462852478, -0.23289507627487183, -0.21432869136333466, -0.19576232135295868, -0.1771959513425827, -0.15862956643104553, -0.14006319642066956, -0.12149682641029358, -0.1029304563999176, -0.08436407893896103, -0.06579770147800446, -0.04723133146762848, -0.028664961457252502, -0.010098583996295929, 0.008467793464660645, 0.027034103870391846, 0.04560047760605812, 0.0641668513417244, 0.08273322880268097, 0.10129959881305695, 0.11986596882343292, 0.1384323537349701, 0.15699872374534607, 0.17556509375572205, 0.19413146376609802, 0.212697833776474, 0.23126421868801117, 0.24983058869838715, 0.2683969736099243, 0.2869633436203003, 0.30552971363067627, 0.32409608364105225, 0.3426624536514282, 0.3612288236618042, 0.3797951936721802, 0.39836156368255615, 0.41692793369293213, 0.4354943335056305, 0.45406070351600647, 0.47262707352638245, 0.4911934435367584, 0.5097598433494568, 0.5283262133598328, 0.5468925833702087, 0.5654589533805847, 0.5840253233909607, 0.6025916934013367, 0.6211580634117126]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 30.0, 34.0, 58.0, 89.0, 181.0, 347.0, 560.0, 1013.0, 1973.0, 4013.0, 8240.0, 18621.0, 47117.0, 144742.0, 395093.0, 282105.0, 88009.0, 31174.0, 12979.0, 5871.0, 2983.0, 1486.0, 800.0, 451.0, 219.0, 138.0, 73.0, 41.0, 38.0, 16.0, 10.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.4110069274902344, -0.39720916748046875, -0.3834114074707031, -0.3696136474609375, -0.3558158874511719, -0.34201812744140625, -0.3282203674316406, -0.314422607421875, -0.3006248474121094, -0.28682708740234375, -0.2730293273925781, -0.2592315673828125, -0.24543380737304688, -0.23163604736328125, -0.21783828735351562, -0.20404052734375, -0.19024276733398438, -0.17644500732421875, -0.16264724731445312, -0.1488494873046875, -0.13505172729492188, -0.12125396728515625, -0.10745620727539062, -0.093658447265625, -0.07986068725585938, -0.06606292724609375, -0.052265167236328125, -0.0384674072265625, -0.024669647216796875, -0.01087188720703125, 0.002925872802734375, 0.0167236328125, 0.030521392822265625, 0.04431915283203125, 0.058116912841796875, 0.0719146728515625, 0.08571243286132812, 0.09951019287109375, 0.11330795288085938, 0.127105712890625, 0.14090347290039062, 0.15470123291015625, 0.16849899291992188, 0.1822967529296875, 0.19609451293945312, 0.20989227294921875, 0.22369003295898438, 0.23748779296875, 0.2512855529785156, 0.26508331298828125, 0.2788810729980469, 0.2926788330078125, 0.3064765930175781, 0.32027435302734375, 0.3340721130371094, 0.347869873046875, 0.3616676330566406, 0.37546539306640625, 0.3892631530761719, 0.4030609130859375, 0.4168586730957031, 0.43065643310546875, 0.4444541931152344, 0.458251953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 8.0, 7.0, 17.0, 13.0, 22.0, 32.0, 13.0, 31.0, 42.0, 48.0, 43.0, 45.0, 44.0, 57.0, 55.0, 58.0, 52.0, 52.0, 67.0, 47.0, 62.0, 33.0, 26.0, 21.0, 21.0, 14.0, 17.0, 13.0, 9.0, 1.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.2374267578125, -0.23132705688476562, -0.22522735595703125, -0.21912765502929688, -0.2130279541015625, -0.20692825317382812, -0.20082855224609375, -0.19472885131835938, -0.188629150390625, -0.18252944946289062, -0.17642974853515625, -0.17033004760742188, -0.1642303466796875, -0.15813064575195312, -0.15203094482421875, -0.14593124389648438, -0.13983154296875, -0.13373184204101562, -0.12763214111328125, -0.12153244018554688, -0.1154327392578125, -0.10933303833007812, -0.10323333740234375, -0.09713363647460938, -0.091033935546875, -0.08493423461914062, -0.07883453369140625, -0.07273483276367188, -0.0666351318359375, -0.060535430908203125, -0.05443572998046875, -0.048336029052734375, -0.042236328125, -0.036136627197265625, -0.03003692626953125, -0.023937225341796875, -0.0178375244140625, -0.011737823486328125, -0.00563812255859375, 0.000461578369140625, 0.006561279296875, 0.012660980224609375, 0.01876068115234375, 0.024860382080078125, 0.0309600830078125, 0.037059783935546875, 0.04315948486328125, 0.049259185791015625, 0.05535888671875, 0.061458587646484375, 0.06755828857421875, 0.07365798950195312, 0.0797576904296875, 0.08585739135742188, 0.09195709228515625, 0.09805679321289062, 0.104156494140625, 0.11025619506835938, 0.11635589599609375, 0.12245559692382812, 0.1285552978515625, 0.13465499877929688, 0.14075469970703125, 0.14685440063476562, 0.1529541015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 3.0, 11.0, 14.0, 14.0, 20.0, 34.0, 60.0, 101.0, 116.0, 241.0, 370.0, 662.0, 1615.0, 4415.0, 17222.0, 130962.0, 765196.0, 105614.0, 14859.0, 3981.0, 1505.0, 644.0, 337.0, 193.0, 119.0, 60.0, 54.0, 35.0, 20.0, 19.0, 12.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.748046875, -0.7208023071289062, -0.6935577392578125, -0.6663131713867188, -0.639068603515625, -0.6118240356445312, -0.5845794677734375, -0.5573348999023438, -0.53009033203125, -0.5028457641601562, -0.4756011962890625, -0.44835662841796875, -0.421112060546875, -0.39386749267578125, -0.3666229248046875, -0.33937835693359375, -0.3121337890625, -0.28488922119140625, -0.2576446533203125, -0.23040008544921875, -0.203155517578125, -0.17591094970703125, -0.1486663818359375, -0.12142181396484375, -0.09417724609375, -0.06693267822265625, -0.0396881103515625, -0.01244354248046875, 0.014801025390625, 0.04204559326171875, 0.0692901611328125, 0.09653472900390625, 0.123779296875, 0.15102386474609375, 0.1782684326171875, 0.20551300048828125, 0.232757568359375, 0.26000213623046875, 0.2872467041015625, 0.31449127197265625, 0.34173583984375, 0.36898040771484375, 0.3962249755859375, 0.42346954345703125, 0.450714111328125, 0.47795867919921875, 0.5052032470703125, 0.5324478149414062, 0.5596923828125, 0.5869369506835938, 0.6141815185546875, 0.6414260864257812, 0.668670654296875, 0.6959152221679688, 0.7231597900390625, 0.7504043579101562, 0.77764892578125, 0.8048934936523438, 0.8321380615234375, 0.8593826293945312, 0.886627197265625, 0.9138717651367188, 0.9411163330078125, 0.9683609008789062, 0.99560546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 6.0, 11.0, 12.0, 15.0, 16.0, 13.0, 31.0, 25.0, 24.0, 41.0, 36.0, 45.0, 47.0, 49.0, 71.0, 57.0, 52.0, 59.0, 61.0, 45.0, 45.0, 54.0, 27.0, 25.0, 27.0, 28.0, 17.0, 19.0, 10.0, 8.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1058578491210938, -1.0759735107421875, -1.0460891723632812, -1.016204833984375, -0.9863204956054688, -0.9564361572265625, -0.9265518188476562, -0.89666748046875, -0.8667831420898438, -0.8368988037109375, -0.8070144653320312, -0.777130126953125, -0.7472457885742188, -0.7173614501953125, -0.6874771118164062, -0.6575927734375, -0.6277084350585938, -0.5978240966796875, -0.5679397583007812, -0.538055419921875, -0.5081710815429688, -0.4782867431640625, -0.44840240478515625, -0.41851806640625, -0.38863372802734375, -0.3587493896484375, -0.32886505126953125, -0.298980712890625, -0.26909637451171875, -0.2392120361328125, -0.20932769775390625, -0.179443359375, -0.14955902099609375, -0.1196746826171875, -0.08979034423828125, -0.059906005859375, -0.03002166748046875, -0.0001373291015625, 0.02974700927734375, 0.05963134765625, 0.08951568603515625, 0.1194000244140625, 0.14928436279296875, 0.179168701171875, 0.20905303955078125, 0.2389373779296875, 0.26882171630859375, 0.2987060546875, 0.32859039306640625, 0.3584747314453125, 0.38835906982421875, 0.418243408203125, 0.44812774658203125, 0.4780120849609375, 0.5078964233398438, 0.53778076171875, 0.5676651000976562, 0.5975494384765625, 0.6274337768554688, 0.657318115234375, 0.6872024536132812, 0.7170867919921875, 0.7469711303710938, 0.77685546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 11.0, 10.0, 17.0, 26.0, 51.0, 67.0, 109.0, 169.0, 247.0, 406.0, 814.0, 1728.0, 4718.0, 18604.0, 134708.0, 730058.0, 130443.0, 17943.0, 4717.0, 1695.0, 823.0, 437.0, 251.0, 166.0, 121.0, 65.0, 29.0, 14.0, 29.0, 29.0, 12.0, 15.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394775390625, -0.3813896179199219, -0.36800384521484375, -0.3546180725097656, -0.3412322998046875, -0.3278465270996094, -0.31446075439453125, -0.3010749816894531, -0.287689208984375, -0.2743034362792969, -0.26091766357421875, -0.24753189086914062, -0.2341461181640625, -0.22076034545898438, -0.20737457275390625, -0.19398880004882812, -0.18060302734375, -0.16721725463867188, -0.15383148193359375, -0.14044570922851562, -0.1270599365234375, -0.11367416381835938, -0.10028839111328125, -0.08690261840820312, -0.073516845703125, -0.060131072998046875, -0.04674530029296875, -0.033359527587890625, -0.0199737548828125, -0.006587982177734375, 0.00679779052734375, 0.020183563232421875, 0.0335693359375, 0.046955108642578125, 0.06034088134765625, 0.07372665405273438, 0.0871124267578125, 0.10049819946289062, 0.11388397216796875, 0.12726974487304688, 0.140655517578125, 0.15404129028320312, 0.16742706298828125, 0.18081283569335938, 0.1941986083984375, 0.20758438110351562, 0.22097015380859375, 0.23435592651367188, 0.24774169921875, 0.2611274719238281, 0.27451324462890625, 0.2878990173339844, 0.3012847900390625, 0.3146705627441406, 0.32805633544921875, 0.3414421081542969, 0.354827880859375, 0.3682136535644531, 0.38159942626953125, 0.3949851989746094, 0.4083709716796875, 0.4217567443847656, 0.43514251708984375, 0.4485282897949219, 0.4619140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 2.0, 9.0, 10.0, 16.0, 39.0, 45.0, 72.0, 96.0, 119.0, 150.0, 103.0, 102.0, 70.0, 45.0, 32.0, 35.0, 17.0, 9.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010126829147338867, -9.826663881540298e-05, -9.52649861574173e-05, -9.226333349943161e-05, -8.926168084144592e-05, -8.626002818346024e-05, -8.325837552547455e-05, -8.025672286748886e-05, -7.725507020950317e-05, -7.425341755151749e-05, -7.12517648935318e-05, -6.825011223554611e-05, -6.524845957756042e-05, -6.224680691957474e-05, -5.924515426158905e-05, -5.624350160360336e-05, -5.3241848945617676e-05, -5.024019628763199e-05, -4.72385436296463e-05, -4.4236890971660614e-05, -4.123523831367493e-05, -3.823358565568924e-05, -3.523193299770355e-05, -3.2230280339717865e-05, -2.9228627681732178e-05, -2.622697502374649e-05, -2.3225322365760803e-05, -2.0223669707775116e-05, -1.722201704978943e-05, -1.4220364391803741e-05, -1.1218711733818054e-05, -8.217059075832367e-06, -5.21540641784668e-06, -2.2137537598609924e-06, 7.878988981246948e-07, 3.789551556110382e-06, 6.791204214096069e-06, 9.792856872081757e-06, 1.2794509530067444e-05, 1.579616218805313e-05, 1.879781484603882e-05, 2.1799467504024506e-05, 2.4801120162010193e-05, 2.780277281999588e-05, 3.080442547798157e-05, 3.3806078135967255e-05, 3.680773079395294e-05, 3.980938345193863e-05, 4.2811036109924316e-05, 4.5812688767910004e-05, 4.881434142589569e-05, 5.181599408388138e-05, 5.4817646741867065e-05, 5.781929939985275e-05, 6.082095205783844e-05, 6.382260471582413e-05, 6.682425737380981e-05, 6.98259100317955e-05, 7.282756268978119e-05, 7.582921534776688e-05, 7.883086800575256e-05, 8.183252066373825e-05, 8.483417332172394e-05, 8.783582597970963e-05, 9.083747863769531e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 13.0, 15.0, 25.0, 31.0, 39.0, 94.0, 103.0, 214.0, 372.0, 693.0, 1408.0, 3473.0, 12579.0, 80242.0, 712014.0, 205298.0, 22494.0, 5440.0, 1934.0, 938.0, 444.0, 268.0, 143.0, 87.0, 54.0, 38.0, 36.0, 16.0, 13.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.455078125, -0.44024658203125, -0.4254150390625, -0.41058349609375, -0.395751953125, -0.38092041015625, -0.3660888671875, -0.35125732421875, -0.33642578125, -0.32159423828125, -0.3067626953125, -0.29193115234375, -0.277099609375, -0.26226806640625, -0.2474365234375, -0.23260498046875, -0.2177734375, -0.20294189453125, -0.1881103515625, -0.17327880859375, -0.158447265625, -0.14361572265625, -0.1287841796875, -0.11395263671875, -0.09912109375, -0.08428955078125, -0.0694580078125, -0.05462646484375, -0.039794921875, -0.02496337890625, -0.0101318359375, 0.00469970703125, 0.01953125, 0.03436279296875, 0.0491943359375, 0.06402587890625, 0.078857421875, 0.09368896484375, 0.1085205078125, 0.12335205078125, 0.13818359375, 0.15301513671875, 0.1678466796875, 0.18267822265625, 0.197509765625, 0.21234130859375, 0.2271728515625, 0.24200439453125, 0.2568359375, 0.27166748046875, 0.2864990234375, 0.30133056640625, 0.316162109375, 0.33099365234375, 0.3458251953125, 0.36065673828125, 0.37548828125, 0.39031982421875, 0.4051513671875, 0.41998291015625, 0.434814453125, 0.44964599609375, 0.4644775390625, 0.47930908203125, 0.494140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 11.0, 19.0, 25.0, 25.0, 61.0, 82.0, 103.0, 128.0, 132.0, 118.0, 92.0, 67.0, 45.0, 36.0, 17.0, 12.0, 11.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4444541931152344, -0.42821502685546875, -0.4119758605957031, -0.3957366943359375, -0.3794975280761719, -0.36325836181640625, -0.3470191955566406, -0.330780029296875, -0.3145408630371094, -0.29830169677734375, -0.2820625305175781, -0.2658233642578125, -0.24958419799804688, -0.23334503173828125, -0.21710586547851562, -0.20086669921875, -0.18462753295898438, -0.16838836669921875, -0.15214920043945312, -0.1359100341796875, -0.11967086791992188, -0.10343170166015625, -0.08719253540039062, -0.070953369140625, -0.054714202880859375, -0.03847503662109375, -0.022235870361328125, -0.0059967041015625, 0.010242462158203125, 0.02648162841796875, 0.042720794677734375, 0.0589599609375, 0.07519912719726562, 0.09143829345703125, 0.10767745971679688, 0.1239166259765625, 0.14015579223632812, 0.15639495849609375, 0.17263412475585938, 0.188873291015625, 0.20511245727539062, 0.22135162353515625, 0.23759078979492188, 0.2538299560546875, 0.2700691223144531, 0.28630828857421875, 0.3025474548339844, 0.31878662109375, 0.3350257873535156, 0.35126495361328125, 0.3675041198730469, 0.3837432861328125, 0.3999824523925781, 0.41622161865234375, 0.4324607849121094, 0.448699951171875, 0.4649391174316406, 0.48117828369140625, 0.4974174499511719, 0.5136566162109375, 0.5298957824707031, 0.5461349487304688, 0.5623741149902344, 0.57861328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 20.0, 87.0, 272.0, 361.0, 193.0, 51.0, 14.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31913423538208, -3.7977378368377686, -3.276341438293457, -2.7549452781677246, -2.233548879623413, -1.7121524810791016, -1.1907563209533691, -0.6693599224090576, -0.1479635238647461, 0.37343281507492065, 0.8948291540145874, 1.4162254333496094, 1.937621831893921, 2.4590182304382324, 2.980414390563965, 3.5018107891082764, 4.023207187652588, 4.54460334777832, 5.065999984741211, 5.587396144866943, 6.108792304992676, 6.630188941955566, 7.151585102081299, 7.672981262207031, 8.194377899169922, 8.715774536132812, 9.237170219421387, 9.758566856384277, 10.279963493347168, 10.801359176635742, 11.322755813598633, 11.844152450561523, 12.365547180175781, 12.886943817138672, 13.408339500427246, 13.929736137390137, 14.451132774353027, 14.972528457641602, 15.493925094604492, 16.015321731567383, 16.536718368530273, 17.058115005493164, 17.579511642456055, 18.100906372070312, 18.622303009033203, 19.143699645996094, 19.665096282958984, 20.186492919921875, 20.707889556884766, 21.229286193847656, 21.750682830810547, 22.272079467773438, 22.793474197387695, 23.314870834350586, 23.836267471313477, 24.357664108276367, 24.879058837890625, 25.400455474853516, 25.921852111816406, 26.443248748779297, 26.964643478393555, 27.486040115356445, 28.007436752319336, 28.528833389282227, 29.050230026245117]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 8.0, 8.0, 17.0, 17.0, 26.0, 18.0, 30.0, 27.0, 28.0, 45.0, 39.0, 70.0, 54.0, 52.0, 60.0, 60.0, 44.0, 55.0, 48.0, 40.0, 38.0, 31.0, 32.0, 27.0, 20.0, 19.0, 16.0, 12.0, 14.0, 8.0, 5.0, 3.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.067383766174316, -4.918712615966797, -4.770041465759277, -4.621370315551758, -4.472699165344238, -4.3240275382995605, -4.175356388092041, -4.0266852378845215, -3.878014087677002, -3.7293429374694824, -3.580671787261963, -3.4320003986358643, -3.2833292484283447, -3.134658098220825, -2.9859867095947266, -2.837315559387207, -2.6886444091796875, -2.539973258972168, -2.3913021087646484, -2.24263072013855, -2.0939595699310303, -1.9452884197235107, -1.7966171503067017, -1.6479458808898926, -1.499274730682373, -1.3506035804748535, -1.2019323110580444, -1.0532610416412354, -0.9045898914337158, -0.7559186816215515, -0.6072474718093872, -0.4585762023925781, -0.3099050521850586, -0.1612338423728943, -0.01256263256072998, 0.13610857725143433, 0.28477978706359863, 0.43345099687576294, 0.5821222066879272, 0.7307934761047363, 0.8794646263122559, 1.0281357765197754, 1.1768070459365845, 1.3254783153533936, 1.474149465560913, 1.6228206157684326, 1.7714918851852417, 1.9201631546020508, 2.0688343048095703, 2.21750545501709, 2.3661766052246094, 2.514847993850708, 2.6635191440582275, 2.812190294265747, 2.9608616828918457, 3.1095328330993652, 3.2582039833068848, 3.4068751335144043, 3.555546283721924, 3.7042176723480225, 3.852888822555542, 4.001560211181641, 4.15023136138916, 4.29890251159668, 4.447573661804199]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 7.0, 19.0, 23.0, 37.0, 36.0, 64.0, 123.0, 151.0, 245.0, 433.0, 739.0, 1639.0, 4853.0, 44110.0, 4126263.0, 10418.0, 2590.0, 1060.0, 527.0, 310.0, 194.0, 115.0, 88.0, 64.0, 50.0, 31.0, 25.0, 17.0, 14.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1907196044921875, -1.149993896484375, -1.1092681884765625, -1.06854248046875, -1.0278167724609375, -0.987091064453125, -0.9463653564453125, -0.9056396484375, -0.8649139404296875, -0.824188232421875, -0.7834625244140625, -0.74273681640625, -0.7020111083984375, -0.661285400390625, -0.6205596923828125, -0.579833984375, -0.5391082763671875, -0.498382568359375, -0.4576568603515625, -0.41693115234375, -0.3762054443359375, -0.335479736328125, -0.2947540283203125, -0.2540283203125, -0.2133026123046875, -0.172576904296875, -0.1318511962890625, -0.09112548828125, -0.0503997802734375, -0.009674072265625, 0.0310516357421875, 0.07177734375, 0.1125030517578125, 0.153228759765625, 0.1939544677734375, 0.23468017578125, 0.2754058837890625, 0.316131591796875, 0.3568572998046875, 0.3975830078125, 0.4383087158203125, 0.479034423828125, 0.5197601318359375, 0.56048583984375, 0.6012115478515625, 0.641937255859375, 0.6826629638671875, 0.723388671875, 0.7641143798828125, 0.804840087890625, 0.8455657958984375, 0.88629150390625, 0.9270172119140625, 0.967742919921875, 1.0084686279296875, 1.0491943359375, 1.0899200439453125, 1.130645751953125, 1.1713714599609375, 1.21209716796875, 1.2528228759765625, 1.293548583984375, 1.3342742919921875, 1.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 5.0, 2.0, 7.0, 1.0, 5.0, 6.0, 8.0, 20.0, 14.0, 18.0, 17.0, 33.0, 28.0, 40.0, 32.0, 53.0, 43.0, 62.0, 61.0, 64.0, 48.0, 45.0, 61.0, 52.0, 48.0, 51.0, 36.0, 27.0, 25.0, 22.0, 14.0, 12.0, 10.0, 6.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20703125, -0.2007007598876953, -0.19437026977539062, -0.18803977966308594, -0.18170928955078125, -0.17537879943847656, -0.16904830932617188, -0.1627178192138672, -0.1563873291015625, -0.1500568389892578, -0.14372634887695312, -0.13739585876464844, -0.13106536865234375, -0.12473487854003906, -0.11840438842773438, -0.11207389831542969, -0.105743408203125, -0.09941291809082031, -0.09308242797851562, -0.08675193786621094, -0.08042144775390625, -0.07409095764160156, -0.06776046752929688, -0.06142997741699219, -0.0550994873046875, -0.04876899719238281, -0.042438507080078125, -0.03610801696777344, -0.02977752685546875, -0.023447036743164062, -0.017116546630859375, -0.010786056518554688, -0.00445556640625, 0.0018749237060546875, 0.008205413818359375, 0.014535903930664062, 0.02086639404296875, 0.027196884155273438, 0.033527374267578125, 0.03985786437988281, 0.0461883544921875, 0.05251884460449219, 0.058849334716796875, 0.06517982482910156, 0.07151031494140625, 0.07784080505371094, 0.08417129516601562, 0.09050178527832031, 0.096832275390625, 0.10316276550292969, 0.10949325561523438, 0.11582374572753906, 0.12215423583984375, 0.12848472595214844, 0.13481521606445312, 0.1411457061767578, 0.1474761962890625, 0.1538066864013672, 0.16013717651367188, 0.16646766662597656, 0.17279815673828125, 0.17912864685058594, 0.18545913696289062, 0.1917896270751953, 0.1981201171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 13.0, 24.0, 13.0, 39.0, 44.0, 68.0, 132.0, 154.0, 257.0, 360.0, 552.0, 869.0, 1260.0, 2133.0, 3649.0, 7864.0, 30385.0, 4072336.0, 53173.0, 10068.0, 4238.0, 2381.0, 1428.0, 942.0, 610.0, 452.0, 279.0, 173.0, 116.0, 101.0, 60.0, 30.0, 29.0, 13.0, 14.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0625, -1.0326690673828125, -1.002838134765625, -0.9730072021484375, -0.94317626953125, -0.9133453369140625, -0.883514404296875, -0.8536834716796875, -0.8238525390625, -0.7940216064453125, -0.764190673828125, -0.7343597412109375, -0.70452880859375, -0.6746978759765625, -0.644866943359375, -0.6150360107421875, -0.585205078125, -0.5553741455078125, -0.525543212890625, -0.4957122802734375, -0.46588134765625, -0.4360504150390625, -0.406219482421875, -0.3763885498046875, -0.3465576171875, -0.3167266845703125, -0.286895751953125, -0.2570648193359375, -0.22723388671875, -0.1974029541015625, -0.167572021484375, -0.1377410888671875, -0.10791015625, -0.0780792236328125, -0.048248291015625, -0.0184173583984375, 0.01141357421875, 0.0412445068359375, 0.071075439453125, 0.1009063720703125, 0.1307373046875, 0.1605682373046875, 0.190399169921875, 0.2202301025390625, 0.25006103515625, 0.2798919677734375, 0.309722900390625, 0.3395538330078125, 0.369384765625, 0.3992156982421875, 0.429046630859375, 0.4588775634765625, 0.48870849609375, 0.5185394287109375, 0.548370361328125, 0.5782012939453125, 0.6080322265625, 0.6378631591796875, 0.667694091796875, 0.6975250244140625, 0.72735595703125, 0.7571868896484375, 0.787017822265625, 0.8168487548828125, 0.8466796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 25.0, 29.0, 222.0, 3597.0, 79.0, 32.0, 15.0, 16.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.248779296875, -0.24190711975097656, -0.23503494262695312, -0.2281627655029297, -0.22129058837890625, -0.2144184112548828, -0.20754623413085938, -0.20067405700683594, -0.1938018798828125, -0.18692970275878906, -0.18005752563476562, -0.1731853485107422, -0.16631317138671875, -0.1594409942626953, -0.15256881713867188, -0.14569664001464844, -0.138824462890625, -0.13195228576660156, -0.12508010864257812, -0.11820793151855469, -0.11133575439453125, -0.10446357727050781, -0.09759140014648438, -0.09071922302246094, -0.0838470458984375, -0.07697486877441406, -0.07010269165039062, -0.06323051452636719, -0.05635833740234375, -0.04948616027832031, -0.042613983154296875, -0.03574180603027344, -0.02886962890625, -0.021997451782226562, -0.015125274658203125, -0.008253097534179688, -0.00138092041015625, 0.0054912567138671875, 0.012363433837890625, 0.019235610961914062, 0.0261077880859375, 0.03297996520996094, 0.039852142333984375, 0.04672431945800781, 0.05359649658203125, 0.06046867370605469, 0.06734085083007812, 0.07421302795410156, 0.081085205078125, 0.08795738220214844, 0.09482955932617188, 0.10170173645019531, 0.10857391357421875, 0.11544609069824219, 0.12231826782226562, 0.12919044494628906, 0.1360626220703125, 0.14293479919433594, 0.14980697631835938, 0.1566791534423828, 0.16355133056640625, 0.1704235076904297, 0.17729568481445312, 0.18416786193847656, 0.1910400390625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 12.0, 25.0, 23.0, 33.0, 53.0, 70.0, 71.0, 96.0, 114.0, 121.0, 84.0, 80.0, 68.0, 47.0, 34.0, 27.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6498937010765076, -0.624650239944458, -0.5994067788124084, -0.5741633176803589, -0.5489199161529541, -0.5236764550209045, -0.498432993888855, -0.4731895327568054, -0.44794610142707825, -0.4227026402950287, -0.3974592089653015, -0.37221574783325195, -0.3469722867012024, -0.3217288553714752, -0.29648539423942566, -0.2712419629096985, -0.24599850177764893, -0.22075505554676056, -0.1955116093158722, -0.17026814818382263, -0.14502470195293427, -0.1197812557220459, -0.09453779458999634, -0.06929434835910797, -0.044050902128219604, -0.01880745217204094, 0.006435997784137726, 0.03167945146560669, 0.056922897696495056, 0.08216634392738342, 0.10740980505943298, 0.13265325129032135, 0.15789663791656494, 0.1831400841474533, 0.20838353037834167, 0.23362699151039124, 0.2588704228401184, 0.28411388397216797, 0.30935734510421753, 0.3346008062362671, 0.35984423756599426, 0.3850876986980438, 0.410331130027771, 0.43557459115982056, 0.4608180522918701, 0.4860614836215973, 0.5113049745559692, 0.536548376083374, 0.5617918372154236, 0.5870352983474731, 0.6122787594795227, 0.6375222206115723, 0.662765622138977, 0.6880090832710266, 0.7132525444030762, 0.7384960055351257, 0.7637394666671753, 0.7889829277992249, 0.8142263889312744, 0.8394697904586792, 0.8647132515907288, 0.8899567127227783, 0.9152001738548279, 0.9404436349868774, 0.9656870365142822]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 16.0, 19.0, 13.0, 9.0, 13.0, 13.0, 24.0, 23.0, 23.0, 17.0, 33.0, 43.0, 33.0, 36.0, 34.0, 40.0, 37.0, 49.0, 41.0, 39.0, 38.0, 27.0, 33.0, 33.0, 38.0, 33.0, 34.0, 25.0, 19.0, 22.0, 15.0, 20.0, 13.0, 11.0, 12.0, 13.0, 7.0, 8.0, 5.0, 7.0, 1.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.3959835171699524, -0.38427460193634033, -0.37256571650505066, -0.360856831073761, -0.3491479158401489, -0.33743900060653687, -0.3257301151752472, -0.3140212297439575, -0.30231231451034546, -0.2906033992767334, -0.2788945138454437, -0.26718562841415405, -0.255476713180542, -0.24376781284809113, -0.23205891251564026, -0.2203500121831894, -0.20864111185073853, -0.19693221151828766, -0.1852233111858368, -0.17351441085338593, -0.16180551052093506, -0.1500966101884842, -0.13838770985603333, -0.12667880952358246, -0.11496990919113159, -0.10326100885868073, -0.09155210852622986, -0.07984320819377899, -0.06813430786132812, -0.05642540752887726, -0.04471650719642639, -0.033007606863975525, -0.021298706531524658, -0.009589806199073792, 0.002119094133377075, 0.013827994465827942, 0.02553689479827881, 0.037245795130729675, 0.04895469546318054, 0.06066359579563141, 0.07237249612808228, 0.08408139646053314, 0.09579029679298401, 0.10749919712543488, 0.11920809745788574, 0.1309169977903366, 0.14262589812278748, 0.15433479845523834, 0.1660436987876892, 0.17775259912014008, 0.18946149945259094, 0.2011703997850418, 0.21287930011749268, 0.22458820044994354, 0.2362971007823944, 0.24800600111484528, 0.25971490144729614, 0.2714238166809082, 0.2831327021121979, 0.29484158754348755, 0.3065505027770996, 0.31825941801071167, 0.32996830344200134, 0.341677188873291, 0.3533861041069031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 6.0, 13.0, 18.0, 22.0, 24.0, 35.0, 51.0, 73.0, 95.0, 160.0, 235.0, 354.0, 612.0, 1013.0, 1840.0, 3624.0, 7221.0, 16232.0, 39815.0, 103427.0, 267419.0, 350156.0, 153904.0, 58530.0, 23257.0, 9990.0, 4711.0, 2399.0, 1292.0, 730.0, 441.0, 273.0, 183.0, 107.0, 76.0, 56.0, 40.0, 30.0, 22.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.35257720947265625, -0.3416290283203125, -0.33068084716796875, -0.319732666015625, -0.30878448486328125, -0.2978363037109375, -0.28688812255859375, -0.27593994140625, -0.26499176025390625, -0.2540435791015625, -0.24309539794921875, -0.232147216796875, -0.22119903564453125, -0.2102508544921875, -0.19930267333984375, -0.1883544921875, -0.17740631103515625, -0.1664581298828125, -0.15550994873046875, -0.144561767578125, -0.13361358642578125, -0.1226654052734375, -0.11171722412109375, -0.10076904296875, -0.08982086181640625, -0.0788726806640625, -0.06792449951171875, -0.056976318359375, -0.04602813720703125, -0.0350799560546875, -0.02413177490234375, -0.01318359375, -0.00223541259765625, 0.0087127685546875, 0.01966094970703125, 0.030609130859375, 0.04155731201171875, 0.0525054931640625, 0.06345367431640625, 0.07440185546875, 0.08535003662109375, 0.0962982177734375, 0.10724639892578125, 0.118194580078125, 0.12914276123046875, 0.1400909423828125, 0.15103912353515625, 0.1619873046875, 0.17293548583984375, 0.1838836669921875, 0.19483184814453125, 0.205780029296875, 0.21672821044921875, 0.2276763916015625, 0.23862457275390625, 0.24957275390625, 0.26052093505859375, 0.2714691162109375, 0.28241729736328125, 0.293365478515625, 0.30431365966796875, 0.3152618408203125, 0.32621002197265625, 0.337158203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 5.0, 6.0, 10.0, 12.0, 11.0, 12.0, 12.0, 15.0, 21.0, 23.0, 27.0, 33.0, 28.0, 31.0, 32.0, 54.0, 58.0, 46.0, 45.0, 38.0, 58.0, 46.0, 42.0, 47.0, 41.0, 32.0, 29.0, 29.0, 20.0, 21.0, 16.0, 13.0, 13.0, 12.0, 14.0, 5.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17815017700195312, -0.17258453369140625, -0.16701889038085938, -0.1614532470703125, -0.15588760375976562, -0.15032196044921875, -0.14475631713867188, -0.139190673828125, -0.13362503051757812, -0.12805938720703125, -0.12249374389648438, -0.1169281005859375, -0.11136245727539062, -0.10579681396484375, -0.10023117065429688, -0.09466552734375, -0.08909988403320312, -0.08353424072265625, -0.07796859741210938, -0.0724029541015625, -0.06683731079101562, -0.06127166748046875, -0.055706024169921875, -0.050140380859375, -0.044574737548828125, -0.03900909423828125, -0.033443450927734375, -0.0278778076171875, -0.022312164306640625, -0.01674652099609375, -0.011180877685546875, -0.005615234375, -4.9591064453125e-05, 0.00551605224609375, 0.011081695556640625, 0.0166473388671875, 0.022212982177734375, 0.02777862548828125, 0.033344268798828125, 0.038909912109375, 0.044475555419921875, 0.05004119873046875, 0.055606842041015625, 0.0611724853515625, 0.06673812866210938, 0.07230377197265625, 0.07786941528320312, 0.08343505859375, 0.08900070190429688, 0.09456634521484375, 0.10013198852539062, 0.1056976318359375, 0.11126327514648438, 0.11682891845703125, 0.12239456176757812, 0.127960205078125, 0.13352584838867188, 0.13909149169921875, 0.14465713500976562, 0.1502227783203125, 0.15578842163085938, 0.16135406494140625, 0.16691970825195312, 0.1724853515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 7.0, 8.0, 9.0, 22.0, 25.0, 29.0, 39.0, 49.0, 96.0, 102.0, 194.0, 288.0, 450.0, 731.0, 1457.0, 3450.0, 10922.0, 56817.0, 546957.0, 371302.0, 40953.0, 8539.0, 2812.0, 1307.0, 662.0, 457.0, 267.0, 163.0, 117.0, 74.0, 68.0, 37.0, 24.0, 23.0, 11.0, 11.0, 17.0, 10.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.5830078125, -0.56414794921875, -0.5452880859375, -0.52642822265625, -0.507568359375, -0.48870849609375, -0.4698486328125, -0.45098876953125, -0.43212890625, -0.41326904296875, -0.3944091796875, -0.37554931640625, -0.356689453125, -0.33782958984375, -0.3189697265625, -0.30010986328125, -0.28125, -0.26239013671875, -0.2435302734375, -0.22467041015625, -0.205810546875, -0.18695068359375, -0.1680908203125, -0.14923095703125, -0.13037109375, -0.11151123046875, -0.0926513671875, -0.07379150390625, -0.054931640625, -0.03607177734375, -0.0172119140625, 0.00164794921875, 0.0205078125, 0.03936767578125, 0.0582275390625, 0.07708740234375, 0.095947265625, 0.11480712890625, 0.1336669921875, 0.15252685546875, 0.17138671875, 0.19024658203125, 0.2091064453125, 0.22796630859375, 0.246826171875, 0.26568603515625, 0.2845458984375, 0.30340576171875, 0.322265625, 0.34112548828125, 0.3599853515625, 0.37884521484375, 0.397705078125, 0.41656494140625, 0.4354248046875, 0.45428466796875, 0.47314453125, 0.49200439453125, 0.5108642578125, 0.52972412109375, 0.548583984375, 0.56744384765625, 0.5863037109375, 0.60516357421875, 0.6240234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 13.0, 14.0, 10.0, 18.0, 21.0, 24.0, 24.0, 42.0, 40.0, 42.0, 36.0, 49.0, 38.0, 49.0, 42.0, 51.0, 53.0, 53.0, 42.0, 32.0, 38.0, 32.0, 42.0, 31.0, 24.0, 25.0, 13.0, 18.0, 14.0, 11.0, 6.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.837890625, -0.8110275268554688, -0.7841644287109375, -0.7573013305664062, -0.730438232421875, -0.7035751342773438, -0.6767120361328125, -0.6498489379882812, -0.62298583984375, -0.5961227416992188, -0.5692596435546875, -0.5423965454101562, -0.515533447265625, -0.48867034912109375, -0.4618072509765625, -0.43494415283203125, -0.4080810546875, -0.38121795654296875, -0.3543548583984375, -0.32749176025390625, -0.300628662109375, -0.27376556396484375, -0.2469024658203125, -0.22003936767578125, -0.19317626953125, -0.16631317138671875, -0.1394500732421875, -0.11258697509765625, -0.085723876953125, -0.05886077880859375, -0.0319976806640625, -0.00513458251953125, 0.021728515625, 0.04859161376953125, 0.0754547119140625, 0.10231781005859375, 0.129180908203125, 0.15604400634765625, 0.1829071044921875, 0.20977020263671875, 0.23663330078125, 0.26349639892578125, 0.2903594970703125, 0.31722259521484375, 0.344085693359375, 0.37094879150390625, 0.3978118896484375, 0.42467498779296875, 0.4515380859375, 0.47840118408203125, 0.5052642822265625, 0.5321273803710938, 0.558990478515625, 0.5858535766601562, 0.6127166748046875, 0.6395797729492188, 0.66644287109375, 0.6933059692382812, 0.7201690673828125, 0.7470321655273438, 0.773895263671875, 0.8007583618164062, 0.8276214599609375, 0.8544845581054688, 0.88134765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 10.0, 13.0, 26.0, 41.0, 93.0, 134.0, 316.0, 889.0, 3959.0, 48595.0, 967921.0, 22551.0, 2726.0, 673.0, 273.0, 126.0, 75.0, 39.0, 26.0, 10.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4180984497070312, -1.3820953369140625, -1.3460922241210938, -1.310089111328125, -1.2740859985351562, -1.2380828857421875, -1.2020797729492188, -1.16607666015625, -1.1300735473632812, -1.0940704345703125, -1.0580673217773438, -1.022064208984375, -0.9860610961914062, -0.9500579833984375, -0.9140548706054688, -0.8780517578125, -0.8420486450195312, -0.8060455322265625, -0.7700424194335938, -0.734039306640625, -0.6980361938476562, -0.6620330810546875, -0.6260299682617188, -0.59002685546875, -0.5540237426757812, -0.5180206298828125, -0.48201751708984375, -0.446014404296875, -0.41001129150390625, -0.3740081787109375, -0.33800506591796875, -0.302001953125, -0.26599884033203125, -0.2299957275390625, -0.19399261474609375, -0.157989501953125, -0.12198638916015625, -0.0859832763671875, -0.04998016357421875, -0.01397705078125, 0.02202606201171875, 0.0580291748046875, 0.09403228759765625, 0.130035400390625, 0.16603851318359375, 0.2020416259765625, 0.23804473876953125, 0.2740478515625, 0.31005096435546875, 0.3460540771484375, 0.38205718994140625, 0.418060302734375, 0.45406341552734375, 0.4900665283203125, 0.5260696411132812, 0.56207275390625, 0.5980758666992188, 0.6340789794921875, 0.6700820922851562, 0.706085205078125, 0.7420883178710938, 0.7780914306640625, 0.8140945434570312, 0.85009765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 15.0, 27.0, 45.0, 68.0, 132.0, 161.0, 192.0, 138.0, 86.0, 51.0, 32.0, 24.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014579296112060547, -0.00014187581837177277, -0.00013795867562294006, -0.00013404153287410736, -0.00013012439012527466, -0.00012620724737644196, -0.00012229010462760925, -0.00011837296187877655, -0.00011445581912994385, -0.00011053867638111115, -0.00010662153363227844, -0.00010270439088344574, -9.878724813461304e-05, -9.487010538578033e-05, -9.095296263694763e-05, -8.703581988811493e-05, -8.311867713928223e-05, -7.920153439044952e-05, -7.528439164161682e-05, -7.136724889278412e-05, -6.745010614395142e-05, -6.353296339511871e-05, -5.961582064628601e-05, -5.569867789745331e-05, -5.1781535148620605e-05, -4.78643923997879e-05, -4.39472496509552e-05, -4.00301069021225e-05, -3.6112964153289795e-05, -3.219582140445709e-05, -2.827867865562439e-05, -2.4361535906791687e-05, -2.0444393157958984e-05, -1.6527250409126282e-05, -1.2610107660293579e-05, -8.692964911460876e-06, -4.775822162628174e-06, -8.586794137954712e-07, 3.0584633350372314e-06, 6.975606083869934e-06, 1.0892748832702637e-05, 1.480989158153534e-05, 1.8727034330368042e-05, 2.2644177079200745e-05, 2.6561319828033447e-05, 3.047846257686615e-05, 3.439560532569885e-05, 3.8312748074531555e-05, 4.222989082336426e-05, 4.614703357219696e-05, 5.006417632102966e-05, 5.3981319069862366e-05, 5.789846181869507e-05, 6.181560456752777e-05, 6.573274731636047e-05, 6.964989006519318e-05, 7.356703281402588e-05, 7.748417556285858e-05, 8.140131831169128e-05, 8.531846106052399e-05, 8.923560380935669e-05, 9.315274655818939e-05, 9.70698893070221e-05, 0.0001009870320558548, 0.0001049041748046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 27.0, 36.0, 59.0, 113.0, 185.0, 384.0, 1074.0, 4561.0, 54405.0, 946373.0, 35794.0, 3795.0, 946.0, 370.0, 165.0, 101.0, 47.0, 32.0, 17.0, 17.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1748046875, -1.1416549682617188, -1.1085052490234375, -1.0753555297851562, -1.042205810546875, -1.0090560913085938, -0.9759063720703125, -0.9427566528320312, -0.90960693359375, -0.8764572143554688, -0.8433074951171875, -0.8101577758789062, -0.777008056640625, -0.7438583374023438, -0.7107086181640625, -0.6775588989257812, -0.6444091796875, -0.6112594604492188, -0.5781097412109375, -0.5449600219726562, -0.511810302734375, -0.47866058349609375, -0.4455108642578125, -0.41236114501953125, -0.37921142578125, -0.34606170654296875, -0.3129119873046875, -0.27976226806640625, -0.246612548828125, -0.21346282958984375, -0.1803131103515625, -0.14716339111328125, -0.114013671875, -0.08086395263671875, -0.0477142333984375, -0.01456451416015625, 0.018585205078125, 0.05173492431640625, 0.0848846435546875, 0.11803436279296875, 0.15118408203125, 0.18433380126953125, 0.2174835205078125, 0.25063323974609375, 0.283782958984375, 0.31693267822265625, 0.3500823974609375, 0.38323211669921875, 0.4163818359375, 0.44953155517578125, 0.4826812744140625, 0.5158309936523438, 0.548980712890625, 0.5821304321289062, 0.6152801513671875, 0.6484298706054688, 0.68157958984375, 0.7147293090820312, 0.7478790283203125, 0.7810287475585938, 0.814178466796875, 0.8473281860351562, 0.8804779052734375, 0.9136276245117188, 0.94677734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 5.0, 17.0, 12.0, 32.0, 50.0, 96.0, 174.0, 210.0, 175.0, 90.0, 59.0, 19.0, 17.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5792770385742188, -0.5535736083984375, -0.5278701782226562, -0.502166748046875, -0.47646331787109375, -0.4507598876953125, -0.42505645751953125, -0.39935302734375, -0.37364959716796875, -0.3479461669921875, -0.32224273681640625, -0.296539306640625, -0.27083587646484375, -0.2451324462890625, -0.21942901611328125, -0.1937255859375, -0.16802215576171875, -0.1423187255859375, -0.11661529541015625, -0.090911865234375, -0.06520843505859375, -0.0395050048828125, -0.01380157470703125, 0.01190185546875, 0.03760528564453125, 0.0633087158203125, 0.08901214599609375, 0.114715576171875, 0.14041900634765625, 0.1661224365234375, 0.19182586669921875, 0.217529296875, 0.24323272705078125, 0.2689361572265625, 0.29463958740234375, 0.320343017578125, 0.34604644775390625, 0.3717498779296875, 0.39745330810546875, 0.42315673828125, 0.44886016845703125, 0.4745635986328125, 0.5002670288085938, 0.525970458984375, 0.5516738891601562, 0.5773773193359375, 0.6030807495117188, 0.6287841796875, 0.6544876098632812, 0.6801910400390625, 0.7058944702148438, 0.731597900390625, 0.7573013305664062, 0.7830047607421875, 0.8087081909179688, 0.83441162109375, 0.8601150512695312, 0.8858184814453125, 0.9115219116210938, 0.937225341796875, 0.9629287719726562, 0.9886322021484375, 1.0143356323242188, 1.0400390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 16.0, 30.0, 59.0, 96.0, 188.0, 247.0, 160.0, 92.0, 51.0, 23.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.260588645935059, -11.970691680908203, -11.680793762207031, -11.390896797180176, -11.10099983215332, -10.811101913452148, -10.521204948425293, -10.231307983398438, -9.941410064697266, -9.65151309967041, -9.361615180969238, -9.071718215942383, -8.781820297241211, -8.491923332214355, -8.2020263671875, -7.912128925323486, -7.622231483459473, -7.332334041595459, -7.042436599731445, -6.75253963470459, -6.462642192840576, -6.1727447509765625, -5.882847785949707, -5.592950344085693, -5.30305290222168, -5.013155460357666, -4.723258018493652, -4.433361053466797, -4.143463611602783, -3.8535661697387695, -3.563668966293335, -3.2737717628479004, -2.9838733673095703, -2.6939759254455566, -2.404078722000122, -2.1141815185546875, -1.8242840766906738, -1.5343867540359497, -1.2444894313812256, -0.954592227935791, -0.6646947860717773, -0.3747974634170532, -0.0849001407623291, 0.20499718189239502, 0.49489450454711914, 0.7847918272018433, 1.0746891498565674, 1.364586353302002, 1.6544837951660156, 1.9443811178207397, 2.234278440475464, 2.5241756439208984, 2.814073085784912, 3.103970527648926, 3.3938677310943604, 3.683764934539795, 3.9736623764038086, 4.263559818267822, 4.553457260131836, 4.843354225158691, 5.133251667022705, 5.423149108886719, 5.713046073913574, 6.002943515777588, 6.292840957641602]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 7.0, 10.0, 5.0, 12.0, 11.0, 14.0, 22.0, 22.0, 25.0, 28.0, 24.0, 38.0, 37.0, 36.0, 49.0, 44.0, 44.0, 50.0, 43.0, 54.0, 47.0, 49.0, 36.0, 37.0, 44.0, 24.0, 28.0, 21.0, 24.0, 20.0, 19.0, 16.0, 16.0, 6.0, 7.0, 10.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.166521072387695, -4.029800891876221, -3.893080949783325, -3.7563610076904297, -3.619640827178955, -3.4829208850860596, -3.346200942993164, -3.2094807624816895, -3.072760581970215, -2.9360406398773193, -2.7993204593658447, -2.662600517272949, -2.5258803367614746, -2.389160394668579, -2.2524404525756836, -2.115720272064209, -1.9790003299713135, -1.8422802686691284, -1.7055602073669434, -1.5688402652740479, -1.4321200847625732, -1.2954001426696777, -1.1586800813674927, -1.0219600200653076, -0.8852399587631226, -0.7485198974609375, -0.6117998361587524, -0.47507983446121216, -0.3383597731590271, -0.20163971185684204, -0.06491971015930176, 0.0718003511428833, 0.20852041244506836, 0.3452404737472534, 0.4819605052471161, 0.6186805367469788, 0.7554005980491638, 0.8921206593513489, 1.0288406610488892, 1.1655607223510742, 1.3022807836532593, 1.4390008449554443, 1.5757209062576294, 1.7124409675598145, 1.84916090965271, 1.9858810901641846, 2.12260103225708, 2.2593212127685547, 2.39604115486145, 2.5327610969543457, 2.6694812774658203, 2.806201219558716, 2.9429214000701904, 3.079641342163086, 3.2163615226745605, 3.353081464767456, 3.4898014068603516, 3.626521348953247, 3.7632415294647217, 3.899961471557617, 4.036681652069092, 4.173401832580566, 4.310121536254883, 4.446841716766357, 4.583561897277832]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 16.0, 16.0, 29.0, 65.0, 72.0, 102.0, 169.0, 297.0, 475.0, 850.0, 1513.0, 3107.0, 6960.0, 22890.0, 3744290.0, 380744.0, 19848.0, 6531.0, 2931.0, 1427.0, 781.0, 455.0, 269.0, 157.0, 107.0, 46.0, 36.0, 21.0, 18.0, 18.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.71728515625, -0.691619873046875, -0.66595458984375, -0.640289306640625, -0.6146240234375, -0.588958740234375, -0.56329345703125, -0.537628173828125, -0.511962890625, -0.486297607421875, -0.46063232421875, -0.434967041015625, -0.4093017578125, -0.383636474609375, -0.35797119140625, -0.332305908203125, -0.306640625, -0.280975341796875, -0.25531005859375, -0.229644775390625, -0.2039794921875, -0.178314208984375, -0.15264892578125, -0.126983642578125, -0.101318359375, -0.075653076171875, -0.04998779296875, -0.024322509765625, 0.0013427734375, 0.027008056640625, 0.05267333984375, 0.078338623046875, 0.10400390625, 0.129669189453125, 0.15533447265625, 0.180999755859375, 0.2066650390625, 0.232330322265625, 0.25799560546875, 0.283660888671875, 0.309326171875, 0.334991455078125, 0.36065673828125, 0.386322021484375, 0.4119873046875, 0.437652587890625, 0.46331787109375, 0.488983154296875, 0.5146484375, 0.540313720703125, 0.56597900390625, 0.591644287109375, 0.6173095703125, 0.642974853515625, 0.66864013671875, 0.694305419921875, 0.719970703125, 0.745635986328125, 0.77130126953125, 0.796966552734375, 0.8226318359375, 0.848297119140625, 0.87396240234375, 0.899627685546875, 0.92529296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 7.0, 10.0, 8.0, 18.0, 16.0, 23.0, 30.0, 32.0, 36.0, 31.0, 48.0, 48.0, 55.0, 52.0, 57.0, 69.0, 59.0, 66.0, 65.0, 40.0, 50.0, 46.0, 24.0, 22.0, 22.0, 13.0, 7.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21484375, -0.20786666870117188, -0.20088958740234375, -0.19391250610351562, -0.1869354248046875, -0.17995834350585938, -0.17298126220703125, -0.16600418090820312, -0.159027099609375, -0.15205001831054688, -0.14507293701171875, -0.13809585571289062, -0.1311187744140625, -0.12414169311523438, -0.11716461181640625, -0.11018753051757812, -0.10321044921875, -0.09623336791992188, -0.08925628662109375, -0.08227920532226562, -0.0753021240234375, -0.06832504272460938, -0.06134796142578125, -0.054370880126953125, -0.047393798828125, -0.040416717529296875, -0.03343963623046875, -0.026462554931640625, -0.0194854736328125, -0.012508392333984375, -0.00553131103515625, 0.001445770263671875, 0.0084228515625, 0.015399932861328125, 0.02237701416015625, 0.029354095458984375, 0.0363311767578125, 0.043308258056640625, 0.05028533935546875, 0.057262420654296875, 0.064239501953125, 0.07121658325195312, 0.07819366455078125, 0.08517074584960938, 0.0921478271484375, 0.09912490844726562, 0.10610198974609375, 0.11307907104492188, 0.12005615234375, 0.12703323364257812, 0.13401031494140625, 0.14098739624023438, 0.1479644775390625, 0.15494155883789062, 0.16191864013671875, 0.16889572143554688, 0.175872802734375, 0.18284988403320312, 0.18982696533203125, 0.19680404663085938, 0.2037811279296875, 0.21075820922851562, 0.21773529052734375, 0.22471237182617188, 0.231689453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 17.0, 18.0, 48.0, 62.0, 120.0, 185.0, 324.0, 617.0, 1297.0, 2959.0, 8225.0, 32494.0, 3843624.0, 272007.0, 21347.0, 6236.0, 2390.0, 1112.0, 506.0, 255.0, 149.0, 98.0, 63.0, 35.0, 22.0, 18.0, 10.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.992950439453125, -0.95855712890625, -0.924163818359375, -0.8897705078125, -0.855377197265625, -0.82098388671875, -0.786590576171875, -0.752197265625, -0.717803955078125, -0.68341064453125, -0.649017333984375, -0.6146240234375, -0.580230712890625, -0.54583740234375, -0.511444091796875, -0.47705078125, -0.442657470703125, -0.40826416015625, -0.373870849609375, -0.3394775390625, -0.305084228515625, -0.27069091796875, -0.236297607421875, -0.201904296875, -0.167510986328125, -0.13311767578125, -0.098724365234375, -0.0643310546875, -0.029937744140625, 0.00445556640625, 0.038848876953125, 0.0732421875, 0.107635498046875, 0.14202880859375, 0.176422119140625, 0.2108154296875, 0.245208740234375, 0.27960205078125, 0.313995361328125, 0.348388671875, 0.382781982421875, 0.41717529296875, 0.451568603515625, 0.4859619140625, 0.520355224609375, 0.55474853515625, 0.589141845703125, 0.62353515625, 0.657928466796875, 0.69232177734375, 0.726715087890625, 0.7611083984375, 0.795501708984375, 0.82989501953125, 0.864288330078125, 0.898681640625, 0.933074951171875, 0.96746826171875, 1.001861572265625, 1.0362548828125, 1.070648193359375, 1.10504150390625, 1.139434814453125, 1.173828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 18.0, 22.0, 30.0, 86.0, 252.0, 3271.0, 213.0, 53.0, 43.0, 18.0, 14.0, 6.0, 8.0, 5.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39306640625, -0.3781890869140625, -0.363311767578125, -0.3484344482421875, -0.33355712890625, -0.3186798095703125, -0.303802490234375, -0.2889251708984375, -0.2740478515625, -0.2591705322265625, -0.244293212890625, -0.2294158935546875, -0.21453857421875, -0.1996612548828125, -0.184783935546875, -0.1699066162109375, -0.155029296875, -0.1401519775390625, -0.125274658203125, -0.1103973388671875, -0.09552001953125, -0.0806427001953125, -0.065765380859375, -0.0508880615234375, -0.0360107421875, -0.0211334228515625, -0.006256103515625, 0.0086212158203125, 0.02349853515625, 0.0383758544921875, 0.053253173828125, 0.0681304931640625, 0.0830078125, 0.0978851318359375, 0.112762451171875, 0.1276397705078125, 0.14251708984375, 0.1573944091796875, 0.172271728515625, 0.1871490478515625, 0.2020263671875, 0.2169036865234375, 0.231781005859375, 0.2466583251953125, 0.26153564453125, 0.2764129638671875, 0.291290283203125, 0.3061676025390625, 0.321044921875, 0.3359222412109375, 0.350799560546875, 0.3656768798828125, 0.38055419921875, 0.3954315185546875, 0.410308837890625, 0.4251861572265625, 0.4400634765625, 0.4549407958984375, 0.469818115234375, 0.4846954345703125, 0.49957275390625, 0.5144500732421875, 0.529327392578125, 0.5442047119140625, 0.55908203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 17.0, 22.0, 52.0, 71.0, 103.0, 142.0, 137.0, 114.0, 86.0, 73.0, 48.0, 31.0, 32.0, 14.0, 9.0, 9.0, 5.0, 5.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.506753921508789, -1.4527078866958618, -1.3986618518829346, -1.3446158170700073, -1.29056978225708, -1.2365237474441528, -1.1824777126312256, -1.1284316778182983, -1.074385643005371, -1.0203396081924438, -0.9662935733795166, -0.9122475385665894, -0.8582015037536621, -0.8041554689407349, -0.7501094341278076, -0.6960633993148804, -0.6420173048973083, -0.5879712700843811, -0.5339252352714539, -0.4798792004585266, -0.42583316564559937, -0.37178710103034973, -0.3177410662174225, -0.26369503140449524, -0.209648996591568, -0.15560296177864075, -0.1015569195151329, -0.04751087725162506, 0.006535157561302185, 0.060581207275390625, 0.11462724208831787, 0.16867327690124512, 0.22271931171417236, 0.2767653465270996, 0.33081138134002686, 0.3848574161529541, 0.43890345096588135, 0.492949515581131, 0.5469955205917358, 0.6010415554046631, 0.6550875902175903, 0.7091336250305176, 0.7631796598434448, 0.8172256946563721, 0.8712717294692993, 0.9253177642822266, 0.9793637990951538, 1.033409833908081, 1.0874559879302979, 1.141502022743225, 1.1955480575561523, 1.2495940923690796, 1.3036401271820068, 1.357686161994934, 1.4117321968078613, 1.4657782316207886, 1.5198242664337158, 1.573870301246643, 1.6279163360595703, 1.6819623708724976, 1.7360084056854248, 1.790054440498352, 1.8441004753112793, 1.8981465101242065, 1.9521925449371338]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 10.0, 12.0, 21.0, 29.0, 19.0, 20.0, 32.0, 29.0, 27.0, 40.0, 46.0, 34.0, 46.0, 44.0, 40.0, 41.0, 41.0, 43.0, 48.0, 45.0, 38.0, 33.0, 41.0, 34.0, 27.0, 29.0, 16.0, 20.0, 16.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1297924518585205, -1.098103404045105, -1.0664143562316895, -1.0347254276275635, -1.003036379814148, -0.9713473320007324, -0.9396582841873169, -0.9079692363739014, -0.8762801885604858, -0.8445911407470703, -0.8129021525382996, -0.781213104724884, -0.7495240569114685, -0.7178350687026978, -0.6861460208892822, -0.6544569730758667, -0.622767984867096, -0.5910789370536804, -0.5593899488449097, -0.5277009010314941, -0.4960118532180786, -0.4643228352069855, -0.43263381719589233, -0.4009447693824768, -0.36925575137138367, -0.3375667333602905, -0.305877685546875, -0.27418866753578186, -0.24249963462352753, -0.2108106017112732, -0.17912158370018005, -0.14743255078792572, -0.11574351787567139, -0.08405448496341705, -0.05236545950174332, -0.02067643404006958, 0.011012598872184753, 0.04270163178443909, 0.07439064979553223, 0.10607968270778656, 0.1377687156200409, 0.16945774853229523, 0.20114678144454956, 0.2328357994556427, 0.26452481746673584, 0.29621386528015137, 0.3279028832912445, 0.35959190130233765, 0.3912809491157532, 0.4229699671268463, 0.45465901494026184, 0.486348032951355, 0.5180370807647705, 0.549726128578186, 0.5814151167869568, 0.6131041646003723, 0.6447931528091431, 0.6764822006225586, 0.7081711888313293, 0.7398602366447449, 0.7715492844581604, 0.8032382726669312, 0.8349273204803467, 0.8666163682937622, 0.8983054161071777]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 6.0, 3.0, 8.0, 12.0, 9.0, 23.0, 27.0, 40.0, 50.0, 82.0, 109.0, 172.0, 230.0, 374.0, 564.0, 893.0, 1474.0, 2404.0, 4112.0, 7825.0, 15552.0, 33230.0, 73323.0, 173120.0, 361926.0, 209085.0, 86504.0, 38444.0, 18116.0, 8926.0, 4817.0, 2691.0, 1546.0, 1014.0, 592.0, 426.0, 258.0, 176.0, 139.0, 75.0, 53.0, 36.0, 29.0, 18.0, 11.0, 18.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.488525390625, -0.4751777648925781, -0.46183013916015625, -0.4484825134277344, -0.4351348876953125, -0.4217872619628906, -0.40843963623046875, -0.3950920104980469, -0.381744384765625, -0.3683967590332031, -0.35504913330078125, -0.3417015075683594, -0.3283538818359375, -0.3150062561035156, -0.30165863037109375, -0.2883110046386719, -0.27496337890625, -0.2616157531738281, -0.24826812744140625, -0.23492050170898438, -0.2215728759765625, -0.20822525024414062, -0.19487762451171875, -0.18152999877929688, -0.168182373046875, -0.15483474731445312, -0.14148712158203125, -0.12813949584960938, -0.1147918701171875, -0.10144424438476562, -0.08809661865234375, -0.07474899291992188, -0.0614013671875, -0.048053741455078125, -0.03470611572265625, -0.021358489990234375, -0.0080108642578125, 0.005336761474609375, 0.01868438720703125, 0.032032012939453125, 0.045379638671875, 0.058727264404296875, 0.07207489013671875, 0.08542251586914062, 0.0987701416015625, 0.11211776733398438, 0.12546539306640625, 0.13881301879882812, 0.15216064453125, 0.16550827026367188, 0.17885589599609375, 0.19220352172851562, 0.2055511474609375, 0.21889877319335938, 0.23224639892578125, 0.24559402465820312, 0.258941650390625, 0.2722892761230469, 0.28563690185546875, 0.2989845275878906, 0.3123321533203125, 0.3256797790527344, 0.33902740478515625, 0.3523750305175781, 0.36572265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 6.0, 8.0, 14.0, 17.0, 23.0, 21.0, 29.0, 42.0, 42.0, 44.0, 46.0, 46.0, 62.0, 66.0, 57.0, 51.0, 48.0, 60.0, 45.0, 45.0, 40.0, 38.0, 25.0, 24.0, 18.0, 20.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.23929405212402344, -0.23163986206054688, -0.2239856719970703, -0.21633148193359375, -0.2086772918701172, -0.20102310180664062, -0.19336891174316406, -0.1857147216796875, -0.17806053161621094, -0.17040634155273438, -0.1627521514892578, -0.15509796142578125, -0.1474437713623047, -0.13978958129882812, -0.13213539123535156, -0.124481201171875, -0.11682701110839844, -0.10917282104492188, -0.10151863098144531, -0.09386444091796875, -0.08621025085449219, -0.07855606079101562, -0.07090187072753906, -0.0632476806640625, -0.05559349060058594, -0.047939300537109375, -0.04028511047363281, -0.03263092041015625, -0.024976730346679688, -0.017322540283203125, -0.009668350219726562, -0.00201416015625, 0.0056400299072265625, 0.013294219970703125, 0.020948410034179688, 0.02860260009765625, 0.03625679016113281, 0.043910980224609375, 0.05156517028808594, 0.0592193603515625, 0.06687355041503906, 0.07452774047851562, 0.08218193054199219, 0.08983612060546875, 0.09749031066894531, 0.10514450073242188, 0.11279869079589844, 0.120452880859375, 0.12810707092285156, 0.13576126098632812, 0.1434154510498047, 0.15106964111328125, 0.1587238311767578, 0.16637802124023438, 0.17403221130371094, 0.1816864013671875, 0.18934059143066406, 0.19699478149414062, 0.2046489715576172, 0.21230316162109375, 0.2199573516845703, 0.22761154174804688, 0.23526573181152344, 0.242919921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 14.0, 22.0, 42.0, 61.0, 81.0, 117.0, 190.0, 250.0, 435.0, 703.0, 1128.0, 2485.0, 7198.0, 35315.0, 377298.0, 560090.0, 48357.0, 8575.0, 2820.0, 1367.0, 674.0, 420.0, 264.0, 191.0, 132.0, 87.0, 62.0, 49.0, 38.0, 18.0, 20.0, 7.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0380859375, -1.0066986083984375, -0.975311279296875, -0.9439239501953125, -0.91253662109375, -0.8811492919921875, -0.849761962890625, -0.8183746337890625, -0.7869873046875, -0.7555999755859375, -0.724212646484375, -0.6928253173828125, -0.66143798828125, -0.6300506591796875, -0.598663330078125, -0.5672760009765625, -0.535888671875, -0.5045013427734375, -0.473114013671875, -0.4417266845703125, -0.41033935546875, -0.3789520263671875, -0.347564697265625, -0.3161773681640625, -0.2847900390625, -0.2534027099609375, -0.222015380859375, -0.1906280517578125, -0.15924072265625, -0.1278533935546875, -0.096466064453125, -0.0650787353515625, -0.03369140625, -0.0023040771484375, 0.029083251953125, 0.0604705810546875, 0.09185791015625, 0.1232452392578125, 0.154632568359375, 0.1860198974609375, 0.2174072265625, 0.2487945556640625, 0.280181884765625, 0.3115692138671875, 0.34295654296875, 0.3743438720703125, 0.405731201171875, 0.4371185302734375, 0.468505859375, 0.4998931884765625, 0.531280517578125, 0.5626678466796875, 0.59405517578125, 0.6254425048828125, 0.656829833984375, 0.6882171630859375, 0.7196044921875, 0.7509918212890625, 0.782379150390625, 0.8137664794921875, 0.84515380859375, 0.8765411376953125, 0.907928466796875, 0.9393157958984375, 0.970703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 10.0, 15.0, 11.0, 15.0, 19.0, 25.0, 16.0, 27.0, 26.0, 40.0, 44.0, 39.0, 54.0, 50.0, 44.0, 49.0, 53.0, 31.0, 53.0, 44.0, 47.0, 39.0, 41.0, 28.0, 27.0, 23.0, 19.0, 16.0, 21.0, 15.0, 13.0, 8.0, 6.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.974609375, -0.94317626953125, -0.9117431640625, -0.88031005859375, -0.848876953125, -0.81744384765625, -0.7860107421875, -0.75457763671875, -0.72314453125, -0.69171142578125, -0.6602783203125, -0.62884521484375, -0.597412109375, -0.56597900390625, -0.5345458984375, -0.50311279296875, -0.4716796875, -0.44024658203125, -0.4088134765625, -0.37738037109375, -0.345947265625, -0.31451416015625, -0.2830810546875, -0.25164794921875, -0.22021484375, -0.18878173828125, -0.1573486328125, -0.12591552734375, -0.094482421875, -0.06304931640625, -0.0316162109375, -0.00018310546875, 0.03125, 0.06268310546875, 0.0941162109375, 0.12554931640625, 0.156982421875, 0.18841552734375, 0.2198486328125, 0.25128173828125, 0.28271484375, 0.31414794921875, 0.3455810546875, 0.37701416015625, 0.408447265625, 0.43988037109375, 0.4713134765625, 0.50274658203125, 0.5341796875, 0.56561279296875, 0.5970458984375, 0.62847900390625, 0.659912109375, 0.69134521484375, 0.7227783203125, 0.75421142578125, 0.78564453125, 0.81707763671875, 0.8485107421875, 0.87994384765625, 0.911376953125, 0.94281005859375, 0.9742431640625, 1.00567626953125, 1.037109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 5.0, 9.0, 9.0, 9.0, 18.0, 17.0, 41.0, 37.0, 59.0, 87.0, 110.0, 210.0, 337.0, 775.0, 1659.0, 4715.0, 20415.0, 231242.0, 724721.0, 50774.0, 8440.0, 2530.0, 999.0, 502.0, 286.0, 180.0, 116.0, 79.0, 41.0, 32.0, 22.0, 18.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.449951171875, -0.4350624084472656, -0.42017364501953125, -0.4052848815917969, -0.3903961181640625, -0.3755073547363281, -0.36061859130859375, -0.3457298278808594, -0.330841064453125, -0.3159523010253906, -0.30106353759765625, -0.2861747741699219, -0.2712860107421875, -0.2563972473144531, -0.24150848388671875, -0.22661972045898438, -0.21173095703125, -0.19684219360351562, -0.18195343017578125, -0.16706466674804688, -0.1521759033203125, -0.13728713989257812, -0.12239837646484375, -0.10750961303710938, -0.092620849609375, -0.07773208618164062, -0.06284332275390625, -0.047954559326171875, -0.0330657958984375, -0.018177032470703125, -0.00328826904296875, 0.011600494384765625, 0.0264892578125, 0.041378021240234375, 0.05626678466796875, 0.07115554809570312, 0.0860443115234375, 0.10093307495117188, 0.11582183837890625, 0.13071060180664062, 0.145599365234375, 0.16048812866210938, 0.17537689208984375, 0.19026565551757812, 0.2051544189453125, 0.22004318237304688, 0.23493194580078125, 0.24982070922851562, 0.26470947265625, 0.2795982360839844, 0.29448699951171875, 0.3093757629394531, 0.3242645263671875, 0.3391532897949219, 0.35404205322265625, 0.3689308166503906, 0.383819580078125, 0.3987083435058594, 0.41359710693359375, 0.4284858703613281, 0.4433746337890625, 0.4582633972167969, 0.47315216064453125, 0.4880409240722656, 0.5029296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 14.0, 14.0, 21.0, 33.0, 46.0, 68.0, 90.0, 134.0, 176.0, 127.0, 73.0, 44.0, 44.0, 27.0, 13.0, 12.0, 18.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.423494338989258e-05, -9.020697325468063e-05, -8.617900311946869e-05, -8.215103298425674e-05, -7.81230628490448e-05, -7.409509271383286e-05, -7.006712257862091e-05, -6.603915244340897e-05, -6.201118230819702e-05, -5.798321217298508e-05, -5.395524203777313e-05, -4.992727190256119e-05, -4.589930176734924e-05, -4.18713316321373e-05, -3.7843361496925354e-05, -3.381539136171341e-05, -2.9787421226501465e-05, -2.575945109128952e-05, -2.1731480956077576e-05, -1.770351082086563e-05, -1.3675540685653687e-05, -9.647570550441742e-06, -5.619600415229797e-06, -1.5916302800178528e-06, 2.436339855194092e-06, 6.464309990406036e-06, 1.0492280125617981e-05, 1.4520250260829926e-05, 1.854822039604187e-05, 2.2576190531253815e-05, 2.660416066646576e-05, 3.0632130801677704e-05, 3.466010093688965e-05, 3.868807107210159e-05, 4.271604120731354e-05, 4.674401134252548e-05, 5.077198147773743e-05, 5.479995161294937e-05, 5.8827921748161316e-05, 6.285589188337326e-05, 6.68838620185852e-05, 7.091183215379715e-05, 7.49398022890091e-05, 7.896777242422104e-05, 8.299574255943298e-05, 8.702371269464493e-05, 9.105168282985687e-05, 9.507965296506882e-05, 9.910762310028076e-05, 0.0001031355932354927, 0.00010716356337070465, 0.0001111915335059166, 0.00011521950364112854, 0.00011924747377634048, 0.00012327544391155243, 0.00012730341404676437, 0.00013133138418197632, 0.00013535935431718826, 0.0001393873244524002, 0.00014341529458761215, 0.0001474432647228241, 0.00015147123485803604, 0.00015549920499324799, 0.00015952717512845993, 0.00016355514526367188]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 11.0, 6.0, 16.0, 15.0, 27.0, 40.0, 45.0, 74.0, 102.0, 168.0, 258.0, 493.0, 976.0, 2311.0, 7116.0, 36179.0, 542531.0, 416807.0, 30599.0, 6524.0, 2120.0, 924.0, 459.0, 233.0, 174.0, 108.0, 69.0, 52.0, 37.0, 22.0, 23.0, 7.0, 10.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4136810302734375, -0.399871826171875, -0.3860626220703125, -0.37225341796875, -0.3584442138671875, -0.344635009765625, -0.3308258056640625, -0.3170166015625, -0.3032073974609375, -0.289398193359375, -0.2755889892578125, -0.26177978515625, -0.2479705810546875, -0.234161376953125, -0.2203521728515625, -0.20654296875, -0.1927337646484375, -0.178924560546875, -0.1651153564453125, -0.15130615234375, -0.1374969482421875, -0.123687744140625, -0.1098785400390625, -0.0960693359375, -0.0822601318359375, -0.068450927734375, -0.0546417236328125, -0.04083251953125, -0.0270233154296875, -0.013214111328125, 0.0005950927734375, 0.014404296875, 0.0282135009765625, 0.042022705078125, 0.0558319091796875, 0.06964111328125, 0.0834503173828125, 0.097259521484375, 0.1110687255859375, 0.1248779296875, 0.1386871337890625, 0.152496337890625, 0.1663055419921875, 0.18011474609375, 0.1939239501953125, 0.207733154296875, 0.2215423583984375, 0.2353515625, 0.2491607666015625, 0.262969970703125, 0.2767791748046875, 0.29058837890625, 0.3043975830078125, 0.318206787109375, 0.3320159912109375, 0.3458251953125, 0.3596343994140625, 0.373443603515625, 0.3872528076171875, 0.40106201171875, 0.4148712158203125, 0.428680419921875, 0.4424896240234375, 0.456298828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 3.0, 8.0, 14.0, 15.0, 25.0, 35.0, 53.0, 66.0, 107.0, 96.0, 116.0, 109.0, 79.0, 79.0, 47.0, 37.0, 24.0, 19.0, 12.0, 9.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48974609375, -0.475921630859375, -0.46209716796875, -0.448272705078125, -0.4344482421875, -0.420623779296875, -0.40679931640625, -0.392974853515625, -0.379150390625, -0.365325927734375, -0.35150146484375, -0.337677001953125, -0.3238525390625, -0.310028076171875, -0.29620361328125, -0.282379150390625, -0.2685546875, -0.254730224609375, -0.24090576171875, -0.227081298828125, -0.2132568359375, -0.199432373046875, -0.18560791015625, -0.171783447265625, -0.157958984375, -0.144134521484375, -0.13031005859375, -0.116485595703125, -0.1026611328125, -0.088836669921875, -0.07501220703125, -0.061187744140625, -0.04736328125, -0.033538818359375, -0.01971435546875, -0.005889892578125, 0.0079345703125, 0.021759033203125, 0.03558349609375, 0.049407958984375, 0.063232421875, 0.077056884765625, 0.09088134765625, 0.104705810546875, 0.1185302734375, 0.132354736328125, 0.14617919921875, 0.160003662109375, 0.173828125, 0.187652587890625, 0.20147705078125, 0.215301513671875, 0.2291259765625, 0.242950439453125, 0.25677490234375, 0.270599365234375, 0.284423828125, 0.298248291015625, 0.31207275390625, 0.325897216796875, 0.3397216796875, 0.353546142578125, 0.36737060546875, 0.381195068359375, 0.39501953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 13.0, 39.0, 143.0, 399.0, 300.0, 80.0, 21.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.629871368408203, -14.041703224182129, -13.453536033630371, -12.865367889404297, -12.277200698852539, -11.689032554626465, -11.10086441040039, -10.512697219848633, -9.924530029296875, -9.3363618850708, -8.748194694519043, -8.160026550292969, -7.571859359741211, -6.983691215515137, -6.395523548126221, -5.807355880737305, -5.2191877365112305, -4.6310200691223145, -4.042852401733398, -3.4546844959259033, -2.8665168285369873, -2.2783491611480713, -1.6901812553405762, -1.1020135879516602, -0.5138459205627441, 0.07432180643081665, 0.6624895334243774, 1.250657320022583, 1.838824987411499, 2.426992654800415, 3.01516056060791, 3.603328227996826, 4.191495895385742, 4.779663562774658, 5.367831230163574, 5.955999374389648, 6.544166564941406, 7.1323347091674805, 7.7205023765563965, 8.308670043945312, 8.89683723449707, 9.485005378723145, 10.073172569274902, 10.661340713500977, 11.249507904052734, 11.837676048278809, 12.425844192504883, 13.01401138305664, 13.602179527282715, 14.190347671508789, 14.778514862060547, 15.366683006286621, 15.954850196838379, 16.543018341064453, 17.13118553161621, 17.71935272216797, 18.30752182006836, 18.895689010620117, 19.483858108520508, 20.072025299072266, 20.660192489624023, 21.24835968017578, 21.836528778076172, 22.42469596862793, 23.012863159179688]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 21.0, 17.0, 13.0, 17.0, 19.0, 33.0, 29.0, 27.0, 45.0, 39.0, 50.0, 51.0, 49.0, 52.0, 50.0, 47.0, 59.0, 38.0, 47.0, 35.0, 37.0, 29.0, 19.0, 24.0, 26.0, 18.0, 12.0, 15.0, 10.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.276425838470459, -4.143445014953613, -4.010463714599609, -3.8774826526641846, -3.7445015907287598, -3.611520528793335, -3.47853946685791, -3.3455584049224854, -3.2125773429870605, -3.0795962810516357, -2.946615219116211, -2.813634157180786, -2.6806530952453613, -2.5476720333099365, -2.4146909713745117, -2.281709909439087, -2.148728847503662, -2.0157477855682373, -1.8827667236328125, -1.7497856616973877, -1.616804599761963, -1.483823537826538, -1.3508424758911133, -1.2178614139556885, -1.0848803520202637, -0.9518992900848389, -0.8189182281494141, -0.6859371662139893, -0.5529561042785645, -0.41997504234313965, -0.28699398040771484, -0.15401291847229004, -0.02103137969970703, 0.11194968223571777, 0.24493074417114258, 0.3779118061065674, 0.5108928680419922, 0.643873929977417, 0.7768549919128418, 0.9098360538482666, 1.0428171157836914, 1.1757981777191162, 1.308779239654541, 1.4417603015899658, 1.5747413635253906, 1.7077224254608154, 1.8407034873962402, 1.973684549331665, 2.10666561126709, 2.2396466732025146, 2.3726277351379395, 2.5056087970733643, 2.638589859008789, 2.771570920944214, 2.9045519828796387, 3.0375330448150635, 3.1705141067504883, 3.303495168685913, 3.436476230621338, 3.5694572925567627, 3.7024383544921875, 3.8354194164276123, 3.968400478363037, 4.101381301879883, 4.234362602233887]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 11.0, 6.0, 9.0, 6.0, 15.0, 12.0, 12.0, 27.0, 29.0, 46.0, 61.0, 94.0, 142.0, 206.0, 311.0, 552.0, 963.0, 1695.0, 2953.0, 5955.0, 12699.0, 34459.0, 149941.0, 2067632.0, 1722704.0, 135134.0, 33464.0, 12736.0, 5604.0, 2906.0, 1544.0, 877.0, 499.0, 325.0, 228.0, 153.0, 69.0, 61.0, 43.0, 29.0, 19.0, 15.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.43505859375, -0.4226188659667969, -0.41017913818359375, -0.3977394104003906, -0.3852996826171875, -0.3728599548339844, -0.36042022705078125, -0.3479804992675781, -0.335540771484375, -0.3231010437011719, -0.31066131591796875, -0.2982215881347656, -0.2857818603515625, -0.2733421325683594, -0.26090240478515625, -0.24846267700195312, -0.23602294921875, -0.22358322143554688, -0.21114349365234375, -0.19870376586914062, -0.1862640380859375, -0.17382431030273438, -0.16138458251953125, -0.14894485473632812, -0.136505126953125, -0.12406539916992188, -0.11162567138671875, -0.09918594360351562, -0.0867462158203125, -0.07430648803710938, -0.06186676025390625, -0.049427032470703125, -0.0369873046875, -0.024547576904296875, -0.01210784912109375, 0.000331878662109375, 0.0127716064453125, 0.025211334228515625, 0.03765106201171875, 0.050090789794921875, 0.062530517578125, 0.07497024536132812, 0.08740997314453125, 0.09984970092773438, 0.1122894287109375, 0.12472915649414062, 0.13716888427734375, 0.14960861206054688, 0.16204833984375, 0.17448806762695312, 0.18692779541015625, 0.19936752319335938, 0.2118072509765625, 0.22424697875976562, 0.23668670654296875, 0.24912643432617188, 0.261566162109375, 0.2740058898925781, 0.28644561767578125, 0.2988853454589844, 0.3113250732421875, 0.3237648010253906, 0.33620452880859375, 0.3486442565917969, 0.361083984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 4.0, 7.0, 15.0, 22.0, 28.0, 55.0, 65.0, 82.0, 95.0, 77.0, 101.0, 103.0, 90.0, 57.0, 63.0, 51.0, 28.0, 25.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.5966796875, -0.5845756530761719, -0.5724716186523438, -0.5603675842285156, -0.5482635498046875, -0.5361595153808594, -0.5240554809570312, -0.5119514465332031, -0.499847412109375, -0.4877433776855469, -0.47563934326171875, -0.4635353088378906, -0.4514312744140625, -0.4393272399902344, -0.42722320556640625, -0.4151191711425781, -0.40301513671875, -0.3909111022949219, -0.37880706787109375, -0.3667030334472656, -0.3545989990234375, -0.3424949645996094, -0.33039093017578125, -0.3182868957519531, -0.306182861328125, -0.2940788269042969, -0.28197479248046875, -0.2698707580566406, -0.2577667236328125, -0.24566268920898438, -0.23355865478515625, -0.22145462036132812, -0.2093505859375, -0.19724655151367188, -0.18514251708984375, -0.17303848266601562, -0.1609344482421875, -0.14883041381835938, -0.13672637939453125, -0.12462234497070312, -0.112518310546875, -0.10041427612304688, -0.08831024169921875, -0.07620620727539062, -0.0641021728515625, -0.051998138427734375, -0.03989410400390625, -0.027790069580078125, -0.01568603515625, -0.003582000732421875, 0.00852203369140625, 0.020626068115234375, 0.0327301025390625, 0.044834136962890625, 0.05693817138671875, 0.06904220581054688, 0.081146240234375, 0.09325027465820312, 0.10535430908203125, 0.11745834350585938, 0.1295623779296875, 0.14166641235351562, 0.15377044677734375, 0.16587448120117188, 0.177978515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 7.0, 7.0, 10.0, 12.0, 27.0, 43.0, 41.0, 75.0, 113.0, 225.0, 466.0, 876.0, 1866.0, 4726.0, 13872.0, 53293.0, 449267.0, 3443797.0, 179175.0, 31229.0, 9025.0, 3225.0, 1351.0, 703.0, 314.0, 185.0, 104.0, 82.0, 38.0, 38.0, 20.0, 24.0, 17.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6728591918945312, -0.6513824462890625, -0.6299057006835938, -0.608428955078125, -0.5869522094726562, -0.5654754638671875, -0.5439987182617188, -0.52252197265625, -0.5010452270507812, -0.4795684814453125, -0.45809173583984375, -0.436614990234375, -0.41513824462890625, -0.3936614990234375, -0.37218475341796875, -0.3507080078125, -0.32923126220703125, -0.3077545166015625, -0.28627777099609375, -0.264801025390625, -0.24332427978515625, -0.2218475341796875, -0.20037078857421875, -0.17889404296875, -0.15741729736328125, -0.1359405517578125, -0.11446380615234375, -0.092987060546875, -0.07151031494140625, -0.0500335693359375, -0.02855682373046875, -0.007080078125, 0.01439666748046875, 0.0358734130859375, 0.05735015869140625, 0.078826904296875, 0.10030364990234375, 0.1217803955078125, 0.14325714111328125, 0.16473388671875, 0.18621063232421875, 0.2076873779296875, 0.22916412353515625, 0.250640869140625, 0.27211761474609375, 0.2935943603515625, 0.31507110595703125, 0.3365478515625, 0.35802459716796875, 0.3795013427734375, 0.40097808837890625, 0.422454833984375, 0.44393157958984375, 0.4654083251953125, 0.48688507080078125, 0.50836181640625, 0.5298385620117188, 0.5513153076171875, 0.5727920532226562, 0.594268798828125, 0.6157455444335938, 0.6372222900390625, 0.6586990356445312, 0.68017578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 18.0, 16.0, 25.0, 24.0, 53.0, 47.0, 78.0, 113.0, 137.0, 295.0, 615.0, 1070.0, 717.0, 353.0, 164.0, 100.0, 60.0, 41.0, 26.0, 22.0, 15.0, 11.0, 16.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7373046875, -0.7152328491210938, -0.6931610107421875, -0.6710891723632812, -0.649017333984375, -0.6269454956054688, -0.6048736572265625, -0.5828018188476562, -0.56072998046875, -0.5386581420898438, -0.5165863037109375, -0.49451446533203125, -0.472442626953125, -0.45037078857421875, -0.4282989501953125, -0.40622711181640625, -0.3841552734375, -0.36208343505859375, -0.3400115966796875, -0.31793975830078125, -0.295867919921875, -0.27379608154296875, -0.2517242431640625, -0.22965240478515625, -0.20758056640625, -0.18550872802734375, -0.1634368896484375, -0.14136505126953125, -0.119293212890625, -0.09722137451171875, -0.0751495361328125, -0.05307769775390625, -0.031005859375, -0.00893402099609375, 0.0131378173828125, 0.03520965576171875, 0.057281494140625, 0.07935333251953125, 0.1014251708984375, 0.12349700927734375, 0.14556884765625, 0.16764068603515625, 0.1897125244140625, 0.21178436279296875, 0.233856201171875, 0.25592803955078125, 0.2779998779296875, 0.30007171630859375, 0.3221435546875, 0.34421539306640625, 0.3662872314453125, 0.38835906982421875, 0.410430908203125, 0.43250274658203125, 0.4545745849609375, 0.47664642333984375, 0.49871826171875, 0.5207901000976562, 0.5428619384765625, 0.5649337768554688, 0.587005615234375, 0.6090774536132812, 0.6311492919921875, 0.6532211303710938, 0.67529296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 24.0, 45.0, 119.0, 287.0, 295.0, 162.0, 46.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.010629653930664, -9.642141342163086, -9.273652076721191, -8.905163764953613, -8.536675453186035, -8.16818618774414, -7.7996978759765625, -7.431209564208984, -7.062720775604248, -6.694231986999512, -6.325743675231934, -5.957254886627197, -5.588766098022461, -5.220277786254883, -4.8517889976501465, -4.48330020904541, -4.114811897277832, -3.746323347091675, -3.3778347969055176, -3.0093460083007812, -2.640857458114624, -2.272368907928467, -1.9038801193237305, -1.5353915691375732, -1.166903018951416, -0.798414409160614, -0.429925799369812, -0.061437129974365234, 0.307051420211792, 0.6755399703979492, 1.0440287590026855, 1.4125173091888428, 1.781005859375, 2.1494944095611572, 2.5179829597473145, 2.886471748352051, 3.254960298538208, 3.6234488487243652, 3.9919376373291016, 4.36042594909668, 4.728914737701416, 5.097403526306152, 5.4658918380737305, 5.834380626678467, 6.202869415283203, 6.571357727050781, 6.939846515655518, 7.308335304260254, 7.676823616027832, 8.04531192779541, 8.413801193237305, 8.782289505004883, 9.150777816772461, 9.519266128540039, 9.887755393981934, 10.256243705749512, 10.624732971191406, 10.993221282958984, 11.361710548400879, 11.730198860168457, 12.098687171936035, 12.46717643737793, 12.835664749145508, 13.204153060913086, 13.572641372680664]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 10.0, 9.0, 12.0, 11.0, 16.0, 31.0, 35.0, 44.0, 45.0, 49.0, 58.0, 60.0, 64.0, 62.0, 67.0, 50.0, 57.0, 44.0, 40.0, 51.0, 40.0, 35.0, 26.0, 15.0, 19.0, 14.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513559341430664, -3.3802833557128906, -3.247007369995117, -3.1137313842773438, -2.9804553985595703, -2.847179412841797, -2.7139036655426025, -2.580627679824829, -2.4473516941070557, -2.3140757083892822, -2.180799722671509, -2.0475237369537354, -1.9142478704452515, -1.780971884727478, -1.6476960182189941, -1.5144200325012207, -1.3811440467834473, -1.2478680610656738, -1.1145920753479004, -0.9813162088394165, -0.8480402231216431, -0.7147642374038696, -0.581488311290741, -0.4482123851776123, -0.31493639945983887, -0.18166044354438782, -0.04838448762893677, 0.08489146828651428, 0.21816742420196533, 0.35144340991973877, 0.48471933603286743, 0.6179952621459961, 0.7512707710266113, 0.8845467567443848, 1.0178227424621582, 1.151098608970642, 1.2843745946884155, 1.417650580406189, 1.5509264469146729, 1.6842024326324463, 1.8174784183502197, 1.9507544040679932, 2.0840303897857666, 2.21730637550354, 2.3505821228027344, 2.483858108520508, 2.6171340942382812, 2.7504100799560547, 2.883686065673828, 3.0169620513916016, 3.150238037109375, 3.2835140228271484, 3.416790008544922, 3.5500659942626953, 3.6833417415618896, 3.816617727279663, 3.9498937129974365, 4.083169460296631, 4.216445446014404, 4.349721431732178, 4.482997417449951, 4.616273403167725, 4.749549388885498, 4.8828253746032715, 5.016101360321045]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 15.0, 21.0, 31.0, 55.0, 113.0, 163.0, 358.0, 731.0, 1732.0, 4244.0, 12245.0, 45587.0, 285128.0, 588577.0, 80181.0, 19118.0, 5972.0, 2303.0, 963.0, 463.0, 228.0, 115.0, 68.0, 35.0, 29.0, 15.0, 13.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.60693359375, -0.5818328857421875, -0.556732177734375, -0.5316314697265625, -0.50653076171875, -0.4814300537109375, -0.456329345703125, -0.4312286376953125, -0.4061279296875, -0.3810272216796875, -0.355926513671875, -0.3308258056640625, -0.30572509765625, -0.2806243896484375, -0.255523681640625, -0.2304229736328125, -0.205322265625, -0.1802215576171875, -0.155120849609375, -0.1300201416015625, -0.10491943359375, -0.0798187255859375, -0.054718017578125, -0.0296173095703125, -0.0045166015625, 0.0205841064453125, 0.045684814453125, 0.0707855224609375, 0.09588623046875, 0.1209869384765625, 0.146087646484375, 0.1711883544921875, 0.1962890625, 0.2213897705078125, 0.246490478515625, 0.2715911865234375, 0.29669189453125, 0.3217926025390625, 0.346893310546875, 0.3719940185546875, 0.3970947265625, 0.4221954345703125, 0.447296142578125, 0.4723968505859375, 0.49749755859375, 0.5225982666015625, 0.547698974609375, 0.5727996826171875, 0.597900390625, 0.6230010986328125, 0.648101806640625, 0.6732025146484375, 0.69830322265625, 0.7234039306640625, 0.748504638671875, 0.7736053466796875, 0.7987060546875, 0.8238067626953125, 0.848907470703125, 0.8740081787109375, 0.89910888671875, 0.9242095947265625, 0.949310302734375, 0.9744110107421875, 0.99951171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 3.0, 11.0, 9.0, 4.0, 28.0, 25.0, 24.0, 35.0, 38.0, 53.0, 62.0, 75.0, 62.0, 66.0, 71.0, 67.0, 56.0, 61.0, 51.0, 32.0, 40.0, 34.0, 20.0, 22.0, 18.0, 10.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.365478515625, -0.3565330505371094, -0.34758758544921875, -0.3386421203613281, -0.3296966552734375, -0.3207511901855469, -0.31180572509765625, -0.3028602600097656, -0.293914794921875, -0.2849693298339844, -0.27602386474609375, -0.2670783996582031, -0.2581329345703125, -0.24918746948242188, -0.24024200439453125, -0.23129653930664062, -0.22235107421875, -0.21340560913085938, -0.20446014404296875, -0.19551467895507812, -0.1865692138671875, -0.17762374877929688, -0.16867828369140625, -0.15973281860351562, -0.150787353515625, -0.14184188842773438, -0.13289642333984375, -0.12395095825195312, -0.1150054931640625, -0.10606002807617188, -0.09711456298828125, -0.08816909790039062, -0.0792236328125, -0.07027816772460938, -0.06133270263671875, -0.052387237548828125, -0.0434417724609375, -0.034496307373046875, -0.02555084228515625, -0.016605377197265625, -0.007659912109375, 0.001285552978515625, 0.01023101806640625, 0.019176483154296875, 0.0281219482421875, 0.037067413330078125, 0.04601287841796875, 0.054958343505859375, 0.06390380859375, 0.07284927368164062, 0.08179473876953125, 0.09074020385742188, 0.0996856689453125, 0.10863113403320312, 0.11757659912109375, 0.12652206420898438, 0.135467529296875, 0.14441299438476562, 0.15335845947265625, 0.16230392456054688, 0.1712493896484375, 0.18019485473632812, 0.18914031982421875, 0.19808578491210938, 0.20703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 17.0, 6.0, 14.0, 22.0, 29.0, 36.0, 53.0, 67.0, 113.0, 163.0, 260.0, 410.0, 775.0, 1710.0, 4584.0, 19113.0, 258453.0, 720479.0, 31742.0, 6153.0, 2064.0, 910.0, 471.0, 288.0, 190.0, 142.0, 92.0, 65.0, 30.0, 26.0, 15.0, 16.0, 11.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.03179931640625, -0.9923095703125, -0.95281982421875, -0.913330078125, -0.87384033203125, -0.8343505859375, -0.79486083984375, -0.75537109375, -0.71588134765625, -0.6763916015625, -0.63690185546875, -0.597412109375, -0.55792236328125, -0.5184326171875, -0.47894287109375, -0.439453125, -0.39996337890625, -0.3604736328125, -0.32098388671875, -0.281494140625, -0.24200439453125, -0.2025146484375, -0.16302490234375, -0.12353515625, -0.08404541015625, -0.0445556640625, -0.00506591796875, 0.034423828125, 0.07391357421875, 0.1134033203125, 0.15289306640625, 0.1923828125, 0.23187255859375, 0.2713623046875, 0.31085205078125, 0.350341796875, 0.38983154296875, 0.4293212890625, 0.46881103515625, 0.50830078125, 0.54779052734375, 0.5872802734375, 0.62677001953125, 0.666259765625, 0.70574951171875, 0.7452392578125, 0.78472900390625, 0.82421875, 0.86370849609375, 0.9031982421875, 0.94268798828125, 0.982177734375, 1.02166748046875, 1.0611572265625, 1.10064697265625, 1.14013671875, 1.17962646484375, 1.2191162109375, 1.25860595703125, 1.298095703125, 1.33758544921875, 1.3770751953125, 1.41656494140625, 1.4560546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 7.0, 10.0, 11.0, 13.0, 20.0, 20.0, 33.0, 36.0, 31.0, 51.0, 39.0, 46.0, 53.0, 41.0, 52.0, 61.0, 48.0, 50.0, 47.0, 54.0, 39.0, 29.0, 32.0, 30.0, 21.0, 22.0, 10.0, 10.0, 14.0, 10.0, 11.0, 10.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.982421875, -0.949920654296875, -0.91741943359375, -0.884918212890625, -0.8524169921875, -0.819915771484375, -0.78741455078125, -0.754913330078125, -0.722412109375, -0.689910888671875, -0.65740966796875, -0.624908447265625, -0.5924072265625, -0.559906005859375, -0.52740478515625, -0.494903564453125, -0.46240234375, -0.429901123046875, -0.39739990234375, -0.364898681640625, -0.3323974609375, -0.299896240234375, -0.26739501953125, -0.234893798828125, -0.202392578125, -0.169891357421875, -0.13739013671875, -0.104888916015625, -0.0723876953125, -0.039886474609375, -0.00738525390625, 0.025115966796875, 0.0576171875, 0.090118408203125, 0.12261962890625, 0.155120849609375, 0.1876220703125, 0.220123291015625, 0.25262451171875, 0.285125732421875, 0.317626953125, 0.350128173828125, 0.38262939453125, 0.415130615234375, 0.4476318359375, 0.480133056640625, 0.51263427734375, 0.545135498046875, 0.57763671875, 0.610137939453125, 0.64263916015625, 0.675140380859375, 0.7076416015625, 0.740142822265625, 0.77264404296875, 0.805145263671875, 0.837646484375, 0.870147705078125, 0.90264892578125, 0.935150146484375, 0.9676513671875, 1.000152587890625, 1.03265380859375, 1.065155029296875, 1.09765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 6.0, 10.0, 18.0, 34.0, 43.0, 74.0, 73.0, 176.0, 310.0, 607.0, 1566.0, 4492.0, 19866.0, 203253.0, 755706.0, 49621.0, 8347.0, 2442.0, 876.0, 393.0, 225.0, 139.0, 91.0, 59.0, 34.0, 19.0, 19.0, 10.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.425537109375, -0.4123344421386719, -0.39913177490234375, -0.3859291076660156, -0.3727264404296875, -0.3595237731933594, -0.34632110595703125, -0.3331184387207031, -0.319915771484375, -0.3067131042480469, -0.29351043701171875, -0.2803077697753906, -0.2671051025390625, -0.2539024353027344, -0.24069976806640625, -0.22749710083007812, -0.21429443359375, -0.20109176635742188, -0.18788909912109375, -0.17468643188476562, -0.1614837646484375, -0.14828109741210938, -0.13507843017578125, -0.12187576293945312, -0.108673095703125, -0.09547042846679688, -0.08226776123046875, -0.06906509399414062, -0.0558624267578125, -0.042659759521484375, -0.02945709228515625, -0.016254425048828125, -0.0030517578125, 0.010150909423828125, 0.02335357666015625, 0.036556243896484375, 0.0497589111328125, 0.06296157836914062, 0.07616424560546875, 0.08936691284179688, 0.102569580078125, 0.11577224731445312, 0.12897491455078125, 0.14217758178710938, 0.1553802490234375, 0.16858291625976562, 0.18178558349609375, 0.19498825073242188, 0.20819091796875, 0.22139358520507812, 0.23459625244140625, 0.24779891967773438, 0.2610015869140625, 0.2742042541503906, 0.28740692138671875, 0.3006095886230469, 0.313812255859375, 0.3270149230957031, 0.34021759033203125, 0.3534202575683594, 0.3666229248046875, 0.3798255920410156, 0.39302825927734375, 0.4062309265136719, 0.41943359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 14.0, 20.0, 16.0, 29.0, 38.0, 61.0, 97.0, 149.0, 164.0, 136.0, 66.0, 60.0, 35.0, 26.0, 14.0, 12.0, 11.0, 7.0, 2.0, 7.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001131296157836914, -0.00011009536683559418, -0.00010706111788749695, -0.00010402686893939972, -0.00010099261999130249, -9.795837104320526e-05, -9.492412209510803e-05, -9.18898731470108e-05, -8.885562419891357e-05, -8.582137525081635e-05, -8.278712630271912e-05, -7.975287735462189e-05, -7.671862840652466e-05, -7.368437945842743e-05, -7.06501305103302e-05, -6.761588156223297e-05, -6.458163261413574e-05, -6.154738366603851e-05, -5.8513134717941284e-05, -5.5478885769844055e-05, -5.2444636821746826e-05, -4.94103878736496e-05, -4.637613892555237e-05, -4.334188997745514e-05, -4.030764102935791e-05, -3.727339208126068e-05, -3.423914313316345e-05, -3.120489418506622e-05, -2.8170645236968994e-05, -2.5136396288871765e-05, -2.2102147340774536e-05, -1.9067898392677307e-05, -1.6033649444580078e-05, -1.2999400496482849e-05, -9.96515154838562e-06, -6.930902600288391e-06, -3.896653652191162e-06, -8.624047040939331e-07, 2.171844244003296e-06, 5.206093192100525e-06, 8.240342140197754e-06, 1.1274591088294983e-05, 1.4308840036392212e-05, 1.734308898448944e-05, 2.037733793258667e-05, 2.34115868806839e-05, 2.6445835828781128e-05, 2.9480084776878357e-05, 3.2514333724975586e-05, 3.5548582673072815e-05, 3.8582831621170044e-05, 4.161708056926727e-05, 4.46513295173645e-05, 4.768557846546173e-05, 5.071982741355896e-05, 5.375407636165619e-05, 5.678832530975342e-05, 5.982257425785065e-05, 6.285682320594788e-05, 6.58910721540451e-05, 6.892532110214233e-05, 7.195957005023956e-05, 7.499381899833679e-05, 7.802806794643402e-05, 8.106231689453125e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 10.0, 10.0, 8.0, 11.0, 34.0, 28.0, 42.0, 73.0, 95.0, 125.0, 190.0, 330.0, 545.0, 1017.0, 2182.0, 5759.0, 24874.0, 228758.0, 704347.0, 62658.0, 10870.0, 3288.0, 1476.0, 684.0, 402.0, 238.0, 140.0, 98.0, 65.0, 54.0, 35.0, 32.0, 17.0, 11.0, 10.0, 7.0, 4.0, 10.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.31562042236328125, -0.3048248291015625, -0.29402923583984375, -0.283233642578125, -0.27243804931640625, -0.2616424560546875, -0.25084686279296875, -0.24005126953125, -0.22925567626953125, -0.2184600830078125, -0.20766448974609375, -0.196868896484375, -0.18607330322265625, -0.1752777099609375, -0.16448211669921875, -0.1536865234375, -0.14289093017578125, -0.1320953369140625, -0.12129974365234375, -0.110504150390625, -0.09970855712890625, -0.0889129638671875, -0.07811737060546875, -0.06732177734375, -0.05652618408203125, -0.0457305908203125, -0.03493499755859375, -0.024139404296875, -0.01334381103515625, -0.0025482177734375, 0.00824737548828125, 0.01904296875, 0.02983856201171875, 0.0406341552734375, 0.05142974853515625, 0.062225341796875, 0.07302093505859375, 0.0838165283203125, 0.09461212158203125, 0.10540771484375, 0.11620330810546875, 0.1269989013671875, 0.13779449462890625, 0.148590087890625, 0.15938568115234375, 0.1701812744140625, 0.18097686767578125, 0.1917724609375, 0.20256805419921875, 0.2133636474609375, 0.22415924072265625, 0.234954833984375, 0.24575042724609375, 0.2565460205078125, 0.26734161376953125, 0.27813720703125, 0.28893280029296875, 0.2997283935546875, 0.31052398681640625, 0.321319580078125, 0.33211517333984375, 0.3429107666015625, 0.35370635986328125, 0.364501953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 10.0, 20.0, 15.0, 17.0, 23.0, 42.0, 40.0, 44.0, 53.0, 59.0, 76.0, 76.0, 81.0, 83.0, 50.0, 39.0, 40.0, 36.0, 33.0, 22.0, 28.0, 16.0, 8.0, 9.0, 7.0, 2.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28076171875, -0.2729034423828125, -0.265045166015625, -0.2571868896484375, -0.24932861328125, -0.2414703369140625, -0.233612060546875, -0.2257537841796875, -0.2178955078125, -0.2100372314453125, -0.202178955078125, -0.1943206787109375, -0.18646240234375, -0.1786041259765625, -0.170745849609375, -0.1628875732421875, -0.155029296875, -0.1471710205078125, -0.139312744140625, -0.1314544677734375, -0.12359619140625, -0.1157379150390625, -0.107879638671875, -0.1000213623046875, -0.0921630859375, -0.0843048095703125, -0.076446533203125, -0.0685882568359375, -0.06072998046875, -0.0528717041015625, -0.045013427734375, -0.0371551513671875, -0.029296875, -0.0214385986328125, -0.013580322265625, -0.0057220458984375, 0.00213623046875, 0.0099945068359375, 0.017852783203125, 0.0257110595703125, 0.0335693359375, 0.0414276123046875, 0.049285888671875, 0.0571441650390625, 0.06500244140625, 0.0728607177734375, 0.080718994140625, 0.0885772705078125, 0.096435546875, 0.1042938232421875, 0.112152099609375, 0.1200103759765625, 0.12786865234375, 0.1357269287109375, 0.143585205078125, 0.1514434814453125, 0.1593017578125, 0.1671600341796875, 0.175018310546875, 0.1828765869140625, 0.19073486328125, 0.1985931396484375, 0.206451416015625, 0.2143096923828125, 0.22216796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 11.0, 23.0, 59.0, 108.0, 201.0, 241.0, 173.0, 97.0, 44.0, 15.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.356454849243164, -10.087518692016602, -9.818582534790039, -9.549646377563477, -9.280710220336914, -9.011774063110352, -8.742837905883789, -8.473901748657227, -8.204965591430664, -7.936029434204102, -7.667093276977539, -7.398157119750977, -7.129220962524414, -6.860284805297852, -6.591349124908447, -6.322412967681885, -6.0534772872924805, -5.784541130065918, -5.5156049728393555, -5.246668815612793, -4.9777326583862305, -4.708796501159668, -4.439860820770264, -4.170924663543701, -3.9019885063171387, -3.633052349090576, -3.3641161918640137, -3.0951802730560303, -2.8262441158294678, -2.5573079586029053, -2.288372039794922, -2.0194358825683594, -1.7505006790161133, -1.4815645217895508, -1.2126284837722778, -0.9436923861503601, -0.6747562885284424, -0.4058201313018799, -0.13688409328460693, 0.13205194473266602, 0.4009881019592285, 0.6699241995811462, 0.938860297203064, 1.207796335220337, 1.4767324924468994, 1.745668649673462, 2.0146045684814453, 2.283540725708008, 2.5524768829345703, 2.821413040161133, 3.0903491973876953, 3.3592851161956787, 3.628221273422241, 3.8971574306488037, 4.166093349456787, 4.43502950668335, 4.703965663909912, 4.972901821136475, 5.241837978363037, 5.5107741355896, 5.779709815979004, 6.048645973205566, 6.317582130432129, 6.586518287658691, 6.855454444885254]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 12.0, 13.0, 8.0, 12.0, 22.0, 13.0, 17.0, 27.0, 29.0, 24.0, 36.0, 39.0, 54.0, 51.0, 68.0, 71.0, 73.0, 67.0, 49.0, 46.0, 44.0, 26.0, 31.0, 31.0, 31.0, 19.0, 19.0, 11.0, 14.0, 11.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.709228277206421, -3.574207067489624, -3.439185857772827, -3.3041646480560303, -3.1691434383392334, -3.0341222286224365, -2.8991007804870605, -2.7640795707702637, -2.629058361053467, -2.49403715133667, -2.359015941619873, -2.223994731903076, -2.0889735221862793, -1.9539523124694824, -1.818930983543396, -1.6839097738265991, -1.5488886833190918, -1.413867473602295, -1.278846263885498, -1.1438250541687012, -1.0088038444519043, -0.8737825751304626, -0.738761305809021, -0.6037400960922241, -0.46871888637542725, -0.33369767665863037, -0.1986764371395111, -0.06365519762039185, 0.07136601209640503, 0.2063872218132019, 0.34140849113464355, 0.47642970085144043, 0.6114506721496582, 0.7464718818664551, 0.881493091583252, 1.0165143013000488, 1.1515355110168457, 1.2865567207336426, 1.421578049659729, 1.5565992593765259, 1.6916204690933228, 1.8266416788101196, 1.9616628885269165, 2.096684217453003, 2.2317054271698, 2.3667266368865967, 2.5017478466033936, 2.6367690563201904, 2.7717902660369873, 2.906811475753784, 3.041832685470581, 3.176853895187378, 3.311875104904175, 3.4468963146209717, 3.5819177627563477, 3.7169389724731445, 3.8519601821899414, 3.9869813919067383, 4.122002601623535, 4.257023811340332, 4.392045021057129, 4.527066230773926, 4.662087440490723, 4.7971086502075195, 4.932129859924316]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 18.0, 13.0, 24.0, 42.0, 51.0, 72.0, 123.0, 226.0, 778.0, 7441.0, 2378182.0, 1798728.0, 7054.0, 856.0, 265.0, 130.0, 65.0, 69.0, 42.0, 19.0, 19.0, 10.0, 12.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6281280517578125, -1.575592041015625, -1.5230560302734375, -1.47052001953125, -1.4179840087890625, -1.365447998046875, -1.3129119873046875, -1.2603759765625, -1.2078399658203125, -1.155303955078125, -1.1027679443359375, -1.05023193359375, -0.9976959228515625, -0.945159912109375, -0.8926239013671875, -0.840087890625, -0.7875518798828125, -0.735015869140625, -0.6824798583984375, -0.62994384765625, -0.5774078369140625, -0.524871826171875, -0.4723358154296875, -0.4197998046875, -0.3672637939453125, -0.314727783203125, -0.2621917724609375, -0.20965576171875, -0.1571197509765625, -0.104583740234375, -0.0520477294921875, 0.00048828125, 0.0530242919921875, 0.105560302734375, 0.1580963134765625, 0.21063232421875, 0.2631683349609375, 0.315704345703125, 0.3682403564453125, 0.4207763671875, 0.4733123779296875, 0.525848388671875, 0.5783843994140625, 0.63092041015625, 0.6834564208984375, 0.735992431640625, 0.7885284423828125, 0.841064453125, 0.8936004638671875, 0.946136474609375, 0.9986724853515625, 1.05120849609375, 1.1037445068359375, 1.156280517578125, 1.2088165283203125, 1.2613525390625, 1.3138885498046875, 1.366424560546875, 1.4189605712890625, 1.47149658203125, 1.5240325927734375, 1.576568603515625, 1.6291046142578125, 1.681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 8.0, 12.0, 14.0, 17.0, 27.0, 32.0, 46.0, 59.0, 49.0, 60.0, 58.0, 67.0, 66.0, 61.0, 74.0, 55.0, 53.0, 50.0, 36.0, 33.0, 27.0, 28.0, 18.0, 11.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217529296875, -0.20933151245117188, -0.20113372802734375, -0.19293594360351562, -0.1847381591796875, -0.17654037475585938, -0.16834259033203125, -0.16014480590820312, -0.151947021484375, -0.14374923706054688, -0.13555145263671875, -0.12735366821289062, -0.1191558837890625, -0.11095809936523438, -0.10276031494140625, -0.09456253051757812, -0.08636474609375, -0.07816696166992188, -0.06996917724609375, -0.061771392822265625, -0.0535736083984375, -0.045375823974609375, -0.03717803955078125, -0.028980255126953125, -0.020782470703125, -0.012584686279296875, -0.00438690185546875, 0.003810882568359375, 0.0120086669921875, 0.020206451416015625, 0.02840423583984375, 0.036602020263671875, 0.0447998046875, 0.052997589111328125, 0.06119537353515625, 0.06939315795898438, 0.0775909423828125, 0.08578872680664062, 0.09398651123046875, 0.10218429565429688, 0.110382080078125, 0.11857986450195312, 0.12677764892578125, 0.13497543334960938, 0.1431732177734375, 0.15137100219726562, 0.15956878662109375, 0.16776657104492188, 0.17596435546875, 0.18416213989257812, 0.19235992431640625, 0.20055770874023438, 0.2087554931640625, 0.21695327758789062, 0.22515106201171875, 0.23334884643554688, 0.241546630859375, 0.24974441528320312, 0.25794219970703125, 0.2661399841308594, 0.2743377685546875, 0.2825355529785156, 0.29073333740234375, 0.2989311218261719, 0.30712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 4.0, 14.0, 13.0, 30.0, 22.0, 29.0, 51.0, 99.0, 165.0, 293.0, 608.0, 1219.0, 2736.0, 6349.0, 15554.0, 43774.0, 189702.0, 2945377.0, 850390.0, 92443.0, 26969.0, 10156.0, 4333.0, 1910.0, 921.0, 462.0, 237.0, 150.0, 88.0, 53.0, 36.0, 22.0, 15.0, 9.0, 7.0, 12.0, 6.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5046310424804688, -0.4887542724609375, -0.47287750244140625, -0.457000732421875, -0.44112396240234375, -0.4252471923828125, -0.40937042236328125, -0.39349365234375, -0.37761688232421875, -0.3617401123046875, -0.34586334228515625, -0.329986572265625, -0.31410980224609375, -0.2982330322265625, -0.28235626220703125, -0.2664794921875, -0.25060272216796875, -0.2347259521484375, -0.21884918212890625, -0.202972412109375, -0.18709564208984375, -0.1712188720703125, -0.15534210205078125, -0.13946533203125, -0.12358856201171875, -0.1077117919921875, -0.09183502197265625, -0.075958251953125, -0.06008148193359375, -0.0442047119140625, -0.02832794189453125, -0.012451171875, 0.00342559814453125, 0.0193023681640625, 0.03517913818359375, 0.051055908203125, 0.06693267822265625, 0.0828094482421875, 0.09868621826171875, 0.11456298828125, 0.13043975830078125, 0.1463165283203125, 0.16219329833984375, 0.178070068359375, 0.19394683837890625, 0.2098236083984375, 0.22570037841796875, 0.2415771484375, 0.25745391845703125, 0.2733306884765625, 0.28920745849609375, 0.305084228515625, 0.32096099853515625, 0.3368377685546875, 0.35271453857421875, 0.36859130859375, 0.38446807861328125, 0.4003448486328125, 0.41622161865234375, 0.432098388671875, 0.44797515869140625, 0.4638519287109375, 0.47972869873046875, 0.49560546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 6.0, 7.0, 9.0, 10.0, 20.0, 24.0, 24.0, 28.0, 43.0, 75.0, 108.0, 164.0, 314.0, 630.0, 993.0, 686.0, 319.0, 191.0, 106.0, 85.0, 52.0, 34.0, 27.0, 17.0, 16.0, 16.0, 6.0, 9.0, 7.0, 4.0, 9.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5419082641601562, -0.5247344970703125, -0.5075607299804688, -0.490386962890625, -0.47321319580078125, -0.4560394287109375, -0.43886566162109375, -0.42169189453125, -0.40451812744140625, -0.3873443603515625, -0.37017059326171875, -0.352996826171875, -0.33582305908203125, -0.3186492919921875, -0.30147552490234375, -0.2843017578125, -0.26712799072265625, -0.2499542236328125, -0.23278045654296875, -0.215606689453125, -0.19843292236328125, -0.1812591552734375, -0.16408538818359375, -0.14691162109375, -0.12973785400390625, -0.1125640869140625, -0.09539031982421875, -0.078216552734375, -0.06104278564453125, -0.0438690185546875, -0.02669525146484375, -0.009521484375, 0.00765228271484375, 0.0248260498046875, 0.04199981689453125, 0.059173583984375, 0.07634735107421875, 0.0935211181640625, 0.11069488525390625, 0.12786865234375, 0.14504241943359375, 0.1622161865234375, 0.17938995361328125, 0.196563720703125, 0.21373748779296875, 0.2309112548828125, 0.24808502197265625, 0.2652587890625, 0.28243255615234375, 0.2996063232421875, 0.31678009033203125, 0.333953857421875, 0.35112762451171875, 0.3683013916015625, 0.38547515869140625, 0.40264892578125, 0.41982269287109375, 0.4369964599609375, 0.45417022705078125, 0.471343994140625, 0.48851776123046875, 0.5056915283203125, 0.5228652954101562, 0.5400390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 13.0, 18.0, 54.0, 129.0, 260.0, 243.0, 162.0, 54.0, 28.0, 10.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.792000770568848, -7.556621551513672, -7.321242809295654, -7.0858635902404785, -6.850484371185303, -6.615105628967285, -6.379726409912109, -6.144347190856934, -5.908967971801758, -5.673588752746582, -5.4382100105285645, -5.202830791473389, -4.967451572418213, -4.732072830200195, -4.4966936111450195, -4.261314392089844, -4.025935649871826, -3.7905566692352295, -3.5551774501800537, -3.319798469543457, -3.0844192504882812, -2.8490402698516846, -2.613661289215088, -2.378282070159912, -2.1429030895233154, -1.9075239896774292, -1.672144889831543, -1.4367659091949463, -1.20138680934906, -0.9660077095031738, -0.7306287288665771, -0.4952496290206909, -0.2598705291748047, -0.024491459131240845, 0.210887610912323, 0.44626665115356445, 0.6816457509994507, 0.9170248508453369, 1.1524038314819336, 1.3877829313278198, 1.623162031173706, 1.8585411310195923, 2.0939202308654785, 2.329299211502075, 2.564678192138672, 2.8000574111938477, 3.0354363918304443, 3.270815372467041, 3.506194591522217, 3.7415735721588135, 3.9769527912139893, 4.212331771850586, 4.447710990905762, 4.6830902099609375, 4.918468952178955, 5.153848171234131, 5.389226913452148, 5.624606132507324, 5.859984874725342, 6.095364093780518, 6.330743312835693, 6.566122055053711, 6.801501274108887, 7.0368804931640625, 7.272259712219238]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 6.0, 12.0, 11.0, 10.0, 11.0, 5.0, 11.0, 22.0, 21.0, 30.0, 22.0, 26.0, 36.0, 36.0, 29.0, 32.0, 37.0, 40.0, 44.0, 46.0, 37.0, 41.0, 40.0, 40.0, 31.0, 41.0, 31.0, 29.0, 30.0, 19.0, 22.0, 26.0, 17.0, 14.0, 8.0, 16.0, 8.0, 9.0, 2.0, 6.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.027822256088257, -1.9634045362472534, -1.89898681640625, -1.8345690965652466, -1.7701513767242432, -1.7057336568832397, -1.6413159370422363, -1.576898217201233, -1.5124804973602295, -1.448062777519226, -1.3836450576782227, -1.3192273378372192, -1.2548096179962158, -1.1903918981552124, -1.125974178314209, -1.0615564584732056, -0.9971387386322021, -0.9327210187911987, -0.8683032989501953, -0.8038855791091919, -0.7394678592681885, -0.6750501394271851, -0.6106324195861816, -0.5462146997451782, -0.4817969799041748, -0.4173792600631714, -0.35296154022216797, -0.28854382038116455, -0.22412610054016113, -0.15970838069915771, -0.0952906608581543, -0.03087294101715088, 0.03354454040527344, 0.09796226024627686, 0.16237998008728027, 0.2267976999282837, 0.2912154197692871, 0.3556331396102905, 0.42005085945129395, 0.48446857929229736, 0.5488862991333008, 0.6133040189743042, 0.6777217388153076, 0.742139458656311, 0.8065571784973145, 0.8709748983383179, 0.9353926181793213, 0.9998103380203247, 1.0642280578613281, 1.1286457777023315, 1.193063497543335, 1.2574812173843384, 1.3218989372253418, 1.3863166570663452, 1.4507343769073486, 1.515152096748352, 1.5795698165893555, 1.6439875364303589, 1.7084052562713623, 1.7728229761123657, 1.8372406959533691, 1.9016584157943726, 1.966076135635376, 2.03049373626709, 2.094911575317383]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 11.0, 9.0, 20.0, 30.0, 40.0, 71.0, 88.0, 148.0, 258.0, 387.0, 605.0, 1158.0, 1998.0, 3731.0, 7177.0, 14897.0, 34069.0, 95264.0, 326651.0, 377093.0, 111514.0, 39534.0, 16713.0, 7827.0, 3956.0, 2143.0, 1217.0, 733.0, 454.0, 313.0, 135.0, 111.0, 59.0, 51.0, 30.0, 18.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3752174377441406, -0.36273956298828125, -0.3502616882324219, -0.3377838134765625, -0.3253059387207031, -0.31282806396484375, -0.3003501892089844, -0.287872314453125, -0.2753944396972656, -0.26291656494140625, -0.2504386901855469, -0.2379608154296875, -0.22548294067382812, -0.21300506591796875, -0.20052719116210938, -0.18804931640625, -0.17557144165039062, -0.16309356689453125, -0.15061569213867188, -0.1381378173828125, -0.12565994262695312, -0.11318206787109375, -0.10070419311523438, -0.088226318359375, -0.07574844360351562, -0.06327056884765625, -0.050792694091796875, -0.0383148193359375, -0.025836944580078125, -0.01335906982421875, -0.000881195068359375, 0.0115966796875, 0.024074554443359375, 0.03655242919921875, 0.049030303955078125, 0.0615081787109375, 0.07398605346679688, 0.08646392822265625, 0.09894180297851562, 0.111419677734375, 0.12389755249023438, 0.13637542724609375, 0.14885330200195312, 0.1613311767578125, 0.17380905151367188, 0.18628692626953125, 0.19876480102539062, 0.21124267578125, 0.22372055053710938, 0.23619842529296875, 0.24867630004882812, 0.2611541748046875, 0.2736320495605469, 0.28610992431640625, 0.2985877990722656, 0.311065673828125, 0.3235435485839844, 0.33602142333984375, 0.3484992980957031, 0.3609771728515625, 0.3734550476074219, 0.38593292236328125, 0.3984107971191406, 0.410888671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 7.0, 11.0, 24.0, 21.0, 22.0, 24.0, 31.0, 27.0, 40.0, 49.0, 60.0, 55.0, 59.0, 56.0, 54.0, 50.0, 54.0, 51.0, 52.0, 33.0, 33.0, 36.0, 23.0, 17.0, 26.0, 14.0, 10.0, 15.0, 8.0, 5.0, 5.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.23657608032226562, -0.22913360595703125, -0.22169113159179688, -0.2142486572265625, -0.20680618286132812, -0.19936370849609375, -0.19192123413085938, -0.184478759765625, -0.17703628540039062, -0.16959381103515625, -0.16215133666992188, -0.1547088623046875, -0.14726638793945312, -0.13982391357421875, -0.13238143920898438, -0.12493896484375, -0.11749649047851562, -0.11005401611328125, -0.10261154174804688, -0.0951690673828125, -0.08772659301757812, -0.08028411865234375, -0.07284164428710938, -0.065399169921875, -0.057956695556640625, -0.05051422119140625, -0.043071746826171875, -0.0356292724609375, -0.028186798095703125, -0.02074432373046875, -0.013301849365234375, -0.005859375, 0.001583099365234375, 0.00902557373046875, 0.016468048095703125, 0.0239105224609375, 0.031352996826171875, 0.03879547119140625, 0.046237945556640625, 0.053680419921875, 0.061122894287109375, 0.06856536865234375, 0.07600784301757812, 0.0834503173828125, 0.09089279174804688, 0.09833526611328125, 0.10577774047851562, 0.11322021484375, 0.12066268920898438, 0.12810516357421875, 0.13554763793945312, 0.1429901123046875, 0.15043258666992188, 0.15787506103515625, 0.16531753540039062, 0.172760009765625, 0.18020248413085938, 0.18764495849609375, 0.19508743286132812, 0.2025299072265625, 0.20997238159179688, 0.21741485595703125, 0.22485733032226562, 0.2322998046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 17.0, 14.0, 22.0, 25.0, 34.0, 51.0, 78.0, 97.0, 159.0, 274.0, 451.0, 865.0, 1593.0, 4513.0, 18232.0, 133195.0, 787923.0, 81025.0, 13095.0, 3645.0, 1441.0, 693.0, 422.0, 220.0, 151.0, 86.0, 51.0, 38.0, 33.0, 22.0, 21.0, 16.0, 13.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7446060180664062, -0.7152862548828125, -0.6859664916992188, -0.656646728515625, -0.6273269653320312, -0.5980072021484375, -0.5686874389648438, -0.53936767578125, -0.5100479125976562, -0.4807281494140625, -0.45140838623046875, -0.422088623046875, -0.39276885986328125, -0.3634490966796875, -0.33412933349609375, -0.3048095703125, -0.27548980712890625, -0.2461700439453125, -0.21685028076171875, -0.187530517578125, -0.15821075439453125, -0.1288909912109375, -0.09957122802734375, -0.07025146484375, -0.04093170166015625, -0.0116119384765625, 0.01770782470703125, 0.047027587890625, 0.07634735107421875, 0.1056671142578125, 0.13498687744140625, 0.164306640625, 0.19362640380859375, 0.2229461669921875, 0.25226593017578125, 0.281585693359375, 0.31090545654296875, 0.3402252197265625, 0.36954498291015625, 0.39886474609375, 0.42818450927734375, 0.4575042724609375, 0.48682403564453125, 0.516143798828125, 0.5454635620117188, 0.5747833251953125, 0.6041030883789062, 0.6334228515625, 0.6627426147460938, 0.6920623779296875, 0.7213821411132812, 0.750701904296875, 0.7800216674804688, 0.8093414306640625, 0.8386611938476562, 0.86798095703125, 0.8973007202148438, 0.9266204833984375, 0.9559402465820312, 0.985260009765625, 1.0145797729492188, 1.0438995361328125, 1.0732192993164062, 1.1025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 1.0, 5.0, 8.0, 10.0, 4.0, 18.0, 19.0, 12.0, 26.0, 28.0, 22.0, 37.0, 42.0, 42.0, 52.0, 62.0, 56.0, 59.0, 61.0, 69.0, 56.0, 46.0, 51.0, 37.0, 36.0, 28.0, 21.0, 24.0, 13.0, 6.0, 16.0, 14.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2254409790039062, -1.1920928955078125, -1.1587448120117188, -1.125396728515625, -1.0920486450195312, -1.0587005615234375, -1.0253524780273438, -0.99200439453125, -0.9586563110351562, -0.9253082275390625, -0.8919601440429688, -0.858612060546875, -0.8252639770507812, -0.7919158935546875, -0.7585678100585938, -0.7252197265625, -0.6918716430664062, -0.6585235595703125, -0.6251754760742188, -0.591827392578125, -0.5584793090820312, -0.5251312255859375, -0.49178314208984375, -0.45843505859375, -0.42508697509765625, -0.3917388916015625, -0.35839080810546875, -0.325042724609375, -0.29169464111328125, -0.2583465576171875, -0.22499847412109375, -0.191650390625, -0.15830230712890625, -0.1249542236328125, -0.09160614013671875, -0.058258056640625, -0.02490997314453125, 0.0084381103515625, 0.04178619384765625, 0.07513427734375, 0.10848236083984375, 0.1418304443359375, 0.17517852783203125, 0.208526611328125, 0.24187469482421875, 0.2752227783203125, 0.30857086181640625, 0.3419189453125, 0.37526702880859375, 0.4086151123046875, 0.44196319580078125, 0.475311279296875, 0.5086593627929688, 0.5420074462890625, 0.5753555297851562, 0.60870361328125, 0.6420516967773438, 0.6753997802734375, 0.7087478637695312, 0.742095947265625, 0.7754440307617188, 0.8087921142578125, 0.8421401977539062, 0.87548828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 15.0, 18.0, 31.0, 59.0, 203.0, 625.0, 3319.0, 48707.0, 942639.0, 48514.0, 3393.0, 640.0, 206.0, 80.0, 38.0, 18.0, 15.0, 3.0, 5.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1124954223632812, -1.0863189697265625, -1.0601425170898438, -1.033966064453125, -1.0077896118164062, -0.9816131591796875, -0.9554367065429688, -0.92926025390625, -0.9030838012695312, -0.8769073486328125, -0.8507308959960938, -0.824554443359375, -0.7983779907226562, -0.7722015380859375, -0.7460250854492188, -0.7198486328125, -0.6936721801757812, -0.6674957275390625, -0.6413192749023438, -0.615142822265625, -0.5889663696289062, -0.5627899169921875, -0.5366134643554688, -0.51043701171875, -0.48426055908203125, -0.4580841064453125, -0.43190765380859375, -0.405731201171875, -0.37955474853515625, -0.3533782958984375, -0.32720184326171875, -0.301025390625, -0.27484893798828125, -0.2486724853515625, -0.22249603271484375, -0.196319580078125, -0.17014312744140625, -0.1439666748046875, -0.11779022216796875, -0.09161376953125, -0.06543731689453125, -0.0392608642578125, -0.01308441162109375, 0.013092041015625, 0.03926849365234375, 0.0654449462890625, 0.09162139892578125, 0.1177978515625, 0.14397430419921875, 0.1701507568359375, 0.19632720947265625, 0.222503662109375, 0.24868011474609375, 0.2748565673828125, 0.30103302001953125, 0.32720947265625, 0.35338592529296875, 0.3795623779296875, 0.40573883056640625, 0.431915283203125, 0.45809173583984375, 0.4842681884765625, 0.5104446411132812, 0.53662109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 8.0, 4.0, 6.0, 8.0, 5.0, 14.0, 15.0, 24.0, 46.0, 43.0, 55.0, 76.0, 106.0, 148.0, 107.0, 87.0, 73.0, 55.0, 37.0, 21.0, 17.0, 10.0, 8.0, 9.0, 7.0, 2.0, 0.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00011521577835083008, -0.00011245440691709518, -0.00010969303548336029, -0.0001069316640496254, -0.0001041702926158905, -0.00010140892118215561, -9.864754974842072e-05, -9.588617831468582e-05, -9.312480688095093e-05, -9.036343544721603e-05, -8.760206401348114e-05, -8.484069257974625e-05, -8.207932114601135e-05, -7.931794971227646e-05, -7.655657827854156e-05, -7.379520684480667e-05, -7.103383541107178e-05, -6.827246397733688e-05, -6.551109254360199e-05, -6.27497211098671e-05, -5.99883496761322e-05, -5.722697824239731e-05, -5.4465606808662415e-05, -5.170423537492752e-05, -4.894286394119263e-05, -4.618149250745773e-05, -4.342012107372284e-05, -4.0658749639987946e-05, -3.789737820625305e-05, -3.513600677251816e-05, -3.2374635338783264e-05, -2.961326390504837e-05, -2.6851892471313477e-05, -2.4090521037578583e-05, -2.132914960384369e-05, -1.8567778170108795e-05, -1.58064067363739e-05, -1.3045035302639008e-05, -1.0283663868904114e-05, -7.52229243516922e-06, -4.760921001434326e-06, -1.9995495676994324e-06, 7.618218660354614e-07, 3.5231932997703552e-06, 6.284564733505249e-06, 9.045936167240143e-06, 1.1807307600975037e-05, 1.456867903470993e-05, 1.7330050468444824e-05, 2.0091421902179718e-05, 2.2852793335914612e-05, 2.5614164769649506e-05, 2.83755362033844e-05, 3.113690763711929e-05, 3.389827907085419e-05, 3.665965050458908e-05, 3.9421021938323975e-05, 4.218239337205887e-05, 4.494376480579376e-05, 4.7705136239528656e-05, 5.046650767326355e-05, 5.3227879106998444e-05, 5.598925054073334e-05, 5.875062197446823e-05, 6.151199340820312e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 16.0, 29.0, 68.0, 136.0, 310.0, 892.0, 4120.0, 55132.0, 926837.0, 55316.0, 4161.0, 923.0, 319.0, 154.0, 64.0, 30.0, 13.0, 13.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83056640625, -0.8084182739257812, -0.7862701416015625, -0.7641220092773438, -0.741973876953125, -0.7198257446289062, -0.6976776123046875, -0.6755294799804688, -0.65338134765625, -0.6312332153320312, -0.6090850830078125, -0.5869369506835938, -0.564788818359375, -0.5426406860351562, -0.5204925537109375, -0.49834442138671875, -0.4761962890625, -0.45404815673828125, -0.4319000244140625, -0.40975189208984375, -0.387603759765625, -0.36545562744140625, -0.3433074951171875, -0.32115936279296875, -0.29901123046875, -0.27686309814453125, -0.2547149658203125, -0.23256683349609375, -0.210418701171875, -0.18827056884765625, -0.1661224365234375, -0.14397430419921875, -0.121826171875, -0.09967803955078125, -0.0775299072265625, -0.05538177490234375, -0.033233642578125, -0.01108551025390625, 0.0110626220703125, 0.03321075439453125, 0.05535888671875, 0.07750701904296875, 0.0996551513671875, 0.12180328369140625, 0.143951416015625, 0.16609954833984375, 0.1882476806640625, 0.21039581298828125, 0.2325439453125, 0.25469207763671875, 0.2768402099609375, 0.29898834228515625, 0.321136474609375, 0.34328460693359375, 0.3654327392578125, 0.38758087158203125, 0.40972900390625, 0.43187713623046875, 0.4540252685546875, 0.47617340087890625, 0.498321533203125, 0.5204696655273438, 0.5426177978515625, 0.5647659301757812, 0.5869140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 11.0, 21.0, 26.0, 35.0, 40.0, 75.0, 72.0, 103.0, 111.0, 108.0, 76.0, 66.0, 59.0, 50.0, 29.0, 28.0, 12.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3193626403808594, -0.30742645263671875, -0.2954902648925781, -0.2835540771484375, -0.2716178894042969, -0.25968170166015625, -0.24774551391601562, -0.235809326171875, -0.22387313842773438, -0.21193695068359375, -0.20000076293945312, -0.1880645751953125, -0.17612838745117188, -0.16419219970703125, -0.15225601196289062, -0.14031982421875, -0.12838363647460938, -0.11644744873046875, -0.10451126098632812, -0.0925750732421875, -0.08063888549804688, -0.06870269775390625, -0.056766510009765625, -0.044830322265625, -0.032894134521484375, -0.02095794677734375, -0.009021759033203125, 0.0029144287109375, 0.014850616455078125, 0.02678680419921875, 0.038722991943359375, 0.0506591796875, 0.06259536743164062, 0.07453155517578125, 0.08646774291992188, 0.0984039306640625, 0.11034011840820312, 0.12227630615234375, 0.13421249389648438, 0.146148681640625, 0.15808486938476562, 0.17002105712890625, 0.18195724487304688, 0.1938934326171875, 0.20582962036132812, 0.21776580810546875, 0.22970199584960938, 0.24163818359375, 0.2535743713378906, 0.26551055908203125, 0.2774467468261719, 0.2893829345703125, 0.3013191223144531, 0.31325531005859375, 0.3251914978027344, 0.337127685546875, 0.3490638732910156, 0.36100006103515625, 0.3729362487792969, 0.3848724365234375, 0.3968086242675781, 0.40874481201171875, 0.4206809997558594, 0.4326171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 8.0, 44.0, 143.0, 327.0, 294.0, 113.0, 39.0, 15.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.595186233520508, -13.225724220275879, -12.856261253356934, -12.486799240112305, -12.11733627319336, -11.74787425994873, -11.378412246704102, -11.008949279785156, -10.639486312866211, -10.270024299621582, -9.900561332702637, -9.531099319458008, -9.161636352539062, -8.792174339294434, -8.422712326049805, -8.05324935913086, -7.6837873458862305, -7.314324855804443, -6.944862365722656, -6.575400352478027, -6.205937385559082, -5.836475372314453, -5.467012882232666, -5.097550392150879, -4.728087902069092, -4.358625411987305, -3.9891629219055176, -3.6197006702423096, -3.2502381801605225, -2.8807756900787354, -2.5113134384155273, -2.1418509483337402, -1.7723884582519531, -1.402925968170166, -1.0334635972976685, -0.6640012264251709, -0.2945387363433838, 0.07492375373840332, 0.44438600540161133, 0.8138484954833984, 1.1833109855651855, 1.5527734756469727, 1.9222358465194702, 2.2916982173919678, 2.661160707473755, 3.030623197555542, 3.40008544921875, 3.769547939300537, 4.139010429382324, 4.508472919464111, 4.877935409545898, 5.247397422790527, 5.616860389709473, 5.986322402954102, 6.355784893035889, 6.725247383117676, 7.094709873199463, 7.46417236328125, 7.833634853363037, 8.203097343444824, 8.572559356689453, 8.942022323608398, 9.311484336853027, 9.680946350097656, 10.050409317016602]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 9.0, 14.0, 15.0, 16.0, 23.0, 29.0, 19.0, 34.0, 25.0, 26.0, 47.0, 58.0, 58.0, 60.0, 74.0, 60.0, 54.0, 41.0, 39.0, 38.0, 47.0, 26.0, 28.0, 23.0, 22.0, 23.0, 11.0, 21.0, 12.0, 9.0, 9.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.173884868621826, -4.039281368255615, -3.9046778678894043, -3.7700746059417725, -3.6354711055755615, -3.5008676052093506, -3.3662643432617188, -3.231660842895508, -3.097057342529297, -2.962453842163086, -2.827850341796875, -2.693247079849243, -2.5586435794830322, -2.4240400791168213, -2.2894368171691895, -2.1548333168029785, -2.0202298164367676, -1.8856263160705566, -1.7510229349136353, -1.6164195537567139, -1.481816053390503, -1.347212553024292, -1.2126091718673706, -1.0780057907104492, -0.9434022903442383, -0.8087988495826721, -0.674195408821106, -0.5395919680595398, -0.40498852729797363, -0.27038508653640747, -0.1357816457748413, -0.0011782050132751465, 0.1334247589111328, 0.268028199672699, 0.40263164043426514, 0.5372350811958313, 0.6718385219573975, 0.8064419627189636, 0.9410454034805298, 1.0756487846374512, 1.210252285003662, 1.344855785369873, 1.4794591665267944, 1.6140625476837158, 1.7486660480499268, 1.8832695484161377, 2.0178728103637695, 2.1524763107299805, 2.2870798110961914, 2.4216833114624023, 2.5562868118286133, 2.690890073776245, 2.825493574142456, 2.960097074508667, 3.094700336456299, 3.2293038368225098, 3.3639073371887207, 3.4985108375549316, 3.6331143379211426, 3.7677175998687744, 3.9023211002349854, 4.036924362182617, 4.171527862548828, 4.306131362915039, 4.44073486328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 17.0, 40.0, 50.0, 105.0, 143.0, 208.0, 344.0, 602.0, 1124.0, 2122.0, 4198.0, 8782.0, 19756.0, 51365.0, 170507.0, 854504.0, 2279647.0, 602980.0, 126518.0, 40069.0, 16222.0, 7144.0, 3471.0, 1870.0, 1003.0, 545.0, 316.0, 196.0, 131.0, 89.0, 60.0, 40.0, 23.0, 14.0, 13.0, 15.0, 3.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.2316570281982422, -0.22320175170898438, -0.21474647521972656, -0.20629119873046875, -0.19783592224121094, -0.18938064575195312, -0.1809253692626953, -0.1724700927734375, -0.1640148162841797, -0.15555953979492188, -0.14710426330566406, -0.13864898681640625, -0.13019371032714844, -0.12173843383789062, -0.11328315734863281, -0.104827880859375, -0.09637260437011719, -0.08791732788085938, -0.07946205139160156, -0.07100677490234375, -0.06255149841308594, -0.054096221923828125, -0.04564094543457031, -0.0371856689453125, -0.028730392456054688, -0.020275115966796875, -0.011819839477539062, -0.00336456298828125, 0.0050907135009765625, 0.013545989990234375, 0.022001266479492188, 0.03045654296875, 0.03891181945800781, 0.047367095947265625, 0.05582237243652344, 0.06427764892578125, 0.07273292541503906, 0.08118820190429688, 0.08964347839355469, 0.0980987548828125, 0.10655403137207031, 0.11500930786132812, 0.12346458435058594, 0.13191986083984375, 0.14037513732910156, 0.14883041381835938, 0.1572856903076172, 0.165740966796875, 0.1741962432861328, 0.18265151977539062, 0.19110679626464844, 0.19956207275390625, 0.20801734924316406, 0.21647262573242188, 0.2249279022216797, 0.2333831787109375, 0.2418384552001953, 0.2502937316894531, 0.25874900817871094, 0.26720428466796875, 0.27565956115722656, 0.2841148376464844, 0.2925701141357422, 0.301025390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 11.0, 19.0, 15.0, 20.0, 30.0, 39.0, 38.0, 61.0, 66.0, 71.0, 74.0, 91.0, 92.0, 80.0, 81.0, 58.0, 50.0, 34.0, 24.0, 17.0, 17.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.14758682250976562, -0.13745880126953125, -0.12733078002929688, -0.1172027587890625, -0.10707473754882812, -0.09694671630859375, -0.08681869506835938, -0.076690673828125, -0.06656265258789062, -0.05643463134765625, -0.046306610107421875, -0.0361785888671875, -0.026050567626953125, -0.01592254638671875, -0.005794525146484375, 0.00433349609375, 0.014461517333984375, 0.02458953857421875, 0.034717559814453125, 0.0448455810546875, 0.054973602294921875, 0.06510162353515625, 0.07522964477539062, 0.085357666015625, 0.09548568725585938, 0.10561370849609375, 0.11574172973632812, 0.1258697509765625, 0.13599777221679688, 0.14612579345703125, 0.15625381469726562, 0.1663818359375, 0.17650985717773438, 0.18663787841796875, 0.19676589965820312, 0.2068939208984375, 0.21702194213867188, 0.22714996337890625, 0.23727798461914062, 0.247406005859375, 0.2575340270996094, 0.26766204833984375, 0.2777900695800781, 0.2879180908203125, 0.2980461120605469, 0.30817413330078125, 0.3183021545410156, 0.32843017578125, 0.3385581970214844, 0.34868621826171875, 0.3588142395019531, 0.3689422607421875, 0.3790702819824219, 0.38919830322265625, 0.3993263244628906, 0.409454345703125, 0.4195823669433594, 0.42971038818359375, 0.4398384094238281, 0.4499664306640625, 0.4600944519042969, 0.47022247314453125, 0.4803504943847656, 0.490478515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 10.0, 10.0, 9.0, 12.0, 15.0, 30.0, 31.0, 61.0, 93.0, 164.0, 235.0, 407.0, 675.0, 1338.0, 3037.0, 7986.0, 25472.0, 103899.0, 845978.0, 2868886.0, 260332.0, 51336.0, 14715.0, 5085.0, 2108.0, 1058.0, 491.0, 290.0, 138.0, 116.0, 72.0, 62.0, 33.0, 23.0, 13.0, 18.0, 9.0, 10.0, 5.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43285369873046875, -0.4169769287109375, -0.40110015869140625, -0.385223388671875, -0.36934661865234375, -0.3534698486328125, -0.33759307861328125, -0.32171630859375, -0.30583953857421875, -0.2899627685546875, -0.27408599853515625, -0.258209228515625, -0.24233245849609375, -0.2264556884765625, -0.21057891845703125, -0.1947021484375, -0.17882537841796875, -0.1629486083984375, -0.14707183837890625, -0.131195068359375, -0.11531829833984375, -0.0994415283203125, -0.08356475830078125, -0.06768798828125, -0.05181121826171875, -0.0359344482421875, -0.02005767822265625, -0.004180908203125, 0.01169586181640625, 0.0275726318359375, 0.04344940185546875, 0.059326171875, 0.07520294189453125, 0.0910797119140625, 0.10695648193359375, 0.122833251953125, 0.13871002197265625, 0.1545867919921875, 0.17046356201171875, 0.18634033203125, 0.20221710205078125, 0.2180938720703125, 0.23397064208984375, 0.249847412109375, 0.26572418212890625, 0.2816009521484375, 0.29747772216796875, 0.3133544921875, 0.32923126220703125, 0.3451080322265625, 0.36098480224609375, 0.376861572265625, 0.39273834228515625, 0.4086151123046875, 0.42449188232421875, 0.44036865234375, 0.45624542236328125, 0.4721221923828125, 0.48799896240234375, 0.503875732421875, 0.5197525024414062, 0.5356292724609375, 0.5515060424804688, 0.5673828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 7.0, 18.0, 15.0, 21.0, 26.0, 38.0, 36.0, 65.0, 103.0, 158.0, 208.0, 324.0, 542.0, 698.0, 623.0, 410.0, 246.0, 142.0, 108.0, 65.0, 48.0, 40.0, 28.0, 17.0, 22.0, 13.0, 15.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.607421875, -0.5882797241210938, -0.5691375732421875, -0.5499954223632812, -0.530853271484375, -0.5117111206054688, -0.4925689697265625, -0.47342681884765625, -0.45428466796875, -0.43514251708984375, -0.4160003662109375, -0.39685821533203125, -0.377716064453125, -0.35857391357421875, -0.3394317626953125, -0.32028961181640625, -0.3011474609375, -0.28200531005859375, -0.2628631591796875, -0.24372100830078125, -0.224578857421875, -0.20543670654296875, -0.1862945556640625, -0.16715240478515625, -0.14801025390625, -0.12886810302734375, -0.1097259521484375, -0.09058380126953125, -0.071441650390625, -0.05229949951171875, -0.0331573486328125, -0.01401519775390625, 0.005126953125, 0.02426910400390625, 0.0434112548828125, 0.06255340576171875, 0.081695556640625, 0.10083770751953125, 0.1199798583984375, 0.13912200927734375, 0.15826416015625, 0.17740631103515625, 0.1965484619140625, 0.21569061279296875, 0.234832763671875, 0.25397491455078125, 0.2731170654296875, 0.29225921630859375, 0.3114013671875, 0.33054351806640625, 0.3496856689453125, 0.36882781982421875, 0.387969970703125, 0.40711212158203125, 0.4262542724609375, 0.44539642333984375, 0.46453857421875, 0.48368072509765625, 0.5028228759765625, 0.5219650268554688, 0.541107177734375, 0.5602493286132812, 0.5793914794921875, 0.5985336303710938, 0.61767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 20.0, 90.0, 337.0, 393.0, 116.0, 30.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.909759521484375, -5.4194464683532715, -4.929133892059326, -4.438820838928223, -3.9485080242156982, -3.458195209503174, -2.9678821563720703, -2.477569341659546, -1.9872565269470215, -1.496943712234497, -1.006630778312683, -0.5163178443908691, -0.026005029678344727, 0.4643077850341797, 0.9546208381652832, 1.4449336528778076, 1.935246467590332, 2.4255592823028564, 2.915872097015381, 3.4061851501464844, 3.896497964859009, 4.386810779571533, 4.877123832702637, 5.367436408996582, 5.8577494621276855, 6.348062515258789, 6.838375091552734, 7.328688144683838, 7.819001197814941, 8.309313774108887, 8.799627304077148, 9.289939880371094, 9.780252456665039, 10.270565032958984, 10.760878562927246, 11.251191139221191, 11.741503715515137, 12.231817245483398, 12.722129821777344, 13.212442398071289, 13.702754974365234, 14.19306755065918, 14.683381080627441, 15.173693656921387, 15.664006233215332, 16.154319763183594, 16.64463233947754, 17.134944915771484, 17.625259399414062, 18.115571975708008, 18.605884552001953, 19.09619903564453, 19.586511611938477, 20.076824188232422, 20.567136764526367, 21.057449340820312, 21.547761917114258, 22.038074493408203, 22.52838706970215, 23.018699645996094, 23.509014129638672, 23.999326705932617, 24.489639282226562, 24.979951858520508, 25.470264434814453]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 17.0, 11.0, 24.0, 26.0, 47.0, 46.0, 45.0, 59.0, 70.0, 72.0, 76.0, 71.0, 58.0, 64.0, 64.0, 50.0, 32.0, 38.0, 27.0, 27.0, 12.0, 16.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.914650917053223, -5.772266387939453, -5.629881858825684, -5.487497329711914, -5.3451128005981445, -5.202728271484375, -5.0603437423706055, -4.917959213256836, -4.775574684143066, -4.633190155029297, -4.490805625915527, -4.348421096801758, -4.206036567687988, -4.063652038574219, -3.921267509460449, -3.7788829803466797, -3.63649845123291, -3.4941139221191406, -3.351729393005371, -3.2093448638916016, -3.066960334777832, -2.9245758056640625, -2.782191276550293, -2.6398067474365234, -2.497422218322754, -2.3550376892089844, -2.212653160095215, -2.0702686309814453, -1.9278841018676758, -1.7854995727539062, -1.6431150436401367, -1.5007305145263672, -1.3583455085754395, -1.21596097946167, -1.0735764503479004, -0.9311919212341309, -0.7888073921203613, -0.6464228630065918, -0.5040383338928223, -0.36165380477905273, -0.2192692756652832, -0.07688474655151367, 0.06549978256225586, 0.2078843116760254, 0.3502688407897949, 0.49265336990356445, 0.635037899017334, 0.7774224281311035, 0.919806957244873, 1.0621914863586426, 1.204576015472412, 1.3469605445861816, 1.4893450736999512, 1.6317296028137207, 1.7741141319274902, 1.9164986610412598, 2.0588831901550293, 2.201267719268799, 2.3436522483825684, 2.486036777496338, 2.6284213066101074, 2.770805835723877, 2.9131903648376465, 3.055574893951416, 3.1979594230651855]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 10.0, 12.0, 14.0, 25.0, 27.0, 67.0, 105.0, 139.0, 237.0, 399.0, 723.0, 1327.0, 2660.0, 5630.0, 12510.0, 30212.0, 74504.0, 200475.0, 398908.0, 195003.0, 73011.0, 29407.0, 12238.0, 5428.0, 2518.0, 1246.0, 684.0, 384.0, 248.0, 133.0, 96.0, 46.0, 37.0, 28.0, 22.0, 11.0, 12.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4795036315917969, -0.46559906005859375, -0.4516944885253906, -0.4377899169921875, -0.4238853454589844, -0.40998077392578125, -0.3960762023925781, -0.382171630859375, -0.3682670593261719, -0.35436248779296875, -0.3404579162597656, -0.3265533447265625, -0.3126487731933594, -0.29874420166015625, -0.2848396301269531, -0.27093505859375, -0.2570304870605469, -0.24312591552734375, -0.22922134399414062, -0.2153167724609375, -0.20141220092773438, -0.18750762939453125, -0.17360305786132812, -0.159698486328125, -0.14579391479492188, -0.13188934326171875, -0.11798477172851562, -0.1040802001953125, -0.09017562866210938, -0.07627105712890625, -0.062366485595703125, -0.0484619140625, -0.034557342529296875, -0.02065277099609375, -0.006748199462890625, 0.0071563720703125, 0.021060943603515625, 0.03496551513671875, 0.048870086669921875, 0.062774658203125, 0.07667922973632812, 0.09058380126953125, 0.10448837280273438, 0.1183929443359375, 0.13229751586914062, 0.14620208740234375, 0.16010665893554688, 0.17401123046875, 0.18791580200195312, 0.20182037353515625, 0.21572494506835938, 0.2296295166015625, 0.24353408813476562, 0.25743865966796875, 0.2713432312011719, 0.285247802734375, 0.2991523742675781, 0.31305694580078125, 0.3269615173339844, 0.3408660888671875, 0.3547706604003906, 0.36867523193359375, 0.3825798034667969, 0.396484375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 4.0, 15.0, 10.0, 14.0, 16.0, 19.0, 21.0, 21.0, 29.0, 18.0, 19.0, 49.0, 43.0, 42.0, 40.0, 32.0, 48.0, 36.0, 44.0, 42.0, 36.0, 39.0, 41.0, 41.0, 39.0, 28.0, 32.0, 17.0, 28.0, 23.0, 25.0, 13.0, 13.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15927886962890625, -0.1537628173828125, -0.14824676513671875, -0.142730712890625, -0.13721466064453125, -0.1316986083984375, -0.12618255615234375, -0.12066650390625, -0.11515045166015625, -0.1096343994140625, -0.10411834716796875, -0.098602294921875, -0.09308624267578125, -0.0875701904296875, -0.08205413818359375, -0.0765380859375, -0.07102203369140625, -0.0655059814453125, -0.05998992919921875, -0.054473876953125, -0.04895782470703125, -0.0434417724609375, -0.03792572021484375, -0.03240966796875, -0.02689361572265625, -0.0213775634765625, -0.01586151123046875, -0.010345458984375, -0.00482940673828125, 0.0006866455078125, 0.00620269775390625, 0.01171875, 0.01723480224609375, 0.0227508544921875, 0.02826690673828125, 0.033782958984375, 0.03929901123046875, 0.0448150634765625, 0.05033111572265625, 0.05584716796875, 0.06136322021484375, 0.0668792724609375, 0.07239532470703125, 0.077911376953125, 0.08342742919921875, 0.0889434814453125, 0.09445953369140625, 0.0999755859375, 0.10549163818359375, 0.1110076904296875, 0.11652374267578125, 0.122039794921875, 0.12755584716796875, 0.1330718994140625, 0.13858795166015625, 0.14410400390625, 0.14962005615234375, 0.1551361083984375, 0.16065216064453125, 0.166168212890625, 0.17168426513671875, 0.1772003173828125, 0.18271636962890625, 0.188232421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 11.0, 17.0, 18.0, 45.0, 68.0, 82.0, 152.0, 220.0, 425.0, 793.0, 1606.0, 3935.0, 15949.0, 191636.0, 781653.0, 40362.0, 6698.0, 2362.0, 1085.0, 537.0, 321.0, 207.0, 131.0, 58.0, 52.0, 32.0, 28.0, 14.0, 13.0, 13.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2744140625, -1.2335968017578125, -1.192779541015625, -1.1519622802734375, -1.11114501953125, -1.0703277587890625, -1.029510498046875, -0.9886932373046875, -0.9478759765625, -0.9070587158203125, -0.866241455078125, -0.8254241943359375, -0.78460693359375, -0.7437896728515625, -0.702972412109375, -0.6621551513671875, -0.621337890625, -0.5805206298828125, -0.539703369140625, -0.4988861083984375, -0.45806884765625, -0.4172515869140625, -0.376434326171875, -0.3356170654296875, -0.2947998046875, -0.2539825439453125, -0.213165283203125, -0.1723480224609375, -0.13153076171875, -0.0907135009765625, -0.049896240234375, -0.0090789794921875, 0.03173828125, 0.0725555419921875, 0.113372802734375, 0.1541900634765625, 0.19500732421875, 0.2358245849609375, 0.276641845703125, 0.3174591064453125, 0.3582763671875, 0.3990936279296875, 0.439910888671875, 0.4807281494140625, 0.52154541015625, 0.5623626708984375, 0.603179931640625, 0.6439971923828125, 0.684814453125, 0.7256317138671875, 0.766448974609375, 0.8072662353515625, 0.84808349609375, 0.8889007568359375, 0.929718017578125, 0.9705352783203125, 1.0113525390625, 1.0521697998046875, 1.092987060546875, 1.1338043212890625, 1.17462158203125, 1.2154388427734375, 1.256256103515625, 1.2970733642578125, 1.337890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 15.0, 10.0, 13.0, 19.0, 22.0, 32.0, 37.0, 35.0, 40.0, 48.0, 56.0, 71.0, 72.0, 50.0, 54.0, 56.0, 40.0, 48.0, 37.0, 35.0, 48.0, 34.0, 33.0, 19.0, 15.0, 14.0, 18.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7822494506835938, -0.7476043701171875, -0.7129592895507812, -0.678314208984375, -0.6436691284179688, -0.6090240478515625, -0.5743789672851562, -0.53973388671875, -0.5050888061523438, -0.4704437255859375, -0.43579864501953125, -0.401153564453125, -0.36650848388671875, -0.3318634033203125, -0.29721832275390625, -0.2625732421875, -0.22792816162109375, -0.1932830810546875, -0.15863800048828125, -0.123992919921875, -0.08934783935546875, -0.0547027587890625, -0.02005767822265625, 0.01458740234375, 0.04923248291015625, 0.0838775634765625, 0.11852264404296875, 0.153167724609375, 0.18781280517578125, 0.2224578857421875, 0.25710296630859375, 0.291748046875, 0.32639312744140625, 0.3610382080078125, 0.39568328857421875, 0.430328369140625, 0.46497344970703125, 0.4996185302734375, 0.5342636108398438, 0.56890869140625, 0.6035537719726562, 0.6381988525390625, 0.6728439331054688, 0.707489013671875, 0.7421340942382812, 0.7767791748046875, 0.8114242553710938, 0.8460693359375, 0.8807144165039062, 0.9153594970703125, 0.9500045776367188, 0.984649658203125, 1.0192947387695312, 1.0539398193359375, 1.0885848999023438, 1.12322998046875, 1.1578750610351562, 1.1925201416015625, 1.2271652221679688, 1.261810302734375, 1.2964553833007812, 1.3311004638671875, 1.3657455444335938, 1.400390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 9.0, 16.0, 20.0, 34.0, 35.0, 57.0, 75.0, 109.0, 187.0, 273.0, 447.0, 828.0, 1495.0, 3184.0, 7266.0, 20138.0, 63827.0, 247404.0, 546713.0, 105754.0, 31241.0, 10491.0, 4227.0, 2038.0, 1034.0, 576.0, 363.0, 210.0, 149.0, 91.0, 60.0, 47.0, 32.0, 24.0, 23.0, 14.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.226806640625, -0.21997451782226562, -0.21314239501953125, -0.20631027221679688, -0.1994781494140625, -0.19264602661132812, -0.18581390380859375, -0.17898178100585938, -0.172149658203125, -0.16531753540039062, -0.15848541259765625, -0.15165328979492188, -0.1448211669921875, -0.13798904418945312, -0.13115692138671875, -0.12432479858398438, -0.11749267578125, -0.11066055297851562, -0.10382843017578125, -0.09699630737304688, -0.0901641845703125, -0.08333206176757812, -0.07649993896484375, -0.06966781616210938, -0.062835693359375, -0.056003570556640625, -0.04917144775390625, -0.042339324951171875, -0.0355072021484375, -0.028675079345703125, -0.02184295654296875, -0.015010833740234375, -0.0081787109375, -0.001346588134765625, 0.00548553466796875, 0.012317657470703125, 0.0191497802734375, 0.025981903076171875, 0.03281402587890625, 0.039646148681640625, 0.046478271484375, 0.053310394287109375, 0.06014251708984375, 0.06697463989257812, 0.0738067626953125, 0.08063888549804688, 0.08747100830078125, 0.09430313110351562, 0.10113525390625, 0.10796737670898438, 0.11479949951171875, 0.12163162231445312, 0.1284637451171875, 0.13529586791992188, 0.14212799072265625, 0.14896011352539062, 0.155792236328125, 0.16262435913085938, 0.16945648193359375, 0.17628860473632812, 0.1831207275390625, 0.18995285034179688, 0.19678497314453125, 0.20361709594726562, 0.21044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 9.0, 9.0, 13.0, 7.0, 9.0, 16.0, 22.0, 25.0, 18.0, 30.0, 39.0, 49.0, 68.0, 101.0, 124.0, 97.0, 75.0, 67.0, 36.0, 42.0, 26.0, 24.0, 18.0, 16.0, 13.0, 15.0, 12.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.543433457612991e-05, -7.278658449649811e-05, -7.01388344168663e-05, -6.74910843372345e-05, -6.484333425760269e-05, -6.219558417797089e-05, -5.954783409833908e-05, -5.6900084018707275e-05, -5.425233393907547e-05, -5.1604583859443665e-05, -4.895683377981186e-05, -4.6309083700180054e-05, -4.366133362054825e-05, -4.101358354091644e-05, -3.836583346128464e-05, -3.571808338165283e-05, -3.3070333302021027e-05, -3.042258322238922e-05, -2.7774833142757416e-05, -2.512708306312561e-05, -2.2479332983493805e-05, -1.9831582903862e-05, -1.7183832824230194e-05, -1.4536082744598389e-05, -1.1888332664966583e-05, -9.240582585334778e-06, -6.592832505702972e-06, -3.945082426071167e-06, -1.2973323464393616e-06, 1.3504177331924438e-06, 3.998167812824249e-06, 6.645917892456055e-06, 9.29366797208786e-06, 1.1941418051719666e-05, 1.4589168131351471e-05, 1.7236918210983276e-05, 1.9884668290615082e-05, 2.2532418370246887e-05, 2.5180168449878693e-05, 2.7827918529510498e-05, 3.0475668609142303e-05, 3.312341868877411e-05, 3.5771168768405914e-05, 3.841891884803772e-05, 4.1066668927669525e-05, 4.371441900730133e-05, 4.6362169086933136e-05, 4.900991916656494e-05, 5.165766924619675e-05, 5.430541932582855e-05, 5.695316940546036e-05, 5.960091948509216e-05, 6.224866956472397e-05, 6.489641964435577e-05, 6.754416972398758e-05, 7.019191980361938e-05, 7.283966988325119e-05, 7.5487419962883e-05, 7.81351700425148e-05, 8.07829201221466e-05, 8.343067020177841e-05, 8.607842028141022e-05, 8.872617036104202e-05, 9.137392044067383e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 12.0, 9.0, 28.0, 23.0, 56.0, 53.0, 124.0, 202.0, 368.0, 547.0, 1120.0, 2506.0, 7279.0, 38860.0, 528763.0, 419353.0, 37340.0, 6986.0, 2471.0, 1076.0, 564.0, 317.0, 181.0, 121.0, 70.0, 35.0, 34.0, 17.0, 9.0, 12.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2854042053222656, -0.27442169189453125, -0.2634391784667969, -0.2524566650390625, -0.24147415161132812, -0.23049163818359375, -0.21950912475585938, -0.208526611328125, -0.19754409790039062, -0.18656158447265625, -0.17557907104492188, -0.1645965576171875, -0.15361404418945312, -0.14263153076171875, -0.13164901733398438, -0.12066650390625, -0.10968399047851562, -0.09870147705078125, -0.08771896362304688, -0.0767364501953125, -0.06575393676757812, -0.05477142333984375, -0.043788909912109375, -0.032806396484375, -0.021823883056640625, -0.01084136962890625, 0.000141143798828125, 0.0111236572265625, 0.022106170654296875, 0.03308868408203125, 0.044071197509765625, 0.0550537109375, 0.06603622436523438, 0.07701873779296875, 0.08800125122070312, 0.0989837646484375, 0.10996627807617188, 0.12094879150390625, 0.13193130493164062, 0.142913818359375, 0.15389633178710938, 0.16487884521484375, 0.17586135864257812, 0.1868438720703125, 0.19782638549804688, 0.20880889892578125, 0.21979141235351562, 0.23077392578125, 0.24175643920898438, 0.25273895263671875, 0.2637214660644531, 0.2747039794921875, 0.2856864929199219, 0.29666900634765625, 0.3076515197753906, 0.318634033203125, 0.3296165466308594, 0.34059906005859375, 0.3515815734863281, 0.3625640869140625, 0.3735466003417969, 0.38452911376953125, 0.3955116271972656, 0.406494140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 2.0, 6.0, 8.0, 2.0, 10.0, 13.0, 16.0, 16.0, 19.0, 27.0, 24.0, 24.0, 37.0, 46.0, 55.0, 52.0, 75.0, 57.0, 74.0, 67.0, 64.0, 51.0, 40.0, 35.0, 25.0, 35.0, 23.0, 20.0, 8.0, 15.0, 11.0, 6.0, 8.0, 12.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510147094726562, -0.21753692626953125, -0.20997238159179688, -0.2024078369140625, -0.19484329223632812, -0.18727874755859375, -0.17971420288085938, -0.172149658203125, -0.16458511352539062, -0.15702056884765625, -0.14945602416992188, -0.1418914794921875, -0.13432693481445312, -0.12676239013671875, -0.11919784545898438, -0.11163330078125, -0.10406875610351562, -0.09650421142578125, -0.08893966674804688, -0.0813751220703125, -0.07381057739257812, -0.06624603271484375, -0.058681488037109375, -0.051116943359375, -0.043552398681640625, -0.03598785400390625, -0.028423309326171875, -0.0208587646484375, -0.013294219970703125, -0.00572967529296875, 0.001834869384765625, 0.0093994140625, 0.016963958740234375, 0.02452850341796875, 0.032093048095703125, 0.0396575927734375, 0.047222137451171875, 0.05478668212890625, 0.062351226806640625, 0.069915771484375, 0.07748031616210938, 0.08504486083984375, 0.09260940551757812, 0.1001739501953125, 0.10773849487304688, 0.11530303955078125, 0.12286758422851562, 0.13043212890625, 0.13799667358398438, 0.14556121826171875, 0.15312576293945312, 0.1606903076171875, 0.16825485229492188, 0.17581939697265625, 0.18338394165039062, 0.190948486328125, 0.19851303100585938, 0.20607757568359375, 0.21364212036132812, 0.2212066650390625, 0.22877120971679688, 0.23633575439453125, 0.24390029907226562, 0.25146484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 25.0, 44.0, 119.0, 189.0, 286.0, 170.0, 75.0, 36.0, 17.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.636467933654785, -9.363018035888672, -9.089569091796875, -8.816119194030762, -8.542670249938965, -8.269220352172852, -7.9957709312438965, -7.722321510314941, -7.448872089385986, -7.175422668457031, -6.901973247528076, -6.628523826599121, -6.355073928833008, -6.081624984741211, -5.808175086975098, -5.534725666046143, -5.2612762451171875, -4.987826824188232, -4.714377403259277, -4.440927982330322, -4.167478561401367, -3.894028902053833, -3.620579242706299, -3.3471298217773438, -3.0736804008483887, -2.8002309799194336, -2.5267815589904785, -2.2533318996429443, -1.9798824787139893, -1.7064330577850342, -1.4329835176467896, -1.159533977508545, -0.886085033416748, -0.6126355528831482, -0.33918607234954834, -0.06573659181594849, 0.20771288871765137, 0.48116230964660645, 0.7546118497848511, 1.0280613899230957, 1.3015108108520508, 1.5749602317810059, 1.8484097719192505, 2.121859312057495, 2.39530873298645, 2.6687581539154053, 2.9422078132629395, 3.2156572341918945, 3.4891066551208496, 3.7625560760498047, 4.03600549697876, 4.309454917907715, 4.582904815673828, 4.856353759765625, 5.129803657531738, 5.403253078460693, 5.676702499389648, 5.9501519203186035, 6.223601341247559, 6.497050762176514, 6.770500183105469, 7.043950080871582, 7.317399501800537, 7.590848922729492, 7.864298343658447]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 10.0, 7.0, 13.0, 16.0, 12.0, 14.0, 14.0, 33.0, 20.0, 23.0, 25.0, 39.0, 28.0, 28.0, 41.0, 50.0, 56.0, 61.0, 61.0, 49.0, 51.0, 34.0, 30.0, 40.0, 32.0, 26.0, 28.0, 25.0, 22.0, 17.0, 15.0, 9.0, 12.0, 5.0, 11.0, 11.0, 4.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4706637859344482, -3.365431785583496, -3.260199546813965, -3.1549675464630127, -3.0497355461120605, -2.9445033073425293, -2.839271306991577, -2.734039306640625, -2.628807306289673, -2.5235753059387207, -2.4183430671691895, -2.3131110668182373, -2.207879066467285, -2.102646827697754, -1.9974148273468018, -1.8921828269958496, -1.786950707435608, -1.6817185878753662, -1.576486587524414, -1.4712544679641724, -1.3660224676132202, -1.2607903480529785, -1.1555583477020264, -1.0503262281417847, -0.9450941681861877, -0.8398621082305908, -0.7346300482749939, -0.629397988319397, -0.5241658687591553, -0.41893380880355835, -0.3137017488479614, -0.2084696888923645, -0.10323762893676758, 0.0019944384694099426, 0.10722650587558746, 0.21245858073234558, 0.3176906406879425, 0.4229227304458618, 0.5281547904014587, 0.6333868503570557, 0.7386189103126526, 0.8438509702682495, 0.9490830302238464, 1.0543150901794434, 1.159547209739685, 1.2647793292999268, 1.370011329650879, 1.475243330001831, 1.5804754495620728, 1.6857075691223145, 1.7909395694732666, 1.8961716890335083, 2.00140380859375, 2.106635808944702, 2.2118678092956543, 2.3171000480651855, 2.4223320484161377, 2.52756404876709, 2.632796287536621, 2.7380282878875732, 2.8432602882385254, 2.9484925270080566, 3.053724527359009, 3.158956527709961, 3.264188528060913]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 15.0, 16.0, 27.0, 30.0, 57.0, 83.0, 127.0, 205.0, 350.0, 750.0, 1256.0, 2286.0, 4524.0, 9601.0, 21822.0, 56463.0, 198282.0, 1026061.0, 2146598.0, 537878.0, 119089.0, 38364.0, 15695.0, 6954.0, 3544.0, 1804.0, 981.0, 528.0, 325.0, 194.0, 122.0, 73.0, 52.0, 32.0, 27.0, 16.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2354736328125, -0.2277050018310547, -0.21993637084960938, -0.21216773986816406, -0.20439910888671875, -0.19663047790527344, -0.18886184692382812, -0.1810932159423828, -0.1733245849609375, -0.1655559539794922, -0.15778732299804688, -0.15001869201660156, -0.14225006103515625, -0.13448143005371094, -0.12671279907226562, -0.11894416809082031, -0.111175537109375, -0.10340690612792969, -0.09563827514648438, -0.08786964416503906, -0.08010101318359375, -0.07233238220214844, -0.06456375122070312, -0.05679512023925781, -0.0490264892578125, -0.04125785827636719, -0.033489227294921875, -0.025720596313476562, -0.01795196533203125, -0.010183334350585938, -0.002414703369140625, 0.0053539276123046875, 0.01312255859375, 0.020891189575195312, 0.028659820556640625, 0.03642845153808594, 0.04419708251953125, 0.05196571350097656, 0.059734344482421875, 0.06750297546386719, 0.0752716064453125, 0.08304023742675781, 0.09080886840820312, 0.09857749938964844, 0.10634613037109375, 0.11411476135253906, 0.12188339233398438, 0.1296520233154297, 0.137420654296875, 0.1451892852783203, 0.15295791625976562, 0.16072654724121094, 0.16849517822265625, 0.17626380920410156, 0.18403244018554688, 0.1918010711669922, 0.1995697021484375, 0.2073383331298828, 0.21510696411132812, 0.22287559509277344, 0.23064422607421875, 0.23841285705566406, 0.24618148803710938, 0.2539501190185547, 0.26171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 12.0, 9.0, 6.0, 15.0, 13.0, 20.0, 30.0, 23.0, 24.0, 29.0, 25.0, 20.0, 37.0, 37.0, 29.0, 45.0, 46.0, 38.0, 42.0, 37.0, 38.0, 35.0, 48.0, 39.0, 37.0, 31.0, 29.0, 22.0, 19.0, 24.0, 18.0, 22.0, 21.0, 9.0, 10.0, 11.0, 10.0, 8.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16357421875, -0.15834617614746094, -0.15311813354492188, -0.1478900909423828, -0.14266204833984375, -0.1374340057373047, -0.13220596313476562, -0.12697792053222656, -0.1217498779296875, -0.11652183532714844, -0.11129379272460938, -0.10606575012207031, -0.10083770751953125, -0.09560966491699219, -0.09038162231445312, -0.08515357971191406, -0.079925537109375, -0.07469749450683594, -0.06946945190429688, -0.06424140930175781, -0.05901336669921875, -0.05378532409667969, -0.048557281494140625, -0.04332923889160156, -0.0381011962890625, -0.03287315368652344, -0.027645111083984375, -0.022417068481445312, -0.01718902587890625, -0.011960983276367188, -0.006732940673828125, -0.0015048980712890625, 0.00372314453125, 0.008951187133789062, 0.014179229736328125, 0.019407272338867188, 0.02463531494140625, 0.029863357543945312, 0.035091400146484375, 0.04031944274902344, 0.0455474853515625, 0.05077552795410156, 0.056003570556640625, 0.06123161315917969, 0.06645965576171875, 0.07168769836425781, 0.07691574096679688, 0.08214378356933594, 0.087371826171875, 0.09259986877441406, 0.09782791137695312, 0.10305595397949219, 0.10828399658203125, 0.11351203918457031, 0.11874008178710938, 0.12396812438964844, 0.1291961669921875, 0.13442420959472656, 0.13965225219726562, 0.1448802947998047, 0.15010833740234375, 0.1553363800048828, 0.16056442260742188, 0.16579246520996094, 0.1710205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 10.0, 17.0, 29.0, 28.0, 59.0, 110.0, 219.0, 468.0, 1076.0, 3079.0, 11437.0, 60609.0, 929045.0, 3037698.0, 125540.0, 17772.0, 4363.0, 1470.0, 606.0, 256.0, 146.0, 81.0, 52.0, 27.0, 23.0, 11.0, 16.0, 10.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77197265625, -0.750030517578125, -0.72808837890625, -0.706146240234375, -0.6842041015625, -0.662261962890625, -0.64031982421875, -0.618377685546875, -0.596435546875, -0.574493408203125, -0.55255126953125, -0.530609130859375, -0.5086669921875, -0.486724853515625, -0.46478271484375, -0.442840576171875, -0.4208984375, -0.398956298828125, -0.37701416015625, -0.355072021484375, -0.3331298828125, -0.311187744140625, -0.28924560546875, -0.267303466796875, -0.245361328125, -0.223419189453125, -0.20147705078125, -0.179534912109375, -0.1575927734375, -0.135650634765625, -0.11370849609375, -0.091766357421875, -0.06982421875, -0.047882080078125, -0.02593994140625, -0.003997802734375, 0.0179443359375, 0.039886474609375, 0.06182861328125, 0.083770751953125, 0.105712890625, 0.127655029296875, 0.14959716796875, 0.171539306640625, 0.1934814453125, 0.215423583984375, 0.23736572265625, 0.259307861328125, 0.28125, 0.303192138671875, 0.32513427734375, 0.347076416015625, 0.3690185546875, 0.390960693359375, 0.41290283203125, 0.434844970703125, 0.456787109375, 0.478729248046875, 0.50067138671875, 0.522613525390625, 0.5445556640625, 0.566497802734375, 0.58843994140625, 0.610382080078125, 0.63232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 19.0, 24.0, 26.0, 32.0, 35.0, 75.0, 90.0, 115.0, 228.0, 444.0, 648.0, 786.0, 569.0, 344.0, 190.0, 121.0, 85.0, 53.0, 47.0, 34.0, 25.0, 7.0, 13.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5054855346679688, -0.4855804443359375, -0.46567535400390625, -0.445770263671875, -0.42586517333984375, -0.4059600830078125, -0.38605499267578125, -0.36614990234375, -0.34624481201171875, -0.3263397216796875, -0.30643463134765625, -0.286529541015625, -0.26662445068359375, -0.2467193603515625, -0.22681427001953125, -0.2069091796875, -0.18700408935546875, -0.1670989990234375, -0.14719390869140625, -0.127288818359375, -0.10738372802734375, -0.0874786376953125, -0.06757354736328125, -0.04766845703125, -0.02776336669921875, -0.0078582763671875, 0.01204681396484375, 0.031951904296875, 0.05185699462890625, 0.0717620849609375, 0.09166717529296875, 0.111572265625, 0.13147735595703125, 0.1513824462890625, 0.17128753662109375, 0.191192626953125, 0.21109771728515625, 0.2310028076171875, 0.25090789794921875, 0.27081298828125, 0.29071807861328125, 0.3106231689453125, 0.33052825927734375, 0.350433349609375, 0.37033843994140625, 0.3902435302734375, 0.41014862060546875, 0.4300537109375, 0.44995880126953125, 0.4698638916015625, 0.48976898193359375, 0.509674072265625, 0.5295791625976562, 0.5494842529296875, 0.5693893432617188, 0.58929443359375, 0.6091995239257812, 0.6291046142578125, 0.6490097045898438, 0.668914794921875, 0.6888198852539062, 0.7087249755859375, 0.7286300659179688, 0.74853515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 14.0, 18.0, 48.0, 73.0, 161.0, 188.0, 205.0, 141.0, 59.0, 31.0, 15.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.089385032653809, -7.897246837615967, -7.705108642578125, -7.512970447540283, -7.320832252502441, -7.128694534301758, -6.936555862426758, -6.744418144226074, -6.552279949188232, -6.360141754150391, -6.168003559112549, -5.975865364074707, -5.783727169036865, -5.591588973999023, -5.39945125579834, -5.207313060760498, -5.015174865722656, -4.8230366706848145, -4.630898475646973, -4.438760280609131, -4.246622085571289, -4.0544843673706055, -3.8623459339141846, -3.670207977294922, -3.478069305419922, -3.28593111038208, -3.0937929153442383, -2.9016547203063965, -2.709516763687134, -2.517378568649292, -2.32524037361145, -2.1331024169921875, -1.9409642219543457, -1.748826026916504, -1.5566879510879517, -1.3645497560501099, -1.1724116802215576, -0.9802734851837158, -0.788135290145874, -0.5959972143173218, -0.40385901927948, -0.21172086894512177, -0.01958271861076355, 0.17255544662475586, 0.3646935820579529, 0.5568317174911499, 0.7489699125289917, 0.941107988357544, 1.1332461833953857, 1.3253843784332275, 1.5175224542617798, 1.7096606492996216, 1.9017987251281738, 2.0939369201660156, 2.2860751152038574, 2.478213310241699, 2.670351505279541, 2.862489700317383, 3.0546278953552246, 3.2467660903930664, 3.438904047012329, 3.631042242050171, 3.8231804370880127, 4.015318393707275, 4.207456588745117]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 12.0, 7.0, 16.0, 9.0, 20.0, 22.0, 28.0, 36.0, 37.0, 48.0, 47.0, 38.0, 60.0, 53.0, 71.0, 53.0, 56.0, 45.0, 58.0, 45.0, 44.0, 35.0, 32.0, 27.0, 11.0, 15.0, 14.0, 9.0, 8.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.811023712158203, -2.7054712772369385, -2.5999186038970947, -2.49436616897583, -2.3888137340545654, -2.283261299133301, -2.177708625793457, -2.0721561908721924, -1.9666036367416382, -1.861051082611084, -1.7554986476898193, -1.6499460935592651, -1.544393539428711, -1.4388411045074463, -1.333288550376892, -1.227735996246338, -1.1221835613250732, -1.016631007194519, -0.9110785722732544, -0.8055260181427002, -0.6999735236167908, -0.5944210290908813, -0.48886847496032715, -0.3833159804344177, -0.2777634859085083, -0.17221097648143768, -0.06665846705436707, 0.038894057273864746, 0.14444655179977417, 0.2499990463256836, 0.3555516004562378, 0.4611040949821472, 0.5666563510894775, 0.672208845615387, 0.7777613401412964, 0.8833138942718506, 0.98886638879776, 1.0944188833236694, 1.1999714374542236, 1.3055238723754883, 1.4110764265060425, 1.5166289806365967, 1.6221814155578613, 1.7277339696884155, 1.8332865238189697, 1.9388389587402344, 2.044391632080078, 2.1499440670013428, 2.2554965019226074, 2.361048936843872, 2.466601610183716, 2.5721540451049805, 2.677706480026245, 2.7832589149475098, 2.8888115882873535, 2.994364023208618, 3.099916458129883, 3.2054688930511475, 3.311021566390991, 3.416574001312256, 3.5221264362335205, 3.627678871154785, 3.733231544494629, 3.8387839794158936, 3.9443366527557373]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 13.0, 16.0, 22.0, 21.0, 46.0, 67.0, 98.0, 156.0, 240.0, 330.0, 533.0, 809.0, 1398.0, 2214.0, 3913.0, 7064.0, 13934.0, 28905.0, 67016.0, 175969.0, 376958.0, 217251.0, 81846.0, 34557.0, 16136.0, 8149.0, 4374.0, 2401.0, 1501.0, 872.0, 562.0, 358.0, 266.0, 175.0, 119.0, 78.0, 63.0, 28.0, 32.0, 27.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3190574645996094, -0.30828094482421875, -0.2975044250488281, -0.2867279052734375, -0.2759513854980469, -0.26517486572265625, -0.2543983459472656, -0.243621826171875, -0.23284530639648438, -0.22206878662109375, -0.21129226684570312, -0.2005157470703125, -0.18973922729492188, -0.17896270751953125, -0.16818618774414062, -0.15740966796875, -0.14663314819335938, -0.13585662841796875, -0.12508010864257812, -0.1143035888671875, -0.10352706909179688, -0.09275054931640625, -0.08197402954101562, -0.071197509765625, -0.060420989990234375, -0.04964447021484375, -0.038867950439453125, -0.0280914306640625, -0.017314910888671875, -0.00653839111328125, 0.004238128662109375, 0.0150146484375, 0.025791168212890625, 0.03656768798828125, 0.047344207763671875, 0.0581207275390625, 0.06889724731445312, 0.07967376708984375, 0.09045028686523438, 0.101226806640625, 0.11200332641601562, 0.12277984619140625, 0.13355636596679688, 0.1443328857421875, 0.15510940551757812, 0.16588592529296875, 0.17666244506835938, 0.18743896484375, 0.19821548461914062, 0.20899200439453125, 0.21976852416992188, 0.2305450439453125, 0.24132156372070312, 0.25209808349609375, 0.2628746032714844, 0.273651123046875, 0.2844276428222656, 0.29520416259765625, 0.3059806823730469, 0.3167572021484375, 0.3275337219238281, 0.33831024169921875, 0.3490867614746094, 0.35986328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 6.0, 4.0, 4.0, 13.0, 10.0, 20.0, 23.0, 19.0, 26.0, 20.0, 28.0, 28.0, 34.0, 28.0, 41.0, 34.0, 40.0, 38.0, 40.0, 37.0, 36.0, 39.0, 40.0, 40.0, 41.0, 41.0, 37.0, 26.0, 28.0, 22.0, 29.0, 19.0, 12.0, 14.0, 9.0, 14.0, 8.0, 4.0, 6.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1807861328125, -0.17522621154785156, -0.16966629028320312, -0.1641063690185547, -0.15854644775390625, -0.1529865264892578, -0.14742660522460938, -0.14186668395996094, -0.1363067626953125, -0.13074684143066406, -0.12518692016601562, -0.11962699890136719, -0.11406707763671875, -0.10850715637207031, -0.10294723510742188, -0.09738731384277344, -0.091827392578125, -0.08626747131347656, -0.08070755004882812, -0.07514762878417969, -0.06958770751953125, -0.06402778625488281, -0.058467864990234375, -0.05290794372558594, -0.0473480224609375, -0.04178810119628906, -0.036228179931640625, -0.030668258666992188, -0.02510833740234375, -0.019548416137695312, -0.013988494873046875, -0.008428573608398438, -0.00286865234375, 0.0026912689208984375, 0.008251190185546875, 0.013811111450195312, 0.01937103271484375, 0.024930953979492188, 0.030490875244140625, 0.03605079650878906, 0.0416107177734375, 0.04717063903808594, 0.052730560302734375, 0.05829048156738281, 0.06385040283203125, 0.06941032409667969, 0.07497024536132812, 0.08053016662597656, 0.086090087890625, 0.09165000915527344, 0.09720993041992188, 0.10276985168457031, 0.10832977294921875, 0.11388969421386719, 0.11944961547851562, 0.12500953674316406, 0.1305694580078125, 0.13612937927246094, 0.14168930053710938, 0.1472492218017578, 0.15280914306640625, 0.1583690643310547, 0.16392898559570312, 0.16948890686035156, 0.175048828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 2.0, 5.0, 9.0, 17.0, 22.0, 40.0, 48.0, 45.0, 70.0, 116.0, 202.0, 313.0, 528.0, 1003.0, 2219.0, 6539.0, 33606.0, 633257.0, 334903.0, 25942.0, 5377.0, 1930.0, 969.0, 519.0, 282.0, 190.0, 134.0, 72.0, 52.0, 36.0, 26.0, 19.0, 17.0, 13.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.814971923828125, -0.78228759765625, -0.749603271484375, -0.7169189453125, -0.684234619140625, -0.65155029296875, -0.618865966796875, -0.586181640625, -0.553497314453125, -0.52081298828125, -0.488128662109375, -0.4554443359375, -0.422760009765625, -0.39007568359375, -0.357391357421875, -0.32470703125, -0.292022705078125, -0.25933837890625, -0.226654052734375, -0.1939697265625, -0.161285400390625, -0.12860107421875, -0.095916748046875, -0.063232421875, -0.030548095703125, 0.00213623046875, 0.034820556640625, 0.0675048828125, 0.100189208984375, 0.13287353515625, 0.165557861328125, 0.1982421875, 0.230926513671875, 0.26361083984375, 0.296295166015625, 0.3289794921875, 0.361663818359375, 0.39434814453125, 0.427032470703125, 0.459716796875, 0.492401123046875, 0.52508544921875, 0.557769775390625, 0.5904541015625, 0.623138427734375, 0.65582275390625, 0.688507080078125, 0.72119140625, 0.753875732421875, 0.78656005859375, 0.819244384765625, 0.8519287109375, 0.884613037109375, 0.91729736328125, 0.949981689453125, 0.982666015625, 1.015350341796875, 1.04803466796875, 1.080718994140625, 1.1134033203125, 1.146087646484375, 1.17877197265625, 1.211456298828125, 1.244140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 1.0, 6.0, 7.0, 2.0, 12.0, 15.0, 24.0, 25.0, 27.0, 29.0, 39.0, 47.0, 58.0, 56.0, 69.0, 71.0, 79.0, 62.0, 54.0, 47.0, 60.0, 42.0, 43.0, 37.0, 24.0, 10.0, 15.0, 16.0, 6.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.14300537109375, -1.1053466796875, -1.06768798828125, -1.030029296875, -0.99237060546875, -0.9547119140625, -0.91705322265625, -0.87939453125, -0.84173583984375, -0.8040771484375, -0.76641845703125, -0.728759765625, -0.69110107421875, -0.6534423828125, -0.61578369140625, -0.578125, -0.54046630859375, -0.5028076171875, -0.46514892578125, -0.427490234375, -0.38983154296875, -0.3521728515625, -0.31451416015625, -0.27685546875, -0.23919677734375, -0.2015380859375, -0.16387939453125, -0.126220703125, -0.08856201171875, -0.0509033203125, -0.01324462890625, 0.0244140625, 0.06207275390625, 0.0997314453125, 0.13739013671875, 0.175048828125, 0.21270751953125, 0.2503662109375, 0.28802490234375, 0.32568359375, 0.36334228515625, 0.4010009765625, 0.43865966796875, 0.476318359375, 0.51397705078125, 0.5516357421875, 0.58929443359375, 0.626953125, 0.66461181640625, 0.7022705078125, 0.73992919921875, 0.777587890625, 0.81524658203125, 0.8529052734375, 0.89056396484375, 0.92822265625, 0.96588134765625, 1.0035400390625, 1.04119873046875, 1.078857421875, 1.11651611328125, 1.1541748046875, 1.19183349609375, 1.2294921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 9.0, 24.0, 28.0, 26.0, 52.0, 85.0, 149.0, 256.0, 432.0, 679.0, 1390.0, 3154.0, 8714.0, 30127.0, 147238.0, 674794.0, 138682.0, 28288.0, 8222.0, 3127.0, 1391.0, 650.0, 414.0, 190.0, 132.0, 81.0, 48.0, 47.0, 29.0, 24.0, 17.0, 5.0, 6.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.261962890625, -0.2541389465332031, -0.24631500244140625, -0.23849105834960938, -0.2306671142578125, -0.22284317016601562, -0.21501922607421875, -0.20719528198242188, -0.199371337890625, -0.19154739379882812, -0.18372344970703125, -0.17589950561523438, -0.1680755615234375, -0.16025161743164062, -0.15242767333984375, -0.14460372924804688, -0.13677978515625, -0.12895584106445312, -0.12113189697265625, -0.11330795288085938, -0.1054840087890625, -0.09766006469726562, -0.08983612060546875, -0.08201217651367188, -0.074188232421875, -0.06636428833007812, -0.05854034423828125, -0.050716400146484375, -0.0428924560546875, -0.035068511962890625, -0.02724456787109375, -0.019420623779296875, -0.0115966796875, -0.003772735595703125, 0.00405120849609375, 0.011875152587890625, 0.0196990966796875, 0.027523040771484375, 0.03534698486328125, 0.043170928955078125, 0.050994873046875, 0.058818817138671875, 0.06664276123046875, 0.07446670532226562, 0.0822906494140625, 0.09011459350585938, 0.09793853759765625, 0.10576248168945312, 0.11358642578125, 0.12141036987304688, 0.12923431396484375, 0.13705825805664062, 0.1448822021484375, 0.15270614624023438, 0.16053009033203125, 0.16835403442382812, 0.176177978515625, 0.18400192260742188, 0.19182586669921875, 0.19964981079101562, 0.2074737548828125, 0.21529769897460938, 0.22312164306640625, 0.23094558715820312, 0.23876953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 5.0, 9.0, 9.0, 13.0, 13.0, 18.0, 18.0, 29.0, 38.0, 46.0, 74.0, 98.0, 121.0, 116.0, 108.0, 74.0, 51.0, 39.0, 35.0, 21.0, 18.0, 12.0, 11.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0001061558723449707, -0.00010344944894313812, -0.00010074302554130554, -9.803660213947296e-05, -9.533017873764038e-05, -9.26237553358078e-05, -8.991733193397522e-05, -8.721090853214264e-05, -8.450448513031006e-05, -8.179806172847748e-05, -7.90916383266449e-05, -7.638521492481232e-05, -7.367879152297974e-05, -7.097236812114716e-05, -6.826594471931458e-05, -6.5559521317482e-05, -6.285309791564941e-05, -6.0146674513816833e-05, -5.744025111198425e-05, -5.473382771015167e-05, -5.202740430831909e-05, -4.932098090648651e-05, -4.661455750465393e-05, -4.390813410282135e-05, -4.120171070098877e-05, -3.849528729915619e-05, -3.578886389732361e-05, -3.308244049549103e-05, -3.0376017093658447e-05, -2.7669593691825867e-05, -2.4963170289993286e-05, -2.2256746888160706e-05, -1.9550323486328125e-05, -1.6843900084495544e-05, -1.4137476682662964e-05, -1.1431053280830383e-05, -8.724629878997803e-06, -6.018206477165222e-06, -3.3117830753326416e-06, -6.05359673500061e-07, 2.1010637283325195e-06, 4.8074871301651e-06, 7.513910531997681e-06, 1.0220333933830261e-05, 1.2926757335662842e-05, 1.5633180737495422e-05, 1.8339604139328003e-05, 2.1046027541160583e-05, 2.3752450942993164e-05, 2.6458874344825745e-05, 2.9165297746658325e-05, 3.1871721148490906e-05, 3.4578144550323486e-05, 3.728456795215607e-05, 3.999099135398865e-05, 4.269741475582123e-05, 4.540383815765381e-05, 4.811026155948639e-05, 5.081668496131897e-05, 5.352310836315155e-05, 5.622953176498413e-05, 5.893595516681671e-05, 6.164237856864929e-05, 6.434880197048187e-05, 6.705522537231445e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 0.0, 4.0, 5.0, 5.0, 4.0, 15.0, 13.0, 20.0, 35.0, 33.0, 44.0, 71.0, 134.0, 204.0, 330.0, 515.0, 974.0, 1879.0, 4443.0, 13318.0, 58731.0, 506193.0, 384495.0, 55569.0, 12782.0, 4418.0, 1902.0, 949.0, 558.0, 289.0, 215.0, 146.0, 65.0, 46.0, 46.0, 32.0, 19.0, 15.0, 8.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2410888671875, -0.2337799072265625, -0.226470947265625, -0.2191619873046875, -0.21185302734375, -0.2045440673828125, -0.197235107421875, -0.1899261474609375, -0.1826171875, -0.1753082275390625, -0.167999267578125, -0.1606903076171875, -0.15338134765625, -0.1460723876953125, -0.138763427734375, -0.1314544677734375, -0.1241455078125, -0.1168365478515625, -0.109527587890625, -0.1022186279296875, -0.09490966796875, -0.0876007080078125, -0.080291748046875, -0.0729827880859375, -0.065673828125, -0.0583648681640625, -0.051055908203125, -0.0437469482421875, -0.03643798828125, -0.0291290283203125, -0.021820068359375, -0.0145111083984375, -0.0072021484375, 0.0001068115234375, 0.007415771484375, 0.0147247314453125, 0.02203369140625, 0.0293426513671875, 0.036651611328125, 0.0439605712890625, 0.05126953125, 0.0585784912109375, 0.065887451171875, 0.0731964111328125, 0.08050537109375, 0.0878143310546875, 0.095123291015625, 0.1024322509765625, 0.1097412109375, 0.1170501708984375, 0.124359130859375, 0.1316680908203125, 0.13897705078125, 0.1462860107421875, 0.153594970703125, 0.1609039306640625, 0.168212890625, 0.1755218505859375, 0.182830810546875, 0.1901397705078125, 0.19744873046875, 0.2047576904296875, 0.212066650390625, 0.2193756103515625, 0.2266845703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 4.0, 12.0, 16.0, 13.0, 20.0, 34.0, 41.0, 56.0, 75.0, 101.0, 108.0, 91.0, 109.0, 93.0, 58.0, 44.0, 29.0, 25.0, 20.0, 7.0, 8.0, 7.0, 10.0, 9.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219970703125, -0.21078109741210938, -0.20159149169921875, -0.19240188598632812, -0.1832122802734375, -0.17402267456054688, -0.16483306884765625, -0.15564346313476562, -0.146453857421875, -0.13726425170898438, -0.12807464599609375, -0.11888504028320312, -0.1096954345703125, -0.10050582885742188, -0.09131622314453125, -0.08212661743164062, -0.07293701171875, -0.06374740600585938, -0.05455780029296875, -0.045368194580078125, -0.0361785888671875, -0.026988983154296875, -0.01779937744140625, -0.008609771728515625, 0.000579833984375, 0.009769439697265625, 0.01895904541015625, 0.028148651123046875, 0.0373382568359375, 0.046527862548828125, 0.05571746826171875, 0.06490707397460938, 0.0740966796875, 0.08328628540039062, 0.09247589111328125, 0.10166549682617188, 0.1108551025390625, 0.12004470825195312, 0.12923431396484375, 0.13842391967773438, 0.147613525390625, 0.15680313110351562, 0.16599273681640625, 0.17518234252929688, 0.1843719482421875, 0.19356155395507812, 0.20275115966796875, 0.21194076538085938, 0.22113037109375, 0.23031997680664062, 0.23950958251953125, 0.24869918823242188, 0.2578887939453125, 0.2670783996582031, 0.27626800537109375, 0.2854576110839844, 0.294647216796875, 0.3038368225097656, 0.31302642822265625, 0.3222160339355469, 0.3314056396484375, 0.3405952453613281, 0.34978485107421875, 0.3589744567871094, 0.3681640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 16.0, 31.0, 46.0, 80.0, 104.0, 175.0, 184.0, 126.0, 82.0, 49.0, 29.0, 22.0, 8.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-5.8701324462890625, -5.723775386810303, -5.577418327331543, -5.431060791015625, -5.284703731536865, -5.1383466720581055, -4.9919891357421875, -4.845632076263428, -4.699275016784668, -4.552917957305908, -4.406560897827148, -4.2602033615112305, -4.113846302032471, -3.967489242553711, -3.821131944656372, -3.674774646759033, -3.5284175872802734, -3.3820605278015137, -3.235703229904175, -3.089345932006836, -2.942988872528076, -2.7966318130493164, -2.6502745151519775, -2.5039172172546387, -2.357560157775879, -2.211203098297119, -2.0648458003997803, -1.918488621711731, -1.7721314430236816, -1.6257742643356323, -1.479417085647583, -1.3330599069595337, -1.1867024898529053, -1.040345311164856, -0.8939881324768066, -0.7476309537887573, -0.601273775100708, -0.4549165964126587, -0.3085594177246094, -0.16220223903656006, -0.015845060348510742, 0.13051211833953857, 0.2768692970275879, 0.4232264757156372, 0.5695836544036865, 0.7159408330917358, 0.8622980117797852, 1.0086551904678345, 1.1550123691558838, 1.301369547843933, 1.4477267265319824, 1.5940839052200317, 1.740441083908081, 1.8867982625961304, 2.0331554412841797, 2.1795125007629395, 2.3258697986602783, 2.472227096557617, 2.618584156036377, 2.7649412155151367, 2.9112985134124756, 3.0576558113098145, 3.204012870788574, 3.350369930267334, 3.496727228164673]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 10.0, 11.0, 14.0, 19.0, 11.0, 20.0, 23.0, 23.0, 22.0, 30.0, 38.0, 30.0, 38.0, 32.0, 63.0, 72.0, 84.0, 80.0, 48.0, 48.0, 36.0, 23.0, 26.0, 22.0, 28.0, 20.0, 7.0, 22.0, 11.0, 16.0, 21.0, 6.0, 10.0, 8.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.274181365966797, -4.14931058883667, -4.024440288543701, -3.899569511413574, -3.7746989727020264, -3.6498284339904785, -3.5249578952789307, -3.400087356567383, -3.275216579437256, -3.150346040725708, -3.02547550201416, -2.900604724884033, -2.7757341861724854, -2.6508636474609375, -2.5259931087493896, -2.401122570037842, -2.276252031326294, -2.151381492614746, -2.0265109539031982, -1.9016402959823608, -1.7767696380615234, -1.6518990993499756, -1.5270285606384277, -1.4021580219268799, -1.2772873640060425, -1.1524168252944946, -1.0275461673736572, -0.9026756286621094, -0.7778050303459167, -0.6529344320297241, -0.5280638933181763, -0.40319329500198364, -0.278322696685791, -0.15345211327075958, -0.02858152985572815, 0.09628903865814209, 0.22115963697433472, 0.34603023529052734, 0.4709007740020752, 0.5957713723182678, 0.7206419706344604, 0.8455125689506531, 0.9703831672668457, 1.0952537059783936, 1.2201242446899414, 1.3449949026107788, 1.4698654413223267, 1.594736099243164, 1.719606637954712, 1.8444771766662598, 1.9693478345870972, 2.0942182540893555, 2.2190890312194824, 2.3439595699310303, 2.468830108642578, 2.593700647354126, 2.718571186065674, 2.8434417247772217, 2.9683122634887695, 3.0931830406188965, 3.2180535793304443, 3.342924118041992, 3.46779465675354, 3.592665195465088, 3.717535972595215]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 15.0, 19.0, 30.0, 49.0, 61.0, 96.0, 163.0, 250.0, 422.0, 701.0, 1246.0, 2461.0, 5230.0, 12887.0, 38719.0, 181671.0, 1643660.0, 2003345.0, 232041.0, 44923.0, 14368.0, 5787.0, 2743.0, 1391.0, 743.0, 420.0, 276.0, 170.0, 122.0, 78.0, 50.0, 38.0, 20.0, 18.0, 14.0, 9.0, 13.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2666015625, -0.2574272155761719, -0.24825286865234375, -0.23907852172851562, -0.2299041748046875, -0.22072982788085938, -0.21155548095703125, -0.20238113403320312, -0.193206787109375, -0.18403244018554688, -0.17485809326171875, -0.16568374633789062, -0.1565093994140625, -0.14733505249023438, -0.13816070556640625, -0.12898635864257812, -0.11981201171875, -0.11063766479492188, -0.10146331787109375, -0.09228897094726562, -0.0831146240234375, -0.07394027709960938, -0.06476593017578125, -0.055591583251953125, -0.046417236328125, -0.037242889404296875, -0.02806854248046875, -0.018894195556640625, -0.0097198486328125, -0.000545501708984375, 0.00862884521484375, 0.017803192138671875, 0.0269775390625, 0.036151885986328125, 0.04532623291015625, 0.054500579833984375, 0.0636749267578125, 0.07284927368164062, 0.08202362060546875, 0.09119796752929688, 0.100372314453125, 0.10954666137695312, 0.11872100830078125, 0.12789535522460938, 0.1370697021484375, 0.14624404907226562, 0.15541839599609375, 0.16459274291992188, 0.17376708984375, 0.18294143676757812, 0.19211578369140625, 0.20129013061523438, 0.2104644775390625, 0.21963882446289062, 0.22881317138671875, 0.23798751831054688, 0.247161865234375, 0.2563362121582031, 0.26551055908203125, 0.2746849060058594, 0.2838592529296875, 0.2930335998535156, 0.30220794677734375, 0.3113822937011719, 0.320556640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 12.0, 11.0, 12.0, 10.0, 10.0, 25.0, 26.0, 36.0, 41.0, 40.0, 29.0, 33.0, 39.0, 38.0, 48.0, 29.0, 58.0, 46.0, 45.0, 43.0, 36.0, 34.0, 39.0, 35.0, 39.0, 22.0, 19.0, 23.0, 13.0, 21.0, 11.0, 10.0, 11.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.18033218383789062, -0.17450714111328125, -0.16868209838867188, -0.1628570556640625, -0.15703201293945312, -0.15120697021484375, -0.14538192749023438, -0.139556884765625, -0.13373184204101562, -0.12790679931640625, -0.12208175659179688, -0.1162567138671875, -0.11043167114257812, -0.10460662841796875, -0.09878158569335938, -0.09295654296875, -0.08713150024414062, -0.08130645751953125, -0.07548141479492188, -0.0696563720703125, -0.06383132934570312, -0.05800628662109375, -0.052181243896484375, -0.046356201171875, -0.040531158447265625, -0.03470611572265625, -0.028881072998046875, -0.0230560302734375, -0.017230987548828125, -0.01140594482421875, -0.005580902099609375, 0.000244140625, 0.006069183349609375, 0.01189422607421875, 0.017719268798828125, 0.0235443115234375, 0.029369354248046875, 0.03519439697265625, 0.041019439697265625, 0.046844482421875, 0.052669525146484375, 0.05849456787109375, 0.06431961059570312, 0.0701446533203125, 0.07596969604492188, 0.08179473876953125, 0.08761978149414062, 0.09344482421875, 0.09926986694335938, 0.10509490966796875, 0.11091995239257812, 0.1167449951171875, 0.12257003784179688, 0.12839508056640625, 0.13422012329101562, 0.140045166015625, 0.14587020874023438, 0.15169525146484375, 0.15752029418945312, 0.1633453369140625, 0.16917037963867188, 0.17499542236328125, 0.18082046508789062, 0.1866455078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 5.0, 15.0, 33.0, 59.0, 198.0, 649.0, 4825.0, 154960.0, 3994572.0, 36118.0, 2225.0, 407.0, 113.0, 48.0, 23.0, 12.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.9121551513671875, -0.867279052734375, -0.8224029541015625, -0.77752685546875, -0.7326507568359375, -0.687774658203125, -0.6428985595703125, -0.5980224609375, -0.5531463623046875, -0.508270263671875, -0.4633941650390625, -0.41851806640625, -0.3736419677734375, -0.328765869140625, -0.2838897705078125, -0.239013671875, -0.1941375732421875, -0.149261474609375, -0.1043853759765625, -0.05950927734375, -0.0146331787109375, 0.030242919921875, 0.0751190185546875, 0.1199951171875, 0.1648712158203125, 0.209747314453125, 0.2546234130859375, 0.29949951171875, 0.3443756103515625, 0.389251708984375, 0.4341278076171875, 0.47900390625, 0.5238800048828125, 0.568756103515625, 0.6136322021484375, 0.65850830078125, 0.7033843994140625, 0.748260498046875, 0.7931365966796875, 0.8380126953125, 0.8828887939453125, 0.927764892578125, 0.9726409912109375, 1.01751708984375, 1.0623931884765625, 1.107269287109375, 1.1521453857421875, 1.197021484375, 1.2418975830078125, 1.286773681640625, 1.3316497802734375, 1.37652587890625, 1.4214019775390625, 1.466278076171875, 1.5111541748046875, 1.5560302734375, 1.6009063720703125, 1.645782470703125, 1.6906585693359375, 1.73553466796875, 1.7804107666015625, 1.825286865234375, 1.8701629638671875, 1.9150390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 13.0, 18.0, 17.0, 33.0, 43.0, 70.0, 120.0, 194.0, 450.0, 785.0, 1005.0, 591.0, 279.0, 154.0, 94.0, 61.0, 36.0, 29.0, 26.0, 12.0, 3.0, 8.0, 4.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7568359375, -0.7365188598632812, -0.7162017822265625, -0.6958847045898438, -0.675567626953125, -0.6552505493164062, -0.6349334716796875, -0.6146163940429688, -0.59429931640625, -0.5739822387695312, -0.5536651611328125, -0.5333480834960938, -0.513031005859375, -0.49271392822265625, -0.4723968505859375, -0.45207977294921875, -0.4317626953125, -0.41144561767578125, -0.3911285400390625, -0.37081146240234375, -0.350494384765625, -0.33017730712890625, -0.3098602294921875, -0.28954315185546875, -0.26922607421875, -0.24890899658203125, -0.2285919189453125, -0.20827484130859375, -0.187957763671875, -0.16764068603515625, -0.1473236083984375, -0.12700653076171875, -0.106689453125, -0.08637237548828125, -0.0660552978515625, -0.04573822021484375, -0.025421142578125, -0.00510406494140625, 0.0152130126953125, 0.03553009033203125, 0.05584716796875, 0.07616424560546875, 0.0964813232421875, 0.11679840087890625, 0.137115478515625, 0.15743255615234375, 0.1777496337890625, 0.19806671142578125, 0.2183837890625, 0.23870086669921875, 0.2590179443359375, 0.27933502197265625, 0.299652099609375, 0.31996917724609375, 0.3402862548828125, 0.36060333251953125, 0.38092041015625, 0.40123748779296875, 0.4215545654296875, 0.44187164306640625, 0.462188720703125, 0.48250579833984375, 0.5028228759765625, 0.5231399536132812, 0.54345703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 44.0, 120.0, 192.0, 230.0, 189.0, 102.0, 47.0, 15.0, 10.0, 9.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.550397872924805, -6.359920978546143, -6.169444561004639, -5.978967666625977, -5.788491249084473, -5.5980143547058105, -5.407537937164307, -5.2170610427856445, -5.026584625244141, -4.8361077308654785, -4.645631313323975, -4.4551544189453125, -4.264678001403809, -4.0742011070251465, -3.8837246894836426, -3.6932477951049805, -3.5027711391448975, -3.3122944831848145, -3.1218178272247314, -2.9313411712646484, -2.7408645153045654, -2.5503878593444824, -2.3599109649658203, -2.1694345474243164, -1.9789577722549438, -1.7884811162948608, -1.5980044603347778, -1.4075276851654053, -1.2170510292053223, -1.0265743732452393, -0.8360977172851562, -0.6456210613250732, -0.45514440536499023, -0.2646677494049072, -0.07419106364250183, 0.11628562211990356, 0.3067622780799866, 0.4972389340400696, 0.6877156496047974, 0.8781923055648804, 1.0686689615249634, 1.2591456174850464, 1.4496222734451294, 1.640099048614502, 1.830575704574585, 2.021052360534668, 2.211529016494751, 2.402005672454834, 2.592482328414917, 2.782958984375, 2.973435640335083, 3.163912296295166, 3.354388952255249, 3.544865608215332, 3.735342502593994, 3.925818920135498, 4.11629581451416, 4.306772708892822, 4.497249126434326, 4.687726020812988, 4.878202438354492, 5.068679332733154, 5.259155750274658, 5.44963264465332, 5.640109062194824]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 8.0, 4.0, 10.0, 10.0, 11.0, 10.0, 12.0, 10.0, 15.0, 26.0, 23.0, 31.0, 35.0, 34.0, 41.0, 37.0, 30.0, 50.0, 59.0, 38.0, 52.0, 59.0, 32.0, 44.0, 31.0, 32.0, 32.0, 25.0, 35.0, 28.0, 19.0, 12.0, 9.0, 14.0, 16.0, 9.0, 14.0, 13.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8522539138793945, -1.790534496307373, -1.7288150787353516, -1.66709566116333, -1.6053762435913086, -1.543656826019287, -1.4819374084472656, -1.4202179908752441, -1.3584985733032227, -1.2967791557312012, -1.2350597381591797, -1.1733403205871582, -1.1116209030151367, -1.0499014854431152, -0.9881820678710938, -0.9264626502990723, -0.864743173122406, -0.8030237555503845, -0.741304337978363, -0.6795849204063416, -0.6178655028343201, -0.5561460256576538, -0.4944266378879547, -0.4327072203159332, -0.37098780274391174, -0.30926838517189026, -0.24754896759986877, -0.1858295351266861, -0.12411011755466461, -0.062390685081481934, -0.0006712675094604492, 0.061048150062561035, 0.12276756763458252, 0.184486985206604, 0.2462064027786255, 0.307925820350647, 0.36964523792266846, 0.43136468529701233, 0.4930841028690338, 0.5548034906387329, 0.6165229082107544, 0.6782423257827759, 0.7399617433547974, 0.8016811609268188, 0.8634005784988403, 0.9251199960708618, 0.9868394136428833, 1.0485588312149048, 1.1102783679962158, 1.1719977855682373, 1.2337172031402588, 1.2954366207122803, 1.3571560382843018, 1.4188754558563232, 1.4805948734283447, 1.5423142910003662, 1.6040337085723877, 1.6657531261444092, 1.7274725437164307, 1.7891919612884521, 1.8509113788604736, 1.9126307964324951, 1.9743502140045166, 2.036069631576538, 2.0977890491485596]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 3.0, 10.0, 16.0, 23.0, 37.0, 52.0, 76.0, 118.0, 206.0, 300.0, 503.0, 966.0, 1734.0, 3367.0, 6964.0, 15491.0, 41145.0, 121494.0, 328344.0, 331524.0, 123616.0, 42001.0, 15986.0, 7148.0, 3396.0, 1738.0, 940.0, 506.0, 322.0, 187.0, 112.0, 77.0, 56.0, 24.0, 22.0, 11.0, 11.0, 8.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29811859130859375, -0.2893524169921875, -0.28058624267578125, -0.271820068359375, -0.26305389404296875, -0.2542877197265625, -0.24552154541015625, -0.23675537109375, -0.22798919677734375, -0.2192230224609375, -0.21045684814453125, -0.201690673828125, -0.19292449951171875, -0.1841583251953125, -0.17539215087890625, -0.1666259765625, -0.15785980224609375, -0.1490936279296875, -0.14032745361328125, -0.131561279296875, -0.12279510498046875, -0.1140289306640625, -0.10526275634765625, -0.09649658203125, -0.08773040771484375, -0.0789642333984375, -0.07019805908203125, -0.061431884765625, -0.05266571044921875, -0.0438995361328125, -0.03513336181640625, -0.0263671875, -0.01760101318359375, -0.0088348388671875, -6.866455078125e-05, 0.008697509765625, 0.01746368408203125, 0.0262298583984375, 0.03499603271484375, 0.04376220703125, 0.05252838134765625, 0.0612945556640625, 0.07006072998046875, 0.078826904296875, 0.08759307861328125, 0.0963592529296875, 0.10512542724609375, 0.1138916015625, 0.12265777587890625, 0.1314239501953125, 0.14019012451171875, 0.148956298828125, 0.15772247314453125, 0.1664886474609375, 0.17525482177734375, 0.18402099609375, 0.19278717041015625, 0.2015533447265625, 0.21031951904296875, 0.219085693359375, 0.22785186767578125, 0.2366180419921875, 0.24538421630859375, 0.254150390625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 13.0, 5.0, 14.0, 20.0, 20.0, 24.0, 20.0, 26.0, 34.0, 34.0, 38.0, 34.0, 28.0, 45.0, 35.0, 39.0, 38.0, 43.0, 49.0, 43.0, 52.0, 34.0, 36.0, 32.0, 31.0, 29.0, 22.0, 23.0, 18.0, 17.0, 19.0, 12.0, 6.0, 13.0, 7.0, 6.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.20849609375, -0.2026805877685547, -0.19686508178710938, -0.19104957580566406, -0.18523406982421875, -0.17941856384277344, -0.17360305786132812, -0.1677875518798828, -0.1619720458984375, -0.1561565399169922, -0.15034103393554688, -0.14452552795410156, -0.13871002197265625, -0.13289451599121094, -0.12707901000976562, -0.12126350402832031, -0.115447998046875, -0.10963249206542969, -0.10381698608398438, -0.09800148010253906, -0.09218597412109375, -0.08637046813964844, -0.08055496215820312, -0.07473945617675781, -0.0689239501953125, -0.06310844421386719, -0.057292938232421875, -0.05147743225097656, -0.04566192626953125, -0.03984642028808594, -0.034030914306640625, -0.028215408325195312, -0.02239990234375, -0.016584396362304688, -0.010768890380859375, -0.0049533843994140625, 0.00086212158203125, 0.0066776275634765625, 0.012493133544921875, 0.018308639526367188, 0.0241241455078125, 0.029939651489257812, 0.035755157470703125, 0.04157066345214844, 0.04738616943359375, 0.05320167541503906, 0.059017181396484375, 0.06483268737792969, 0.070648193359375, 0.07646369934082031, 0.08227920532226562, 0.08809471130371094, 0.09391021728515625, 0.09972572326660156, 0.10554122924804688, 0.11135673522949219, 0.1171722412109375, 0.12298774719238281, 0.12880325317382812, 0.13461875915527344, 0.14043426513671875, 0.14624977111816406, 0.15206527709960938, 0.1578807830810547, 0.1636962890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 9.0, 14.0, 20.0, 18.0, 27.0, 45.0, 65.0, 108.0, 188.0, 366.0, 892.0, 2355.0, 8555.0, 55067.0, 707147.0, 242614.0, 23429.0, 4809.0, 1477.0, 655.0, 261.0, 165.0, 80.0, 48.0, 33.0, 29.0, 22.0, 10.0, 11.0, 5.0, 4.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.555419921875, -0.5361328125, -0.516845703125, -0.49755859375, -0.478271484375, -0.458984375, -0.439697265625, -0.42041015625, -0.401123046875, -0.3818359375, -0.362548828125, -0.34326171875, -0.323974609375, -0.3046875, -0.285400390625, -0.26611328125, -0.246826171875, -0.2275390625, -0.208251953125, -0.18896484375, -0.169677734375, -0.150390625, -0.131103515625, -0.11181640625, -0.092529296875, -0.0732421875, -0.053955078125, -0.03466796875, -0.015380859375, 0.00390625, 0.023193359375, 0.04248046875, 0.061767578125, 0.0810546875, 0.100341796875, 0.11962890625, 0.138916015625, 0.158203125, 0.177490234375, 0.19677734375, 0.216064453125, 0.2353515625, 0.254638671875, 0.27392578125, 0.293212890625, 0.3125, 0.331787109375, 0.35107421875, 0.370361328125, 0.3896484375, 0.408935546875, 0.42822265625, 0.447509765625, 0.466796875, 0.486083984375, 0.50537109375, 0.524658203125, 0.5439453125, 0.563232421875, 0.58251953125, 0.601806640625, 0.62109375, 0.640380859375, 0.65966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 7.0, 13.0, 12.0, 18.0, 20.0, 24.0, 23.0, 34.0, 39.0, 50.0, 62.0, 78.0, 72.0, 72.0, 69.0, 83.0, 81.0, 58.0, 48.0, 35.0, 26.0, 14.0, 19.0, 15.0, 11.0, 9.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.26953125, -1.234832763671875, -1.20013427734375, -1.165435791015625, -1.1307373046875, -1.096038818359375, -1.06134033203125, -1.026641845703125, -0.991943359375, -0.957244873046875, -0.92254638671875, -0.887847900390625, -0.8531494140625, -0.818450927734375, -0.78375244140625, -0.749053955078125, -0.71435546875, -0.679656982421875, -0.64495849609375, -0.610260009765625, -0.5755615234375, -0.540863037109375, -0.50616455078125, -0.471466064453125, -0.436767578125, -0.402069091796875, -0.36737060546875, -0.332672119140625, -0.2979736328125, -0.263275146484375, -0.22857666015625, -0.193878173828125, -0.1591796875, -0.124481201171875, -0.08978271484375, -0.055084228515625, -0.0203857421875, 0.014312744140625, 0.04901123046875, 0.083709716796875, 0.118408203125, 0.153106689453125, 0.18780517578125, 0.222503662109375, 0.2572021484375, 0.291900634765625, 0.32659912109375, 0.361297607421875, 0.39599609375, 0.430694580078125, 0.46539306640625, 0.500091552734375, 0.5347900390625, 0.569488525390625, 0.60418701171875, 0.638885498046875, 0.673583984375, 0.708282470703125, 0.74298095703125, 0.777679443359375, 0.8123779296875, 0.847076416015625, 0.88177490234375, 0.916473388671875, 0.951171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 8.0, 20.0, 16.0, 13.0, 32.0, 40.0, 106.0, 116.0, 194.0, 383.0, 922.0, 2554.0, 9414.0, 71371.0, 852835.0, 94550.0, 11164.0, 2796.0, 991.0, 441.0, 245.0, 108.0, 67.0, 48.0, 38.0, 18.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29613494873046875, -0.2853851318359375, -0.27463531494140625, -0.263885498046875, -0.25313568115234375, -0.2423858642578125, -0.23163604736328125, -0.22088623046875, -0.21013641357421875, -0.1993865966796875, -0.18863677978515625, -0.177886962890625, -0.16713714599609375, -0.1563873291015625, -0.14563751220703125, -0.1348876953125, -0.12413787841796875, -0.1133880615234375, -0.10263824462890625, -0.091888427734375, -0.08113861083984375, -0.0703887939453125, -0.05963897705078125, -0.04888916015625, -0.03813934326171875, -0.0273895263671875, -0.01663970947265625, -0.005889892578125, 0.00485992431640625, 0.0156097412109375, 0.02635955810546875, 0.037109375, 0.04785919189453125, 0.0586090087890625, 0.06935882568359375, 0.080108642578125, 0.09085845947265625, 0.1016082763671875, 0.11235809326171875, 0.12310791015625, 0.13385772705078125, 0.1446075439453125, 0.15535736083984375, 0.166107177734375, 0.17685699462890625, 0.1876068115234375, 0.19835662841796875, 0.2091064453125, 0.21985626220703125, 0.2306060791015625, 0.24135589599609375, 0.252105712890625, 0.26285552978515625, 0.2736053466796875, 0.28435516357421875, 0.29510498046875, 0.30585479736328125, 0.3166046142578125, 0.32735443115234375, 0.338104248046875, 0.34885406494140625, 0.3596038818359375, 0.37035369873046875, 0.381103515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 5.0, 10.0, 9.0, 8.0, 26.0, 130.0, 362.0, 312.0, 89.0, 22.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002465248107910156, -0.00024002045392990112, -0.00023351609706878662, -0.00022701174020767212, -0.00022050738334655762, -0.00021400302648544312, -0.0002074986696243286, -0.0002009943127632141, -0.0001944899559020996, -0.0001879855990409851, -0.0001814812421798706, -0.0001749768853187561, -0.0001684725284576416, -0.0001619681715965271, -0.0001554638147354126, -0.0001489594578742981, -0.0001424551010131836, -0.0001359507441520691, -0.0001294463872909546, -0.0001229420304298401, -0.00011643767356872559, -0.00010993331670761108, -0.00010342895984649658, -9.692460298538208e-05, -9.042024612426758e-05, -8.391588926315308e-05, -7.741153240203857e-05, -7.090717554092407e-05, -6.440281867980957e-05, -5.789846181869507e-05, -5.1394104957580566e-05, -4.4889748096466064e-05, -3.838539123535156e-05, -3.188103437423706e-05, -2.537667751312256e-05, -1.8872320652008057e-05, -1.2367963790893555e-05, -5.863606929779053e-06, 6.407499313354492e-07, 7.145106792449951e-06, 1.3649463653564453e-05, 2.0153820514678955e-05, 2.6658177375793457e-05, 3.316253423690796e-05, 3.966689109802246e-05, 4.617124795913696e-05, 5.2675604820251465e-05, 5.917996168136597e-05, 6.568431854248047e-05, 7.218867540359497e-05, 7.869303226470947e-05, 8.519738912582397e-05, 9.170174598693848e-05, 9.820610284805298e-05, 0.00010471045970916748, 0.00011121481657028198, 0.00011771917343139648, 0.00012422353029251099, 0.0001307278871536255, 0.00013723224401474, 0.0001437366008758545, 0.000150240957736969, 0.0001567453145980835, 0.000163249671459198, 0.0001697540283203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 10.0, 21.0, 21.0, 49.0, 54.0, 91.0, 144.0, 277.0, 528.0, 1245.0, 3312.0, 12206.0, 95870.0, 819944.0, 96386.0, 12570.0, 3375.0, 1201.0, 574.0, 272.0, 149.0, 91.0, 53.0, 32.0, 23.0, 15.0, 10.0, 7.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3056640625, -0.2956428527832031, -0.28562164306640625, -0.2756004333496094, -0.2655792236328125, -0.2555580139160156, -0.24553680419921875, -0.23551559448242188, -0.225494384765625, -0.21547317504882812, -0.20545196533203125, -0.19543075561523438, -0.1854095458984375, -0.17538833618164062, -0.16536712646484375, -0.15534591674804688, -0.14532470703125, -0.13530349731445312, -0.12528228759765625, -0.11526107788085938, -0.1052398681640625, -0.09521865844726562, -0.08519744873046875, -0.07517623901367188, -0.065155029296875, -0.055133819580078125, -0.04511260986328125, -0.035091400146484375, -0.0250701904296875, -0.015048980712890625, -0.00502777099609375, 0.004993438720703125, 0.0150146484375, 0.025035858154296875, 0.03505706787109375, 0.045078277587890625, 0.0550994873046875, 0.06512069702148438, 0.07514190673828125, 0.08516311645507812, 0.095184326171875, 0.10520553588867188, 0.11522674560546875, 0.12524795532226562, 0.1352691650390625, 0.14529037475585938, 0.15531158447265625, 0.16533279418945312, 0.17535400390625, 0.18537521362304688, 0.19539642333984375, 0.20541763305664062, 0.2154388427734375, 0.22546005249023438, 0.23548126220703125, 0.24550247192382812, 0.255523681640625, 0.2655448913574219, 0.27556610107421875, 0.2855873107910156, 0.2956085205078125, 0.3056297302246094, 0.31565093994140625, 0.3256721496582031, 0.335693359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 1.0, 5.0, 13.0, 10.0, 11.0, 19.0, 23.0, 44.0, 67.0, 106.0, 110.0, 127.0, 125.0, 97.0, 78.0, 44.0, 34.0, 23.0, 18.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24393463134765625, -0.2356719970703125, -0.22740936279296875, -0.219146728515625, -0.21088409423828125, -0.2026214599609375, -0.19435882568359375, -0.18609619140625, -0.17783355712890625, -0.1695709228515625, -0.16130828857421875, -0.153045654296875, -0.14478302001953125, -0.1365203857421875, -0.12825775146484375, -0.1199951171875, -0.11173248291015625, -0.1034698486328125, -0.09520721435546875, -0.086944580078125, -0.07868194580078125, -0.0704193115234375, -0.06215667724609375, -0.05389404296875, -0.04563140869140625, -0.0373687744140625, -0.02910614013671875, -0.020843505859375, -0.01258087158203125, -0.0043182373046875, 0.00394439697265625, 0.01220703125, 0.02046966552734375, 0.0287322998046875, 0.03699493408203125, 0.045257568359375, 0.05352020263671875, 0.0617828369140625, 0.07004547119140625, 0.07830810546875, 0.08657073974609375, 0.0948333740234375, 0.10309600830078125, 0.111358642578125, 0.11962127685546875, 0.1278839111328125, 0.13614654541015625, 0.1444091796875, 0.15267181396484375, 0.1609344482421875, 0.16919708251953125, 0.177459716796875, 0.18572235107421875, 0.1939849853515625, 0.20224761962890625, 0.21051025390625, 0.21877288818359375, 0.2270355224609375, 0.23529815673828125, 0.243560791015625, 0.25182342529296875, 0.2600860595703125, 0.26834869384765625, 0.276611328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 17.0, 101.0, 475.0, 303.0, 71.0, 22.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0348992347717285, -3.6630659103393555, -3.2912325859069824, -2.9193992614746094, -2.5475659370422363, -2.1757326126098633, -1.8038995265960693, -1.4320662021636963, -1.0602328777313232, -0.6883995532989502, -0.3165662884712219, 0.05526697635650635, 0.4271003007888794, 0.7989336252212524, 1.170766830444336, 1.542600154876709, 1.914433479309082, 2.286266803741455, 2.658100128173828, 3.029933452606201, 3.401766777038574, 3.7736001014709473, 4.14543342590332, 4.517266273498535, 4.889100074768066, 5.2609333992004395, 5.6327667236328125, 6.0046000480651855, 6.376433372497559, 6.748266696929932, 7.120100021362305, 7.4919328689575195, 7.863766670227051, 8.235599517822266, 8.607433319091797, 8.979266166687012, 9.351099967956543, 9.722932815551758, 10.094766616821289, 10.466599464416504, 10.838433265686035, 11.21026611328125, 11.582099914550781, 11.953932762145996, 12.325766563415527, 12.697599411010742, 13.069433212280273, 13.441266059875488, 13.813098907470703, 14.184931755065918, 14.55676555633545, 14.928598403930664, 15.300432205200195, 15.67226505279541, 16.044097900390625, 16.415931701660156, 16.787765502929688, 17.15959930419922, 17.531431198120117, 17.90326499938965, 18.27509880065918, 18.64693260192871, 19.01876449584961, 19.39059829711914, 19.762432098388672]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 6.0, 5.0, 12.0, 16.0, 16.0, 10.0, 11.0, 22.0, 21.0, 23.0, 25.0, 44.0, 34.0, 36.0, 49.0, 58.0, 79.0, 73.0, 66.0, 43.0, 42.0, 33.0, 37.0, 36.0, 23.0, 22.0, 24.0, 14.0, 21.0, 15.0, 11.0, 7.0, 14.0, 11.0, 5.0, 6.0, 3.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.664245843887329, -2.5767669677734375, -2.489287853240967, -2.401808977127075, -2.3143301010131836, -2.226851224899292, -2.1393723487854004, -2.0518932342529297, -1.964414358139038, -1.8769354820251465, -1.7894564867019653, -1.7019774913787842, -1.6144986152648926, -1.527019739151001, -1.4395407438278198, -1.3520617485046387, -1.264582872390747, -1.1771039962768555, -1.0896250009536743, -1.0021460056304932, -0.9146671295166016, -0.8271881937980652, -0.7397092580795288, -0.6522303223609924, -0.564751386642456, -0.4772724509239197, -0.3897935152053833, -0.3023145794868469, -0.21483564376831055, -0.12735670804977417, -0.03987777233123779, 0.047601163387298584, 0.13508033752441406, 0.22255927324295044, 0.3100382089614868, 0.3975171446800232, 0.48499608039855957, 0.572475016117096, 0.6599539518356323, 0.7474328875541687, 0.8349118232727051, 0.9223907589912415, 1.0098696947097778, 1.097348690032959, 1.1848275661468506, 1.2723064422607422, 1.3597854375839233, 1.4472644329071045, 1.534743309020996, 1.6222221851348877, 1.7097011804580688, 1.79718017578125, 1.8846590518951416, 1.9721379280090332, 2.059617042541504, 2.1470959186553955, 2.234574794769287, 2.3220536708831787, 2.4095325469970703, 2.497011661529541, 2.5844905376434326, 2.671969413757324, 2.759448528289795, 2.8469274044036865, 2.934406280517578]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 5.0, 26.0, 34.0, 47.0, 72.0, 155.0, 245.0, 442.0, 781.0, 1533.0, 2988.0, 6471.0, 16255.0, 58563.0, 374553.0, 2556402.0, 1002037.0, 126980.0, 28393.0, 9835.0, 4151.0, 2009.0, 1026.0, 533.0, 315.0, 187.0, 91.0, 51.0, 26.0, 22.0, 16.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24271011352539062, -0.23395538330078125, -0.22520065307617188, -0.2164459228515625, -0.20769119262695312, -0.19893646240234375, -0.19018173217773438, -0.181427001953125, -0.17267227172851562, -0.16391754150390625, -0.15516281127929688, -0.1464080810546875, -0.13765335083007812, -0.12889862060546875, -0.12014389038085938, -0.11138916015625, -0.10263442993164062, -0.09387969970703125, -0.08512496948242188, -0.0763702392578125, -0.06761550903320312, -0.05886077880859375, -0.050106048583984375, -0.041351318359375, -0.032596588134765625, -0.02384185791015625, -0.015087127685546875, -0.0063323974609375, 0.002422332763671875, 0.01117706298828125, 0.019931793212890625, 0.0286865234375, 0.037441253662109375, 0.04619598388671875, 0.054950714111328125, 0.0637054443359375, 0.07246017456054688, 0.08121490478515625, 0.08996963500976562, 0.098724365234375, 0.10747909545898438, 0.11623382568359375, 0.12498855590820312, 0.1337432861328125, 0.14249801635742188, 0.15125274658203125, 0.16000747680664062, 0.16876220703125, 0.17751693725585938, 0.18627166748046875, 0.19502639770507812, 0.2037811279296875, 0.21253585815429688, 0.22129058837890625, 0.23004531860351562, 0.238800048828125, 0.24755477905273438, 0.25630950927734375, 0.2650642395019531, 0.2738189697265625, 0.2825736999511719, 0.29132843017578125, 0.3000831604003906, 0.308837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 9.0, 12.0, 13.0, 13.0, 18.0, 18.0, 31.0, 28.0, 36.0, 41.0, 37.0, 40.0, 36.0, 39.0, 36.0, 34.0, 43.0, 41.0, 40.0, 40.0, 44.0, 28.0, 30.0, 41.0, 35.0, 26.0, 26.0, 19.0, 20.0, 14.0, 12.0, 16.0, 7.0, 9.0, 10.0, 5.0, 1.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.190185546875, -0.18480491638183594, -0.17942428588867188, -0.1740436553955078, -0.16866302490234375, -0.1632823944091797, -0.15790176391601562, -0.15252113342285156, -0.1471405029296875, -0.14175987243652344, -0.13637924194335938, -0.1309986114501953, -0.12561798095703125, -0.12023735046386719, -0.11485671997070312, -0.10947608947753906, -0.104095458984375, -0.09871482849121094, -0.09333419799804688, -0.08795356750488281, -0.08257293701171875, -0.07719230651855469, -0.07181167602539062, -0.06643104553222656, -0.0610504150390625, -0.05566978454589844, -0.050289154052734375, -0.04490852355957031, -0.03952789306640625, -0.03414726257324219, -0.028766632080078125, -0.023386001586914062, -0.01800537109375, -0.012624740600585938, -0.007244110107421875, -0.0018634796142578125, 0.00351715087890625, 0.008897781372070312, 0.014278411865234375, 0.019659042358398438, 0.0250396728515625, 0.030420303344726562, 0.035800933837890625, 0.04118156433105469, 0.04656219482421875, 0.05194282531738281, 0.057323455810546875, 0.06270408630371094, 0.068084716796875, 0.07346534729003906, 0.07884597778320312, 0.08422660827636719, 0.08960723876953125, 0.09498786926269531, 0.10036849975585938, 0.10574913024902344, 0.1111297607421875, 0.11651039123535156, 0.12189102172851562, 0.1272716522216797, 0.13265228271484375, 0.1380329132080078, 0.14341354370117188, 0.14879417419433594, 0.1541748046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 13.0, 17.0, 22.0, 45.0, 136.0, 428.0, 2143.0, 43832.0, 4103546.0, 41382.0, 2050.0, 392.0, 136.0, 61.0, 34.0, 19.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.568359375, -1.5185546875, -1.46875, -1.4189453125, -1.369140625, -1.3193359375, -1.26953125, -1.2197265625, -1.169921875, -1.1201171875, -1.0703125, -1.0205078125, -0.970703125, -0.9208984375, -0.87109375, -0.8212890625, -0.771484375, -0.7216796875, -0.671875, -0.6220703125, -0.572265625, -0.5224609375, -0.47265625, -0.4228515625, -0.373046875, -0.3232421875, -0.2734375, -0.2236328125, -0.173828125, -0.1240234375, -0.07421875, -0.0244140625, 0.025390625, 0.0751953125, 0.125, 0.1748046875, 0.224609375, 0.2744140625, 0.32421875, 0.3740234375, 0.423828125, 0.4736328125, 0.5234375, 0.5732421875, 0.623046875, 0.6728515625, 0.72265625, 0.7724609375, 0.822265625, 0.8720703125, 0.921875, 0.9716796875, 1.021484375, 1.0712890625, 1.12109375, 1.1708984375, 1.220703125, 1.2705078125, 1.3203125, 1.3701171875, 1.419921875, 1.4697265625, 1.51953125, 1.5693359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 5.0, 8.0, 2.0, 9.0, 11.0, 12.0, 21.0, 18.0, 42.0, 89.0, 207.0, 381.0, 814.0, 1168.0, 605.0, 292.0, 150.0, 87.0, 60.0, 32.0, 17.0, 16.0, 10.0, 5.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5037384033203125, -0.483062744140625, -0.4623870849609375, -0.44171142578125, -0.4210357666015625, -0.400360107421875, -0.3796844482421875, -0.3590087890625, -0.3383331298828125, -0.317657470703125, -0.2969818115234375, -0.27630615234375, -0.2556304931640625, -0.234954833984375, -0.2142791748046875, -0.193603515625, -0.1729278564453125, -0.152252197265625, -0.1315765380859375, -0.11090087890625, -0.0902252197265625, -0.069549560546875, -0.0488739013671875, -0.0281982421875, -0.0075225830078125, 0.013153076171875, 0.0338287353515625, 0.05450439453125, 0.0751800537109375, 0.095855712890625, 0.1165313720703125, 0.13720703125, 0.1578826904296875, 0.178558349609375, 0.1992340087890625, 0.21990966796875, 0.2405853271484375, 0.261260986328125, 0.2819366455078125, 0.3026123046875, 0.3232879638671875, 0.343963623046875, 0.3646392822265625, 0.38531494140625, 0.4059906005859375, 0.426666259765625, 0.4473419189453125, 0.468017578125, 0.4886932373046875, 0.509368896484375, 0.5300445556640625, 0.55072021484375, 0.5713958740234375, 0.592071533203125, 0.6127471923828125, 0.6334228515625, 0.6540985107421875, 0.674774169921875, 0.6954498291015625, 0.71612548828125, 0.7368011474609375, 0.757476806640625, 0.7781524658203125, 0.798828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 11.0, 25.0, 62.0, 159.0, 249.0, 249.0, 148.0, 53.0, 19.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.129081726074219, -3.9313509464263916, -3.7336199283599854, -3.535889148712158, -3.338158369064331, -3.140427589416504, -2.9426965713500977, -2.7449657917022705, -2.5472350120544434, -2.349504232406616, -2.15177321434021, -1.9540424346923828, -1.7563116550445557, -1.558580756187439, -1.3608498573303223, -1.1631190776824951, -0.9653880596160889, -0.7676572203636169, -0.569926381111145, -0.3721954822540283, -0.1744646430015564, 0.023266196250915527, 0.22099709510803223, 0.4187278747558594, 0.6164587736129761, 0.814189612865448, 1.01192045211792, 1.2096513509750366, 1.4073822498321533, 1.6051130294799805, 1.8028439283370972, 2.0005745887756348, 2.198305606842041, 2.396036386489868, 2.5937674045562744, 2.7914981842041016, 2.9892289638519287, 3.186959743499756, 3.384690761566162, 3.5824215412139893, 3.7801523208618164, 3.9778831005096436, 4.175613880157471, 4.373344898223877, 4.571075916290283, 4.768806457519531, 4.9665374755859375, 5.164268493652344, 5.36199951171875, 5.559730529785156, 5.757461071014404, 5.9551920890808105, 6.152923107147217, 6.350653648376465, 6.548384666442871, 6.746115684509277, 6.943846225738525, 7.141577243804932, 7.33930778503418, 7.537038803100586, 7.734769821166992, 7.93250036239624, 8.130231857299805, 8.327961921691895, 8.5256929397583]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 16.0, 14.0, 14.0, 9.0, 17.0, 23.0, 28.0, 24.0, 35.0, 35.0, 41.0, 33.0, 41.0, 48.0, 41.0, 37.0, 44.0, 40.0, 38.0, 42.0, 41.0, 31.0, 37.0, 34.0, 32.0, 25.0, 22.0, 21.0, 26.0, 10.0, 16.0, 14.0, 6.0, 9.0, 10.0, 7.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.006152391433716, -1.9449986219406128, -1.8838447332382202, -1.8226909637451172, -1.7615370750427246, -1.7003833055496216, -1.6392295360565186, -1.578075647354126, -1.5169217586517334, -1.4557679891586304, -1.3946141004562378, -1.3334603309631348, -1.2723064422607422, -1.2111526727676392, -1.1499989032745361, -1.0888450145721436, -1.0276912450790405, -0.9665374159812927, -0.9053835868835449, -0.8442298173904419, -0.7830759286880493, -0.7219221591949463, -0.6607683300971985, -0.5996145009994507, -0.5384606719017029, -0.4773068428039551, -0.4161530137062073, -0.35499921441078186, -0.29384538531303406, -0.23269155621528625, -0.17153775691986084, -0.11038392782211304, -0.049230098724365234, 0.011923722922801971, 0.07307754456996918, 0.1342313587665558, 0.1953851878643036, 0.2565390169620514, 0.3176928162574768, 0.3788466453552246, 0.4400004744529724, 0.5011543035507202, 0.562308132648468, 0.6234619617462158, 0.6846157312393188, 0.7457696199417114, 0.8069233894348145, 0.8680772185325623, 0.9292310476303101, 0.9903848767280579, 1.0515387058258057, 1.1126924753189087, 1.1738463640213013, 1.2350001335144043, 1.2961540222167969, 1.3573077917099, 1.418461561203003, 1.479615330696106, 1.5407692193984985, 1.6019229888916016, 1.6630768775939941, 1.7242306470870972, 1.7853844165802002, 1.8465383052825928, 1.9076921939849854]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 13.0, 23.0, 30.0, 37.0, 61.0, 64.0, 112.0, 139.0, 218.0, 331.0, 489.0, 721.0, 1132.0, 1857.0, 3113.0, 5342.0, 9656.0, 18495.0, 38947.0, 88148.0, 214720.0, 335047.0, 182651.0, 75474.0, 33646.0, 16700.0, 8685.0, 5004.0, 2901.0, 1737.0, 1051.0, 677.0, 415.0, 275.0, 189.0, 122.0, 97.0, 62.0, 44.0, 41.0, 27.0, 16.0, 15.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.2459716796875, -0.23902511596679688, -0.23207855224609375, -0.22513198852539062, -0.2181854248046875, -0.21123886108398438, -0.20429229736328125, -0.19734573364257812, -0.190399169921875, -0.18345260620117188, -0.17650604248046875, -0.16955947875976562, -0.1626129150390625, -0.15566635131835938, -0.14871978759765625, -0.14177322387695312, -0.13482666015625, -0.12788009643554688, -0.12093353271484375, -0.11398696899414062, -0.1070404052734375, -0.10009384155273438, -0.09314727783203125, -0.08620071411132812, -0.079254150390625, -0.07230758666992188, -0.06536102294921875, -0.058414459228515625, -0.0514678955078125, -0.044521331787109375, -0.03757476806640625, -0.030628204345703125, -0.023681640625, -0.016735076904296875, -0.00978851318359375, -0.002841949462890625, 0.0041046142578125, 0.011051177978515625, 0.01799774169921875, 0.024944305419921875, 0.031890869140625, 0.038837432861328125, 0.04578399658203125, 0.052730560302734375, 0.0596771240234375, 0.06662368774414062, 0.07357025146484375, 0.08051681518554688, 0.08746337890625, 0.09440994262695312, 0.10135650634765625, 0.10830307006835938, 0.1152496337890625, 0.12219619750976562, 0.12914276123046875, 0.13608932495117188, 0.143035888671875, 0.14998245239257812, 0.15692901611328125, 0.16387557983398438, 0.1708221435546875, 0.17776870727539062, 0.18471527099609375, 0.19166183471679688, 0.1986083984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 12.0, 7.0, 13.0, 12.0, 28.0, 29.0, 20.0, 34.0, 24.0, 30.0, 36.0, 46.0, 25.0, 48.0, 44.0, 45.0, 41.0, 38.0, 39.0, 56.0, 40.0, 30.0, 35.0, 35.0, 33.0, 24.0, 32.0, 25.0, 16.0, 18.0, 22.0, 13.0, 5.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.208251953125, -0.2019062042236328, -0.19556045532226562, -0.18921470642089844, -0.18286895751953125, -0.17652320861816406, -0.17017745971679688, -0.1638317108154297, -0.1574859619140625, -0.1511402130126953, -0.14479446411132812, -0.13844871520996094, -0.13210296630859375, -0.12575721740722656, -0.11941146850585938, -0.11306571960449219, -0.106719970703125, -0.10037422180175781, -0.09402847290039062, -0.08768272399902344, -0.08133697509765625, -0.07499122619628906, -0.06864547729492188, -0.06229972839355469, -0.0559539794921875, -0.04960823059082031, -0.043262481689453125, -0.03691673278808594, -0.03057098388671875, -0.024225234985351562, -0.017879486083984375, -0.011533737182617188, -0.00518798828125, 0.0011577606201171875, 0.007503509521484375, 0.013849258422851562, 0.02019500732421875, 0.026540756225585938, 0.032886505126953125, 0.03923225402832031, 0.0455780029296875, 0.05192375183105469, 0.058269500732421875, 0.06461524963378906, 0.07096099853515625, 0.07730674743652344, 0.08365249633789062, 0.08999824523925781, 0.096343994140625, 0.10268974304199219, 0.10903549194335938, 0.11538124084472656, 0.12172698974609375, 0.12807273864746094, 0.13441848754882812, 0.1407642364501953, 0.1471099853515625, 0.1534557342529297, 0.15980148315429688, 0.16614723205566406, 0.17249298095703125, 0.17883872985839844, 0.18518447875976562, 0.1915302276611328, 0.1978759765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 7.0, 15.0, 21.0, 26.0, 31.0, 50.0, 83.0, 90.0, 171.0, 234.0, 398.0, 758.0, 1594.0, 4329.0, 16587.0, 116836.0, 779117.0, 105186.0, 15563.0, 4155.0, 1497.0, 708.0, 373.0, 245.0, 130.0, 93.0, 77.0, 43.0, 21.0, 22.0, 17.0, 16.0, 6.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5008163452148438, -0.4825897216796875, -0.46436309814453125, -0.446136474609375, -0.42790985107421875, -0.4096832275390625, -0.39145660400390625, -0.37322998046875, -0.35500335693359375, -0.3367767333984375, -0.31855010986328125, -0.300323486328125, -0.28209686279296875, -0.2638702392578125, -0.24564361572265625, -0.2274169921875, -0.20919036865234375, -0.1909637451171875, -0.17273712158203125, -0.154510498046875, -0.13628387451171875, -0.1180572509765625, -0.09983062744140625, -0.08160400390625, -0.06337738037109375, -0.0451507568359375, -0.02692413330078125, -0.008697509765625, 0.00952911376953125, 0.0277557373046875, 0.04598236083984375, 0.064208984375, 0.08243560791015625, 0.1006622314453125, 0.11888885498046875, 0.137115478515625, 0.15534210205078125, 0.1735687255859375, 0.19179534912109375, 0.21002197265625, 0.22824859619140625, 0.2464752197265625, 0.26470184326171875, 0.282928466796875, 0.30115509033203125, 0.3193817138671875, 0.33760833740234375, 0.3558349609375, 0.37406158447265625, 0.3922882080078125, 0.41051483154296875, 0.428741455078125, 0.44696807861328125, 0.4651947021484375, 0.48342132568359375, 0.50164794921875, 0.5198745727539062, 0.5381011962890625, 0.5563278198242188, 0.574554443359375, 0.5927810668945312, 0.6110076904296875, 0.6292343139648438, 0.6474609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 11.0, 14.0, 11.0, 13.0, 19.0, 25.0, 25.0, 31.0, 47.0, 58.0, 69.0, 62.0, 68.0, 73.0, 65.0, 60.0, 56.0, 53.0, 37.0, 37.0, 21.0, 24.0, 26.0, 22.0, 19.0, 12.0, 10.0, 8.0, 11.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.22528076171875, -1.1927490234375, -1.16021728515625, -1.127685546875, -1.09515380859375, -1.0626220703125, -1.03009033203125, -0.99755859375, -0.96502685546875, -0.9324951171875, -0.89996337890625, -0.867431640625, -0.83489990234375, -0.8023681640625, -0.76983642578125, -0.7373046875, -0.70477294921875, -0.6722412109375, -0.63970947265625, -0.607177734375, -0.57464599609375, -0.5421142578125, -0.50958251953125, -0.47705078125, -0.44451904296875, -0.4119873046875, -0.37945556640625, -0.346923828125, -0.31439208984375, -0.2818603515625, -0.24932861328125, -0.216796875, -0.18426513671875, -0.1517333984375, -0.11920166015625, -0.086669921875, -0.05413818359375, -0.0216064453125, 0.01092529296875, 0.04345703125, 0.07598876953125, 0.1085205078125, 0.14105224609375, 0.173583984375, 0.20611572265625, 0.2386474609375, 0.27117919921875, 0.3037109375, 0.33624267578125, 0.3687744140625, 0.40130615234375, 0.433837890625, 0.46636962890625, 0.4989013671875, 0.53143310546875, 0.56396484375, 0.59649658203125, 0.6290283203125, 0.66156005859375, 0.694091796875, 0.72662353515625, 0.7591552734375, 0.79168701171875, 0.82421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 10.0, 17.0, 24.0, 46.0, 64.0, 105.0, 200.0, 353.0, 681.0, 1566.0, 4437.0, 17104.0, 157211.0, 809686.0, 44132.0, 8268.0, 2474.0, 1051.0, 496.0, 242.0, 126.0, 80.0, 50.0, 29.0, 19.0, 15.0, 13.0, 14.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.26305389404296875, -0.2534027099609375, -0.24375152587890625, -0.234100341796875, -0.22444915771484375, -0.2147979736328125, -0.20514678955078125, -0.19549560546875, -0.18584442138671875, -0.1761932373046875, -0.16654205322265625, -0.156890869140625, -0.14723968505859375, -0.1375885009765625, -0.12793731689453125, -0.1182861328125, -0.10863494873046875, -0.0989837646484375, -0.08933258056640625, -0.079681396484375, -0.07003021240234375, -0.0603790283203125, -0.05072784423828125, -0.04107666015625, -0.03142547607421875, -0.0217742919921875, -0.01212310791015625, -0.002471923828125, 0.00717926025390625, 0.0168304443359375, 0.02648162841796875, 0.0361328125, 0.04578399658203125, 0.0554351806640625, 0.06508636474609375, 0.074737548828125, 0.08438873291015625, 0.0940399169921875, 0.10369110107421875, 0.11334228515625, 0.12299346923828125, 0.1326446533203125, 0.14229583740234375, 0.151947021484375, 0.16159820556640625, 0.1712493896484375, 0.18090057373046875, 0.1905517578125, 0.20020294189453125, 0.2098541259765625, 0.21950531005859375, 0.229156494140625, 0.23880767822265625, 0.2484588623046875, 0.25811004638671875, 0.26776123046875, 0.27741241455078125, 0.2870635986328125, 0.29671478271484375, 0.306365966796875, 0.31601715087890625, 0.3256683349609375, 0.33531951904296875, 0.344970703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 5.0, 12.0, 9.0, 15.0, 22.0, 35.0, 54.0, 88.0, 153.0, 209.0, 155.0, 73.0, 55.0, 41.0, 15.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.311867713928223e-05, -8.028745651245117e-05, -7.745623588562012e-05, -7.462501525878906e-05, -7.179379463195801e-05, -6.896257400512695e-05, -6.61313533782959e-05, -6.330013275146484e-05, -6.046891212463379e-05, -5.7637691497802734e-05, -5.480647087097168e-05, -5.1975250244140625e-05, -4.914402961730957e-05, -4.6312808990478516e-05, -4.348158836364746e-05, -4.0650367736816406e-05, -3.781914710998535e-05, -3.49879264831543e-05, -3.215670585632324e-05, -2.9325485229492188e-05, -2.6494264602661133e-05, -2.3663043975830078e-05, -2.0831823348999023e-05, -1.800060272216797e-05, -1.5169382095336914e-05, -1.233816146850586e-05, -9.506940841674805e-06, -6.67572021484375e-06, -3.844499588012695e-06, -1.0132789611816406e-06, 1.817941665649414e-06, 4.649162292480469e-06, 7.4803829193115234e-06, 1.0311603546142578e-05, 1.3142824172973633e-05, 1.5974044799804688e-05, 1.8805265426635742e-05, 2.1636486053466797e-05, 2.446770668029785e-05, 2.7298927307128906e-05, 3.013014793395996e-05, 3.2961368560791016e-05, 3.579258918762207e-05, 3.8623809814453125e-05, 4.145503044128418e-05, 4.4286251068115234e-05, 4.711747169494629e-05, 4.9948692321777344e-05, 5.27799129486084e-05, 5.561113357543945e-05, 5.844235420227051e-05, 6.127357482910156e-05, 6.410479545593262e-05, 6.693601608276367e-05, 6.976723670959473e-05, 7.259845733642578e-05, 7.542967796325684e-05, 7.826089859008789e-05, 8.109211921691895e-05, 8.392333984375e-05, 8.675456047058105e-05, 8.958578109741211e-05, 9.241700172424316e-05, 9.524822235107422e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 2.0, 9.0, 16.0, 18.0, 33.0, 53.0, 96.0, 147.0, 315.0, 643.0, 1332.0, 3891.0, 14781.0, 125403.0, 831099.0, 56443.0, 9341.0, 2743.0, 1057.0, 491.0, 251.0, 153.0, 79.0, 39.0, 27.0, 26.0, 23.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2442626953125, -0.23462486267089844, -0.22498703002929688, -0.2153491973876953, -0.20571136474609375, -0.1960735321044922, -0.18643569946289062, -0.17679786682128906, -0.1671600341796875, -0.15752220153808594, -0.14788436889648438, -0.1382465362548828, -0.12860870361328125, -0.11897087097167969, -0.10933303833007812, -0.09969520568847656, -0.090057373046875, -0.08041954040527344, -0.07078170776367188, -0.06114387512207031, -0.05150604248046875, -0.04186820983886719, -0.032230377197265625, -0.022592544555664062, -0.0129547119140625, -0.0033168792724609375, 0.006320953369140625, 0.015958786010742188, 0.02559661865234375, 0.03523445129394531, 0.044872283935546875, 0.05451011657714844, 0.06414794921875, 0.07378578186035156, 0.08342361450195312, 0.09306144714355469, 0.10269927978515625, 0.11233711242675781, 0.12197494506835938, 0.13161277770996094, 0.1412506103515625, 0.15088844299316406, 0.16052627563476562, 0.1701641082763672, 0.17980194091796875, 0.1894397735595703, 0.19907760620117188, 0.20871543884277344, 0.218353271484375, 0.22799110412597656, 0.23762893676757812, 0.2472667694091797, 0.25690460205078125, 0.2665424346923828, 0.2761802673339844, 0.28581809997558594, 0.2954559326171875, 0.30509376525878906, 0.3147315979003906, 0.3243694305419922, 0.33400726318359375, 0.3436450958251953, 0.3532829284667969, 0.36292076110839844, 0.37255859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 3.0, 8.0, 11.0, 7.0, 18.0, 21.0, 34.0, 53.0, 65.0, 93.0, 124.0, 135.0, 104.0, 88.0, 64.0, 41.0, 35.0, 23.0, 9.0, 4.0, 6.0, 12.0, 11.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283203125, -0.27541351318359375, -0.2676239013671875, -0.25983428955078125, -0.252044677734375, -0.24425506591796875, -0.2364654541015625, -0.22867584228515625, -0.22088623046875, -0.21309661865234375, -0.2053070068359375, -0.19751739501953125, -0.189727783203125, -0.18193817138671875, -0.1741485595703125, -0.16635894775390625, -0.1585693359375, -0.15077972412109375, -0.1429901123046875, -0.13520050048828125, -0.127410888671875, -0.11962127685546875, -0.1118316650390625, -0.10404205322265625, -0.09625244140625, -0.08846282958984375, -0.0806732177734375, -0.07288360595703125, -0.065093994140625, -0.05730438232421875, -0.0495147705078125, -0.04172515869140625, -0.033935546875, -0.02614593505859375, -0.0183563232421875, -0.01056671142578125, -0.002777099609375, 0.00501251220703125, 0.0128021240234375, 0.02059173583984375, 0.02838134765625, 0.03617095947265625, 0.0439605712890625, 0.05175018310546875, 0.059539794921875, 0.06732940673828125, 0.0751190185546875, 0.08290863037109375, 0.0906982421875, 0.09848785400390625, 0.1062774658203125, 0.11406707763671875, 0.121856689453125, 0.12964630126953125, 0.1374359130859375, 0.14522552490234375, 0.15301513671875, 0.16080474853515625, 0.1685943603515625, 0.17638397216796875, 0.184173583984375, 0.19196319580078125, 0.1997528076171875, 0.20754241943359375, 0.21533203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 12.0, 37.0, 133.0, 423.0, 250.0, 76.0, 38.0, 18.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4286065101623535, -5.153811454772949, -4.879016399383545, -4.604221343994141, -4.329425811767578, -4.054630756378174, -3.7798357009887695, -3.5050406455993652, -3.230245351791382, -2.9554502964019775, -2.680655002593994, -2.40585994720459, -2.1310648918151855, -1.8562695980072021, -1.5814745426177979, -1.306679368019104, -1.0318841934204102, -0.7570890188217163, -0.48229390382766724, -0.20749878883361816, 0.06729638576507568, 0.34209156036376953, 0.6168866157531738, 0.8916817903518677, 1.1664769649505615, 1.4412721395492554, 1.7160673141479492, 1.9908623695373535, 2.265657424926758, 2.540452718734741, 2.8152477741241455, 3.090043067932129, 3.364837646484375, 3.6396327018737793, 3.9144279956817627, 4.189223289489746, 4.46401834487915, 4.738813400268555, 5.013608455657959, 5.288403511047363, 5.563199043273926, 5.83799409866333, 6.112789154052734, 6.387584686279297, 6.662379741668701, 6.9371747970581055, 7.21196985244751, 7.486764907836914, 7.761559963226318, 8.036355018615723, 8.311150550842285, 8.585945129394531, 8.860740661621094, 9.135536193847656, 9.410330772399902, 9.685126304626465, 9.959920883178711, 10.234716415405273, 10.50951099395752, 10.784306526184082, 11.059101104736328, 11.33389663696289, 11.608692169189453, 11.8834867477417, 12.158282279968262]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 9.0, 17.0, 15.0, 15.0, 22.0, 24.0, 20.0, 19.0, 24.0, 27.0, 34.0, 47.0, 54.0, 65.0, 93.0, 77.0, 68.0, 44.0, 37.0, 41.0, 22.0, 32.0, 20.0, 21.0, 15.0, 20.0, 13.0, 14.0, 12.0, 6.0, 5.0, 7.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0460667610168457, -2.946803569793701, -2.8475406169891357, -2.748277425765991, -2.649014472961426, -2.5497512817382812, -2.450488328933716, -2.3512251377105713, -2.251962184906006, -2.1526989936828613, -2.053436040878296, -1.954172968864441, -1.854909896850586, -1.755646824836731, -1.656383752822876, -1.5571205615997314, -1.4578574895858765, -1.3585944175720215, -1.2593313455581665, -1.1600682735443115, -1.0608052015304565, -0.9615421295166016, -0.8622789978981018, -0.7630159258842468, -0.6637528538703918, -0.5644897818565369, -0.4652267098426819, -0.3659636080265045, -0.26670053601264954, -0.16743746399879456, -0.06817436218261719, 0.031088709831237793, 0.13035178184509277, 0.22961485385894775, 0.32887792587280273, 0.4281410276889801, 0.5274040699005127, 0.6266671419143677, 0.7259302735328674, 0.8251933455467224, 0.9244564175605774, 1.0237195491790771, 1.1229826211929321, 1.222245693206787, 1.321508765220642, 1.420771837234497, 1.520034909248352, 1.619297981262207, 1.718561053276062, 1.817824125289917, 1.917087197303772, 2.016350269317627, 2.1156134605407715, 2.214876413345337, 2.3141396045684814, 2.413402557373047, 2.5126657485961914, 2.611928939819336, 2.7111918926239014, 2.810455083847046, 2.9097180366516113, 3.008981227874756, 3.1082441806793213, 3.207507371902466, 3.3067703247070312]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 8.0, 5.0, 5.0, 7.0, 13.0, 18.0, 27.0, 27.0, 39.0, 47.0, 74.0, 141.0, 220.0, 448.0, 1120.0, 3309.0, 13377.0, 106019.0, 2637079.0, 1357452.0, 61609.0, 9032.0, 2395.0, 864.0, 365.0, 199.0, 99.0, 81.0, 62.0, 25.0, 23.0, 24.0, 16.0, 11.0, 13.0, 5.0, 11.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423828125, -0.4080657958984375, -0.392303466796875, -0.3765411376953125, -0.36077880859375, -0.3450164794921875, -0.329254150390625, -0.3134918212890625, -0.2977294921875, -0.2819671630859375, -0.266204833984375, -0.2504425048828125, -0.23468017578125, -0.2189178466796875, -0.203155517578125, -0.1873931884765625, -0.171630859375, -0.1558685302734375, -0.140106201171875, -0.1243438720703125, -0.10858154296875, -0.0928192138671875, -0.077056884765625, -0.0612945556640625, -0.0455322265625, -0.0297698974609375, -0.014007568359375, 0.0017547607421875, 0.01751708984375, 0.0332794189453125, 0.049041748046875, 0.0648040771484375, 0.08056640625, 0.0963287353515625, 0.112091064453125, 0.1278533935546875, 0.14361572265625, 0.1593780517578125, 0.175140380859375, 0.1909027099609375, 0.2066650390625, 0.2224273681640625, 0.238189697265625, 0.2539520263671875, 0.26971435546875, 0.2854766845703125, 0.301239013671875, 0.3170013427734375, 0.332763671875, 0.3485260009765625, 0.364288330078125, 0.3800506591796875, 0.39581298828125, 0.4115753173828125, 0.427337646484375, 0.4430999755859375, 0.4588623046875, 0.4746246337890625, 0.490386962890625, 0.5061492919921875, 0.52191162109375, 0.5376739501953125, 0.553436279296875, 0.5691986083984375, 0.5849609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 9.0, 6.0, 13.0, 9.0, 6.0, 10.0, 15.0, 26.0, 22.0, 21.0, 26.0, 25.0, 34.0, 38.0, 40.0, 35.0, 43.0, 38.0, 47.0, 42.0, 42.0, 48.0, 43.0, 42.0, 35.0, 34.0, 26.0, 24.0, 22.0, 28.0, 13.0, 28.0, 16.0, 11.0, 10.0, 4.0, 13.0, 8.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1660003662109375, -0.160125732421875, -0.1542510986328125, -0.14837646484375, -0.1425018310546875, -0.136627197265625, -0.1307525634765625, -0.1248779296875, -0.1190032958984375, -0.113128662109375, -0.1072540283203125, -0.10137939453125, -0.0955047607421875, -0.089630126953125, -0.0837554931640625, -0.077880859375, -0.0720062255859375, -0.066131591796875, -0.0602569580078125, -0.05438232421875, -0.0485076904296875, -0.042633056640625, -0.0367584228515625, -0.0308837890625, -0.0250091552734375, -0.019134521484375, -0.0132598876953125, -0.00738525390625, -0.0015106201171875, 0.004364013671875, 0.0102386474609375, 0.01611328125, 0.0219879150390625, 0.027862548828125, 0.0337371826171875, 0.03961181640625, 0.0454864501953125, 0.051361083984375, 0.0572357177734375, 0.0631103515625, 0.0689849853515625, 0.074859619140625, 0.0807342529296875, 0.08660888671875, 0.0924835205078125, 0.098358154296875, 0.1042327880859375, 0.110107421875, 0.1159820556640625, 0.121856689453125, 0.1277313232421875, 0.13360595703125, 0.1394805908203125, 0.145355224609375, 0.1512298583984375, 0.1571044921875, 0.1629791259765625, 0.168853759765625, 0.1747283935546875, 0.18060302734375, 0.1864776611328125, 0.192352294921875, 0.1982269287109375, 0.2041015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 25.0, 33.0, 83.0, 164.0, 514.0, 3489.0, 98485.0, 4058333.0, 30444.0, 2037.0, 379.0, 151.0, 48.0, 23.0, 21.0, 10.0, 12.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.64447021484375, -1.6004638671875, -1.55645751953125, -1.512451171875, -1.46844482421875, -1.4244384765625, -1.38043212890625, -1.33642578125, -1.29241943359375, -1.2484130859375, -1.20440673828125, -1.160400390625, -1.11639404296875, -1.0723876953125, -1.02838134765625, -0.984375, -0.94036865234375, -0.8963623046875, -0.85235595703125, -0.808349609375, -0.76434326171875, -0.7203369140625, -0.67633056640625, -0.63232421875, -0.58831787109375, -0.5443115234375, -0.50030517578125, -0.456298828125, -0.41229248046875, -0.3682861328125, -0.32427978515625, -0.2802734375, -0.23626708984375, -0.1922607421875, -0.14825439453125, -0.104248046875, -0.06024169921875, -0.0162353515625, 0.02777099609375, 0.07177734375, 0.11578369140625, 0.1597900390625, 0.20379638671875, 0.247802734375, 0.29180908203125, 0.3358154296875, 0.37982177734375, 0.423828125, 0.46783447265625, 0.5118408203125, 0.55584716796875, 0.599853515625, 0.64385986328125, 0.6878662109375, 0.73187255859375, 0.77587890625, 0.81988525390625, 0.8638916015625, 0.90789794921875, 0.951904296875, 0.99591064453125, 1.0399169921875, 1.08392333984375, 1.1279296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 7.0, 17.0, 18.0, 27.0, 30.0, 52.0, 87.0, 119.0, 209.0, 300.0, 570.0, 806.0, 673.0, 431.0, 249.0, 146.0, 78.0, 51.0, 43.0, 36.0, 29.0, 12.0, 12.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4501953125, -0.43506622314453125, -0.4199371337890625, -0.40480804443359375, -0.389678955078125, -0.37454986572265625, -0.3594207763671875, -0.34429168701171875, -0.32916259765625, -0.31403350830078125, -0.2989044189453125, -0.28377532958984375, -0.268646240234375, -0.25351715087890625, -0.2383880615234375, -0.22325897216796875, -0.2081298828125, -0.19300079345703125, -0.1778717041015625, -0.16274261474609375, -0.147613525390625, -0.13248443603515625, -0.1173553466796875, -0.10222625732421875, -0.08709716796875, -0.07196807861328125, -0.0568389892578125, -0.04170989990234375, -0.026580810546875, -0.01145172119140625, 0.0036773681640625, 0.01880645751953125, 0.033935546875, 0.04906463623046875, 0.0641937255859375, 0.07932281494140625, 0.094451904296875, 0.10958099365234375, 0.1247100830078125, 0.13983917236328125, 0.15496826171875, 0.17009735107421875, 0.1852264404296875, 0.20035552978515625, 0.215484619140625, 0.23061370849609375, 0.2457427978515625, 0.26087188720703125, 0.2760009765625, 0.29113006591796875, 0.3062591552734375, 0.32138824462890625, 0.336517333984375, 0.35164642333984375, 0.3667755126953125, 0.38190460205078125, 0.39703369140625, 0.41216278076171875, 0.4272918701171875, 0.44242095947265625, 0.457550048828125, 0.47267913818359375, 0.4878082275390625, 0.5029373168945312, 0.51806640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 14.0, 15.0, 50.0, 64.0, 129.0, 157.0, 187.0, 143.0, 96.0, 53.0, 28.0, 14.0, 12.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.864886283874512, -4.737573623657227, -4.610260486602783, -4.482947826385498, -4.355634689331055, -4.2283220291137695, -4.101008892059326, -3.973696231842041, -3.8463833332061768, -3.7190704345703125, -3.5917575359344482, -3.464444637298584, -3.337131977081299, -3.2098188400268555, -3.0825061798095703, -2.955193281173706, -2.827880382537842, -2.7005674839019775, -2.5732545852661133, -2.445941686630249, -2.3186287879943848, -2.1913161277770996, -2.0640032291412354, -1.936690330505371, -1.8093774318695068, -1.6820645332336426, -1.5547516345977783, -1.4274388551712036, -1.3001259565353394, -1.172813057899475, -1.0455002784729004, -0.9181873798370361, -0.7908740043640137, -0.6635611057281494, -0.5362482666969299, -0.40893539786338806, -0.2816225290298462, -0.15430963039398193, -0.02699679136276245, 0.10031604766845703, 0.2276289463043213, 0.35494181513786316, 0.48225468397140503, 0.6095675230026245, 0.7368804216384888, 0.864193320274353, 0.9915061593055725, 1.118818998336792, 1.2461318969726562, 1.3734447956085205, 1.5007576942443848, 1.6280704736709595, 1.7553833723068237, 1.882696270942688, 2.0100090503692627, 2.137321949005127, 2.264634847640991, 2.3919477462768555, 2.5192606449127197, 2.646573543548584, 2.773886203765869, 2.9011993408203125, 3.0285120010375977, 3.155824899673462, 3.283137798309326]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 11.0, 10.0, 10.0, 16.0, 18.0, 14.0, 25.0, 26.0, 21.0, 32.0, 35.0, 44.0, 54.0, 65.0, 49.0, 61.0, 48.0, 62.0, 46.0, 49.0, 42.0, 34.0, 34.0, 33.0, 29.0, 28.0, 27.0, 12.0, 9.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9927042722702026, -1.9288220405578613, -1.86493980884552, -1.8010575771331787, -1.7371753454208374, -1.673293113708496, -1.6094107627868652, -1.5455286502838135, -1.4816462993621826, -1.4177640676498413, -1.3538818359375, -1.2899996042251587, -1.2261173725128174, -1.162235140800476, -1.0983529090881348, -1.034470558166504, -0.9705884456634521, -0.9067062139511108, -0.8428239822387695, -0.7789417505264282, -0.7150595188140869, -0.6511772871017456, -0.5872949957847595, -0.5234127640724182, -0.4595305323600769, -0.3956483006477356, -0.3317660689353943, -0.2678838074207306, -0.20400157570838928, -0.14011934399604797, -0.07623708248138428, -0.012354850769042969, 0.05152726173400879, 0.1154095008969307, 0.1792917400598526, 0.2431739866733551, 0.3070562183856964, 0.3709384500980377, 0.4348207116127014, 0.4987029433250427, 0.562585175037384, 0.6264674067497253, 0.6903496384620667, 0.7542319297790527, 0.818114161491394, 0.8819963932037354, 0.9458786249160767, 1.009760856628418, 1.0736430883407593, 1.1375253200531006, 1.201407551765442, 1.2652897834777832, 1.3291720151901245, 1.3930542469024658, 1.4569365978240967, 1.5208187103271484, 1.5847010612487793, 1.6485832929611206, 1.712465524673462, 1.7763477563858032, 1.8402299880981445, 1.9041122198104858, 1.9679944515228271, 2.031876802444458, 2.0957589149475098]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 9.0, 19.0, 34.0, 51.0, 93.0, 125.0, 213.0, 432.0, 841.0, 1647.0, 3894.0, 9977.0, 28955.0, 112683.0, 532098.0, 274157.0, 55371.0, 16685.0, 6159.0, 2529.0, 1244.0, 604.0, 296.0, 162.0, 94.0, 66.0, 39.0, 18.0, 9.0, 12.0, 8.0, 3.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.52587890625, -0.5123100280761719, -0.49874114990234375, -0.4851722717285156, -0.4716033935546875, -0.4580345153808594, -0.44446563720703125, -0.4308967590332031, -0.417327880859375, -0.4037590026855469, -0.39019012451171875, -0.3766212463378906, -0.3630523681640625, -0.3494834899902344, -0.33591461181640625, -0.3223457336425781, -0.30877685546875, -0.2952079772949219, -0.28163909912109375, -0.2680702209472656, -0.2545013427734375, -0.24093246459960938, -0.22736358642578125, -0.21379470825195312, -0.200225830078125, -0.18665695190429688, -0.17308807373046875, -0.15951919555664062, -0.1459503173828125, -0.13238143920898438, -0.11881256103515625, -0.10524368286132812, -0.0916748046875, -0.07810592651367188, -0.06453704833984375, -0.050968170166015625, -0.0373992919921875, -0.023830413818359375, -0.01026153564453125, 0.003307342529296875, 0.016876220703125, 0.030445098876953125, 0.04401397705078125, 0.057582855224609375, 0.0711517333984375, 0.08472061157226562, 0.09828948974609375, 0.11185836791992188, 0.12542724609375, 0.13899612426757812, 0.15256500244140625, 0.16613388061523438, 0.1797027587890625, 0.19327163696289062, 0.20684051513671875, 0.22040939331054688, 0.233978271484375, 0.24754714965820312, 0.26111602783203125, 0.2746849060058594, 0.2882537841796875, 0.3018226623535156, 0.31539154052734375, 0.3289604187011719, 0.342529296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 2.0, 7.0, 6.0, 7.0, 13.0, 16.0, 17.0, 18.0, 15.0, 31.0, 37.0, 34.0, 27.0, 30.0, 37.0, 30.0, 32.0, 58.0, 58.0, 51.0, 40.0, 44.0, 36.0, 47.0, 43.0, 35.0, 33.0, 31.0, 16.0, 20.0, 24.0, 19.0, 15.0, 12.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2117919921875, -0.20538902282714844, -0.19898605346679688, -0.1925830841064453, -0.18618011474609375, -0.1797771453857422, -0.17337417602539062, -0.16697120666503906, -0.1605682373046875, -0.15416526794433594, -0.14776229858398438, -0.1413593292236328, -0.13495635986328125, -0.1285533905029297, -0.12215042114257812, -0.11574745178222656, -0.109344482421875, -0.10294151306152344, -0.09653854370117188, -0.09013557434082031, -0.08373260498046875, -0.07732963562011719, -0.07092666625976562, -0.06452369689941406, -0.0581207275390625, -0.05171775817871094, -0.045314788818359375, -0.03891181945800781, -0.03250885009765625, -0.026105880737304688, -0.019702911376953125, -0.013299942016601562, -0.00689697265625, -0.0004940032958984375, 0.005908966064453125, 0.012311935424804688, 0.01871490478515625, 0.025117874145507812, 0.031520843505859375, 0.03792381286621094, 0.0443267822265625, 0.05072975158691406, 0.057132720947265625, 0.06353569030761719, 0.06993865966796875, 0.07634162902832031, 0.08274459838867188, 0.08914756774902344, 0.095550537109375, 0.10195350646972656, 0.10835647583007812, 0.11475944519042969, 0.12116241455078125, 0.1275653839111328, 0.13396835327148438, 0.14037132263183594, 0.1467742919921875, 0.15317726135253906, 0.15958023071289062, 0.1659832000732422, 0.17238616943359375, 0.1787891387939453, 0.18519210815429688, 0.19159507751464844, 0.197998046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 8.0, 12.0, 25.0, 31.0, 55.0, 68.0, 102.0, 209.0, 335.0, 695.0, 1574.0, 4411.0, 19488.0, 222266.0, 753335.0, 35421.0, 6561.0, 2026.0, 852.0, 429.0, 214.0, 135.0, 75.0, 62.0, 35.0, 31.0, 13.0, 16.0, 13.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.814239501953125, -0.79107666015625, -0.767913818359375, -0.7447509765625, -0.721588134765625, -0.69842529296875, -0.675262451171875, -0.652099609375, -0.628936767578125, -0.60577392578125, -0.582611083984375, -0.5594482421875, -0.536285400390625, -0.51312255859375, -0.489959716796875, -0.466796875, -0.443634033203125, -0.42047119140625, -0.397308349609375, -0.3741455078125, -0.350982666015625, -0.32781982421875, -0.304656982421875, -0.281494140625, -0.258331298828125, -0.23516845703125, -0.212005615234375, -0.1888427734375, -0.165679931640625, -0.14251708984375, -0.119354248046875, -0.09619140625, -0.073028564453125, -0.04986572265625, -0.026702880859375, -0.0035400390625, 0.019622802734375, 0.04278564453125, 0.065948486328125, 0.089111328125, 0.112274169921875, 0.13543701171875, 0.158599853515625, 0.1817626953125, 0.204925537109375, 0.22808837890625, 0.251251220703125, 0.2744140625, 0.297576904296875, 0.32073974609375, 0.343902587890625, 0.3670654296875, 0.390228271484375, 0.41339111328125, 0.436553955078125, 0.459716796875, 0.482879638671875, 0.50604248046875, 0.529205322265625, 0.5523681640625, 0.575531005859375, 0.59869384765625, 0.621856689453125, 0.64501953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 13.0, 10.0, 6.0, 18.0, 13.0, 23.0, 23.0, 16.0, 31.0, 37.0, 39.0, 42.0, 59.0, 40.0, 65.0, 47.0, 57.0, 41.0, 55.0, 50.0, 54.0, 38.0, 38.0, 36.0, 26.0, 21.0, 17.0, 10.0, 9.0, 8.0, 7.0, 13.0, 2.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.82373046875, -0.7971115112304688, -0.7704925537109375, -0.7438735961914062, -0.717254638671875, -0.6906356811523438, -0.6640167236328125, -0.6373977661132812, -0.61077880859375, -0.5841598510742188, -0.5575408935546875, -0.5309219360351562, -0.504302978515625, -0.47768402099609375, -0.4510650634765625, -0.42444610595703125, -0.3978271484375, -0.37120819091796875, -0.3445892333984375, -0.31797027587890625, -0.291351318359375, -0.26473236083984375, -0.2381134033203125, -0.21149444580078125, -0.18487548828125, -0.15825653076171875, -0.1316375732421875, -0.10501861572265625, -0.078399658203125, -0.05178070068359375, -0.0251617431640625, 0.00145721435546875, 0.028076171875, 0.05469512939453125, 0.0813140869140625, 0.10793304443359375, 0.134552001953125, 0.16117095947265625, 0.1877899169921875, 0.21440887451171875, 0.24102783203125, 0.26764678955078125, 0.2942657470703125, 0.32088470458984375, 0.347503662109375, 0.37412261962890625, 0.4007415771484375, 0.42736053466796875, 0.4539794921875, 0.48059844970703125, 0.5072174072265625, 0.5338363647460938, 0.560455322265625, 0.5870742797851562, 0.6136932373046875, 0.6403121948242188, 0.66693115234375, 0.6935501098632812, 0.7201690673828125, 0.7467880249023438, 0.773406982421875, 0.8000259399414062, 0.8266448974609375, 0.8532638549804688, 0.8798828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 9.0, 10.0, 18.0, 22.0, 27.0, 51.0, 88.0, 183.0, 326.0, 868.0, 2487.0, 13069.0, 768339.0, 249877.0, 9566.0, 2157.0, 758.0, 333.0, 161.0, 89.0, 44.0, 21.0, 13.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3288688659667969, -0.31618499755859375, -0.3035011291503906, -0.2908172607421875, -0.2781333923339844, -0.26544952392578125, -0.2527656555175781, -0.240081787109375, -0.22739791870117188, -0.21471405029296875, -0.20203018188476562, -0.1893463134765625, -0.17666244506835938, -0.16397857666015625, -0.15129470825195312, -0.13861083984375, -0.12592697143554688, -0.11324310302734375, -0.10055923461914062, -0.0878753662109375, -0.07519149780273438, -0.06250762939453125, -0.049823760986328125, -0.037139892578125, -0.024456024169921875, -0.01177215576171875, 0.000911712646484375, 0.0135955810546875, 0.026279449462890625, 0.03896331787109375, 0.051647186279296875, 0.0643310546875, 0.07701492309570312, 0.08969879150390625, 0.10238265991210938, 0.1150665283203125, 0.12775039672851562, 0.14043426513671875, 0.15311813354492188, 0.165802001953125, 0.17848587036132812, 0.19116973876953125, 0.20385360717773438, 0.2165374755859375, 0.22922134399414062, 0.24190521240234375, 0.2545890808105469, 0.26727294921875, 0.2799568176269531, 0.29264068603515625, 0.3053245544433594, 0.3180084228515625, 0.3306922912597656, 0.34337615966796875, 0.3560600280761719, 0.368743896484375, 0.3814277648925781, 0.39411163330078125, 0.4067955017089844, 0.4194793701171875, 0.4321632385253906, 0.44484710693359375, 0.4575309753417969, 0.47021484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 9.0, 13.0, 31.0, 89.0, 333.0, 362.0, 79.0, 30.0, 17.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00032520294189453125, -0.0003184322267770767, -0.0003116615116596222, -0.00030489079654216766, -0.00029812008142471313, -0.0002913493663072586, -0.0002845786511898041, -0.00027780793607234955, -0.000271037220954895, -0.0002642665058374405, -0.00025749579071998596, -0.00025072507560253143, -0.0002439543604850769, -0.00023718364536762238, -0.00023041293025016785, -0.00022364221513271332, -0.0002168715000152588, -0.00021010078489780426, -0.00020333006978034973, -0.0001965593546628952, -0.00018978863954544067, -0.00018301792442798615, -0.00017624720931053162, -0.0001694764941930771, -0.00016270577907562256, -0.00015593506395816803, -0.0001491643488407135, -0.00014239363372325897, -0.00013562291860580444, -0.00012885220348834991, -0.00012208148837089539, -0.00011531077325344086, -0.00010854005813598633, -0.0001017693430185318, -9.499862790107727e-05, -8.822791278362274e-05, -8.145719766616821e-05, -7.468648254871368e-05, -6.791576743125916e-05, -6.114505231380463e-05, -5.43743371963501e-05, -4.760362207889557e-05, -4.083290696144104e-05, -3.406219184398651e-05, -2.7291476726531982e-05, -2.0520761609077454e-05, -1.3750046491622925e-05, -6.979331374168396e-06, -2.086162567138672e-07, 6.562098860740662e-06, 1.333281397819519e-05, 2.010352909564972e-05, 2.6874244213104248e-05, 3.364495933055878e-05, 4.0415674448013306e-05, 4.7186389565467834e-05, 5.395710468292236e-05, 6.072781980037689e-05, 6.749853491783142e-05, 7.426925003528595e-05, 8.103996515274048e-05, 8.781068027019501e-05, 9.458139538764954e-05, 0.00010135211050510406, 0.0001081228256225586]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 10.0, 15.0, 18.0, 31.0, 54.0, 52.0, 102.0, 160.0, 307.0, 614.0, 1741.0, 6154.0, 79463.0, 926386.0, 27272.0, 3801.0, 1181.0, 500.0, 251.0, 145.0, 100.0, 63.0, 32.0, 21.0, 19.0, 17.0, 6.0, 8.0, 2.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34375, -0.3311767578125, -0.318603515625, -0.3060302734375, -0.29345703125, -0.2808837890625, -0.268310546875, -0.2557373046875, -0.2431640625, -0.2305908203125, -0.218017578125, -0.2054443359375, -0.19287109375, -0.1802978515625, -0.167724609375, -0.1551513671875, -0.142578125, -0.1300048828125, -0.117431640625, -0.1048583984375, -0.09228515625, -0.0797119140625, -0.067138671875, -0.0545654296875, -0.0419921875, -0.0294189453125, -0.016845703125, -0.0042724609375, 0.00830078125, 0.0208740234375, 0.033447265625, 0.0460205078125, 0.05859375, 0.0711669921875, 0.083740234375, 0.0963134765625, 0.10888671875, 0.1214599609375, 0.134033203125, 0.1466064453125, 0.1591796875, 0.1717529296875, 0.184326171875, 0.1968994140625, 0.20947265625, 0.2220458984375, 0.234619140625, 0.2471923828125, 0.259765625, 0.2723388671875, 0.284912109375, 0.2974853515625, 0.31005859375, 0.3226318359375, 0.335205078125, 0.3477783203125, 0.3603515625, 0.3729248046875, 0.385498046875, 0.3980712890625, 0.41064453125, 0.4232177734375, 0.435791015625, 0.4483642578125, 0.4609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 5.0, 13.0, 24.0, 41.0, 45.0, 114.0, 157.0, 195.0, 156.0, 83.0, 55.0, 34.0, 18.0, 14.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.369140625, -0.35950279235839844, -0.3498649597167969, -0.3402271270751953, -0.33058929443359375, -0.3209514617919922, -0.3113136291503906, -0.30167579650878906, -0.2920379638671875, -0.28240013122558594, -0.2727622985839844, -0.2631244659423828, -0.25348663330078125, -0.2438488006591797, -0.23421096801757812, -0.22457313537597656, -0.214935302734375, -0.20529747009277344, -0.19565963745117188, -0.1860218048095703, -0.17638397216796875, -0.1667461395263672, -0.15710830688476562, -0.14747047424316406, -0.1378326416015625, -0.12819480895996094, -0.11855697631835938, -0.10891914367675781, -0.09928131103515625, -0.08964347839355469, -0.08000564575195312, -0.07036781311035156, -0.06072998046875, -0.05109214782714844, -0.041454315185546875, -0.03181648254394531, -0.02217864990234375, -0.012540817260742188, -0.002902984619140625, 0.0067348480224609375, 0.0163726806640625, 0.026010513305664062, 0.035648345947265625, 0.04528617858886719, 0.05492401123046875, 0.06456184387207031, 0.07419967651367188, 0.08383750915527344, 0.093475341796875, 0.10311317443847656, 0.11275100708007812, 0.12238883972167969, 0.13202667236328125, 0.1416645050048828, 0.15130233764648438, 0.16094017028808594, 0.1705780029296875, 0.18021583557128906, 0.18985366821289062, 0.1994915008544922, 0.20912933349609375, 0.2187671661376953, 0.22840499877929688, 0.23804283142089844, 0.2476806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 8.0, 15.0, 58.0, 157.0, 498.0, 190.0, 45.0, 19.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.972320556640625, -10.694829940795898, -10.417340278625488, -10.139849662780762, -9.862359046936035, -9.584869384765625, -9.307378768920898, -9.029888153076172, -8.752397537231445, -8.474906921386719, -8.197417259216309, -7.919926643371582, -7.6424360275268555, -7.364945888519287, -7.087455749511719, -6.809965133666992, -6.532475471496582, -6.254985332489014, -5.977494716644287, -5.700004577636719, -5.422513961791992, -5.145023822784424, -4.8675336837768555, -4.590043067932129, -4.3125529289245605, -4.035062789916992, -3.7575721740722656, -3.4800820350646973, -3.20259165763855, -2.9251012802124023, -2.647611141204834, -2.3701207637786865, -2.0926294326782227, -1.8151390552520752, -1.5376487970352173, -1.2601585388183594, -0.9826681613922119, -0.7051777839660645, -0.42768752574920654, -0.15019726753234863, 0.12729310989379883, 0.4047834277153015, 0.6822737455368042, 0.9597640633583069, 1.2372543811798096, 1.514744758605957, 1.792235016822815, 2.069725275039673, 2.3472156524658203, 2.6247060298919678, 2.9021964073181152, 3.1796865463256836, 3.457176923751831, 3.7346673011779785, 4.012157440185547, 4.289648056030273, 4.567138195037842, 4.84462833404541, 5.122118949890137, 5.399609088897705, 5.677099227905273, 5.95458984375, 6.232079982757568, 6.509570121765137, 6.787060737609863]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 2.0, 8.0, 14.0, 10.0, 18.0, 23.0, 16.0, 19.0, 18.0, 26.0, 30.0, 21.0, 27.0, 54.0, 64.0, 74.0, 86.0, 94.0, 55.0, 49.0, 27.0, 27.0, 22.0, 25.0, 16.0, 16.0, 19.0, 19.0, 11.0, 21.0, 10.0, 8.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.8594861030578613, -2.7713756561279297, -2.683264970779419, -2.5951545238494873, -2.5070438385009766, -2.418933391571045, -2.3308229446411133, -2.2427124977111816, -2.154601812362671, -2.0664913654327393, -1.9783806800842285, -1.8902702331542969, -1.8021596670150757, -1.7140491008758545, -1.6259386539459229, -1.5378280878067017, -1.4497175216674805, -1.3616069555282593, -1.273496389389038, -1.1853859424591064, -1.0972753763198853, -1.009164810180664, -0.9210543036460876, -0.8329437971115112, -0.74483323097229, -0.6567226648330688, -0.5686121582984924, -0.48050162196159363, -0.3923910856246948, -0.304280549287796, -0.21617001295089722, -0.1280595064163208, -0.03994917869567871, 0.04816135764122009, 0.1362718939781189, 0.2243824303150177, 0.3124929666519165, 0.4006035029888153, 0.4887140393257141, 0.5768245458602905, 0.6649351119995117, 0.7530456781387329, 0.8411561846733093, 0.9292666912078857, 1.017377257347107, 1.1054878234863281, 1.1935982704162598, 1.281708836555481, 1.3698194026947021, 1.4579299688339233, 1.5460405349731445, 1.6341509819030762, 1.7222615480422974, 1.8103721141815186, 1.8984825611114502, 1.9865931272506714, 2.0747036933898926, 2.162814140319824, 2.250924825668335, 2.3390352725982666, 2.4271459579467773, 2.515256404876709, 2.6033668518066406, 2.6914772987365723, 2.779587984085083]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 13.0, 8.0, 20.0, 22.0, 39.0, 51.0, 110.0, 126.0, 263.0, 462.0, 788.0, 1591.0, 3555.0, 9040.0, 28942.0, 136104.0, 1023603.0, 2419042.0, 469788.0, 71384.0, 18017.0, 5977.0, 2575.0, 1242.0, 623.0, 317.0, 235.0, 119.0, 72.0, 42.0, 37.0, 17.0, 23.0, 10.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48486328125, -0.4693756103515625, -0.453887939453125, -0.4384002685546875, -0.42291259765625, -0.4074249267578125, -0.391937255859375, -0.3764495849609375, -0.3609619140625, -0.3454742431640625, -0.329986572265625, -0.3144989013671875, -0.29901123046875, -0.2835235595703125, -0.268035888671875, -0.2525482177734375, -0.237060546875, -0.2215728759765625, -0.206085205078125, -0.1905975341796875, -0.17510986328125, -0.1596221923828125, -0.144134521484375, -0.1286468505859375, -0.1131591796875, -0.0976715087890625, -0.082183837890625, -0.0666961669921875, -0.05120849609375, -0.0357208251953125, -0.020233154296875, -0.0047454833984375, 0.0107421875, 0.0262298583984375, 0.041717529296875, 0.0572052001953125, 0.07269287109375, 0.0881805419921875, 0.103668212890625, 0.1191558837890625, 0.1346435546875, 0.1501312255859375, 0.165618896484375, 0.1811065673828125, 0.19659423828125, 0.2120819091796875, 0.227569580078125, 0.2430572509765625, 0.258544921875, 0.2740325927734375, 0.289520263671875, 0.3050079345703125, 0.32049560546875, 0.3359832763671875, 0.351470947265625, 0.3669586181640625, 0.3824462890625, 0.3979339599609375, 0.413421630859375, 0.4289093017578125, 0.44439697265625, 0.4598846435546875, 0.475372314453125, 0.4908599853515625, 0.50634765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 6.0, 16.0, 9.0, 11.0, 20.0, 19.0, 15.0, 43.0, 33.0, 35.0, 41.0, 37.0, 51.0, 59.0, 48.0, 60.0, 60.0, 62.0, 53.0, 44.0, 49.0, 38.0, 29.0, 25.0, 24.0, 28.0, 21.0, 16.0, 10.0, 10.0, 3.0, 6.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.281494140625, -0.2739696502685547, -0.2664451599121094, -0.25892066955566406, -0.25139617919921875, -0.24387168884277344, -0.23634719848632812, -0.2288227081298828, -0.2212982177734375, -0.2137737274169922, -0.20624923706054688, -0.19872474670410156, -0.19120025634765625, -0.18367576599121094, -0.17615127563476562, -0.1686267852783203, -0.161102294921875, -0.1535778045654297, -0.14605331420898438, -0.13852882385253906, -0.13100433349609375, -0.12347984313964844, -0.11595535278320312, -0.10843086242675781, -0.1009063720703125, -0.09338188171386719, -0.08585739135742188, -0.07833290100097656, -0.07080841064453125, -0.06328392028808594, -0.055759429931640625, -0.04823493957519531, -0.04071044921875, -0.03318595886230469, -0.025661468505859375, -0.018136978149414062, -0.01061248779296875, -0.0030879974365234375, 0.004436492919921875, 0.011960983276367188, 0.0194854736328125, 0.027009963989257812, 0.034534454345703125, 0.04205894470214844, 0.04958343505859375, 0.05710792541503906, 0.06463241577148438, 0.07215690612792969, 0.079681396484375, 0.08720588684082031, 0.09473037719726562, 0.10225486755371094, 0.10977935791015625, 0.11730384826660156, 0.12482833862304688, 0.1323528289794922, 0.1398773193359375, 0.1474018096923828, 0.15492630004882812, 0.16245079040527344, 0.16997528076171875, 0.17749977111816406, 0.18502426147460938, 0.1925487518310547, 0.2000732421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 15.0, 27.0, 59.0, 111.0, 325.0, 1256.0, 23576.0, 4160329.0, 7361.0, 791.0, 223.0, 100.0, 38.0, 26.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37890625, -5.24566650390625, -5.1124267578125, -4.97918701171875, -4.845947265625, -4.71270751953125, -4.5794677734375, -4.44622802734375, -4.31298828125, -4.17974853515625, -4.0465087890625, -3.91326904296875, -3.780029296875, -3.64678955078125, -3.5135498046875, -3.38031005859375, -3.2470703125, -3.11383056640625, -2.9805908203125, -2.84735107421875, -2.714111328125, -2.58087158203125, -2.4476318359375, -2.31439208984375, -2.18115234375, -2.04791259765625, -1.9146728515625, -1.78143310546875, -1.648193359375, -1.51495361328125, -1.3817138671875, -1.24847412109375, -1.115234375, -0.98199462890625, -0.8487548828125, -0.71551513671875, -0.582275390625, -0.44903564453125, -0.3157958984375, -0.18255615234375, -0.04931640625, 0.08392333984375, 0.2171630859375, 0.35040283203125, 0.483642578125, 0.61688232421875, 0.7501220703125, 0.88336181640625, 1.0166015625, 1.14984130859375, 1.2830810546875, 1.41632080078125, 1.549560546875, 1.68280029296875, 1.8160400390625, 1.94927978515625, 2.08251953125, 2.21575927734375, 2.3489990234375, 2.48223876953125, 2.615478515625, 2.74871826171875, 2.8819580078125, 3.01519775390625, 3.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 16.0, 31.0, 45.0, 92.0, 155.0, 259.0, 503.0, 954.0, 968.0, 497.0, 224.0, 148.0, 59.0, 45.0, 26.0, 11.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1131134033203125, -1.071929931640625, -1.0307464599609375, -0.98956298828125, -0.9483795166015625, -0.907196044921875, -0.8660125732421875, -0.8248291015625, -0.7836456298828125, -0.742462158203125, -0.7012786865234375, -0.66009521484375, -0.6189117431640625, -0.577728271484375, -0.5365447998046875, -0.495361328125, -0.4541778564453125, -0.412994384765625, -0.3718109130859375, -0.33062744140625, -0.2894439697265625, -0.248260498046875, -0.2070770263671875, -0.1658935546875, -0.1247100830078125, -0.083526611328125, -0.0423431396484375, -0.00115966796875, 0.0400238037109375, 0.081207275390625, 0.1223907470703125, 0.16357421875, 0.2047576904296875, 0.245941162109375, 0.2871246337890625, 0.32830810546875, 0.3694915771484375, 0.410675048828125, 0.4518585205078125, 0.4930419921875, 0.5342254638671875, 0.575408935546875, 0.6165924072265625, 0.65777587890625, 0.6989593505859375, 0.740142822265625, 0.7813262939453125, 0.822509765625, 0.8636932373046875, 0.904876708984375, 0.9460601806640625, 0.98724365234375, 1.0284271240234375, 1.069610595703125, 1.1107940673828125, 1.1519775390625, 1.1931610107421875, 1.234344482421875, 1.2755279541015625, 1.31671142578125, 1.3578948974609375, 1.399078369140625, 1.4402618408203125, 1.4814453125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 15.0, 50.0, 236.0, 466.0, 171.0, 41.0, 14.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.747618675231934, -11.972113609313965, -11.196608543395996, -10.421104431152344, -9.645599365234375, -8.870094299316406, -8.094589233398438, -7.319084167480469, -6.5435791015625, -5.768074035644531, -4.9925689697265625, -4.217064380645752, -3.441559314727783, -2.6660542488098145, -1.890549659729004, -1.1150445938110352, -0.3395395278930664, 0.4359654188156128, 1.211470365524292, 1.9869751930236816, 2.7624802589416504, 3.537985324859619, 4.31348991394043, 5.088994979858398, 5.864500045776367, 6.640005111694336, 7.415510177612305, 8.191015243530273, 8.966520309448242, 9.742025375366211, 10.517529487609863, 11.293034553527832, 12.068538665771484, 12.844043731689453, 13.619548797607422, 14.39505386352539, 15.17055892944336, 15.946063995361328, 16.721569061279297, 17.497074127197266, 18.272579193115234, 19.048084259033203, 19.823589324951172, 20.59909439086914, 21.37459945678711, 22.150104522705078, 22.925609588623047, 23.701114654541016, 24.47661781311035, 25.25212287902832, 26.02762794494629, 26.803133010864258, 27.578638076782227, 28.354143142700195, 29.12964630126953, 29.9051513671875, 30.68065643310547, 31.456161499023438, 32.231666564941406, 33.007171630859375, 33.782676696777344, 34.55818176269531, 35.33368682861328, 36.10919189453125, 36.88469696044922]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 6.0, 9.0, 10.0, 9.0, 15.0, 13.0, 14.0, 17.0, 21.0, 38.0, 36.0, 41.0, 38.0, 43.0, 42.0, 61.0, 76.0, 59.0, 50.0, 47.0, 48.0, 49.0, 40.0, 33.0, 31.0, 33.0, 22.0, 20.0, 18.0, 9.0, 13.0, 11.0, 10.0, 6.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.924989700317383, -3.778637170791626, -3.632284641265869, -3.485931873321533, -3.3395793437957764, -3.1932268142700195, -3.0468740463256836, -2.9005215167999268, -2.75416898727417, -2.607816457748413, -2.4614639282226562, -2.3151111602783203, -2.1687586307525635, -2.0224061012268066, -1.8760534524917603, -1.7297008037567139, -1.583348274230957, -1.4369957447052002, -1.2906430959701538, -1.1442904472351074, -0.9979379177093506, -0.851585328578949, -0.7052327394485474, -0.558880090713501, -0.41252756118774414, -0.26617497205734253, -0.11982238292694092, 0.026530206203460693, 0.1728827953338623, 0.3192353844642639, 0.4655879735946655, 0.6119406223297119, 0.7582931518554688, 0.9046457409858704, 1.050998330116272, 1.1973509788513184, 1.3437035083770752, 1.490056037902832, 1.6364086866378784, 1.7827613353729248, 1.9291138648986816, 2.0754663944244385, 2.2218189239501953, 2.3681716918945312, 2.514524221420288, 2.660876750946045, 2.807229518890381, 2.9535820484161377, 3.0999345779418945, 3.2462871074676514, 3.392639636993408, 3.538992404937744, 3.685344934463501, 3.831697463989258, 3.9780502319335938, 4.12440299987793, 4.270755290985107, 4.417108058929443, 4.563460350036621, 4.709813117980957, 4.856165885925293, 5.002518177032471, 5.148870944976807, 5.295223236083984, 5.44157600402832]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 11.0, 8.0, 8.0, 7.0, 16.0, 16.0, 19.0, 34.0, 45.0, 104.0, 305.0, 1134.0, 5583.0, 46435.0, 811663.0, 166800.0, 13263.0, 2161.0, 538.0, 180.0, 73.0, 48.0, 22.0, 13.0, 16.0, 8.0, 9.0, 5.0, 9.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0400390625, -1.01171875, -0.9833984375, -0.955078125, -0.9267578125, -0.8984375, -0.8701171875, -0.841796875, -0.8134765625, -0.78515625, -0.7568359375, -0.728515625, -0.7001953125, -0.671875, -0.6435546875, -0.615234375, -0.5869140625, -0.55859375, -0.5302734375, -0.501953125, -0.4736328125, -0.4453125, -0.4169921875, -0.388671875, -0.3603515625, -0.33203125, -0.3037109375, -0.275390625, -0.2470703125, -0.21875, -0.1904296875, -0.162109375, -0.1337890625, -0.10546875, -0.0771484375, -0.048828125, -0.0205078125, 0.0078125, 0.0361328125, 0.064453125, 0.0927734375, 0.12109375, 0.1494140625, 0.177734375, 0.2060546875, 0.234375, 0.2626953125, 0.291015625, 0.3193359375, 0.34765625, 0.3759765625, 0.404296875, 0.4326171875, 0.4609375, 0.4892578125, 0.517578125, 0.5458984375, 0.57421875, 0.6025390625, 0.630859375, 0.6591796875, 0.6875, 0.7158203125, 0.744140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 12.0, 29.0, 40.0, 77.0, 96.0, 151.0, 156.0, 144.0, 122.0, 75.0, 47.0, 27.0, 11.0, 11.0, 3.0, 1.0, 7.0], "bins": [-1.677734375, -1.6464385986328125, -1.615142822265625, -1.5838470458984375, -1.55255126953125, -1.5212554931640625, -1.489959716796875, -1.4586639404296875, -1.4273681640625, -1.3960723876953125, -1.364776611328125, -1.3334808349609375, -1.30218505859375, -1.2708892822265625, -1.239593505859375, -1.2082977294921875, -1.177001953125, -1.1457061767578125, -1.114410400390625, -1.0831146240234375, -1.05181884765625, -1.0205230712890625, -0.989227294921875, -0.9579315185546875, -0.9266357421875, -0.8953399658203125, -0.864044189453125, -0.8327484130859375, -0.80145263671875, -0.7701568603515625, -0.738861083984375, -0.7075653076171875, -0.67626953125, -0.6449737548828125, -0.613677978515625, -0.5823822021484375, -0.55108642578125, -0.5197906494140625, -0.488494873046875, -0.4571990966796875, -0.4259033203125, -0.3946075439453125, -0.363311767578125, -0.3320159912109375, -0.30072021484375, -0.2694244384765625, -0.238128662109375, -0.2068328857421875, -0.175537109375, -0.1442413330078125, -0.112945556640625, -0.0816497802734375, -0.05035400390625, -0.0190582275390625, 0.012237548828125, 0.0435333251953125, 0.0748291015625, 0.1061248779296875, 0.137420654296875, 0.1687164306640625, 0.20001220703125, 0.2313079833984375, 0.262603759765625, 0.2938995361328125, 0.3251953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 10.0, 16.0, 25.0, 35.0, 59.0, 79.0, 178.0, 316.0, 761.0, 2056.0, 7994.0, 61268.0, 908799.0, 55750.0, 7774.0, 1943.0, 723.0, 297.0, 184.0, 105.0, 63.0, 41.0, 19.0, 18.0, 7.0, 5.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5624771118164062, -0.5395050048828125, -0.5165328979492188, -0.493560791015625, -0.47058868408203125, -0.4476165771484375, -0.42464447021484375, -0.40167236328125, -0.37870025634765625, -0.3557281494140625, -0.33275604248046875, -0.309783935546875, -0.28681182861328125, -0.2638397216796875, -0.24086761474609375, -0.2178955078125, -0.19492340087890625, -0.1719512939453125, -0.14897918701171875, -0.126007080078125, -0.10303497314453125, -0.0800628662109375, -0.05709075927734375, -0.03411865234375, -0.01114654541015625, 0.0118255615234375, 0.03479766845703125, 0.057769775390625, 0.08074188232421875, 0.1037139892578125, 0.12668609619140625, 0.149658203125, 0.17263031005859375, 0.1956024169921875, 0.21857452392578125, 0.241546630859375, 0.26451873779296875, 0.2874908447265625, 0.31046295166015625, 0.33343505859375, 0.35640716552734375, 0.3793792724609375, 0.40235137939453125, 0.425323486328125, 0.44829559326171875, 0.4712677001953125, 0.49423980712890625, 0.5172119140625, 0.5401840209960938, 0.5631561279296875, 0.5861282348632812, 0.609100341796875, 0.6320724487304688, 0.6550445556640625, 0.6780166625976562, 0.70098876953125, 0.7239608764648438, 0.7469329833984375, 0.7699050903320312, 0.792877197265625, 0.8158493041992188, 0.8388214111328125, 0.8617935180664062, 0.884765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 9.0, 12.0, 6.0, 11.0, 18.0, 13.0, 10.0, 27.0, 23.0, 21.0, 29.0, 44.0, 37.0, 49.0, 64.0, 65.0, 86.0, 72.0, 73.0, 52.0, 54.0, 33.0, 25.0, 27.0, 21.0, 20.0, 12.0, 9.0, 17.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.423828125, -1.3787384033203125, -1.333648681640625, -1.2885589599609375, -1.24346923828125, -1.1983795166015625, -1.153289794921875, -1.1082000732421875, -1.0631103515625, -1.0180206298828125, -0.972930908203125, -0.9278411865234375, -0.88275146484375, -0.8376617431640625, -0.792572021484375, -0.7474822998046875, -0.702392578125, -0.6573028564453125, -0.612213134765625, -0.5671234130859375, -0.52203369140625, -0.4769439697265625, -0.431854248046875, -0.3867645263671875, -0.3416748046875, -0.2965850830078125, -0.251495361328125, -0.2064056396484375, -0.16131591796875, -0.1162261962890625, -0.071136474609375, -0.0260467529296875, 0.01904296875, 0.0641326904296875, 0.109222412109375, 0.1543121337890625, 0.19940185546875, 0.2444915771484375, 0.289581298828125, 0.3346710205078125, 0.3797607421875, 0.4248504638671875, 0.469940185546875, 0.5150299072265625, 0.56011962890625, 0.6052093505859375, 0.650299072265625, 0.6953887939453125, 0.740478515625, 0.7855682373046875, 0.830657958984375, 0.8757476806640625, 0.92083740234375, 0.9659271240234375, 1.011016845703125, 1.0561065673828125, 1.1011962890625, 1.1462860107421875, 1.191375732421875, 1.2364654541015625, 1.28155517578125, 1.3266448974609375, 1.371734619140625, 1.4168243408203125, 1.4619140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 9.0, 5.0, 9.0, 16.0, 22.0, 37.0, 46.0, 89.0, 162.0, 294.0, 657.0, 1486.0, 4189.0, 16307.0, 113123.0, 854329.0, 44253.0, 8934.0, 2565.0, 1004.0, 462.0, 214.0, 120.0, 68.0, 46.0, 25.0, 17.0, 22.0, 13.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13916969299316406, -0.13441848754882812, -0.1296672821044922, -0.12491607666015625, -0.12016487121582031, -0.11541366577148438, -0.11066246032714844, -0.1059112548828125, -0.10116004943847656, -0.09640884399414062, -0.09165763854980469, -0.08690643310546875, -0.08215522766113281, -0.07740402221679688, -0.07265281677246094, -0.067901611328125, -0.06315040588378906, -0.058399200439453125, -0.05364799499511719, -0.04889678955078125, -0.04414558410644531, -0.039394378662109375, -0.03464317321777344, -0.0298919677734375, -0.025140762329101562, -0.020389556884765625, -0.015638351440429688, -0.01088714599609375, -0.0061359405517578125, -0.001384735107421875, 0.0033664703369140625, 0.00811767578125, 0.012868881225585938, 0.017620086669921875, 0.022371292114257812, 0.02712249755859375, 0.03187370300292969, 0.036624908447265625, 0.04137611389160156, 0.0461273193359375, 0.05087852478027344, 0.055629730224609375, 0.06038093566894531, 0.06513214111328125, 0.06988334655761719, 0.07463455200195312, 0.07938575744628906, 0.084136962890625, 0.08888816833496094, 0.09363937377929688, 0.09839057922363281, 0.10314178466796875, 0.10789299011230469, 0.11264419555664062, 0.11739540100097656, 0.1221466064453125, 0.12689781188964844, 0.13164901733398438, 0.1364002227783203, 0.14115142822265625, 0.1459026336669922, 0.15065383911132812, 0.15540504455566406, 0.16015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 3.0, 10.0, 7.0, 7.0, 6.0, 13.0, 21.0, 20.0, 35.0, 30.0, 49.0, 59.0, 80.0, 115.0, 103.0, 91.0, 79.0, 63.0, 45.0, 26.0, 23.0, 15.0, 12.0, 20.0, 10.0, 6.0, 6.0, 10.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.9981136322021484e-05, -2.895388752222061e-05, -2.792663872241974e-05, -2.6899389922618866e-05, -2.5872141122817993e-05, -2.484489232301712e-05, -2.3817643523216248e-05, -2.2790394723415375e-05, -2.1763145923614502e-05, -2.073589712381363e-05, -1.9708648324012756e-05, -1.8681399524211884e-05, -1.765415072441101e-05, -1.6626901924610138e-05, -1.5599653124809265e-05, -1.4572404325008392e-05, -1.354515552520752e-05, -1.2517906725406647e-05, -1.1490657925605774e-05, -1.0463409125804901e-05, -9.436160326004028e-06, -8.408911526203156e-06, -7.381662726402283e-06, -6.35441392660141e-06, -5.327165126800537e-06, -4.299916326999664e-06, -3.2726675271987915e-06, -2.2454187273979187e-06, -1.218169927597046e-06, -1.909211277961731e-07, 8.363276720046997e-07, 1.8635764718055725e-06, 2.8908252716064453e-06, 3.918074071407318e-06, 4.945322871208191e-06, 5.972571671009064e-06, 6.9998204708099365e-06, 8.02706927061081e-06, 9.054318070411682e-06, 1.0081566870212555e-05, 1.1108815670013428e-05, 1.21360644698143e-05, 1.3163313269615173e-05, 1.4190562069416046e-05, 1.5217810869216919e-05, 1.6245059669017792e-05, 1.7272308468818665e-05, 1.8299557268619537e-05, 1.932680606842041e-05, 2.0354054868221283e-05, 2.1381303668022156e-05, 2.240855246782303e-05, 2.34358012676239e-05, 2.4463050067424774e-05, 2.5490298867225647e-05, 2.651754766702652e-05, 2.7544796466827393e-05, 2.8572045266628265e-05, 2.9599294066429138e-05, 3.062654286623001e-05, 3.1653791666030884e-05, 3.2681040465831757e-05, 3.370828926563263e-05, 3.47355380654335e-05, 3.5762786865234375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 13.0, 11.0, 18.0, 20.0, 41.0, 96.0, 184.0, 451.0, 1779.0, 9885.0, 168127.0, 848172.0, 16293.0, 2450.0, 614.0, 192.0, 75.0, 49.0, 27.0, 15.0, 9.0, 11.0, 6.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.2509040832519531, -0.24228668212890625, -0.23366928100585938, -0.2250518798828125, -0.21643447875976562, -0.20781707763671875, -0.19919967651367188, -0.190582275390625, -0.18196487426757812, -0.17334747314453125, -0.16473007202148438, -0.1561126708984375, -0.14749526977539062, -0.13887786865234375, -0.13026046752929688, -0.12164306640625, -0.11302566528320312, -0.10440826416015625, -0.09579086303710938, -0.0871734619140625, -0.07855606079101562, -0.06993865966796875, -0.061321258544921875, -0.052703857421875, -0.044086456298828125, -0.03546905517578125, -0.026851654052734375, -0.0182342529296875, -0.009616851806640625, -0.00099945068359375, 0.007617950439453125, 0.0162353515625, 0.024852752685546875, 0.03347015380859375, 0.042087554931640625, 0.0507049560546875, 0.059322357177734375, 0.06793975830078125, 0.07655715942382812, 0.085174560546875, 0.09379196166992188, 0.10240936279296875, 0.11102676391601562, 0.1196441650390625, 0.12826156616210938, 0.13687896728515625, 0.14549636840820312, 0.15411376953125, 0.16273117065429688, 0.17134857177734375, 0.17996597290039062, 0.1885833740234375, 0.19720077514648438, 0.20581817626953125, 0.21443557739257812, 0.223052978515625, 0.23167037963867188, 0.24028778076171875, 0.24890518188476562, 0.2575225830078125, 0.2661399841308594, 0.27475738525390625, 0.2833747863769531, 0.2919921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 5.0, 4.0, 9.0, 9.0, 25.0, 25.0, 20.0, 37.0, 41.0, 43.0, 52.0, 64.0, 83.0, 81.0, 88.0, 85.0, 60.0, 60.0, 33.0, 36.0, 34.0, 19.0, 16.0, 12.0, 7.0, 14.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16049575805664062, -0.15558624267578125, -0.15067672729492188, -0.1457672119140625, -0.14085769653320312, -0.13594818115234375, -0.13103866577148438, -0.126129150390625, -0.12121963500976562, -0.11631011962890625, -0.11140060424804688, -0.1064910888671875, -0.10158157348632812, -0.09667205810546875, -0.09176254272460938, -0.08685302734375, -0.08194351196289062, -0.07703399658203125, -0.07212448120117188, -0.0672149658203125, -0.062305450439453125, -0.05739593505859375, -0.052486419677734375, -0.047576904296875, -0.042667388916015625, -0.03775787353515625, -0.032848358154296875, -0.0279388427734375, -0.023029327392578125, -0.01811981201171875, -0.013210296630859375, -0.00830078125, -0.003391265869140625, 0.00151824951171875, 0.006427764892578125, 0.0113372802734375, 0.016246795654296875, 0.02115631103515625, 0.026065826416015625, 0.030975341796875, 0.035884857177734375, 0.04079437255859375, 0.045703887939453125, 0.0506134033203125, 0.055522918701171875, 0.06043243408203125, 0.06534194946289062, 0.07025146484375, 0.07516098022460938, 0.08007049560546875, 0.08498001098632812, 0.0898895263671875, 0.09479904174804688, 0.09970855712890625, 0.10461807250976562, 0.109527587890625, 0.11443710327148438, 0.11934661865234375, 0.12425613403320312, 0.1291656494140625, 0.13407516479492188, 0.13898468017578125, 0.14389419555664062, 0.1488037109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 4.0, 18.0, 35.0, 51.0, 82.0, 327.0, 262.0, 76.0, 51.0, 30.0, 16.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.079756736755371, -3.922390937805176, -3.7650251388549805, -3.607659339904785, -3.45029354095459, -3.2929277420043945, -3.135561943054199, -2.978196144104004, -2.8208303451538086, -2.6634645462036133, -2.506098747253418, -2.3487329483032227, -2.1913671493530273, -2.034001350402832, -1.8766355514526367, -1.7192697525024414, -1.561903953552246, -1.4045381546020508, -1.2471723556518555, -1.0898065567016602, -0.9324407577514648, -0.7750749588012695, -0.6177091598510742, -0.4603433609008789, -0.3029775619506836, -0.14561176300048828, 0.011754035949707031, 0.16911983489990234, 0.32648563385009766, 0.48385143280029297, 0.6412172317504883, 0.7985830307006836, 0.9559488296508789, 1.1133146286010742, 1.2706804275512695, 1.4280462265014648, 1.5854120254516602, 1.7427778244018555, 1.9001436233520508, 2.057509422302246, 2.2148752212524414, 2.3722410202026367, 2.529606819152832, 2.6869726181030273, 2.8443384170532227, 3.001704216003418, 3.1590700149536133, 3.3164358139038086, 3.473801612854004, 3.631167411804199, 3.7885332107543945, 3.94589900970459, 4.103264808654785, 4.2606306076049805, 4.417996406555176, 4.575362205505371, 4.732728004455566, 4.890093803405762, 5.047459602355957, 5.204825401306152, 5.362191200256348, 5.519556999206543, 5.676922798156738, 5.834288597106934, 5.991654396057129]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 5.0, 12.0, 6.0, 9.0, 9.0, 16.0, 12.0, 14.0, 22.0, 13.0, 21.0, 22.0, 27.0, 65.0, 95.0, 114.0, 109.0, 90.0, 84.0, 47.0, 18.0, 20.0, 23.0, 18.0, 20.0, 13.0, 12.0, 7.0, 7.0, 13.0, 5.0, 6.0, 4.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.4178333282470703, -3.3118650913238525, -3.205897092819214, -3.099928855895996, -2.9939608573913574, -2.8879926204681396, -2.782024383544922, -2.676056385040283, -2.5700881481170654, -2.4641199111938477, -2.358151912689209, -2.252183675765991, -2.1462154388427734, -2.0402474403381348, -1.934279203414917, -1.8283110857009888, -1.7223429679870605, -1.6163748502731323, -1.510406732559204, -1.4044384956359863, -1.298470377922058, -1.1925022602081299, -1.086534023284912, -0.9805659055709839, -0.8745977878570557, -0.7686296701431274, -0.6626614928245544, -0.5566933155059814, -0.4507251977920532, -0.344757080078125, -0.238788902759552, -0.132820725440979, -0.026852846145629883, 0.07911530137062073, 0.18508344888687134, 0.29105159640312195, 0.39701974391937256, 0.5029878616333008, 0.6089560389518738, 0.7149242162704468, 0.820892333984375, 0.9268604516983032, 1.0328285694122314, 1.1387968063354492, 1.2447649240493774, 1.3507330417633057, 1.4567012786865234, 1.5626693964004517, 1.6686375141143799, 1.774605631828308, 1.8805737495422363, 1.986541986465454, 2.092510223388672, 2.1984782218933105, 2.3044464588165283, 2.410414695739746, 2.5163826942443848, 2.6223509311676025, 2.728318929672241, 2.834287166595459, 2.9402551651000977, 3.0462234020233154, 3.152191638946533, 3.258159637451172, 3.3641278743743896]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 4.0, 9.0, 17.0, 11.0, 18.0, 19.0, 37.0, 35.0, 43.0, 40.0, 65.0, 139.0, 196.0, 84.0, 41.0, 39.0, 38.0, 36.0, 25.0, 13.0, 17.0, 18.0, 14.0, 7.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49169921875, -0.477691650390625, -0.46368408203125, -0.449676513671875, -0.4356689453125, -0.421661376953125, -0.40765380859375, -0.393646240234375, -0.379638671875, -0.365631103515625, -0.35162353515625, -0.337615966796875, -0.3236083984375, -0.309600830078125, -0.29559326171875, -0.281585693359375, -0.267578125, -0.253570556640625, -0.23956298828125, -0.225555419921875, -0.2115478515625, -0.197540283203125, -0.18353271484375, -0.169525146484375, -0.155517578125, -0.141510009765625, -0.12750244140625, -0.113494873046875, -0.0994873046875, -0.085479736328125, -0.07147216796875, -0.057464599609375, -0.04345703125, -0.029449462890625, -0.01544189453125, -0.001434326171875, 0.0125732421875, 0.026580810546875, 0.04058837890625, 0.054595947265625, 0.068603515625, 0.082611083984375, 0.09661865234375, 0.110626220703125, 0.1246337890625, 0.138641357421875, 0.15264892578125, 0.166656494140625, 0.1806640625, 0.194671630859375, 0.20867919921875, 0.222686767578125, 0.2366943359375, 0.250701904296875, 0.26470947265625, 0.278717041015625, 0.292724609375, 0.306732177734375, 0.32073974609375, 0.334747314453125, 0.3487548828125, 0.362762451171875, 0.37677001953125, 0.390777587890625, 0.40478515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 9.0, 7.0, 11.0, 26.0, 45.0, 57.0, 88.0, 162.0, 277.0, 567.0, 1209.0, 3033.0, 11080.0, 801048.0, 7553075.0, 11709.0, 3495.0, 1338.0, 585.0, 259.0, 135.0, 86.0, 60.0, 50.0, 37.0, 27.0, 19.0, 9.0, 2.0, 5.0, 12.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0], "bins": [-1.5678791999816895, -1.51895010471344, -1.4700210094451904, -1.4210920333862305, -1.372162938117981, -1.3232338428497314, -1.274304747581482, -1.2253756523132324, -1.1764466762542725, -1.127517580986023, -1.0785884857177734, -1.0296595096588135, -0.980730414390564, -0.9318013191223145, -0.8828722238540649, -0.8339431285858154, -0.7850140333175659, -0.7360849380493164, -0.6871559023857117, -0.6382268071174622, -0.5892977714538574, -0.5403686761856079, -0.4914395809173584, -0.4425105154514313, -0.39358144998550415, -0.344652384519577, -0.2957233190536499, -0.2467942237854004, -0.19786515831947327, -0.14893609285354614, -0.10000699758529663, -0.05107793211936951, -0.002148747444152832, 0.04678032547235489, 0.09570939838886261, 0.14463847875595093, 0.19356754422187805, 0.24249660968780518, 0.2914257049560547, 0.3403547704219818, 0.38928383588790894, 0.43821290135383606, 0.4871419668197632, 0.5360710620880127, 0.5850001573562622, 0.6339291930198669, 0.6828582882881165, 0.7317873239517212, 0.7807164192199707, 0.8296455144882202, 0.878574550151825, 0.9275036454200745, 0.9764326810836792, 1.0253617763519287, 1.0742908716201782, 1.1232199668884277, 1.1721489429473877, 1.2210780382156372, 1.2700071334838867, 1.3189361095428467, 1.3678652048110962, 1.4167943000793457, 1.4657233953475952, 1.5146524906158447, 1.5635815858840942]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 13.0, 4.0, 6.0, 7.0, 5.0, 9.0, 5.0, 11.0, 7.0, 10.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.238897323608398, -10.036127090454102, -9.833356857299805, -9.630587577819824, -9.427817344665527, -9.22504711151123, -9.022276878356934, -8.819507598876953, -8.616737365722656, -8.41396713256836, -8.211196899414062, -8.008427619934082, -7.805657386779785, -7.602887153625488, -7.400116920471191, -7.197347164154053, -6.994576930999756, -6.791806697845459, -6.58903694152832, -6.386266708374023, -6.183496952056885, -5.980726718902588, -5.777956962585449, -5.575186729431152, -5.3724164962768555, -5.169646263122559, -4.96687650680542, -4.764106273651123, -4.561336517333984, -4.3585662841796875, -4.155796051025391, -3.953026294708252, -3.7502570152282715, -3.5474870204925537, -3.344717025756836, -3.141946792602539, -2.9391770362854004, -2.7364068031311035, -2.5336368083953857, -2.330866813659668, -2.12809681892395, -1.9253268241882324, -1.7225568294525146, -1.5197867155075073, -1.3170167207717896, -1.1142467260360718, -0.9114766120910645, -0.7087066173553467, -0.5059366226196289, -0.30316659808158875, -0.10039657354354858, 0.10237348079681396, 0.30514347553253174, 0.5079134702682495, 0.7106835842132568, 0.9134535789489746, 1.1162235736846924, 1.3189935684204102, 1.521763563156128, 1.7245336771011353, 1.927303671836853, 2.1300735473632812, 2.332843780517578, 2.535613775253296, 2.7383837699890137]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 5.0, 24.0, 12.0, 30.0, 35.0, 44.0, 43.0, 70.0, 78.0, 64.0, 60.0, 69.0, 71.0, 73.0, 58.0, 49.0, 49.0, 34.0, 26.0, 13.0, 18.0, 10.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.3018646240234375, -0.290252685546875, -0.2786407470703125, -0.26702880859375, -0.2554168701171875, -0.243804931640625, -0.2321929931640625, -0.2205810546875, -0.2089691162109375, -0.197357177734375, -0.1857452392578125, -0.17413330078125, -0.1625213623046875, -0.150909423828125, -0.1392974853515625, -0.127685546875, -0.1160736083984375, -0.104461669921875, -0.0928497314453125, -0.08123779296875, -0.0696258544921875, -0.058013916015625, -0.0464019775390625, -0.0347900390625, -0.0231781005859375, -0.011566162109375, 4.57763671875e-05, 0.01165771484375, 0.0232696533203125, 0.034881591796875, 0.0464935302734375, 0.05810546875, 0.0697174072265625, 0.081329345703125, 0.0929412841796875, 0.10455322265625, 0.1161651611328125, 0.127777099609375, 0.1393890380859375, 0.1510009765625, 0.1626129150390625, 0.174224853515625, 0.1858367919921875, 0.19744873046875, 0.2090606689453125, 0.220672607421875, 0.2322845458984375, 0.243896484375, 0.2555084228515625, 0.267120361328125, 0.2787322998046875, 0.29034423828125, 0.3019561767578125, 0.313568115234375, 0.3251800537109375, 0.3367919921875, 0.3484039306640625, 0.360015869140625, 0.3716278076171875, 0.38323974609375, 0.3948516845703125, 0.406463623046875, 0.4180755615234375, 0.4296875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 16.0, 20.0, 29.0, 39.0, 69.0, 112.0, 159.0, 238.0, 419.0, 719.0, 1420.0, 2874.0, 6284.0, 15060.0, 39028.0, 102712.0, 182009.0, 105552.0, 39658.0, 15596.0, 6461.0, 2862.0, 1368.0, 700.0, 320.0, 194.0, 113.0, 80.0, 50.0, 21.0, 22.0, 16.0, 3.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.59765625, -1.551361083984375, -1.50506591796875, -1.458770751953125, -1.4124755859375, -1.366180419921875, -1.31988525390625, -1.273590087890625, -1.227294921875, -1.180999755859375, -1.13470458984375, -1.088409423828125, -1.0421142578125, -0.995819091796875, -0.94952392578125, -0.903228759765625, -0.85693359375, -0.810638427734375, -0.76434326171875, -0.718048095703125, -0.6717529296875, -0.625457763671875, -0.57916259765625, -0.532867431640625, -0.486572265625, -0.440277099609375, -0.39398193359375, -0.347686767578125, -0.3013916015625, -0.255096435546875, -0.20880126953125, -0.162506103515625, -0.1162109375, -0.069915771484375, -0.02362060546875, 0.022674560546875, 0.0689697265625, 0.115264892578125, 0.16156005859375, 0.207855224609375, 0.254150390625, 0.300445556640625, 0.34674072265625, 0.393035888671875, 0.4393310546875, 0.485626220703125, 0.53192138671875, 0.578216552734375, 0.62451171875, 0.670806884765625, 0.71710205078125, 0.763397216796875, 0.8096923828125, 0.855987548828125, 0.90228271484375, 0.948577880859375, 0.994873046875, 1.041168212890625, 1.08746337890625, 1.133758544921875, 1.1800537109375, 1.226348876953125, 1.27264404296875, 1.318939208984375, 1.365234375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 8.0, 4.0, 6.0, 10.0, 6.0, 8.0, 11.0, 17.0, 16.0, 20.0, 25.0, 25.0, 45.0, 35.0, 31.0, 52.0, 50.0, 59.0, 52.0, 55.0, 60.0, 45.0, 54.0, 49.0, 34.0, 33.0, 38.0, 32.0, 23.0, 19.0, 10.0, 8.0, 12.0, 11.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.27734375, -0.2700366973876953, -0.2627296447753906, -0.25542259216308594, -0.24811553955078125, -0.24080848693847656, -0.23350143432617188, -0.2261943817138672, -0.2188873291015625, -0.2115802764892578, -0.20427322387695312, -0.19696617126464844, -0.18965911865234375, -0.18235206604003906, -0.17504501342773438, -0.1677379608154297, -0.160430908203125, -0.1531238555908203, -0.14581680297851562, -0.13850975036621094, -0.13120269775390625, -0.12389564514160156, -0.11658859252929688, -0.10928153991699219, -0.1019744873046875, -0.09466743469238281, -0.08736038208007812, -0.08005332946777344, -0.07274627685546875, -0.06543922424316406, -0.058132171630859375, -0.05082511901855469, -0.04351806640625, -0.03621101379394531, -0.028903961181640625, -0.021596908569335938, -0.01428985595703125, -0.0069828033447265625, 0.000324249267578125, 0.0076313018798828125, 0.0149383544921875, 0.022245407104492188, 0.029552459716796875, 0.03685951232910156, 0.04416656494140625, 0.05147361755371094, 0.058780670166015625, 0.06608772277832031, 0.073394775390625, 0.08070182800292969, 0.08800888061523438, 0.09531593322753906, 0.10262298583984375, 0.10993003845214844, 0.11723709106445312, 0.12454414367675781, 0.1318511962890625, 0.1391582489013672, 0.14646530151367188, 0.15377235412597656, 0.16107940673828125, 0.16838645935058594, 0.17569351196289062, 0.1830005645751953, 0.1903076171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 11.0, 12.0, 11.0, 31.0, 44.0, 76.0, 100.0, 82.0, 44.0, 23.0, 10.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5849573612213135, -2.513430595397949, -2.441904067993164, -2.3703773021698, -2.2988505363464355, -2.2273240089416504, -2.155797243118286, -2.084270477294922, -2.0127439498901367, -1.941217303276062, -1.8696905374526978, -1.798163890838623, -1.7266372442245483, -1.6551105976104736, -1.5835838317871094, -1.5120571851730347, -1.4405304193496704, -1.3690037727355957, -1.2974770069122314, -1.2259503602981567, -1.154423713684082, -1.0828969478607178, -1.011370301246643, -0.9398436546325684, -0.8683169484138489, -0.7967902421951294, -0.7252635955810547, -0.6537368893623352, -0.5822101831436157, -0.510683536529541, -0.43915683031082153, -0.3676301836967468, -0.2961033582687378, -0.2245766818523407, -0.1530499905347824, -0.08152329921722412, -0.009996622800827026, 0.06153005361557007, 0.13305675983428955, 0.20458340644836426, 0.27611011266708374, 0.34763678908348083, 0.41916346549987793, 0.4906901717185974, 0.5622168779373169, 0.6337435245513916, 0.7052702307701111, 0.7767968773841858, 0.8483235836029053, 0.9198502898216248, 0.9913769364356995, 1.062903642654419, 1.1344302892684937, 1.2059569358825684, 1.2774837017059326, 1.3490103483200073, 1.420536994934082, 1.4920636415481567, 1.563590407371521, 1.6351170539855957, 1.7066437005996704, 1.7781703472137451, 1.8496971130371094, 1.921223759651184, 1.9927505254745483]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 8.0, 19.0, 28.0, 50.0, 77.0, 65.0, 59.0, 44.0, 16.0, 17.0, 15.0, 6.0, 7.0, 9.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-1.6058992147445679, -1.5647358894348145, -1.5235724449157715, -1.482409119606018, -1.4412457942962646, -1.4000824689865112, -1.3589191436767578, -1.3177556991577148, -1.2765923738479614, -1.235429048538208, -1.194265604019165, -1.1531022787094116, -1.1119389533996582, -1.0707756280899048, -1.0296123027801514, -0.9884488582611084, -0.947285532951355, -0.9061222076416016, -0.8649588227272034, -0.8237954378128052, -0.7826321125030518, -0.7414687871932983, -0.7003054022789001, -0.659142017364502, -0.6179786920547485, -0.5768153667449951, -0.5356519818305969, -0.4944886267185211, -0.4533252716064453, -0.4121619164943695, -0.3709985613822937, -0.3298352062702179, -0.28867197036743164, -0.24750861525535583, -0.20634526014328003, -0.16518190503120422, -0.12401854991912842, -0.08285519480705261, -0.04169183969497681, -0.000528484582901001, 0.040634870529174805, 0.08179822564125061, 0.12296158075332642, 0.16412493586540222, 0.20528829097747803, 0.24645164608955383, 0.28761500120162964, 0.32877835631370544, 0.36994171142578125, 0.41110506653785706, 0.45226842164993286, 0.49343177676200867, 0.5345951318740845, 0.5757584571838379, 0.6169218420982361, 0.6580852270126343, 0.6992485523223877, 0.7404118776321411, 0.7815752625465393, 0.8227386474609375, 0.8639019727706909, 0.9050652980804443, 0.9462286829948425, 0.9873920679092407, 1.0285553932189941]}, "eval/loss": 0.32257843017578125, "eval/wer": 0.09236414121380404, "eval/runtime": 558.1846, "eval/samples_per_second": 4.733, "eval/steps_per_second": 0.593, "train/train_runtime": 26664.6603, "train/train_samples_per_second": 5.351, "train/train_steps_per_second": 0.084, "train/total_flos": 0.0, "train/train_loss": 1.6266609489166015, "_wandb": {"runtime": 27499}} \ No newline at end of file