diff --git "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.8017, "train/learning_rate": 2.9109263657957245e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8852, "_timestamp": 1647383394, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 16.0, 11.0, 19.0, 10.0, 14.0, 15.0, 13.0, 21.0, 22.0, 25.0, 33.0, 30.0, 41.0, 40.0, 36.0, 44.0, 43.0, 51.0, 39.0, 49.0, 40.0, 36.0, 39.0, 44.0, 33.0, 32.0, 34.0, 27.0, 31.0, 18.0, 13.0, 10.0, 13.0, 10.0, 10.0, 3.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.82134246826172, -65.99658966064453, -64.17184448242188, -62.34709167480469, -60.522342681884766, -58.697593688964844, -56.872840881347656, -55.048091888427734, -53.22334289550781, -51.39859390258789, -49.5738410949707, -47.74909210205078, -45.92434310913086, -44.09959411621094, -42.27484130859375, -40.45009231567383, -38.62533950805664, -36.80059051513672, -34.97583770751953, -33.15108871459961, -31.326339721679688, -29.501588821411133, -27.676837921142578, -25.852088928222656, -24.0273380279541, -22.202587127685547, -20.377838134765625, -18.55308723449707, -16.728336334228516, -14.903587341308594, -13.078836441040039, -11.2540864944458, -9.429336547851562, -7.604586601257324, -5.779836177825928, -3.9550857543945312, -2.130335807800293, -0.3055858612060547, 1.5191650390625, 3.3439149856567383, 5.168664932250977, 6.993414878845215, 8.818164825439453, 10.642915725708008, 12.467665672302246, 14.292415618896484, 16.11716651916504, 17.941917419433594, 19.766666412353516, 21.59141731262207, 23.416166305541992, 25.240917205810547, 27.06566619873047, 28.890417098999023, 30.715167999267578, 32.5399169921875, 34.36466979980469, 36.18941879272461, 38.0141716003418, 39.83892059326172, 41.66366958618164, 43.48841857910156, 45.31317138671875, 47.13792037963867, 48.962669372558594]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 13.0, 5.0, 14.0, 17.0, 19.0, 16.0, 24.0, 17.0, 15.0, 28.0, 28.0, 39.0, 33.0, 30.0, 27.0, 38.0, 23.0, 37.0, 32.0, 32.0, 24.0, 37.0, 26.0, 41.0, 31.0, 39.0, 23.0, 33.0, 26.0, 24.0, 24.0, 26.0, 17.0, 19.0, 12.0, 6.0, 19.0, 9.0, 10.0, 13.0, 10.0, 5.0, 4.0, 8.0, 7.0, 4.0, 0.0, 2.0], "bins": [-66.78207397460938, -64.92351531982422, -63.06496047973633, -61.20640563964844, -59.34785079956055, -57.489295959472656, -55.6307373046875, -53.77218246459961, -51.91362762451172, -50.05507278442383, -48.19651412963867, -46.33795928955078, -44.47940444946289, -42.620849609375, -40.762290954589844, -38.90373611450195, -37.0451774597168, -35.186622619628906, -33.32806396484375, -31.46950912475586, -29.61095428466797, -27.752397537231445, -25.893840789794922, -24.03528594970703, -22.176729202270508, -20.318172454833984, -18.459617614746094, -16.60106086730957, -14.742505073547363, -12.883949279785156, -11.025392532348633, -9.166836738586426, -7.308277130126953, -5.449721336364746, -3.591165065765381, -1.7326087951660156, 0.1259469985961914, 1.9845027923583984, 3.843059539794922, 5.701615333557129, 7.560171127319336, 9.418726921081543, 11.27728271484375, 13.135839462280273, 14.99439525604248, 16.852951049804688, 18.71150779724121, 20.570064544677734, 22.428619384765625, 24.28717613220215, 26.14573097229004, 28.004287719726562, 29.862842559814453, 31.721399307250977, 33.5799560546875, 35.43851089477539, 37.29706573486328, 39.15562057495117, 41.01417922973633, 42.87273406982422, 44.73128890991211, 46.58984375, 48.448402404785156, 50.30695724487305, 52.1655158996582]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 7.0, 8.0, 21.0, 20.0, 20.0, 37.0, 65.0, 75.0, 106.0, 139.0, 216.0, 287.0, 436.0, 659.0, 943.0, 1381.0, 2043.0, 2988.0, 4401.0, 6851.0, 10284.0, 16036.0, 24785.0, 39080.0, 62323.0, 101688.0, 169304.0, 290948.0, 486644.0, 700852.0, 757098.0, 590233.0, 369372.0, 215181.0, 127756.0, 77616.0, 47950.0, 30318.0, 19347.0, 12522.0, 8067.0, 5343.0, 3533.0, 2398.0, 1608.0, 1102.0, 681.0, 507.0, 331.0, 220.0, 148.0, 101.0, 77.0, 53.0, 25.0, 27.0, 17.0, 7.0, 5.0, 3.0, 4.0], "bins": [-52.6875, -51.1015625, -49.515625, -47.9296875, -46.34375, -44.7578125, -43.171875, -41.5859375, -40.0, -38.4140625, -36.828125, -35.2421875, -33.65625, -32.0703125, -30.484375, -28.8984375, -27.3125, -25.7265625, -24.140625, -22.5546875, -20.96875, -19.3828125, -17.796875, -16.2109375, -14.625, -13.0390625, -11.453125, -9.8671875, -8.28125, -6.6953125, -5.109375, -3.5234375, -1.9375, -0.3515625, 1.234375, 2.8203125, 4.40625, 5.9921875, 7.578125, 9.1640625, 10.75, 12.3359375, 13.921875, 15.5078125, 17.09375, 18.6796875, 20.265625, 21.8515625, 23.4375, 25.0234375, 26.609375, 28.1953125, 29.78125, 31.3671875, 32.953125, 34.5390625, 36.125, 37.7109375, 39.296875, 40.8828125, 42.46875, 44.0546875, 45.640625, 47.2265625, 48.8125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 7.0, 12.0, 10.0, 16.0, 8.0, 12.0, 10.0, 20.0, 21.0, 20.0, 30.0, 27.0, 30.0, 37.0, 26.0, 54.0, 38.0, 49.0, 32.0, 32.0, 40.0, 38.0, 34.0, 48.0, 25.0, 28.0, 31.0, 30.0, 34.0, 28.0, 20.0, 19.0, 17.0, 17.0, 16.0, 15.0, 12.0, 7.0, 10.0, 12.0, 4.0, 5.0, 10.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-45.3125, -44.0537109375, -42.794921875, -41.5361328125, -40.27734375, -39.0185546875, -37.759765625, -36.5009765625, -35.2421875, -33.9833984375, -32.724609375, -31.4658203125, -30.20703125, -28.9482421875, -27.689453125, -26.4306640625, -25.171875, -23.9130859375, -22.654296875, -21.3955078125, -20.13671875, -18.8779296875, -17.619140625, -16.3603515625, -15.1015625, -13.8427734375, -12.583984375, -11.3251953125, -10.06640625, -8.8076171875, -7.548828125, -6.2900390625, -5.03125, -3.7724609375, -2.513671875, -1.2548828125, 0.00390625, 1.2626953125, 2.521484375, 3.7802734375, 5.0390625, 6.2978515625, 7.556640625, 8.8154296875, 10.07421875, 11.3330078125, 12.591796875, 13.8505859375, 15.109375, 16.3681640625, 17.626953125, 18.8857421875, 20.14453125, 21.4033203125, 22.662109375, 23.9208984375, 25.1796875, 26.4384765625, 27.697265625, 28.9560546875, 30.21484375, 31.4736328125, 32.732421875, 33.9912109375, 35.25]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 12.0, 23.0, 43.0, 63.0, 103.0, 143.0, 244.0, 378.0, 638.0, 963.0, 1537.0, 2589.0, 4285.0, 7555.0, 13001.0, 22567.0, 39255.0, 68815.0, 120517.0, 207189.0, 343073.0, 533304.0, 722572.0, 726591.0, 538395.0, 345992.0, 209379.0, 121736.0, 69282.0, 39521.0, 22661.0, 12843.0, 7596.0, 4342.0, 2680.0, 1632.0, 960.0, 654.0, 401.0, 243.0, 162.0, 109.0, 74.0, 50.0, 33.0, 24.0, 17.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-53.46875, -51.79833984375, -50.1279296875, -48.45751953125, -46.787109375, -45.11669921875, -43.4462890625, -41.77587890625, -40.10546875, -38.43505859375, -36.7646484375, -35.09423828125, -33.423828125, -31.75341796875, -30.0830078125, -28.41259765625, -26.7421875, -25.07177734375, -23.4013671875, -21.73095703125, -20.060546875, -18.39013671875, -16.7197265625, -15.04931640625, -13.37890625, -11.70849609375, -10.0380859375, -8.36767578125, -6.697265625, -5.02685546875, -3.3564453125, -1.68603515625, -0.015625, 1.65478515625, 3.3251953125, 4.99560546875, 6.666015625, 8.33642578125, 10.0068359375, 11.67724609375, 13.34765625, 15.01806640625, 16.6884765625, 18.35888671875, 20.029296875, 21.69970703125, 23.3701171875, 25.04052734375, 26.7109375, 28.38134765625, 30.0517578125, 31.72216796875, 33.392578125, 35.06298828125, 36.7333984375, 38.40380859375, 40.07421875, 41.74462890625, 43.4150390625, 45.08544921875, 46.755859375, 48.42626953125, 50.0966796875, 51.76708984375, 53.4375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 9.0, 5.0, 2.0, 8.0, 17.0, 10.0, 11.0, 23.0, 25.0, 30.0, 43.0, 66.0, 57.0, 95.0, 110.0, 124.0, 164.0, 198.0, 228.0, 280.0, 340.0, 318.0, 318.0, 320.0, 295.0, 241.0, 175.0, 150.0, 113.0, 90.0, 63.0, 40.0, 29.0, 29.0, 17.0, 11.0, 8.0, 10.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.375, -28.50732421875, -27.6396484375, -26.77197265625, -25.904296875, -25.03662109375, -24.1689453125, -23.30126953125, -22.43359375, -21.56591796875, -20.6982421875, -19.83056640625, -18.962890625, -18.09521484375, -17.2275390625, -16.35986328125, -15.4921875, -14.62451171875, -13.7568359375, -12.88916015625, -12.021484375, -11.15380859375, -10.2861328125, -9.41845703125, -8.55078125, -7.68310546875, -6.8154296875, -5.94775390625, -5.080078125, -4.21240234375, -3.3447265625, -2.47705078125, -1.609375, -0.74169921875, 0.1259765625, 0.99365234375, 1.861328125, 2.72900390625, 3.5966796875, 4.46435546875, 5.33203125, 6.19970703125, 7.0673828125, 7.93505859375, 8.802734375, 9.67041015625, 10.5380859375, 11.40576171875, 12.2734375, 13.14111328125, 14.0087890625, 14.87646484375, 15.744140625, 16.61181640625, 17.4794921875, 18.34716796875, 19.21484375, 20.08251953125, 20.9501953125, 21.81787109375, 22.685546875, 23.55322265625, 24.4208984375, 25.28857421875, 26.15625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 15.0, 18.0, 17.0, 35.0, 35.0, 34.0, 33.0, 43.0, 35.0, 54.0, 35.0, 54.0, 50.0, 49.0, 49.0, 43.0, 42.0, 44.0, 36.0, 37.0, 26.0, 29.0, 22.0, 24.0, 25.0, 16.0, 14.0, 15.0, 16.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.07258605957031, -53.469810485839844, -51.867034912109375, -50.264259338378906, -48.66148376464844, -47.05870819091797, -45.4559326171875, -43.85315704345703, -42.25038146972656, -40.647605895996094, -39.044830322265625, -37.442054748535156, -35.83927917480469, -34.23650360107422, -32.63372802734375, -31.03095054626465, -29.428173065185547, -27.825397491455078, -26.22262191772461, -24.61984634399414, -23.017070770263672, -21.414295196533203, -19.8115177154541, -18.208742141723633, -16.605966567993164, -15.003190994262695, -13.400415420532227, -11.797638893127441, -10.194863319396973, -8.592087745666504, -6.989311218261719, -5.38653564453125, -3.783763885498047, -2.180988073348999, -0.5782122611999512, 1.0245637893676758, 2.6273393630981445, 4.230114936828613, 5.832891464233398, 7.435667037963867, 9.038442611694336, 10.641218185424805, 12.243993759155273, 13.846770286560059, 15.449545860290527, 17.052322387695312, 18.65509796142578, 20.25787353515625, 21.86064910888672, 23.463424682617188, 25.066200256347656, 26.668975830078125, 28.271751403808594, 29.874526977539062, 31.477304458618164, 33.080078125, 34.68285369873047, 36.28562927246094, 37.888404846191406, 39.491180419921875, 41.093955993652344, 42.69673156738281, 44.29950714111328, 45.90228271484375, 47.505062103271484]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 6.0, 9.0, 9.0, 10.0, 21.0, 18.0, 22.0, 33.0, 24.0, 30.0, 28.0, 33.0, 38.0, 32.0, 41.0, 37.0, 40.0, 46.0, 52.0, 46.0, 23.0, 35.0, 43.0, 34.0, 33.0, 21.0, 37.0, 38.0, 30.0, 29.0, 25.0, 13.0, 7.0, 14.0, 5.0, 11.0, 9.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-65.52235412597656, -63.723411560058594, -61.92446517944336, -60.12552261352539, -58.32658004760742, -56.52763366699219, -54.72869110107422, -52.92974853515625, -51.13080596923828, -49.33186340332031, -47.53291702270508, -45.73397445678711, -43.93503189086914, -42.136085510253906, -40.33714294433594, -38.53820037841797, -36.739253997802734, -34.940311431884766, -33.14136505126953, -31.342422485351562, -29.543479919433594, -27.744535446166992, -25.94559097290039, -24.146648406982422, -22.34770393371582, -20.54875946044922, -18.74981689453125, -16.95087242126465, -15.151928901672363, -13.352985382080078, -11.554040908813477, -9.755097389221191, -7.956157684326172, -6.157214164733887, -4.358270168304443, -2.559326171875, -0.7603826522827148, 1.0385608673095703, 2.837505340576172, 4.636448860168457, 6.435392379760742, 8.234335899353027, 10.033279418945312, 11.832223892211914, 13.6311674118042, 15.430110931396484, 17.229055404663086, 19.027999877929688, 20.826942443847656, 22.625886917114258, 24.424829483032227, 26.223773956298828, 28.022716522216797, 29.8216609954834, 31.62060546875, 33.41954803466797, 35.21849060058594, 37.017433166503906, 38.81637954711914, 40.61532211303711, 42.41426467895508, 44.21321105957031, 46.01215362548828, 47.81109619140625, 49.610042572021484]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 9.0, 17.0, 22.0, 38.0, 54.0, 88.0, 130.0, 220.0, 380.0, 650.0, 1194.0, 2045.0, 3514.0, 6473.0, 11403.0, 20216.0, 34773.0, 58174.0, 93303.0, 136564.0, 169155.0, 165701.0, 129128.0, 87164.0, 54170.0, 31781.0, 18340.0, 10557.0, 5701.0, 3285.0, 1791.0, 1028.0, 581.0, 351.0, 212.0, 128.0, 79.0, 47.0, 39.0, 17.0, 11.0, 11.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.362060546875, -19.72412109375, -19.086181640625, -18.4482421875, -17.810302734375, -17.17236328125, -16.534423828125, -15.896484375, -15.258544921875, -14.62060546875, -13.982666015625, -13.3447265625, -12.706787109375, -12.06884765625, -11.430908203125, -10.79296875, -10.155029296875, -9.51708984375, -8.879150390625, -8.2412109375, -7.603271484375, -6.96533203125, -6.327392578125, -5.689453125, -5.051513671875, -4.41357421875, -3.775634765625, -3.1376953125, -2.499755859375, -1.86181640625, -1.223876953125, -0.5859375, 0.052001953125, 0.68994140625, 1.327880859375, 1.9658203125, 2.603759765625, 3.24169921875, 3.879638671875, 4.517578125, 5.155517578125, 5.79345703125, 6.431396484375, 7.0693359375, 7.707275390625, 8.34521484375, 8.983154296875, 9.62109375, 10.259033203125, 10.89697265625, 11.534912109375, 12.1728515625, 12.810791015625, 13.44873046875, 14.086669921875, 14.724609375, 15.362548828125, 16.00048828125, 16.638427734375, 17.2763671875, 17.914306640625, 18.55224609375, 19.190185546875, 19.828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 6.0, 6.0, 10.0, 9.0, 9.0, 21.0, 19.0, 22.0, 33.0, 26.0, 28.0, 29.0, 31.0, 38.0, 31.0, 43.0, 39.0, 40.0, 44.0, 49.0, 48.0, 22.0, 35.0, 45.0, 35.0, 32.0, 22.0, 36.0, 40.0, 28.0, 29.0, 25.0, 12.0, 7.0, 15.0, 4.0, 11.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-63.9375, -62.17431640625, -60.4111328125, -58.64794921875, -56.884765625, -55.12158203125, -53.3583984375, -51.59521484375, -49.83203125, -48.06884765625, -46.3056640625, -44.54248046875, -42.779296875, -41.01611328125, -39.2529296875, -37.48974609375, -35.7265625, -33.96337890625, -32.2001953125, -30.43701171875, -28.673828125, -26.91064453125, -25.1474609375, -23.38427734375, -21.62109375, -19.85791015625, -18.0947265625, -16.33154296875, -14.568359375, -12.80517578125, -11.0419921875, -9.27880859375, -7.515625, -5.75244140625, -3.9892578125, -2.22607421875, -0.462890625, 1.30029296875, 3.0634765625, 4.82666015625, 6.58984375, 8.35302734375, 10.1162109375, 11.87939453125, 13.642578125, 15.40576171875, 17.1689453125, 18.93212890625, 20.6953125, 22.45849609375, 24.2216796875, 25.98486328125, 27.748046875, 29.51123046875, 31.2744140625, 33.03759765625, 34.80078125, 36.56396484375, 38.3271484375, 40.09033203125, 41.853515625, 43.61669921875, 45.3798828125, 47.14306640625, 48.90625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 9.0, 9.0, 15.0, 31.0, 52.0, 73.0, 142.0, 254.0, 587.0, 1160.0, 2405.0, 5379.0, 12267.0, 30781.0, 898491.0, 61545.0, 19832.0, 8267.0, 3806.0, 1726.0, 842.0, 396.0, 212.0, 97.0, 56.0, 35.0, 20.0, 18.0, 13.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.375, -79.935546875, -77.49609375, -75.056640625, -72.6171875, -70.177734375, -67.73828125, -65.298828125, -62.859375, -60.419921875, -57.98046875, -55.541015625, -53.1015625, -50.662109375, -48.22265625, -45.783203125, -43.34375, -40.904296875, -38.46484375, -36.025390625, -33.5859375, -31.146484375, -28.70703125, -26.267578125, -23.828125, -21.388671875, -18.94921875, -16.509765625, -14.0703125, -11.630859375, -9.19140625, -6.751953125, -4.3125, -1.873046875, 0.56640625, 3.005859375, 5.4453125, 7.884765625, 10.32421875, 12.763671875, 15.203125, 17.642578125, 20.08203125, 22.521484375, 24.9609375, 27.400390625, 29.83984375, 32.279296875, 34.71875, 37.158203125, 39.59765625, 42.037109375, 44.4765625, 46.916015625, 49.35546875, 51.794921875, 54.234375, 56.673828125, 59.11328125, 61.552734375, 63.9921875, 66.431640625, 68.87109375, 71.310546875, 73.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 11.0, 6.0, 13.0, 9.0, 10.0, 14.0, 15.0, 15.0, 23.0, 30.0, 33.0, 32.0, 37.0, 36.0, 40.0, 40.0, 57.0, 46.0, 49.0, 44.0, 40.0, 40.0, 41.0, 36.0, 28.0, 38.0, 31.0, 36.0, 21.0, 23.0, 16.0, 14.0, 16.0, 11.0, 10.0, 12.0, 6.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.625, -46.291015625, -44.95703125, -43.623046875, -42.2890625, -40.955078125, -39.62109375, -38.287109375, -36.953125, -35.619140625, -34.28515625, -32.951171875, -31.6171875, -30.283203125, -28.94921875, -27.615234375, -26.28125, -24.947265625, -23.61328125, -22.279296875, -20.9453125, -19.611328125, -18.27734375, -16.943359375, -15.609375, -14.275390625, -12.94140625, -11.607421875, -10.2734375, -8.939453125, -7.60546875, -6.271484375, -4.9375, -3.603515625, -2.26953125, -0.935546875, 0.3984375, 1.732421875, 3.06640625, 4.400390625, 5.734375, 7.068359375, 8.40234375, 9.736328125, 11.0703125, 12.404296875, 13.73828125, 15.072265625, 16.40625, 17.740234375, 19.07421875, 20.408203125, 21.7421875, 23.076171875, 24.41015625, 25.744140625, 27.078125, 28.412109375, 29.74609375, 31.080078125, 32.4140625, 33.748046875, 35.08203125, 36.416015625, 37.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 8.0, 11.0, 18.0, 11.0, 14.0, 17.0, 31.0, 34.0, 50.0, 76.0, 112.0, 168.0, 253.0, 478.0, 867.0, 1637.0, 3565.0, 1025860.0, 10088.0, 2364.0, 1168.0, 664.0, 358.0, 214.0, 145.0, 73.0, 79.0, 42.0, 37.0, 25.0, 17.0, 17.0, 14.0, 8.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.71875, -43.39404296875, -42.0693359375, -40.74462890625, -39.419921875, -38.09521484375, -36.7705078125, -35.44580078125, -34.12109375, -32.79638671875, -31.4716796875, -30.14697265625, -28.822265625, -27.49755859375, -26.1728515625, -24.84814453125, -23.5234375, -22.19873046875, -20.8740234375, -19.54931640625, -18.224609375, -16.89990234375, -15.5751953125, -14.25048828125, -12.92578125, -11.60107421875, -10.2763671875, -8.95166015625, -7.626953125, -6.30224609375, -4.9775390625, -3.65283203125, -2.328125, -1.00341796875, 0.3212890625, 1.64599609375, 2.970703125, 4.29541015625, 5.6201171875, 6.94482421875, 8.26953125, 9.59423828125, 10.9189453125, 12.24365234375, 13.568359375, 14.89306640625, 16.2177734375, 17.54248046875, 18.8671875, 20.19189453125, 21.5166015625, 22.84130859375, 24.166015625, 25.49072265625, 26.8154296875, 28.14013671875, 29.46484375, 30.78955078125, 32.1142578125, 33.43896484375, 34.763671875, 36.08837890625, 37.4130859375, 38.73779296875, 40.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 4.0, 4.0, 4.0, 29.0, 737.0, 153.0, 7.0, 4.0, 4.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007038116455078125, -0.0006815791130065918, -0.0006593465805053711, -0.0006371140480041504, -0.0006148815155029297, -0.000592648983001709, -0.0005704164505004883, -0.0005481839179992676, -0.0005259513854980469, -0.0005037188529968262, -0.00048148632049560547, -0.00045925378799438477, -0.00043702125549316406, -0.00041478872299194336, -0.00039255619049072266, -0.00037032365798950195, -0.00034809112548828125, -0.00032585859298706055, -0.00030362606048583984, -0.00028139352798461914, -0.00025916099548339844, -0.00023692846298217773, -0.00021469593048095703, -0.00019246339797973633, -0.00017023086547851562, -0.00014799833297729492, -0.00012576580047607422, -0.00010353326797485352, -8.130073547363281e-05, -5.906820297241211e-05, -3.6835670471191406e-05, -1.4603137969970703e-05, 7.62939453125e-06, 2.9861927032470703e-05, 5.2094459533691406e-05, 7.432699203491211e-05, 9.655952453613281e-05, 0.00011879205703735352, 0.00014102458953857422, 0.00016325712203979492, 0.00018548965454101562, 0.00020772218704223633, 0.00022995471954345703, 0.00025218725204467773, 0.00027441978454589844, 0.00029665231704711914, 0.00031888484954833984, 0.00034111738204956055, 0.00036334991455078125, 0.00038558244705200195, 0.00040781497955322266, 0.00043004751205444336, 0.00045228004455566406, 0.00047451257705688477, 0.0004967451095581055, 0.0005189776420593262, 0.0005412101745605469, 0.0005634427070617676, 0.0005856752395629883, 0.000607907772064209, 0.0006301403045654297, 0.0006523728370666504, 0.0006746053695678711, 0.0006968379020690918, 0.0007190704345703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 13.0, 14.0, 23.0, 35.0, 40.0, 82.0, 94.0, 138.0, 169.0, 238.0, 317.0, 451.0, 588.0, 759.0, 1026.0, 1457.0, 1897.0, 2376.0, 3238.0, 4186.0, 5595.0, 7671.0, 11759.0, 41326.0, 741896.0, 170018.0, 17919.0, 8865.0, 6396.0, 5033.0, 3720.0, 2915.0, 2098.0, 1565.0, 1190.0, 897.0, 670.0, 461.0, 396.0, 280.0, 238.0, 136.0, 113.0, 88.0, 47.0, 50.0, 23.0, 22.0, 9.0, 8.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.0, -5.8167724609375, -5.633544921875, -5.4503173828125, -5.26708984375, -5.0838623046875, -4.900634765625, -4.7174072265625, -4.5341796875, -4.3509521484375, -4.167724609375, -3.9844970703125, -3.80126953125, -3.6180419921875, -3.434814453125, -3.2515869140625, -3.068359375, -2.8851318359375, -2.701904296875, -2.5186767578125, -2.33544921875, -2.1522216796875, -1.968994140625, -1.7857666015625, -1.6025390625, -1.4193115234375, -1.236083984375, -1.0528564453125, -0.86962890625, -0.6864013671875, -0.503173828125, -0.3199462890625, -0.13671875, 0.0465087890625, 0.229736328125, 0.4129638671875, 0.59619140625, 0.7794189453125, 0.962646484375, 1.1458740234375, 1.3291015625, 1.5123291015625, 1.695556640625, 1.8787841796875, 2.06201171875, 2.2452392578125, 2.428466796875, 2.6116943359375, 2.794921875, 2.9781494140625, 3.161376953125, 3.3446044921875, 3.52783203125, 3.7110595703125, 3.894287109375, 4.0775146484375, 4.2607421875, 4.4439697265625, 4.627197265625, 4.8104248046875, 4.99365234375, 5.1768798828125, 5.360107421875, 5.5433349609375, 5.7265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 8.0, 2.0, 2.0, 13.0, 32.0, 93.0, 278.0, 349.0, 101.0, 31.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.644439697265625, -2.55645751953125, -2.468475341796875, -2.3804931640625, -2.292510986328125, -2.20452880859375, -2.116546630859375, -2.028564453125, -1.940582275390625, -1.85260009765625, -1.764617919921875, -1.6766357421875, -1.588653564453125, -1.50067138671875, -1.412689208984375, -1.32470703125, -1.236724853515625, -1.14874267578125, -1.060760498046875, -0.9727783203125, -0.884796142578125, -0.79681396484375, -0.708831787109375, -0.620849609375, -0.532867431640625, -0.44488525390625, -0.356903076171875, -0.2689208984375, -0.180938720703125, -0.09295654296875, -0.004974365234375, 0.0830078125, 0.170989990234375, 0.25897216796875, 0.346954345703125, 0.4349365234375, 0.522918701171875, 0.61090087890625, 0.698883056640625, 0.786865234375, 0.874847412109375, 0.96282958984375, 1.050811767578125, 1.1387939453125, 1.226776123046875, 1.31475830078125, 1.402740478515625, 1.49072265625, 1.578704833984375, 1.66668701171875, 1.754669189453125, 1.8426513671875, 1.930633544921875, 2.01861572265625, 2.106597900390625, 2.194580078125, 2.282562255859375, 2.37054443359375, 2.458526611328125, 2.5465087890625, 2.634490966796875, 2.72247314453125, 2.810455322265625, 2.8984375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 6.0, 3.0, 4.0, 1.0, 7.0, 7.0, 6.0, 11.0, 12.0, 16.0, 30.0, 29.0, 36.0, 25.0, 34.0, 42.0, 46.0, 49.0, 35.0, 49.0, 53.0, 44.0, 48.0, 43.0, 34.0, 44.0, 40.0, 33.0, 28.0, 26.0, 20.0, 24.0, 32.0, 12.0, 16.0, 19.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-52.17606735229492, -50.65773010253906, -49.1393928527832, -47.621055603027344, -46.102718353271484, -44.584381103515625, -43.06604766845703, -41.547706604003906, -40.02937316894531, -38.51103591918945, -36.992698669433594, -35.474361419677734, -33.956024169921875, -32.437686920166016, -30.91935157775879, -29.40101432800293, -27.882675170898438, -26.364337921142578, -24.84600067138672, -23.32766342163086, -21.809326171875, -20.29098892211914, -18.772653579711914, -17.254316329956055, -15.735979080200195, -14.217641830444336, -12.699304580688477, -11.180968284606934, -9.662631034851074, -8.144293785095215, -6.625957489013672, -5.1076202392578125, -3.5892791748046875, -2.0709421634674072, -0.552605152130127, 0.9657316207885742, 2.4840688705444336, 4.002406120300293, 5.520742416381836, 7.039079666137695, 8.557416915893555, 10.075754165649414, 11.594091415405273, 13.112427711486816, 14.630764961242676, 16.14910125732422, 17.667438507080078, 19.185775756835938, 20.704113006591797, 22.222450256347656, 23.740787506103516, 25.259124755859375, 26.777462005615234, 28.295799255371094, 29.81413459777832, 31.33247184753418, 32.850807189941406, 34.369144439697266, 35.887481689453125, 37.405818939208984, 38.924156188964844, 40.4424934387207, 41.96083068847656, 43.479164123535156, 44.99750518798828]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 8.0, 10.0, 16.0, 18.0, 22.0, 32.0, 25.0, 31.0, 24.0, 36.0, 32.0, 35.0, 42.0, 34.0, 37.0, 41.0, 48.0, 45.0, 39.0, 27.0, 44.0, 35.0, 35.0, 21.0, 33.0, 41.0, 32.0, 25.0, 27.0, 22.0, 8.0, 9.0, 12.0, 7.0, 10.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-64.53321075439453, -62.77570343017578, -61.01819610595703, -59.26068878173828, -57.503177642822266, -55.745670318603516, -53.988162994384766, -52.230655670166016, -50.473148345947266, -48.715641021728516, -46.958133697509766, -45.20062255859375, -43.443115234375, -41.68560791015625, -39.9281005859375, -38.17059326171875, -36.4130859375, -34.65557861328125, -32.8980712890625, -31.140562057495117, -29.383054733276367, -27.625545501708984, -25.868038177490234, -24.110530853271484, -22.35301971435547, -20.59551239013672, -18.838003158569336, -17.080495834350586, -15.322988510131836, -13.56548023223877, -11.807971954345703, -10.050464630126953, -8.292957305908203, -6.535449504852295, -4.777941703796387, -3.0204334259033203, -1.262925624847412, 0.4945821762084961, 2.2520904541015625, 4.0095977783203125, 5.767106056213379, 7.524613857269287, 9.282121658325195, 11.039629936218262, 12.797138214111328, 14.554645538330078, 16.312152862548828, 18.069660186767578, 19.82716941833496, 21.58467674255371, 23.342185974121094, 25.099693298339844, 26.857200622558594, 28.614707946777344, 30.372217178344727, 32.129722595214844, 33.88723373413086, 35.64474105834961, 37.40224838256836, 39.159759521484375, 40.917266845703125, 42.674774169921875, 44.432281494140625, 46.189788818359375, 47.947296142578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 7.0, 9.0, 15.0, 27.0, 47.0, 52.0, 83.0, 132.0, 199.0, 349.0, 551.0, 857.0, 1369.0, 2216.0, 3621.0, 5952.0, 9685.0, 15942.0, 26044.0, 42837.0, 66857.0, 99289.0, 133961.0, 153909.0, 146505.0, 116657.0, 82155.0, 53337.0, 33227.0, 20410.0, 12336.0, 7571.0, 4742.0, 2908.0, 1782.0, 1114.0, 678.0, 431.0, 252.0, 147.0, 114.0, 61.0, 33.0, 24.0, 20.0, 19.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-57.375, -55.6748046875, -53.974609375, -52.2744140625, -50.57421875, -48.8740234375, -47.173828125, -45.4736328125, -43.7734375, -42.0732421875, -40.373046875, -38.6728515625, -36.97265625, -35.2724609375, -33.572265625, -31.8720703125, -30.171875, -28.4716796875, -26.771484375, -25.0712890625, -23.37109375, -21.6708984375, -19.970703125, -18.2705078125, -16.5703125, -14.8701171875, -13.169921875, -11.4697265625, -9.76953125, -8.0693359375, -6.369140625, -4.6689453125, -2.96875, -1.2685546875, 0.431640625, 2.1318359375, 3.83203125, 5.5322265625, 7.232421875, 8.9326171875, 10.6328125, 12.3330078125, 14.033203125, 15.7333984375, 17.43359375, 19.1337890625, 20.833984375, 22.5341796875, 24.234375, 25.9345703125, 27.634765625, 29.3349609375, 31.03515625, 32.7353515625, 34.435546875, 36.1357421875, 37.8359375, 39.5361328125, 41.236328125, 42.9365234375, 44.63671875, 46.3369140625, 48.037109375, 49.7373046875, 51.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 8.0, 7.0, 10.0, 8.0, 20.0, 15.0, 21.0, 36.0, 25.0, 29.0, 28.0, 31.0, 33.0, 36.0, 37.0, 39.0, 39.0, 44.0, 46.0, 49.0, 31.0, 29.0, 42.0, 35.0, 35.0, 23.0, 34.0, 35.0, 37.0, 27.0, 25.0, 16.0, 10.0, 12.0, 10.0, 8.0, 10.0, 2.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-59.28125, -57.65869140625, -56.0361328125, -54.41357421875, -52.791015625, -51.16845703125, -49.5458984375, -47.92333984375, -46.30078125, -44.67822265625, -43.0556640625, -41.43310546875, -39.810546875, -38.18798828125, -36.5654296875, -34.94287109375, -33.3203125, -31.69775390625, -30.0751953125, -28.45263671875, -26.830078125, -25.20751953125, -23.5849609375, -21.96240234375, -20.33984375, -18.71728515625, -17.0947265625, -15.47216796875, -13.849609375, -12.22705078125, -10.6044921875, -8.98193359375, -7.359375, -5.73681640625, -4.1142578125, -2.49169921875, -0.869140625, 0.75341796875, 2.3759765625, 3.99853515625, 5.62109375, 7.24365234375, 8.8662109375, 10.48876953125, 12.111328125, 13.73388671875, 15.3564453125, 16.97900390625, 18.6015625, 20.22412109375, 21.8466796875, 23.46923828125, 25.091796875, 26.71435546875, 28.3369140625, 29.95947265625, 31.58203125, 33.20458984375, 34.8271484375, 36.44970703125, 38.072265625, 39.69482421875, 41.3173828125, 42.93994140625, 44.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 8.0, 6.0, 22.0, 25.0, 44.0, 71.0, 95.0, 115.0, 207.0, 287.0, 443.0, 706.0, 1101.0, 1648.0, 2603.0, 4088.0, 6500.0, 10455.0, 16912.0, 27423.0, 44468.0, 68803.0, 101726.0, 134035.0, 152934.0, 142923.0, 114173.0, 79485.0, 51969.0, 32100.0, 19942.0, 12160.0, 7525.0, 4822.0, 3008.0, 2037.0, 1324.0, 804.0, 539.0, 342.0, 251.0, 120.0, 107.0, 69.0, 35.0, 40.0, 16.0, 12.0, 9.0, 6.0, 9.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.71875, -53.95947265625, -52.2001953125, -50.44091796875, -48.681640625, -46.92236328125, -45.1630859375, -43.40380859375, -41.64453125, -39.88525390625, -38.1259765625, -36.36669921875, -34.607421875, -32.84814453125, -31.0888671875, -29.32958984375, -27.5703125, -25.81103515625, -24.0517578125, -22.29248046875, -20.533203125, -18.77392578125, -17.0146484375, -15.25537109375, -13.49609375, -11.73681640625, -9.9775390625, -8.21826171875, -6.458984375, -4.69970703125, -2.9404296875, -1.18115234375, 0.578125, 2.33740234375, 4.0966796875, 5.85595703125, 7.615234375, 9.37451171875, 11.1337890625, 12.89306640625, 14.65234375, 16.41162109375, 18.1708984375, 19.93017578125, 21.689453125, 23.44873046875, 25.2080078125, 26.96728515625, 28.7265625, 30.48583984375, 32.2451171875, 34.00439453125, 35.763671875, 37.52294921875, 39.2822265625, 41.04150390625, 42.80078125, 44.56005859375, 46.3193359375, 48.07861328125, 49.837890625, 51.59716796875, 53.3564453125, 55.11572265625, 56.875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 6.0, 12.0, 11.0, 12.0, 20.0, 22.0, 21.0, 15.0, 30.0, 29.0, 34.0, 28.0, 32.0, 38.0, 43.0, 49.0, 36.0, 49.0, 55.0, 50.0, 41.0, 30.0, 36.0, 31.0, 38.0, 35.0, 27.0, 30.0, 26.0, 22.0, 22.0, 16.0, 12.0, 6.0, 9.0, 3.0, 3.0, 10.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.875, -37.71533203125, -36.5556640625, -35.39599609375, -34.236328125, -33.07666015625, -31.9169921875, -30.75732421875, -29.59765625, -28.43798828125, -27.2783203125, -26.11865234375, -24.958984375, -23.79931640625, -22.6396484375, -21.47998046875, -20.3203125, -19.16064453125, -18.0009765625, -16.84130859375, -15.681640625, -14.52197265625, -13.3623046875, -12.20263671875, -11.04296875, -9.88330078125, -8.7236328125, -7.56396484375, -6.404296875, -5.24462890625, -4.0849609375, -2.92529296875, -1.765625, -0.60595703125, 0.5537109375, 1.71337890625, 2.873046875, 4.03271484375, 5.1923828125, 6.35205078125, 7.51171875, 8.67138671875, 9.8310546875, 10.99072265625, 12.150390625, 13.31005859375, 14.4697265625, 15.62939453125, 16.7890625, 17.94873046875, 19.1083984375, 20.26806640625, 21.427734375, 22.58740234375, 23.7470703125, 24.90673828125, 26.06640625, 27.22607421875, 28.3857421875, 29.54541015625, 30.705078125, 31.86474609375, 33.0244140625, 34.18408203125, 35.34375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 11.0, 16.0, 15.0, 43.0, 50.0, 57.0, 95.0, 149.0, 235.0, 395.0, 594.0, 920.0, 1438.0, 2275.0, 3565.0, 5956.0, 10018.0, 16468.0, 28210.0, 45877.0, 72910.0, 107595.0, 140918.0, 155952.0, 143359.0, 111661.0, 76942.0, 48418.0, 29496.0, 17675.0, 10565.0, 6259.0, 3933.0, 2380.0, 1440.0, 904.0, 580.0, 405.0, 232.0, 187.0, 119.0, 69.0, 55.0, 39.0, 29.0, 13.0, 13.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.57861328125, -8.2978515625, -8.01708984375, -7.736328125, -7.45556640625, -7.1748046875, -6.89404296875, -6.61328125, -6.33251953125, -6.0517578125, -5.77099609375, -5.490234375, -5.20947265625, -4.9287109375, -4.64794921875, -4.3671875, -4.08642578125, -3.8056640625, -3.52490234375, -3.244140625, -2.96337890625, -2.6826171875, -2.40185546875, -2.12109375, -1.84033203125, -1.5595703125, -1.27880859375, -0.998046875, -0.71728515625, -0.4365234375, -0.15576171875, 0.125, 0.40576171875, 0.6865234375, 0.96728515625, 1.248046875, 1.52880859375, 1.8095703125, 2.09033203125, 2.37109375, 2.65185546875, 2.9326171875, 3.21337890625, 3.494140625, 3.77490234375, 4.0556640625, 4.33642578125, 4.6171875, 4.89794921875, 5.1787109375, 5.45947265625, 5.740234375, 6.02099609375, 6.3017578125, 6.58251953125, 6.86328125, 7.14404296875, 7.4248046875, 7.70556640625, 7.986328125, 8.26708984375, 8.5478515625, 8.82861328125, 9.109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 11.0, 5.0, 8.0, 7.0, 16.0, 14.0, 27.0, 30.0, 22.0, 35.0, 30.0, 55.0, 35.0, 46.0, 37.0, 56.0, 65.0, 61.0, 52.0, 54.0, 55.0, 45.0, 45.0, 37.0, 28.0, 18.0, 18.0, 22.0, 9.0, 12.0, 13.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008630752563476562, -0.0008341819047927856, -0.000805288553237915, -0.0007763952016830444, -0.0007475018501281738, -0.0007186084985733032, -0.0006897151470184326, -0.000660821795463562, -0.0006319284439086914, -0.0006030350923538208, -0.0005741417407989502, -0.0005452483892440796, -0.000516355037689209, -0.0004874616861343384, -0.0004585683345794678, -0.00042967498302459717, -0.00040078163146972656, -0.00037188827991485596, -0.00034299492835998535, -0.00031410157680511475, -0.00028520822525024414, -0.00025631487369537354, -0.00022742152214050293, -0.00019852817058563232, -0.00016963481903076172, -0.0001407414674758911, -0.00011184811592102051, -8.29547643661499e-05, -5.40614128112793e-05, -2.516806125640869e-05, 3.725290298461914e-06, 3.261864185333252e-05, 6.151199340820312e-05, 9.040534496307373e-05, 0.00011929869651794434, 0.00014819204807281494, 0.00017708539962768555, 0.00020597875118255615, 0.00023487210273742676, 0.00026376545429229736, 0.00029265880584716797, 0.0003215521574020386, 0.0003504455089569092, 0.0003793388605117798, 0.0004082322120666504, 0.000437125563621521, 0.0004660189151763916, 0.0004949122667312622, 0.0005238056182861328, 0.0005526989698410034, 0.000581592321395874, 0.0006104856729507446, 0.0006393790245056152, 0.0006682723760604858, 0.0006971657276153564, 0.000726059079170227, 0.0007549524307250977, 0.0007838457822799683, 0.0008127391338348389, 0.0008416324853897095, 0.0008705258369445801, 0.0008994191884994507, 0.0009283125400543213, 0.0009572058916091919, 0.0009860992431640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 18.0, 20.0, 21.0, 45.0, 54.0, 80.0, 151.0, 242.0, 314.0, 471.0, 766.0, 1087.0, 1821.0, 2912.0, 4685.0, 7796.0, 12779.0, 21277.0, 34612.0, 55384.0, 84594.0, 117943.0, 144480.0, 150322.0, 131099.0, 98778.0, 67036.0, 42352.0, 26174.0, 16128.0, 9493.0, 5774.0, 3579.0, 2318.0, 1412.0, 919.0, 541.0, 362.0, 244.0, 152.0, 96.0, 69.0, 63.0, 24.0, 23.0, 10.0, 9.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.453125, -8.17333984375, -7.8935546875, -7.61376953125, -7.333984375, -7.05419921875, -6.7744140625, -6.49462890625, -6.21484375, -5.93505859375, -5.6552734375, -5.37548828125, -5.095703125, -4.81591796875, -4.5361328125, -4.25634765625, -3.9765625, -3.69677734375, -3.4169921875, -3.13720703125, -2.857421875, -2.57763671875, -2.2978515625, -2.01806640625, -1.73828125, -1.45849609375, -1.1787109375, -0.89892578125, -0.619140625, -0.33935546875, -0.0595703125, 0.22021484375, 0.5, 0.77978515625, 1.0595703125, 1.33935546875, 1.619140625, 1.89892578125, 2.1787109375, 2.45849609375, 2.73828125, 3.01806640625, 3.2978515625, 3.57763671875, 3.857421875, 4.13720703125, 4.4169921875, 4.69677734375, 4.9765625, 5.25634765625, 5.5361328125, 5.81591796875, 6.095703125, 6.37548828125, 6.6552734375, 6.93505859375, 7.21484375, 7.49462890625, 7.7744140625, 8.05419921875, 8.333984375, 8.61376953125, 8.8935546875, 9.17333984375, 9.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 2.0, 7.0, 9.0, 14.0, 11.0, 20.0, 21.0, 26.0, 21.0, 37.0, 47.0, 43.0, 30.0, 45.0, 61.0, 48.0, 52.0, 46.0, 51.0, 55.0, 55.0, 49.0, 22.0, 39.0, 37.0, 21.0, 25.0, 14.0, 16.0, 15.0, 16.0, 9.0, 5.0, 2.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55078125, -3.42864990234375, -3.3065185546875, -3.18438720703125, -3.062255859375, -2.94012451171875, -2.8179931640625, -2.69586181640625, -2.57373046875, -2.45159912109375, -2.3294677734375, -2.20733642578125, -2.085205078125, -1.96307373046875, -1.8409423828125, -1.71881103515625, -1.5966796875, -1.47454833984375, -1.3524169921875, -1.23028564453125, -1.108154296875, -0.98602294921875, -0.8638916015625, -0.74176025390625, -0.61962890625, -0.49749755859375, -0.3753662109375, -0.25323486328125, -0.131103515625, -0.00897216796875, 0.1131591796875, 0.23529052734375, 0.357421875, 0.47955322265625, 0.6016845703125, 0.72381591796875, 0.845947265625, 0.96807861328125, 1.0902099609375, 1.21234130859375, 1.33447265625, 1.45660400390625, 1.5787353515625, 1.70086669921875, 1.822998046875, 1.94512939453125, 2.0672607421875, 2.18939208984375, 2.3115234375, 2.43365478515625, 2.5557861328125, 2.67791748046875, 2.800048828125, 2.92218017578125, 3.0443115234375, 3.16644287109375, 3.28857421875, 3.41070556640625, 3.5328369140625, 3.65496826171875, 3.777099609375, 3.89923095703125, 4.0213623046875, 4.14349365234375, 4.265625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 21.0, 15.0, 23.0, 21.0, 38.0, 40.0, 44.0, 47.0, 40.0, 53.0, 51.0, 60.0, 48.0, 54.0, 46.0, 56.0, 43.0, 35.0, 34.0, 25.0, 25.0, 28.0, 23.0, 22.0, 22.0, 11.0, 9.0, 11.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.57524871826172, -54.92955780029297, -53.283870697021484, -51.638179779052734, -49.99249267578125, -48.3468017578125, -46.70111083984375, -45.055423736572266, -43.40973663330078, -41.76404571533203, -40.11835861206055, -38.4726676940918, -36.82698059082031, -35.18128967285156, -33.53559875488281, -31.889911651611328, -30.244220733642578, -28.59853172302246, -26.952842712402344, -25.307151794433594, -23.66146469116211, -22.01577377319336, -20.370084762573242, -18.724395751953125, -17.078706741333008, -15.43301773071289, -13.787328720092773, -12.14163875579834, -10.495949745178223, -8.850260734558105, -7.204570770263672, -5.558881759643555, -3.9131927490234375, -2.267503499984741, -0.6218142509460449, 1.0238752365112305, 2.6695642471313477, 4.315253257751465, 5.960943222045898, 7.606632232666016, 9.252321243286133, 10.89801025390625, 12.543699264526367, 14.1893892288208, 15.835078239440918, 17.48076629638672, 19.12645721435547, 20.772146224975586, 22.417835235595703, 24.06352424621582, 25.709213256835938, 27.354904174804688, 29.000591278076172, 30.646282196044922, 32.291969299316406, 33.937660217285156, 35.583351135253906, 37.229042053222656, 38.87472915649414, 40.52042007446289, 42.166107177734375, 43.811798095703125, 45.457489013671875, 47.10317611694336, 48.748863220214844]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 7.0, 5.0, 8.0, 13.0, 9.0, 21.0, 15.0, 19.0, 21.0, 23.0, 22.0, 28.0, 45.0, 32.0, 38.0, 46.0, 41.0, 33.0, 35.0, 38.0, 43.0, 37.0, 41.0, 35.0, 33.0, 26.0, 29.0, 34.0, 31.0, 28.0, 22.0, 27.0, 21.0, 17.0, 15.0, 7.0, 15.0, 3.0, 8.0, 3.0, 6.0, 6.0, 11.0, 4.0, 0.0, 2.0], "bins": [-68.23397064208984, -66.43486022949219, -64.6357421875, -62.83662796020508, -61.037513732910156, -59.238399505615234, -57.43928527832031, -55.64017105102539, -53.84105682373047, -52.04194259643555, -50.242828369140625, -48.4437141418457, -46.64459991455078, -44.84548568725586, -43.04637145996094, -41.247257232666016, -39.448143005371094, -37.64902877807617, -35.84991455078125, -34.05080032348633, -32.251686096191406, -30.452571868896484, -28.653457641601562, -26.85434341430664, -25.05522918701172, -23.256114959716797, -21.457000732421875, -19.657886505126953, -17.85877227783203, -16.05965805053711, -14.260543823242188, -12.461429595947266, -10.662311553955078, -8.863197326660156, -7.064083099365234, -5.2649688720703125, -3.4658546447753906, -1.6667404174804688, 0.13237380981445312, 1.931488037109375, 3.730602264404297, 5.529716491699219, 7.328830718994141, 9.127944946289062, 10.927059173583984, 12.726173400878906, 14.525287628173828, 16.32440185546875, 18.123516082763672, 19.922630310058594, 21.721744537353516, 23.520858764648438, 25.31997299194336, 27.11908721923828, 28.918201446533203, 30.717315673828125, 32.51642990112305, 34.31554412841797, 36.11465835571289, 37.91377258300781, 39.712886810302734, 41.512001037597656, 43.31111526489258, 45.1102294921875, 46.90934371948242]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 8.0, 23.0, 25.0, 37.0, 72.0, 98.0, 187.0, 260.0, 437.0, 675.0, 1204.0, 1892.0, 3176.0, 5225.0, 8844.0, 14818.0, 25631.0, 44137.0, 76910.0, 137416.0, 248990.0, 446291.0, 693476.0, 819603.0, 682336.0, 432085.0, 240646.0, 132440.0, 74672.0, 42597.0, 24514.0, 14330.0, 8486.0, 5067.0, 3049.0, 1888.0, 1084.0, 645.0, 338.0, 237.0, 150.0, 96.0, 62.0, 39.0, 27.0, 17.0, 14.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-52.6875, -51.11328125, -49.5390625, -47.96484375, -46.390625, -44.81640625, -43.2421875, -41.66796875, -40.09375, -38.51953125, -36.9453125, -35.37109375, -33.796875, -32.22265625, -30.6484375, -29.07421875, -27.5, -25.92578125, -24.3515625, -22.77734375, -21.203125, -19.62890625, -18.0546875, -16.48046875, -14.90625, -13.33203125, -11.7578125, -10.18359375, -8.609375, -7.03515625, -5.4609375, -3.88671875, -2.3125, -0.73828125, 0.8359375, 2.41015625, 3.984375, 5.55859375, 7.1328125, 8.70703125, 10.28125, 11.85546875, 13.4296875, 15.00390625, 16.578125, 18.15234375, 19.7265625, 21.30078125, 22.875, 24.44921875, 26.0234375, 27.59765625, 29.171875, 30.74609375, 32.3203125, 33.89453125, 35.46875, 37.04296875, 38.6171875, 40.19140625, 41.765625, 43.33984375, 44.9140625, 46.48828125, 48.0625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 4.0, 5.0, 13.0, 16.0, 15.0, 18.0, 23.0, 12.0, 31.0, 19.0, 33.0, 38.0, 42.0, 42.0, 42.0, 35.0, 36.0, 30.0, 42.0, 38.0, 37.0, 45.0, 37.0, 31.0, 30.0, 28.0, 36.0, 30.0, 20.0, 31.0, 23.0, 17.0, 21.0, 10.0, 7.0, 13.0, 5.0, 7.0, 3.0, 7.0, 8.0, 7.0, 4.0, 0.0, 2.0], "bins": [-51.34375, -49.982421875, -48.62109375, -47.259765625, -45.8984375, -44.537109375, -43.17578125, -41.814453125, -40.453125, -39.091796875, -37.73046875, -36.369140625, -35.0078125, -33.646484375, -32.28515625, -30.923828125, -29.5625, -28.201171875, -26.83984375, -25.478515625, -24.1171875, -22.755859375, -21.39453125, -20.033203125, -18.671875, -17.310546875, -15.94921875, -14.587890625, -13.2265625, -11.865234375, -10.50390625, -9.142578125, -7.78125, -6.419921875, -5.05859375, -3.697265625, -2.3359375, -0.974609375, 0.38671875, 1.748046875, 3.109375, 4.470703125, 5.83203125, 7.193359375, 8.5546875, 9.916015625, 11.27734375, 12.638671875, 14.0, 15.361328125, 16.72265625, 18.083984375, 19.4453125, 20.806640625, 22.16796875, 23.529296875, 24.890625, 26.251953125, 27.61328125, 28.974609375, 30.3359375, 31.697265625, 33.05859375, 34.419921875, 35.78125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 14.0, 27.0, 44.0, 86.0, 133.0, 194.0, 300.0, 453.0, 772.0, 1274.0, 1880.0, 3036.0, 4875.0, 7985.0, 12791.0, 20976.0, 34567.0, 55912.0, 90119.0, 143555.0, 221060.0, 325174.0, 443255.0, 542526.0, 572933.0, 513131.0, 401752.0, 283977.0, 190072.0, 121504.0, 76435.0, 46671.0, 29185.0, 18160.0, 11052.0, 6761.0, 4246.0, 2707.0, 1616.0, 1060.0, 736.0, 452.0, 301.0, 182.0, 114.0, 75.0, 53.0, 34.0, 19.0, 15.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0], "bins": [-37.40625, -36.2490234375, -35.091796875, -33.9345703125, -32.77734375, -31.6201171875, -30.462890625, -29.3056640625, -28.1484375, -26.9912109375, -25.833984375, -24.6767578125, -23.51953125, -22.3623046875, -21.205078125, -20.0478515625, -18.890625, -17.7333984375, -16.576171875, -15.4189453125, -14.26171875, -13.1044921875, -11.947265625, -10.7900390625, -9.6328125, -8.4755859375, -7.318359375, -6.1611328125, -5.00390625, -3.8466796875, -2.689453125, -1.5322265625, -0.375, 0.7822265625, 1.939453125, 3.0966796875, 4.25390625, 5.4111328125, 6.568359375, 7.7255859375, 8.8828125, 10.0400390625, 11.197265625, 12.3544921875, 13.51171875, 14.6689453125, 15.826171875, 16.9833984375, 18.140625, 19.2978515625, 20.455078125, 21.6123046875, 22.76953125, 23.9267578125, 25.083984375, 26.2412109375, 27.3984375, 28.5556640625, 29.712890625, 30.8701171875, 32.02734375, 33.1845703125, 34.341796875, 35.4990234375, 36.65625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 11.0, 9.0, 5.0, 8.0, 16.0, 17.0, 15.0, 25.0, 28.0, 40.0, 50.0, 55.0, 77.0, 74.0, 83.0, 125.0, 153.0, 162.0, 163.0, 202.0, 224.0, 250.0, 233.0, 245.0, 214.0, 230.0, 220.0, 202.0, 160.0, 150.0, 127.0, 114.0, 82.0, 63.0, 56.0, 35.0, 35.0, 30.0, 25.0, 19.0, 14.0, 14.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.71875, -22.068115234375, -21.41748046875, -20.766845703125, -20.1162109375, -19.465576171875, -18.81494140625, -18.164306640625, -17.513671875, -16.863037109375, -16.21240234375, -15.561767578125, -14.9111328125, -14.260498046875, -13.60986328125, -12.959228515625, -12.30859375, -11.657958984375, -11.00732421875, -10.356689453125, -9.7060546875, -9.055419921875, -8.40478515625, -7.754150390625, -7.103515625, -6.452880859375, -5.80224609375, -5.151611328125, -4.5009765625, -3.850341796875, -3.19970703125, -2.549072265625, -1.8984375, -1.247802734375, -0.59716796875, 0.053466796875, 0.7041015625, 1.354736328125, 2.00537109375, 2.656005859375, 3.306640625, 3.957275390625, 4.60791015625, 5.258544921875, 5.9091796875, 6.559814453125, 7.21044921875, 7.861083984375, 8.51171875, 9.162353515625, 9.81298828125, 10.463623046875, 11.1142578125, 11.764892578125, 12.41552734375, 13.066162109375, 13.716796875, 14.367431640625, 15.01806640625, 15.668701171875, 16.3193359375, 16.969970703125, 17.62060546875, 18.271240234375, 18.921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 8.0, 6.0, 15.0, 14.0, 12.0, 22.0, 32.0, 25.0, 29.0, 41.0, 57.0, 50.0, 43.0, 51.0, 51.0, 57.0, 64.0, 70.0, 46.0, 39.0, 45.0, 38.0, 31.0, 20.0, 29.0, 21.0, 13.0, 19.0, 13.0, 9.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.83911895751953, -48.321170806884766, -46.80322265625, -45.285274505615234, -43.76732635498047, -42.24938201904297, -40.7314338684082, -39.21348571777344, -37.69553756713867, -36.177589416503906, -34.65964126586914, -33.141693115234375, -31.623746871948242, -30.105798721313477, -28.587852478027344, -27.069904327392578, -25.551956176757812, -24.034008026123047, -22.51605987548828, -20.99811363220215, -19.480165481567383, -17.962217330932617, -16.444271087646484, -14.926322937011719, -13.408374786376953, -11.890426635742188, -10.372479438781738, -8.854532241821289, -7.336584091186523, -5.818636417388916, -4.300688743591309, -2.7827415466308594, -1.2647972106933594, 0.25315046310424805, 1.7710981369018555, 3.289045810699463, 4.80699348449707, 6.324941158294678, 7.842888832092285, 9.360836029052734, 10.8787841796875, 12.396732330322266, 13.914679527282715, 15.432626724243164, 16.95057487487793, 18.468523025512695, 19.986469268798828, 21.504417419433594, 23.02236557006836, 24.540313720703125, 26.05826187133789, 27.576208114624023, 29.09415626525879, 30.612104415893555, 32.13005065917969, 33.64799880981445, 35.16594696044922, 36.683895111083984, 38.20184326171875, 39.719791412353516, 41.23773956298828, 42.75568389892578, 44.27363204956055, 45.79158020019531, 47.30952835083008]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 16.0, 12.0, 5.0, 15.0, 19.0, 21.0, 24.0, 21.0, 32.0, 34.0, 34.0, 39.0, 39.0, 38.0, 39.0, 49.0, 42.0, 41.0, 31.0, 34.0, 45.0, 35.0, 52.0, 28.0, 24.0, 24.0, 33.0, 30.0, 21.0, 18.0, 18.0, 18.0, 15.0, 14.0, 6.0, 9.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-59.58509826660156, -57.944766998291016, -56.30443572998047, -54.664100646972656, -53.02376937866211, -51.38343811035156, -49.743106842041016, -48.10277557373047, -46.46244430541992, -44.822113037109375, -43.18178176879883, -41.54145050048828, -39.90111541748047, -38.26078414916992, -36.620452880859375, -34.98012161254883, -33.33979034423828, -31.699459075927734, -30.059125900268555, -28.418794631958008, -26.77846336364746, -25.13813018798828, -23.497798919677734, -21.857467651367188, -20.217132568359375, -18.576801300048828, -16.93646812438965, -15.296136856079102, -13.655805587768555, -12.015473365783691, -10.375141143798828, -8.734809875488281, -7.094478607177734, -5.454146862030029, -3.813814878463745, -2.173482894897461, -0.5331511497497559, 1.1071805953979492, 2.7475128173828125, 4.387844085693359, 6.028176307678223, 7.668508052825928, 9.308839797973633, 10.949172019958496, 12.58950424194336, 14.229835510253906, 15.87016773223877, 17.510498046875, 19.15083122253418, 20.791162490844727, 22.431495666503906, 24.071826934814453, 25.712158203125, 27.352489471435547, 28.992822647094727, 30.633153915405273, 32.27348709106445, 33.913818359375, 35.55414962768555, 37.194480895996094, 38.834815979003906, 40.47514724731445, 42.115478515625, 43.75580978393555, 45.396141052246094]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 12.0, 7.0, 29.0, 35.0, 61.0, 82.0, 118.0, 200.0, 295.0, 411.0, 656.0, 1053.0, 1512.0, 2458.0, 3635.0, 5817.0, 8788.0, 14130.0, 22258.0, 33676.0, 50706.0, 72776.0, 100467.0, 125474.0, 136267.0, 128067.0, 104875.0, 78184.0, 54258.0, 36000.0, 23585.0, 15091.0, 9794.0, 6253.0, 4066.0, 2624.0, 1728.0, 1070.0, 730.0, 457.0, 298.0, 184.0, 123.0, 85.0, 50.0, 40.0, 27.0, 13.0, 10.0, 10.0, 3.0, 5.0, 5.0, 0.0, 1.0], "bins": [-15.1328125, -14.6822509765625, -14.231689453125, -13.7811279296875, -13.33056640625, -12.8800048828125, -12.429443359375, -11.9788818359375, -11.5283203125, -11.0777587890625, -10.627197265625, -10.1766357421875, -9.72607421875, -9.2755126953125, -8.824951171875, -8.3743896484375, -7.923828125, -7.4732666015625, -7.022705078125, -6.5721435546875, -6.12158203125, -5.6710205078125, -5.220458984375, -4.7698974609375, -4.3193359375, -3.8687744140625, -3.418212890625, -2.9676513671875, -2.51708984375, -2.0665283203125, -1.615966796875, -1.1654052734375, -0.71484375, -0.2642822265625, 0.186279296875, 0.6368408203125, 1.08740234375, 1.5379638671875, 1.988525390625, 2.4390869140625, 2.8896484375, 3.3402099609375, 3.790771484375, 4.2413330078125, 4.69189453125, 5.1424560546875, 5.593017578125, 6.0435791015625, 6.494140625, 6.9447021484375, 7.395263671875, 7.8458251953125, 8.29638671875, 8.7469482421875, 9.197509765625, 9.6480712890625, 10.0986328125, 10.5491943359375, 10.999755859375, 11.4503173828125, 11.90087890625, 12.3514404296875, 12.802001953125, 13.2525634765625, 13.703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 7.0, 16.0, 12.0, 5.0, 13.0, 22.0, 19.0, 25.0, 22.0, 34.0, 26.0, 36.0, 41.0, 39.0, 38.0, 38.0, 49.0, 43.0, 41.0, 29.0, 38.0, 44.0, 36.0, 45.0, 34.0, 26.0, 22.0, 30.0, 30.0, 25.0, 16.0, 19.0, 18.0, 14.0, 16.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-58.375, -56.77392578125, -55.1728515625, -53.57177734375, -51.970703125, -50.36962890625, -48.7685546875, -47.16748046875, -45.56640625, -43.96533203125, -42.3642578125, -40.76318359375, -39.162109375, -37.56103515625, -35.9599609375, -34.35888671875, -32.7578125, -31.15673828125, -29.5556640625, -27.95458984375, -26.353515625, -24.75244140625, -23.1513671875, -21.55029296875, -19.94921875, -18.34814453125, -16.7470703125, -15.14599609375, -13.544921875, -11.94384765625, -10.3427734375, -8.74169921875, -7.140625, -5.53955078125, -3.9384765625, -2.33740234375, -0.736328125, 0.86474609375, 2.4658203125, 4.06689453125, 5.66796875, 7.26904296875, 8.8701171875, 10.47119140625, 12.072265625, 13.67333984375, 15.2744140625, 16.87548828125, 18.4765625, 20.07763671875, 21.6787109375, 23.27978515625, 24.880859375, 26.48193359375, 28.0830078125, 29.68408203125, 31.28515625, 32.88623046875, 34.4873046875, 36.08837890625, 37.689453125, 39.29052734375, 40.8916015625, 42.49267578125, 44.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 15.0, 10.0, 20.0, 23.0, 44.0, 62.0, 84.0, 119.0, 168.0, 232.0, 353.0, 521.0, 765.0, 1171.0, 1642.0, 2499.0, 3737.0, 5749.0, 8789.0, 13718.0, 24220.0, 56642.0, 850413.0, 30959.0, 16562.0, 10088.0, 6526.0, 4392.0, 2951.0, 1900.0, 1306.0, 899.0, 626.0, 451.0, 274.0, 180.0, 128.0, 92.0, 63.0, 54.0, 33.0, 22.0, 15.0, 4.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.21875, -31.15087890625, -30.0830078125, -29.01513671875, -27.947265625, -26.87939453125, -25.8115234375, -24.74365234375, -23.67578125, -22.60791015625, -21.5400390625, -20.47216796875, -19.404296875, -18.33642578125, -17.2685546875, -16.20068359375, -15.1328125, -14.06494140625, -12.9970703125, -11.92919921875, -10.861328125, -9.79345703125, -8.7255859375, -7.65771484375, -6.58984375, -5.52197265625, -4.4541015625, -3.38623046875, -2.318359375, -1.25048828125, -0.1826171875, 0.88525390625, 1.953125, 3.02099609375, 4.0888671875, 5.15673828125, 6.224609375, 7.29248046875, 8.3603515625, 9.42822265625, 10.49609375, 11.56396484375, 12.6318359375, 13.69970703125, 14.767578125, 15.83544921875, 16.9033203125, 17.97119140625, 19.0390625, 20.10693359375, 21.1748046875, 22.24267578125, 23.310546875, 24.37841796875, 25.4462890625, 26.51416015625, 27.58203125, 28.64990234375, 29.7177734375, 30.78564453125, 31.853515625, 32.92138671875, 33.9892578125, 35.05712890625, 36.125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 13.0, 10.0, 9.0, 14.0, 12.0, 22.0, 18.0, 24.0, 19.0, 21.0, 33.0, 32.0, 24.0, 33.0, 31.0, 27.0, 36.0, 30.0, 35.0, 34.0, 35.0, 43.0, 31.0, 32.0, 29.0, 30.0, 24.0, 29.0, 33.0, 23.0, 22.0, 24.0, 20.0, 16.0, 18.0, 14.0, 16.0, 10.0, 11.0, 9.0, 8.0, 7.0, 6.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-30.140625, -29.211669921875, -28.28271484375, -27.353759765625, -26.4248046875, -25.495849609375, -24.56689453125, -23.637939453125, -22.708984375, -21.780029296875, -20.85107421875, -19.922119140625, -18.9931640625, -18.064208984375, -17.13525390625, -16.206298828125, -15.27734375, -14.348388671875, -13.41943359375, -12.490478515625, -11.5615234375, -10.632568359375, -9.70361328125, -8.774658203125, -7.845703125, -6.916748046875, -5.98779296875, -5.058837890625, -4.1298828125, -3.200927734375, -2.27197265625, -1.343017578125, -0.4140625, 0.514892578125, 1.44384765625, 2.372802734375, 3.3017578125, 4.230712890625, 5.15966796875, 6.088623046875, 7.017578125, 7.946533203125, 8.87548828125, 9.804443359375, 10.7333984375, 11.662353515625, 12.59130859375, 13.520263671875, 14.44921875, 15.378173828125, 16.30712890625, 17.236083984375, 18.1650390625, 19.093994140625, 20.02294921875, 20.951904296875, 21.880859375, 22.809814453125, 23.73876953125, 24.667724609375, 25.5966796875, 26.525634765625, 27.45458984375, 28.383544921875, 29.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 8.0, 15.0, 11.0, 24.0, 33.0, 59.0, 62.0, 108.0, 121.0, 190.0, 278.0, 435.0, 639.0, 1112.0, 1895.0, 3410.0, 6999.0, 15107.0, 41342.0, 899694.0, 44858.0, 16423.0, 7185.0, 3433.0, 1909.0, 1157.0, 667.0, 447.0, 295.0, 191.0, 129.0, 96.0, 56.0, 48.0, 32.0, 22.0, 23.0, 8.0, 10.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7529296875, -1.6990509033203125, -1.645172119140625, -1.5912933349609375, -1.53741455078125, -1.4835357666015625, -1.429656982421875, -1.3757781982421875, -1.3218994140625, -1.2680206298828125, -1.214141845703125, -1.1602630615234375, -1.10638427734375, -1.0525054931640625, -0.998626708984375, -0.9447479248046875, -0.890869140625, -0.8369903564453125, -0.783111572265625, -0.7292327880859375, -0.67535400390625, -0.6214752197265625, -0.567596435546875, -0.5137176513671875, -0.4598388671875, -0.4059600830078125, -0.352081298828125, -0.2982025146484375, -0.24432373046875, -0.1904449462890625, -0.136566162109375, -0.0826873779296875, -0.02880859375, 0.0250701904296875, 0.078948974609375, 0.1328277587890625, 0.18670654296875, 0.2405853271484375, 0.294464111328125, 0.3483428955078125, 0.4022216796875, 0.4561004638671875, 0.509979248046875, 0.5638580322265625, 0.61773681640625, 0.6716156005859375, 0.725494384765625, 0.7793731689453125, 0.833251953125, 0.8871307373046875, 0.941009521484375, 0.9948883056640625, 1.04876708984375, 1.1026458740234375, 1.156524658203125, 1.2104034423828125, 1.2642822265625, 1.3181610107421875, 1.372039794921875, 1.4259185791015625, 1.47979736328125, 1.5336761474609375, 1.587554931640625, 1.6414337158203125, 1.6953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 3.0, 3.0, 12.0, 11.0, 11.0, 19.0, 22.0, 29.0, 41.0, 46.0, 54.0, 76.0, 79.0, 93.0, 94.0, 73.0, 63.0, 66.0, 43.0, 44.0, 27.0, 21.0, 18.0, 12.0, 8.0, 11.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3855438232421875e-05, -3.254786133766174e-05, -3.124028444290161e-05, -2.993270754814148e-05, -2.8625130653381348e-05, -2.7317553758621216e-05, -2.6009976863861084e-05, -2.4702399969100952e-05, -2.339482307434082e-05, -2.208724617958069e-05, -2.0779669284820557e-05, -1.9472092390060425e-05, -1.8164515495300293e-05, -1.685693860054016e-05, -1.554936170578003e-05, -1.4241784811019897e-05, -1.2934207916259766e-05, -1.1626631021499634e-05, -1.0319054126739502e-05, -9.01147723197937e-06, -7.703900337219238e-06, -6.3963234424591064e-06, -5.088746547698975e-06, -3.7811696529388428e-06, -2.473592758178711e-06, -1.166015863418579e-06, 1.4156103134155273e-07, 1.4491379261016846e-06, 2.7567148208618164e-06, 4.064291715621948e-06, 5.37186861038208e-06, 6.679445505142212e-06, 7.987022399902344e-06, 9.294599294662476e-06, 1.0602176189422607e-05, 1.190975308418274e-05, 1.3217329978942871e-05, 1.4524906873703003e-05, 1.5832483768463135e-05, 1.7140060663223267e-05, 1.84476375579834e-05, 1.975521445274353e-05, 2.1062791347503662e-05, 2.2370368242263794e-05, 2.3677945137023926e-05, 2.4985522031784058e-05, 2.629309892654419e-05, 2.760067582130432e-05, 2.8908252716064453e-05, 3.0215829610824585e-05, 3.152340650558472e-05, 3.283098340034485e-05, 3.413856029510498e-05, 3.544613718986511e-05, 3.6753714084625244e-05, 3.8061290979385376e-05, 3.936886787414551e-05, 4.067644476890564e-05, 4.198402166366577e-05, 4.32915985584259e-05, 4.4599175453186035e-05, 4.590675234794617e-05, 4.72143292427063e-05, 4.852190613746643e-05, 4.982948303222656e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 7.0, 3.0, 4.0, 6.0, 9.0, 16.0, 19.0, 50.0, 74.0, 94.0, 166.0, 236.0, 359.0, 567.0, 890.0, 1418.0, 2154.0, 3379.0, 5439.0, 8561.0, 14081.0, 23104.0, 37344.0, 63746.0, 110637.0, 191145.0, 227123.0, 148109.0, 83402.0, 49273.0, 29517.0, 17983.0, 10926.0, 6790.0, 4253.0, 2776.0, 1721.0, 1122.0, 716.0, 484.0, 309.0, 192.0, 107.0, 81.0, 74.0, 44.0, 20.0, 12.0, 10.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6712112426757812, -0.6456451416015625, -0.6200790405273438, -0.594512939453125, -0.5689468383789062, -0.5433807373046875, -0.5178146362304688, -0.49224853515625, -0.46668243408203125, -0.4411163330078125, -0.41555023193359375, -0.389984130859375, -0.36441802978515625, -0.3388519287109375, -0.31328582763671875, -0.2877197265625, -0.26215362548828125, -0.2365875244140625, -0.21102142333984375, -0.185455322265625, -0.15988922119140625, -0.1343231201171875, -0.10875701904296875, -0.08319091796875, -0.05762481689453125, -0.0320587158203125, -0.00649261474609375, 0.019073486328125, 0.04463958740234375, 0.0702056884765625, 0.09577178955078125, 0.121337890625, 0.14690399169921875, 0.1724700927734375, 0.19803619384765625, 0.223602294921875, 0.24916839599609375, 0.2747344970703125, 0.30030059814453125, 0.32586669921875, 0.35143280029296875, 0.3769989013671875, 0.40256500244140625, 0.428131103515625, 0.45369720458984375, 0.4792633056640625, 0.5048294067382812, 0.5303955078125, 0.5559616088867188, 0.5815277099609375, 0.6070938110351562, 0.632659912109375, 0.6582260131835938, 0.6837921142578125, 0.7093582153320312, 0.73492431640625, 0.7604904174804688, 0.7860565185546875, 0.8116226196289062, 0.837188720703125, 0.8627548217773438, 0.8883209228515625, 0.9138870239257812, 0.939453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 10.0, 4.0, 2.0, 8.0, 7.0, 10.0, 3.0, 10.0, 10.0, 8.0, 11.0, 15.0, 16.0, 24.0, 22.0, 22.0, 25.0, 40.0, 54.0, 42.0, 60.0, 50.0, 81.0, 62.0, 46.0, 56.0, 38.0, 40.0, 28.0, 37.0, 22.0, 22.0, 19.0, 15.0, 10.0, 8.0, 7.0, 7.0, 6.0, 7.0, 7.0, 7.0, 9.0, 4.0, 2.0, 8.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.404296875, -0.39261627197265625, -0.3809356689453125, -0.36925506591796875, -0.357574462890625, -0.34589385986328125, -0.3342132568359375, -0.32253265380859375, -0.31085205078125, -0.29917144775390625, -0.2874908447265625, -0.27581024169921875, -0.264129638671875, -0.25244903564453125, -0.2407684326171875, -0.22908782958984375, -0.2174072265625, -0.20572662353515625, -0.1940460205078125, -0.18236541748046875, -0.170684814453125, -0.15900421142578125, -0.1473236083984375, -0.13564300537109375, -0.12396240234375, -0.11228179931640625, -0.1006011962890625, -0.08892059326171875, -0.077239990234375, -0.06555938720703125, -0.0538787841796875, -0.04219818115234375, -0.030517578125, -0.01883697509765625, -0.0071563720703125, 0.00452423095703125, 0.016204833984375, 0.02788543701171875, 0.0395660400390625, 0.05124664306640625, 0.06292724609375, 0.07460784912109375, 0.0862884521484375, 0.09796905517578125, 0.109649658203125, 0.12133026123046875, 0.1330108642578125, 0.14469146728515625, 0.1563720703125, 0.16805267333984375, 0.1797332763671875, 0.19141387939453125, 0.203094482421875, 0.21477508544921875, 0.2264556884765625, 0.23813629150390625, 0.24981689453125, 0.26149749755859375, 0.2731781005859375, 0.28485870361328125, 0.296539306640625, 0.30821990966796875, 0.3199005126953125, 0.33158111572265625, 0.34326171875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 2.0, 4.0, 11.0, 8.0, 16.0, 12.0, 30.0, 17.0, 33.0, 31.0, 37.0, 41.0, 50.0, 56.0, 50.0, 48.0, 54.0, 70.0, 69.0, 56.0, 45.0, 31.0, 42.0, 37.0, 22.0, 28.0, 20.0, 15.0, 16.0, 21.0, 10.0, 4.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.96330261230469, -49.454952239990234, -47.94660186767578, -46.43824768066406, -44.92989730834961, -43.421546936035156, -41.9131965637207, -40.40484619140625, -38.89649200439453, -37.38814163208008, -35.879791259765625, -34.371437072753906, -32.86308670043945, -31.354736328125, -29.846385955810547, -28.33803367614746, -26.829683303833008, -25.321332931518555, -23.81298065185547, -22.304630279541016, -20.79627799987793, -19.287927627563477, -17.77957534790039, -16.271224975585938, -14.762873649597168, -13.254522323608398, -11.746170997619629, -10.23781967163086, -8.729469299316406, -7.2211174964904785, -5.712766647338867, -4.204415321350098, -2.696063995361328, -1.1877127885818481, 0.32063841819763184, 1.8289895057678223, 3.337340831756592, 4.845692157745361, 6.354043006896973, 7.862394332885742, 9.370745658874512, 10.879096984863281, 12.38744831085205, 13.89579963684082, 15.404150009155273, 16.91250228881836, 18.420852661132812, 19.929203033447266, 21.43755531311035, 22.945905685424805, 24.45425796508789, 25.962608337402344, 27.47096061706543, 28.979310989379883, 30.48766326904297, 31.996013641357422, 33.504364013671875, 35.01271438598633, 36.52106475830078, 38.0294189453125, 39.53776931762695, 41.046119689941406, 42.55447006225586, 44.06282043457031, 45.57117462158203]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 13.0, 15.0, 4.0, 12.0, 21.0, 21.0, 25.0, 20.0, 33.0, 32.0, 33.0, 39.0, 44.0, 36.0, 43.0, 42.0, 46.0, 36.0, 32.0, 40.0, 46.0, 30.0, 47.0, 33.0, 25.0, 23.0, 29.0, 31.0, 24.0, 23.0, 12.0, 18.0, 15.0, 15.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-57.942623138427734, -56.35280227661133, -54.76298522949219, -53.17316436767578, -51.583343505859375, -49.993526458740234, -48.40370559692383, -46.81388854980469, -45.22406768798828, -43.634246826171875, -42.044429779052734, -40.45460891723633, -38.86479187011719, -37.27497100830078, -35.685150146484375, -34.09532928466797, -32.50551223754883, -30.915693283081055, -29.32587432861328, -27.736053466796875, -26.1462345123291, -24.556415557861328, -22.966594696044922, -21.37677574157715, -19.786956787109375, -18.1971378326416, -16.607318878173828, -15.017498016357422, -13.427679061889648, -11.837860107421875, -10.248040199279785, -8.658220291137695, -7.068397521972656, -5.478578090667725, -3.888758659362793, -2.2989392280578613, -0.7091197967529297, 0.880699634552002, 2.4705190658569336, 4.060338973999023, 5.650157928466797, 7.2399773597717285, 8.82979679107666, 10.41961669921875, 12.009435653686523, 13.599254608154297, 15.189074516296387, 16.778894424438477, 18.36871337890625, 19.958532333374023, 21.548351287841797, 23.138172149658203, 24.727991104125977, 26.31781005859375, 27.907630920410156, 29.49744987487793, 31.087268829345703, 32.67708969116211, 34.26690673828125, 35.856727600097656, 37.44654846191406, 39.0363655090332, 40.62618637084961, 42.21600341796875, 43.805824279785156]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 20.0, 27.0, 44.0, 62.0, 83.0, 132.0, 169.0, 270.0, 404.0, 649.0, 1035.0, 1587.0, 2292.0, 3714.0, 5837.0, 9030.0, 14179.0, 22484.0, 34600.0, 52039.0, 75911.0, 101804.0, 124383.0, 133668.0, 126089.0, 104678.0, 77958.0, 54831.0, 35964.0, 23527.0, 14638.0, 9513.0, 5837.0, 3852.0, 2551.0, 1627.0, 1026.0, 705.0, 464.0, 279.0, 176.0, 131.0, 89.0, 56.0, 35.0, 34.0, 19.0, 20.0, 10.0, 4.0, 6.0, 4.0, 2.0], "bins": [-41.71875, -40.51123046875, -39.3037109375, -38.09619140625, -36.888671875, -35.68115234375, -34.4736328125, -33.26611328125, -32.05859375, -30.85107421875, -29.6435546875, -28.43603515625, -27.228515625, -26.02099609375, -24.8134765625, -23.60595703125, -22.3984375, -21.19091796875, -19.9833984375, -18.77587890625, -17.568359375, -16.36083984375, -15.1533203125, -13.94580078125, -12.73828125, -11.53076171875, -10.3232421875, -9.11572265625, -7.908203125, -6.70068359375, -5.4931640625, -4.28564453125, -3.078125, -1.87060546875, -0.6630859375, 0.54443359375, 1.751953125, 2.95947265625, 4.1669921875, 5.37451171875, 6.58203125, 7.78955078125, 8.9970703125, 10.20458984375, 11.412109375, 12.61962890625, 13.8271484375, 15.03466796875, 16.2421875, 17.44970703125, 18.6572265625, 19.86474609375, 21.072265625, 22.27978515625, 23.4873046875, 24.69482421875, 25.90234375, 27.10986328125, 28.3173828125, 29.52490234375, 30.732421875, 31.93994140625, 33.1474609375, 34.35498046875, 35.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 8.0, 16.0, 13.0, 5.0, 13.0, 19.0, 19.0, 27.0, 19.0, 36.0, 31.0, 34.0, 40.0, 41.0, 38.0, 41.0, 43.0, 50.0, 34.0, 32.0, 41.0, 40.0, 35.0, 41.0, 39.0, 23.0, 24.0, 28.0, 33.0, 20.0, 26.0, 11.0, 17.0, 16.0, 14.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-54.75, -53.24560546875, -51.7412109375, -50.23681640625, -48.732421875, -47.22802734375, -45.7236328125, -44.21923828125, -42.71484375, -41.21044921875, -39.7060546875, -38.20166015625, -36.697265625, -35.19287109375, -33.6884765625, -32.18408203125, -30.6796875, -29.17529296875, -27.6708984375, -26.16650390625, -24.662109375, -23.15771484375, -21.6533203125, -20.14892578125, -18.64453125, -17.14013671875, -15.6357421875, -14.13134765625, -12.626953125, -11.12255859375, -9.6181640625, -8.11376953125, -6.609375, -5.10498046875, -3.6005859375, -2.09619140625, -0.591796875, 0.91259765625, 2.4169921875, 3.92138671875, 5.42578125, 6.93017578125, 8.4345703125, 9.93896484375, 11.443359375, 12.94775390625, 14.4521484375, 15.95654296875, 17.4609375, 18.96533203125, 20.4697265625, 21.97412109375, 23.478515625, 24.98291015625, 26.4873046875, 27.99169921875, 29.49609375, 31.00048828125, 32.5048828125, 34.00927734375, 35.513671875, 37.01806640625, 38.5224609375, 40.02685546875, 41.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 7.0, 15.0, 17.0, 36.0, 49.0, 46.0, 72.0, 130.0, 160.0, 288.0, 345.0, 629.0, 869.0, 1309.0, 1871.0, 2797.0, 4209.0, 6549.0, 9700.0, 14888.0, 22429.0, 33699.0, 49842.0, 71578.0, 95307.0, 117229.0, 127481.0, 122679.0, 105637.0, 81587.0, 58145.0, 39928.0, 26661.0, 17700.0, 11516.0, 7771.0, 5123.0, 3383.0, 2165.0, 1447.0, 1059.0, 715.0, 487.0, 334.0, 220.0, 131.0, 104.0, 74.0, 58.0, 31.0, 17.0, 17.0, 9.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -34.09375, -32.90625, -31.71875, -30.53125, -29.34375, -28.15625, -26.96875, -25.78125, -24.59375, -23.40625, -22.21875, -21.03125, -19.84375, -18.65625, -17.46875, -16.28125, -15.09375, -13.90625, -12.71875, -11.53125, -10.34375, -9.15625, -7.96875, -6.78125, -5.59375, -4.40625, -3.21875, -2.03125, -0.84375, 0.34375, 1.53125, 2.71875, 3.90625, 5.09375, 6.28125, 7.46875, 8.65625, 9.84375, 11.03125, 12.21875, 13.40625, 14.59375, 15.78125, 16.96875, 18.15625, 19.34375, 20.53125, 21.71875, 22.90625, 24.09375, 25.28125, 26.46875, 27.65625, 28.84375, 30.03125, 31.21875, 32.40625, 33.59375, 34.78125, 35.96875, 37.15625, 38.34375, 39.53125, 40.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 13.0, 11.0, 14.0, 19.0, 11.0, 26.0, 14.0, 23.0, 28.0, 41.0, 37.0, 33.0, 39.0, 36.0, 34.0, 45.0, 31.0, 39.0, 33.0, 52.0, 47.0, 36.0, 31.0, 40.0, 39.0, 26.0, 23.0, 21.0, 22.0, 13.0, 16.0, 16.0, 18.0, 19.0, 8.0, 8.0, 4.0, 10.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.640625, -28.70703125, -27.7734375, -26.83984375, -25.90625, -24.97265625, -24.0390625, -23.10546875, -22.171875, -21.23828125, -20.3046875, -19.37109375, -18.4375, -17.50390625, -16.5703125, -15.63671875, -14.703125, -13.76953125, -12.8359375, -11.90234375, -10.96875, -10.03515625, -9.1015625, -8.16796875, -7.234375, -6.30078125, -5.3671875, -4.43359375, -3.5, -2.56640625, -1.6328125, -0.69921875, 0.234375, 1.16796875, 2.1015625, 3.03515625, 3.96875, 4.90234375, 5.8359375, 6.76953125, 7.703125, 8.63671875, 9.5703125, 10.50390625, 11.4375, 12.37109375, 13.3046875, 14.23828125, 15.171875, 16.10546875, 17.0390625, 17.97265625, 18.90625, 19.83984375, 20.7734375, 21.70703125, 22.640625, 23.57421875, 24.5078125, 25.44140625, 26.375, 27.30859375, 28.2421875, 29.17578125, 30.109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 7.0, 12.0, 14.0, 26.0, 34.0, 54.0, 72.0, 100.0, 150.0, 229.0, 363.0, 540.0, 822.0, 1278.0, 1961.0, 2930.0, 4632.0, 7421.0, 11748.0, 18313.0, 28136.0, 41884.0, 61656.0, 84705.0, 108010.0, 123663.0, 127316.0, 115326.0, 94181.0, 69764.0, 49330.0, 33121.0, 21834.0, 14144.0, 8886.0, 5638.0, 3650.0, 2274.0, 1505.0, 937.0, 646.0, 415.0, 281.0, 176.0, 120.0, 95.0, 51.0, 24.0, 27.0, 15.0, 10.0, 10.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.63671875, -6.43060302734375, -6.2244873046875, -6.01837158203125, -5.812255859375, -5.60614013671875, -5.4000244140625, -5.19390869140625, -4.98779296875, -4.78167724609375, -4.5755615234375, -4.36944580078125, -4.163330078125, -3.95721435546875, -3.7510986328125, -3.54498291015625, -3.3388671875, -3.13275146484375, -2.9266357421875, -2.72052001953125, -2.514404296875, -2.30828857421875, -2.1021728515625, -1.89605712890625, -1.68994140625, -1.48382568359375, -1.2777099609375, -1.07159423828125, -0.865478515625, -0.65936279296875, -0.4532470703125, -0.24713134765625, -0.041015625, 0.16510009765625, 0.3712158203125, 0.57733154296875, 0.783447265625, 0.98956298828125, 1.1956787109375, 1.40179443359375, 1.60791015625, 1.81402587890625, 2.0201416015625, 2.22625732421875, 2.432373046875, 2.63848876953125, 2.8446044921875, 3.05072021484375, 3.2568359375, 3.46295166015625, 3.6690673828125, 3.87518310546875, 4.081298828125, 4.28741455078125, 4.4935302734375, 4.69964599609375, 4.90576171875, 5.11187744140625, 5.3179931640625, 5.52410888671875, 5.730224609375, 5.93634033203125, 6.1424560546875, 6.34857177734375, 6.5546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 6.0, 2.0, 3.0, 7.0, 10.0, 13.0, 18.0, 20.0, 17.0, 35.0, 23.0, 45.0, 39.0, 42.0, 47.0, 60.0, 47.0, 46.0, 63.0, 82.0, 56.0, 46.0, 47.0, 43.0, 38.0, 26.0, 30.0, 15.0, 22.0, 8.0, 13.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009012222290039062, -0.0008741244673728943, -0.0008470267057418823, -0.0008199289441108704, -0.0007928311824798584, -0.0007657334208488464, -0.0007386356592178345, -0.0007115378975868225, -0.0006844401359558105, -0.0006573423743247986, -0.0006302446126937866, -0.0006031468510627747, -0.0005760490894317627, -0.0005489513278007507, -0.0005218535661697388, -0.0004947558045387268, -0.00046765804290771484, -0.0004405602812767029, -0.0004134625196456909, -0.00038636475801467896, -0.000359266996383667, -0.00033216923475265503, -0.00030507147312164307, -0.0002779737114906311, -0.00025087594985961914, -0.00022377818822860718, -0.00019668042659759521, -0.00016958266496658325, -0.0001424849033355713, -0.00011538714170455933, -8.828938007354736e-05, -6.11916184425354e-05, -3.409385681152344e-05, -6.996095180511475e-06, 2.0101666450500488e-05, 4.719942808151245e-05, 7.429718971252441e-05, 0.00010139495134353638, 0.00012849271297454834, 0.0001555904746055603, 0.00018268823623657227, 0.00020978599786758423, 0.0002368837594985962, 0.00026398152112960815, 0.0002910792827606201, 0.0003181770443916321, 0.00034527480602264404, 0.000372372567653656, 0.00039947032928466797, 0.00042656809091567993, 0.0004536658525466919, 0.00048076361417770386, 0.0005078613758087158, 0.0005349591374397278, 0.0005620568990707397, 0.0005891546607017517, 0.0006162524223327637, 0.0006433501839637756, 0.0006704479455947876, 0.0006975457072257996, 0.0007246434688568115, 0.0007517412304878235, 0.0007788389921188354, 0.0008059367537498474, 0.0008330345153808594]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 17.0, 18.0, 23.0, 51.0, 82.0, 118.0, 157.0, 250.0, 462.0, 680.0, 1123.0, 1953.0, 3363.0, 5587.0, 10047.0, 17588.0, 31878.0, 56158.0, 93240.0, 138992.0, 172828.0, 170935.0, 133233.0, 88169.0, 52501.0, 30075.0, 16745.0, 9147.0, 5227.0, 3184.0, 1832.0, 1064.0, 695.0, 399.0, 276.0, 171.0, 105.0, 60.0, 32.0, 27.0, 25.0, 11.0, 9.0, 3.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.064453125, -8.76171875, -8.458984375, -8.15625, -7.853515625, -7.55078125, -7.248046875, -6.9453125, -6.642578125, -6.33984375, -6.037109375, -5.734375, -5.431640625, -5.12890625, -4.826171875, -4.5234375, -4.220703125, -3.91796875, -3.615234375, -3.3125, -3.009765625, -2.70703125, -2.404296875, -2.1015625, -1.798828125, -1.49609375, -1.193359375, -0.890625, -0.587890625, -0.28515625, 0.017578125, 0.3203125, 0.623046875, 0.92578125, 1.228515625, 1.53125, 1.833984375, 2.13671875, 2.439453125, 2.7421875, 3.044921875, 3.34765625, 3.650390625, 3.953125, 4.255859375, 4.55859375, 4.861328125, 5.1640625, 5.466796875, 5.76953125, 6.072265625, 6.375, 6.677734375, 6.98046875, 7.283203125, 7.5859375, 7.888671875, 8.19140625, 8.494140625, 8.796875, 9.099609375, 9.40234375, 9.705078125, 10.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 8.0, 6.0, 7.0, 4.0, 6.0, 7.0, 11.0, 19.0, 28.0, 30.0, 28.0, 35.0, 47.0, 57.0, 39.0, 61.0, 54.0, 64.0, 68.0, 72.0, 50.0, 41.0, 45.0, 33.0, 26.0, 31.0, 26.0, 19.0, 14.0, 15.0, 8.0, 11.0, 4.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.20703125, -5.065460205078125, -4.92388916015625, -4.782318115234375, -4.6407470703125, -4.499176025390625, -4.35760498046875, -4.216033935546875, -4.074462890625, -3.932891845703125, -3.79132080078125, -3.649749755859375, -3.5081787109375, -3.366607666015625, -3.22503662109375, -3.083465576171875, -2.94189453125, -2.800323486328125, -2.65875244140625, -2.517181396484375, -2.3756103515625, -2.234039306640625, -2.09246826171875, -1.950897216796875, -1.809326171875, -1.667755126953125, -1.52618408203125, -1.384613037109375, -1.2430419921875, -1.101470947265625, -0.95989990234375, -0.818328857421875, -0.6767578125, -0.535186767578125, -0.39361572265625, -0.252044677734375, -0.1104736328125, 0.031097412109375, 0.17266845703125, 0.314239501953125, 0.455810546875, 0.597381591796875, 0.73895263671875, 0.880523681640625, 1.0220947265625, 1.163665771484375, 1.30523681640625, 1.446807861328125, 1.58837890625, 1.729949951171875, 1.87152099609375, 2.013092041015625, 2.1546630859375, 2.296234130859375, 2.43780517578125, 2.579376220703125, 2.720947265625, 2.862518310546875, 3.00408935546875, 3.145660400390625, 3.2872314453125, 3.428802490234375, 3.57037353515625, 3.711944580078125, 3.853515625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 7.0, 6.0, 7.0, 22.0, 12.0, 25.0, 26.0, 39.0, 27.0, 34.0, 43.0, 52.0, 42.0, 53.0, 53.0, 60.0, 56.0, 56.0, 55.0, 52.0, 47.0, 33.0, 36.0, 30.0, 25.0, 16.0, 21.0, 14.0, 14.0, 13.0, 3.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.25482940673828, -47.789588928222656, -46.3243522644043, -44.85911178588867, -43.39387512207031, -41.92863464355469, -40.46339797973633, -38.9981575012207, -37.532920837402344, -36.06768035888672, -34.60244369506836, -33.137203216552734, -31.671966552734375, -30.206727981567383, -28.74148941040039, -27.276248931884766, -25.811010360717773, -24.34577178955078, -22.88053321838379, -21.415294647216797, -19.950056076049805, -18.484817504882812, -17.019577026367188, -15.554339408874512, -14.08910083770752, -12.623862266540527, -11.158623695373535, -9.693384170532227, -8.228145599365234, -6.7629075050354, -5.29766845703125, -3.832429885864258, -2.3671913146972656, -0.9019526243209839, 0.5632860660552979, 2.028524875640869, 3.4937634468078613, 4.9590020179748535, 6.424241065979004, 7.889479637145996, 9.354718208312988, 10.81995677947998, 12.285195350646973, 13.750434875488281, 15.215673446655273, 16.680912017822266, 18.146150588989258, 19.61138916015625, 21.076627731323242, 22.541866302490234, 24.007104873657227, 25.47234344482422, 26.93758201599121, 28.402820587158203, 29.868061065673828, 31.333297729492188, 32.79853820800781, 34.26377868652344, 35.7290153503418, 37.19425582885742, 38.65949249267578, 40.124732971191406, 41.589969635009766, 43.05521011352539, 44.52044677734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 9.0, 4.0, 4.0, 7.0, 13.0, 10.0, 14.0, 19.0, 26.0, 29.0, 25.0, 33.0, 33.0, 36.0, 39.0, 51.0, 53.0, 44.0, 48.0, 48.0, 39.0, 42.0, 35.0, 43.0, 46.0, 35.0, 33.0, 25.0, 14.0, 27.0, 31.0, 23.0, 21.0, 12.0, 7.0, 9.0, 8.0, 6.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.95924377441406, -58.156410217285156, -56.35357666015625, -54.550743103027344, -52.74790573120117, -50.945072174072266, -49.14223861694336, -47.33940505981445, -45.53656768798828, -43.733734130859375, -41.93090057373047, -40.12806701660156, -38.32522964477539, -36.522396087646484, -34.71956253051758, -32.91672897338867, -31.113895416259766, -29.31106185913086, -27.50822639465332, -25.705392837524414, -23.902557373046875, -22.09972381591797, -20.296890258789062, -18.494056701660156, -16.691221237182617, -14.888386726379395, -13.085552215576172, -11.282718658447266, -9.479884147644043, -7.67704963684082, -5.874216079711914, -4.071381568908691, -2.2685470581054688, -0.4657127857208252, 1.3371214866638184, 3.139955520629883, 4.9427900314331055, 6.745624542236328, 8.548458099365234, 10.351292610168457, 12.15412712097168, 13.956961631774902, 15.759796142578125, 17.56262969970703, 19.365463256835938, 21.168298721313477, 22.971132278442383, 24.773967742919922, 26.576801300048828, 28.379634857177734, 30.182470321655273, 31.98530387878418, 33.78813934326172, 35.590972900390625, 37.39380645751953, 39.19664001464844, 40.999473571777344, 42.80230712890625, 44.605140686035156, 46.40797424316406, 48.210811614990234, 50.01364517211914, 51.81647872924805, 53.61931228637695, 55.422149658203125]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 13.0, 13.0, 42.0, 53.0, 68.0, 109.0, 146.0, 256.0, 360.0, 585.0, 905.0, 1396.0, 2219.0, 3258.0, 5370.0, 8649.0, 14392.0, 23287.0, 39274.0, 66460.0, 114285.0, 195265.0, 333300.0, 521730.0, 686961.0, 707264.0, 563967.0, 370051.0, 220957.0, 128399.0, 74421.0, 43857.0, 26276.0, 15745.0, 9562.0, 5862.0, 3530.0, 2254.0, 1419.0, 853.0, 532.0, 358.0, 214.0, 124.0, 74.0, 56.0, 33.0, 30.0, 13.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0], "bins": [-41.53125, -40.3134765625, -39.095703125, -37.8779296875, -36.66015625, -35.4423828125, -34.224609375, -33.0068359375, -31.7890625, -30.5712890625, -29.353515625, -28.1357421875, -26.91796875, -25.7001953125, -24.482421875, -23.2646484375, -22.046875, -20.8291015625, -19.611328125, -18.3935546875, -17.17578125, -15.9580078125, -14.740234375, -13.5224609375, -12.3046875, -11.0869140625, -9.869140625, -8.6513671875, -7.43359375, -6.2158203125, -4.998046875, -3.7802734375, -2.5625, -1.3447265625, -0.126953125, 1.0908203125, 2.30859375, 3.5263671875, 4.744140625, 5.9619140625, 7.1796875, 8.3974609375, 9.615234375, 10.8330078125, 12.05078125, 13.2685546875, 14.486328125, 15.7041015625, 16.921875, 18.1396484375, 19.357421875, 20.5751953125, 21.79296875, 23.0107421875, 24.228515625, 25.4462890625, 26.6640625, 27.8818359375, 29.099609375, 30.3173828125, 31.53515625, 32.7529296875, 33.970703125, 35.1884765625, 36.40625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 8.0, 4.0, 4.0, 10.0, 12.0, 9.0, 14.0, 21.0, 24.0, 25.0, 29.0, 34.0, 35.0, 30.0, 42.0, 50.0, 54.0, 48.0, 43.0, 54.0, 37.0, 40.0, 39.0, 39.0, 47.0, 28.0, 41.0, 24.0, 14.0, 28.0, 30.0, 22.0, 19.0, 14.0, 6.0, 10.0, 8.0, 6.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.1875, -44.8017578125, -43.416015625, -42.0302734375, -40.64453125, -39.2587890625, -37.873046875, -36.4873046875, -35.1015625, -33.7158203125, -32.330078125, -30.9443359375, -29.55859375, -28.1728515625, -26.787109375, -25.4013671875, -24.015625, -22.6298828125, -21.244140625, -19.8583984375, -18.47265625, -17.0869140625, -15.701171875, -14.3154296875, -12.9296875, -11.5439453125, -10.158203125, -8.7724609375, -7.38671875, -6.0009765625, -4.615234375, -3.2294921875, -1.84375, -0.4580078125, 0.927734375, 2.3134765625, 3.69921875, 5.0849609375, 6.470703125, 7.8564453125, 9.2421875, 10.6279296875, 12.013671875, 13.3994140625, 14.78515625, 16.1708984375, 17.556640625, 18.9423828125, 20.328125, 21.7138671875, 23.099609375, 24.4853515625, 25.87109375, 27.2568359375, 28.642578125, 30.0283203125, 31.4140625, 32.7998046875, 34.185546875, 35.5712890625, 36.95703125, 38.3427734375, 39.728515625, 41.1142578125, 42.5]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 16.0, 45.0, 51.0, 89.0, 154.0, 219.0, 336.0, 611.0, 1005.0, 1549.0, 2703.0, 4585.0, 7788.0, 13283.0, 22218.0, 37890.0, 63856.0, 105086.0, 168805.0, 261796.0, 377708.0, 493028.0, 570139.0, 563025.0, 481056.0, 361226.0, 249173.0, 160041.0, 99552.0, 59669.0, 35515.0, 21228.0, 12522.0, 7424.0, 4326.0, 2580.0, 1586.0, 912.0, 559.0, 355.0, 232.0, 121.0, 86.0, 44.0, 36.0, 20.0, 14.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.9375, -30.9052734375, -29.873046875, -28.8408203125, -27.80859375, -26.7763671875, -25.744140625, -24.7119140625, -23.6796875, -22.6474609375, -21.615234375, -20.5830078125, -19.55078125, -18.5185546875, -17.486328125, -16.4541015625, -15.421875, -14.3896484375, -13.357421875, -12.3251953125, -11.29296875, -10.2607421875, -9.228515625, -8.1962890625, -7.1640625, -6.1318359375, -5.099609375, -4.0673828125, -3.03515625, -2.0029296875, -0.970703125, 0.0615234375, 1.09375, 2.1259765625, 3.158203125, 4.1904296875, 5.22265625, 6.2548828125, 7.287109375, 8.3193359375, 9.3515625, 10.3837890625, 11.416015625, 12.4482421875, 13.48046875, 14.5126953125, 15.544921875, 16.5771484375, 17.609375, 18.6416015625, 19.673828125, 20.7060546875, 21.73828125, 22.7705078125, 23.802734375, 24.8349609375, 25.8671875, 26.8994140625, 27.931640625, 28.9638671875, 29.99609375, 31.0283203125, 32.060546875, 33.0927734375, 34.125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 6.0, 10.0, 14.0, 14.0, 24.0, 43.0, 44.0, 40.0, 67.0, 65.0, 76.0, 122.0, 108.0, 139.0, 160.0, 199.0, 190.0, 202.0, 241.0, 228.0, 257.0, 261.0, 224.0, 217.0, 172.0, 152.0, 141.0, 103.0, 135.0, 79.0, 58.0, 53.0, 46.0, 43.0, 22.0, 31.0, 14.0, 15.0, 12.0, 6.0, 11.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0], "bins": [-21.71875, -21.143310546875, -20.56787109375, -19.992431640625, -19.4169921875, -18.841552734375, -18.26611328125, -17.690673828125, -17.115234375, -16.539794921875, -15.96435546875, -15.388916015625, -14.8134765625, -14.238037109375, -13.66259765625, -13.087158203125, -12.51171875, -11.936279296875, -11.36083984375, -10.785400390625, -10.2099609375, -9.634521484375, -9.05908203125, -8.483642578125, -7.908203125, -7.332763671875, -6.75732421875, -6.181884765625, -5.6064453125, -5.031005859375, -4.45556640625, -3.880126953125, -3.3046875, -2.729248046875, -2.15380859375, -1.578369140625, -1.0029296875, -0.427490234375, 0.14794921875, 0.723388671875, 1.298828125, 1.874267578125, 2.44970703125, 3.025146484375, 3.6005859375, 4.176025390625, 4.75146484375, 5.326904296875, 5.90234375, 6.477783203125, 7.05322265625, 7.628662109375, 8.2041015625, 8.779541015625, 9.35498046875, 9.930419921875, 10.505859375, 11.081298828125, 11.65673828125, 12.232177734375, 12.8076171875, 13.383056640625, 13.95849609375, 14.533935546875, 15.109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 9.0, 12.0, 10.0, 21.0, 29.0, 21.0, 43.0, 47.0, 48.0, 51.0, 61.0, 51.0, 66.0, 62.0, 55.0, 60.0, 58.0, 44.0, 42.0, 37.0, 25.0, 34.0, 25.0, 25.0, 20.0, 13.0, 4.0, 3.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.56143569946289, -36.11040115356445, -34.659366607666016, -33.20833206176758, -31.75729751586914, -30.306262969970703, -28.8552303314209, -27.40419578552246, -25.953161239624023, -24.502126693725586, -23.05109214782715, -21.600059509277344, -20.149024963378906, -18.69799041748047, -17.24695587158203, -15.795921325683594, -14.344886779785156, -12.893852233886719, -11.442817687988281, -9.99178409576416, -8.540749549865723, -7.089715003967285, -5.638681411743164, -4.187646865844727, -2.736612319946289, -1.2855780124664307, 0.16545629501342773, 1.616490364074707, 3.0675249099731445, 4.518559455871582, 5.969593048095703, 7.420627593994141, 8.871665954589844, 10.322700500488281, 11.773735046386719, 13.22476863861084, 14.675803184509277, 16.12683868408203, 17.577871322631836, 19.028905868530273, 20.47994041442871, 21.93097496032715, 23.382009506225586, 24.83304214477539, 26.284076690673828, 27.735111236572266, 29.186145782470703, 30.63718032836914, 32.08821487426758, 33.539249420166016, 34.99028396606445, 36.44131851196289, 37.89235305786133, 39.343387603759766, 40.79441833496094, 42.245452880859375, 43.69648742675781, 45.14752197265625, 46.59855651855469, 48.049591064453125, 49.50062561035156, 50.95166015625, 52.40269470214844, 53.853729248046875, 55.30476379394531]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 8.0, 8.0, 16.0, 20.0, 22.0, 16.0, 26.0, 23.0, 21.0, 33.0, 39.0, 29.0, 38.0, 41.0, 40.0, 44.0, 52.0, 51.0, 40.0, 42.0, 38.0, 49.0, 34.0, 35.0, 32.0, 26.0, 22.0, 21.0, 24.0, 34.0, 12.0, 9.0, 18.0, 5.0, 9.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.4610481262207, -46.99444580078125, -45.5278434753418, -44.061241149902344, -42.594642639160156, -41.1280403137207, -39.66143798828125, -38.1948356628418, -36.728233337402344, -35.26163101196289, -33.79502868652344, -32.32843017578125, -30.861827850341797, -29.395225524902344, -27.92862319946289, -26.462020874023438, -24.99542236328125, -23.528820037841797, -22.062219619750977, -20.595617294311523, -19.129016876220703, -17.66241455078125, -16.195812225341797, -14.72921085357666, -13.262609481811523, -11.796008110046387, -10.32940673828125, -8.862804412841797, -7.39620304107666, -5.929601669311523, -4.46299934387207, -2.9963979721069336, -1.5297927856445312, -0.06319117546081543, 1.4034104347229004, 2.8700122833251953, 4.336613655090332, 5.803215026855469, 7.269817352294922, 8.736418724060059, 10.203020095825195, 11.669621467590332, 13.136222839355469, 14.602825164794922, 16.069427490234375, 17.536027908325195, 19.00263023376465, 20.46923065185547, 21.935832977294922, 23.402435302734375, 24.869035720825195, 26.33563804626465, 27.80223846435547, 29.268840789794922, 30.735443115234375, 32.20204544067383, 33.66864776611328, 35.135250091552734, 36.60185241699219, 38.068450927734375, 39.53505325317383, 41.00165557861328, 42.468257904052734, 43.93486022949219, 45.401458740234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 24.0, 27.0, 44.0, 80.0, 108.0, 205.0, 342.0, 528.0, 897.0, 1408.0, 2343.0, 4062.0, 6646.0, 11563.0, 19122.0, 32131.0, 51831.0, 81898.0, 119746.0, 152025.0, 159953.0, 137028.0, 99463.0, 65367.0, 40784.0, 24629.0, 14600.0, 8797.0, 5223.0, 3071.0, 1837.0, 1075.0, 657.0, 402.0, 224.0, 157.0, 92.0, 60.0, 44.0, 15.0, 14.0, 4.0, 8.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5234375, -13.090576171875, -12.65771484375, -12.224853515625, -11.7919921875, -11.359130859375, -10.92626953125, -10.493408203125, -10.060546875, -9.627685546875, -9.19482421875, -8.761962890625, -8.3291015625, -7.896240234375, -7.46337890625, -7.030517578125, -6.59765625, -6.164794921875, -5.73193359375, -5.299072265625, -4.8662109375, -4.433349609375, -4.00048828125, -3.567626953125, -3.134765625, -2.701904296875, -2.26904296875, -1.836181640625, -1.4033203125, -0.970458984375, -0.53759765625, -0.104736328125, 0.328125, 0.760986328125, 1.19384765625, 1.626708984375, 2.0595703125, 2.492431640625, 2.92529296875, 3.358154296875, 3.791015625, 4.223876953125, 4.65673828125, 5.089599609375, 5.5224609375, 5.955322265625, 6.38818359375, 6.821044921875, 7.25390625, 7.686767578125, 8.11962890625, 8.552490234375, 8.9853515625, 9.418212890625, 9.85107421875, 10.283935546875, 10.716796875, 11.149658203125, 11.58251953125, 12.015380859375, 12.4482421875, 12.881103515625, 13.31396484375, 13.746826171875, 14.1796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 9.0, 20.0, 16.0, 23.0, 18.0, 24.0, 24.0, 25.0, 29.0, 38.0, 27.0, 41.0, 46.0, 34.0, 48.0, 52.0, 48.0, 43.0, 44.0, 39.0, 47.0, 31.0, 36.0, 34.0, 22.0, 22.0, 21.0, 29.0, 26.0, 12.0, 11.0, 15.0, 7.0, 8.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.4375, -45.99609375, -44.5546875, -43.11328125, -41.671875, -40.23046875, -38.7890625, -37.34765625, -35.90625, -34.46484375, -33.0234375, -31.58203125, -30.140625, -28.69921875, -27.2578125, -25.81640625, -24.375, -22.93359375, -21.4921875, -20.05078125, -18.609375, -17.16796875, -15.7265625, -14.28515625, -12.84375, -11.40234375, -9.9609375, -8.51953125, -7.078125, -5.63671875, -4.1953125, -2.75390625, -1.3125, 0.12890625, 1.5703125, 3.01171875, 4.453125, 5.89453125, 7.3359375, 8.77734375, 10.21875, 11.66015625, 13.1015625, 14.54296875, 15.984375, 17.42578125, 18.8671875, 20.30859375, 21.75, 23.19140625, 24.6328125, 26.07421875, 27.515625, 28.95703125, 30.3984375, 31.83984375, 33.28125, 34.72265625, 36.1640625, 37.60546875, 39.046875, 40.48828125, 41.9296875, 43.37109375, 44.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 9.0, 11.0, 14.0, 24.0, 36.0, 55.0, 78.0, 130.0, 197.0, 310.0, 439.0, 725.0, 1175.0, 1844.0, 2869.0, 4370.0, 7260.0, 11700.0, 20378.0, 44779.0, 865793.0, 38897.0, 18256.0, 11023.0, 6776.0, 4132.0, 2630.0, 1626.0, 1069.0, 658.0, 431.0, 289.0, 193.0, 119.0, 86.0, 61.0, 34.0, 27.0, 14.0, 8.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.96875, -33.952880859375, -32.93701171875, -31.921142578125, -30.9052734375, -29.889404296875, -28.87353515625, -27.857666015625, -26.841796875, -25.825927734375, -24.81005859375, -23.794189453125, -22.7783203125, -21.762451171875, -20.74658203125, -19.730712890625, -18.71484375, -17.698974609375, -16.68310546875, -15.667236328125, -14.6513671875, -13.635498046875, -12.61962890625, -11.603759765625, -10.587890625, -9.572021484375, -8.55615234375, -7.540283203125, -6.5244140625, -5.508544921875, -4.49267578125, -3.476806640625, -2.4609375, -1.445068359375, -0.42919921875, 0.586669921875, 1.6025390625, 2.618408203125, 3.63427734375, 4.650146484375, 5.666015625, 6.681884765625, 7.69775390625, 8.713623046875, 9.7294921875, 10.745361328125, 11.76123046875, 12.777099609375, 13.79296875, 14.808837890625, 15.82470703125, 16.840576171875, 17.8564453125, 18.872314453125, 19.88818359375, 20.904052734375, 21.919921875, 22.935791015625, 23.95166015625, 24.967529296875, 25.9833984375, 26.999267578125, 28.01513671875, 29.031005859375, 30.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 6.0, 8.0, 1.0, 1.0, 8.0, 13.0, 10.0, 14.0, 16.0, 14.0, 21.0, 27.0, 17.0, 18.0, 25.0, 35.0, 34.0, 41.0, 28.0, 43.0, 43.0, 38.0, 42.0, 40.0, 44.0, 46.0, 30.0, 44.0, 25.0, 32.0, 31.0, 31.0, 29.0, 21.0, 27.0, 20.0, 15.0, 11.0, 10.0, 8.0, 14.0, 6.0, 3.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.461669921875, -23.53271484375, -22.603759765625, -21.6748046875, -20.745849609375, -19.81689453125, -18.887939453125, -17.958984375, -17.030029296875, -16.10107421875, -15.172119140625, -14.2431640625, -13.314208984375, -12.38525390625, -11.456298828125, -10.52734375, -9.598388671875, -8.66943359375, -7.740478515625, -6.8115234375, -5.882568359375, -4.95361328125, -4.024658203125, -3.095703125, -2.166748046875, -1.23779296875, -0.308837890625, 0.6201171875, 1.549072265625, 2.47802734375, 3.406982421875, 4.3359375, 5.264892578125, 6.19384765625, 7.122802734375, 8.0517578125, 8.980712890625, 9.90966796875, 10.838623046875, 11.767578125, 12.696533203125, 13.62548828125, 14.554443359375, 15.4833984375, 16.412353515625, 17.34130859375, 18.270263671875, 19.19921875, 20.128173828125, 21.05712890625, 21.986083984375, 22.9150390625, 23.843994140625, 24.77294921875, 25.701904296875, 26.630859375, 27.559814453125, 28.48876953125, 29.417724609375, 30.3466796875, 31.275634765625, 32.20458984375, 33.133544921875, 34.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 13.0, 17.0, 13.0, 23.0, 27.0, 70.0, 77.0, 97.0, 161.0, 258.0, 413.0, 596.0, 1006.0, 1743.0, 3253.0, 6485.0, 14478.0, 38888.0, 902275.0, 46548.0, 16354.0, 7347.0, 3500.0, 1938.0, 1038.0, 649.0, 405.0, 305.0, 155.0, 129.0, 85.0, 63.0, 39.0, 30.0, 14.0, 18.0, 10.0, 10.0, 7.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4931640625, -1.4409027099609375, -1.388641357421875, -1.3363800048828125, -1.28411865234375, -1.2318572998046875, -1.179595947265625, -1.1273345947265625, -1.0750732421875, -1.0228118896484375, -0.970550537109375, -0.9182891845703125, -0.86602783203125, -0.8137664794921875, -0.761505126953125, -0.7092437744140625, -0.656982421875, -0.6047210693359375, -0.552459716796875, -0.5001983642578125, -0.44793701171875, -0.3956756591796875, -0.343414306640625, -0.2911529541015625, -0.2388916015625, -0.1866302490234375, -0.134368896484375, -0.0821075439453125, -0.02984619140625, 0.0224151611328125, 0.074676513671875, 0.1269378662109375, 0.17919921875, 0.2314605712890625, 0.283721923828125, 0.3359832763671875, 0.38824462890625, 0.4405059814453125, 0.492767333984375, 0.5450286865234375, 0.5972900390625, 0.6495513916015625, 0.701812744140625, 0.7540740966796875, 0.80633544921875, 0.8585968017578125, 0.910858154296875, 0.9631195068359375, 1.015380859375, 1.0676422119140625, 1.119903564453125, 1.1721649169921875, 1.22442626953125, 1.2766876220703125, 1.328948974609375, 1.3812103271484375, 1.4334716796875, 1.4857330322265625, 1.537994384765625, 1.5902557373046875, 1.64251708984375, 1.6947784423828125, 1.747039794921875, 1.7993011474609375, 1.8515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 12.0, 15.0, 23.0, 18.0, 31.0, 40.0, 51.0, 61.0, 81.0, 97.0, 100.0, 94.0, 85.0, 55.0, 54.0, 58.0, 32.0, 27.0, 14.0, 11.0, 11.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.094839096069336e-05, -3.964453935623169e-05, -3.834068775177002e-05, -3.703683614730835e-05, -3.573298454284668e-05, -3.442913293838501e-05, -3.312528133392334e-05, -3.182142972946167e-05, -3.0517578125e-05, -2.921372652053833e-05, -2.790987491607666e-05, -2.660602331161499e-05, -2.530217170715332e-05, -2.399832010269165e-05, -2.269446849822998e-05, -2.139061689376831e-05, -2.008676528930664e-05, -1.878291368484497e-05, -1.74790620803833e-05, -1.617521047592163e-05, -1.4871358871459961e-05, -1.3567507266998291e-05, -1.2263655662536621e-05, -1.0959804058074951e-05, -9.655952453613281e-06, -8.352100849151611e-06, -7.048249244689941e-06, -5.7443976402282715e-06, -4.4405460357666016e-06, -3.1366944313049316e-06, -1.8328428268432617e-06, -5.289912223815918e-07, 7.748603820800781e-07, 2.078711986541748e-06, 3.382563591003418e-06, 4.686415195465088e-06, 5.990266799926758e-06, 7.294118404388428e-06, 8.597970008850098e-06, 9.901821613311768e-06, 1.1205673217773438e-05, 1.2509524822235107e-05, 1.3813376426696777e-05, 1.5117228031158447e-05, 1.6421079635620117e-05, 1.7724931240081787e-05, 1.9028782844543457e-05, 2.0332634449005127e-05, 2.1636486053466797e-05, 2.2940337657928467e-05, 2.4244189262390137e-05, 2.5548040866851807e-05, 2.6851892471313477e-05, 2.8155744075775146e-05, 2.9459595680236816e-05, 3.0763447284698486e-05, 3.2067298889160156e-05, 3.3371150493621826e-05, 3.4675002098083496e-05, 3.5978853702545166e-05, 3.7282705307006836e-05, 3.8586556911468506e-05, 3.9890408515930176e-05, 4.1194260120391846e-05, 4.2498111724853516e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 21.0, 27.0, 45.0, 43.0, 71.0, 128.0, 193.0, 280.0, 398.0, 611.0, 981.0, 1428.0, 2172.0, 3281.0, 5195.0, 7875.0, 11963.0, 18333.0, 28705.0, 44873.0, 71100.0, 115924.0, 179768.0, 193263.0, 134834.0, 82225.0, 51181.0, 32739.0, 21089.0, 13784.0, 8914.0, 5883.0, 3780.0, 2617.0, 1644.0, 1059.0, 718.0, 443.0, 354.0, 204.0, 160.0, 80.0, 56.0, 30.0, 30.0, 18.0, 12.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.62841796875, -0.608245849609375, -0.58807373046875, -0.567901611328125, -0.5477294921875, -0.527557373046875, -0.50738525390625, -0.487213134765625, -0.467041015625, -0.446868896484375, -0.42669677734375, -0.406524658203125, -0.3863525390625, -0.366180419921875, -0.34600830078125, -0.325836181640625, -0.3056640625, -0.285491943359375, -0.26531982421875, -0.245147705078125, -0.2249755859375, -0.204803466796875, -0.18463134765625, -0.164459228515625, -0.144287109375, -0.124114990234375, -0.10394287109375, -0.083770751953125, -0.0635986328125, -0.043426513671875, -0.02325439453125, -0.003082275390625, 0.01708984375, 0.037261962890625, 0.05743408203125, 0.077606201171875, 0.0977783203125, 0.117950439453125, 0.13812255859375, 0.158294677734375, 0.178466796875, 0.198638916015625, 0.21881103515625, 0.238983154296875, 0.2591552734375, 0.279327392578125, 0.29949951171875, 0.319671630859375, 0.33984375, 0.360015869140625, 0.38018798828125, 0.400360107421875, 0.4205322265625, 0.440704345703125, 0.46087646484375, 0.481048583984375, 0.501220703125, 0.521392822265625, 0.54156494140625, 0.561737060546875, 0.5819091796875, 0.602081298828125, 0.62225341796875, 0.642425537109375, 0.66259765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 7.0, 14.0, 3.0, 12.0, 9.0, 18.0, 19.0, 15.0, 23.0, 37.0, 37.0, 38.0, 60.0, 80.0, 64.0, 89.0, 85.0, 72.0, 52.0, 47.0, 32.0, 36.0, 30.0, 19.0, 14.0, 8.0, 10.0, 13.0, 9.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24812698364257812, -0.23966217041015625, -0.23119735717773438, -0.2227325439453125, -0.21426773071289062, -0.20580291748046875, -0.19733810424804688, -0.188873291015625, -0.18040847778320312, -0.17194366455078125, -0.16347885131835938, -0.1550140380859375, -0.14654922485351562, -0.13808441162109375, -0.12961959838867188, -0.12115478515625, -0.11268997192382812, -0.10422515869140625, -0.09576034545898438, -0.0872955322265625, -0.07883071899414062, -0.07036590576171875, -0.061901092529296875, -0.053436279296875, -0.044971466064453125, -0.03650665283203125, -0.028041839599609375, -0.0195770263671875, -0.011112213134765625, -0.00264739990234375, 0.005817413330078125, 0.0142822265625, 0.022747039794921875, 0.03121185302734375, 0.039676666259765625, 0.0481414794921875, 0.056606292724609375, 0.06507110595703125, 0.07353591918945312, 0.082000732421875, 0.09046554565429688, 0.09893035888671875, 0.10739517211914062, 0.1158599853515625, 0.12432479858398438, 0.13278961181640625, 0.14125442504882812, 0.14971923828125, 0.15818405151367188, 0.16664886474609375, 0.17511367797851562, 0.1835784912109375, 0.19204330444335938, 0.20050811767578125, 0.20897293090820312, 0.217437744140625, 0.22590255737304688, 0.23436737060546875, 0.24283218383789062, 0.2512969970703125, 0.2597618103027344, 0.26822662353515625, 0.2766914367675781, 0.28515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 3.0, 17.0, 8.0, 11.0, 25.0, 37.0, 22.0, 46.0, 53.0, 55.0, 61.0, 62.0, 60.0, 54.0, 60.0, 65.0, 67.0, 44.0, 52.0, 32.0, 31.0, 33.0, 25.0, 27.0, 17.0, 9.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.71311950683594, -37.211341857910156, -35.709564208984375, -34.207786560058594, -32.70600891113281, -31.2042293548584, -29.702449798583984, -28.200672149658203, -26.698894500732422, -25.19711685180664, -23.69533920288086, -22.193559646606445, -20.691781997680664, -19.190004348754883, -17.68822479248047, -16.186447143554688, -14.684669494628906, -13.182891845703125, -11.681113243103027, -10.17933464050293, -8.677556991577148, -7.175778865814209, -5.6740007400512695, -4.172222137451172, -2.6704444885253906, -1.1686663627624512, 0.3331117630004883, 1.8348898887634277, 3.336668014526367, 4.838446140289307, 6.340224266052246, 7.842002868652344, 9.34377670288086, 10.84555435180664, 12.347332954406738, 13.849111557006836, 15.350889205932617, 16.8526668548584, 18.354446411132812, 19.856224060058594, 21.358001708984375, 22.859779357910156, 24.361557006835938, 25.86333656311035, 27.365114212036133, 28.866891860961914, 30.368671417236328, 31.87044906616211, 33.37222671508789, 34.87400436401367, 36.37578201293945, 37.877559661865234, 39.37934112548828, 40.88111877441406, 42.382896423339844, 43.884674072265625, 45.386451721191406, 46.88822937011719, 48.39000701904297, 49.89178466796875, 51.39356231689453, 52.89534378051758, 54.39712142944336, 55.89889907836914, 57.40067672729492]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 21.0, 17.0, 22.0, 17.0, 25.0, 24.0, 24.0, 29.0, 38.0, 27.0, 41.0, 47.0, 35.0, 46.0, 52.0, 50.0, 40.0, 44.0, 39.0, 47.0, 33.0, 36.0, 33.0, 23.0, 21.0, 22.0, 29.0, 26.0, 14.0, 8.0, 16.0, 7.0, 8.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.40702819824219, -45.967430114746094, -44.527835845947266, -43.08823776245117, -41.648643493652344, -40.20904541015625, -38.769447326660156, -37.32984924316406, -35.890254974365234, -34.45065689086914, -33.01106262207031, -31.57146453857422, -30.131868362426758, -28.692272186279297, -27.252674102783203, -25.813077926635742, -24.37348175048828, -22.93388557434082, -21.49428939819336, -20.054691314697266, -18.615095138549805, -17.175498962402344, -15.735901832580566, -14.296304702758789, -12.856708526611328, -11.417112350463867, -9.97751522064209, -8.537918090820312, -7.098321914672852, -5.658725261688232, -4.219128608703613, -2.779531478881836, -1.3399391174316406, 0.09965753555297852, 1.5392541885375977, 2.978850841522217, 4.418447494506836, 5.858044147491455, 7.297640800476074, 8.737237930297852, 10.176834106445312, 11.616430282592773, 13.05602741241455, 14.495624542236328, 15.935220718383789, 17.37481689453125, 18.814414978027344, 20.254011154174805, 21.693607330322266, 23.133203506469727, 24.572799682617188, 26.01239776611328, 27.451993942260742, 28.891590118408203, 30.331188201904297, 31.770784378051758, 33.21038055419922, 34.64997863769531, 36.08957290649414, 37.529170989990234, 38.96876525878906, 40.408363342285156, 41.84796142578125, 43.287559509277344, 44.72715377807617]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 7.0, 9.0, 22.0, 32.0, 35.0, 48.0, 86.0, 119.0, 166.0, 235.0, 407.0, 565.0, 942.0, 1487.0, 2305.0, 3871.0, 5895.0, 10159.0, 16430.0, 26678.0, 42138.0, 63889.0, 90796.0, 118850.0, 137993.0, 137213.0, 119153.0, 91657.0, 64366.0, 42352.0, 26753.0, 16806.0, 10375.0, 6377.0, 3911.0, 2291.0, 1433.0, 875.0, 583.0, 397.0, 261.0, 192.0, 121.0, 80.0, 58.0, 40.0, 35.0, 10.0, 12.0, 10.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.875, -31.81494140625, -30.7548828125, -29.69482421875, -28.634765625, -27.57470703125, -26.5146484375, -25.45458984375, -24.39453125, -23.33447265625, -22.2744140625, -21.21435546875, -20.154296875, -19.09423828125, -18.0341796875, -16.97412109375, -15.9140625, -14.85400390625, -13.7939453125, -12.73388671875, -11.673828125, -10.61376953125, -9.5537109375, -8.49365234375, -7.43359375, -6.37353515625, -5.3134765625, -4.25341796875, -3.193359375, -2.13330078125, -1.0732421875, -0.01318359375, 1.046875, 2.10693359375, 3.1669921875, 4.22705078125, 5.287109375, 6.34716796875, 7.4072265625, 8.46728515625, 9.52734375, 10.58740234375, 11.6474609375, 12.70751953125, 13.767578125, 14.82763671875, 15.8876953125, 16.94775390625, 18.0078125, 19.06787109375, 20.1279296875, 21.18798828125, 22.248046875, 23.30810546875, 24.3681640625, 25.42822265625, 26.48828125, 27.54833984375, 28.6083984375, 29.66845703125, 30.728515625, 31.78857421875, 32.8486328125, 33.90869140625, 34.96875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 7.0, 10.0, 18.0, 19.0, 20.0, 20.0, 23.0, 23.0, 25.0, 28.0, 38.0, 30.0, 39.0, 44.0, 38.0, 50.0, 51.0, 51.0, 41.0, 38.0, 43.0, 48.0, 31.0, 35.0, 35.0, 23.0, 19.0, 24.0, 31.0, 22.0, 12.0, 9.0, 15.0, 9.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.5, -44.115234375, -42.73046875, -41.345703125, -39.9609375, -38.576171875, -37.19140625, -35.806640625, -34.421875, -33.037109375, -31.65234375, -30.267578125, -28.8828125, -27.498046875, -26.11328125, -24.728515625, -23.34375, -21.958984375, -20.57421875, -19.189453125, -17.8046875, -16.419921875, -15.03515625, -13.650390625, -12.265625, -10.880859375, -9.49609375, -8.111328125, -6.7265625, -5.341796875, -3.95703125, -2.572265625, -1.1875, 0.197265625, 1.58203125, 2.966796875, 4.3515625, 5.736328125, 7.12109375, 8.505859375, 9.890625, 11.275390625, 12.66015625, 14.044921875, 15.4296875, 16.814453125, 18.19921875, 19.583984375, 20.96875, 22.353515625, 23.73828125, 25.123046875, 26.5078125, 27.892578125, 29.27734375, 30.662109375, 32.046875, 33.431640625, 34.81640625, 36.201171875, 37.5859375, 38.970703125, 40.35546875, 41.740234375, 43.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 6.0, 9.0, 14.0, 22.0, 29.0, 29.0, 59.0, 73.0, 97.0, 135.0, 207.0, 305.0, 425.0, 627.0, 903.0, 1385.0, 2101.0, 3037.0, 4643.0, 6909.0, 10535.0, 16413.0, 25373.0, 38371.0, 55711.0, 77814.0, 100566.0, 118583.0, 124739.0, 117067.0, 99288.0, 77039.0, 55018.0, 38190.0, 24893.0, 16511.0, 10569.0, 7040.0, 4578.0, 2991.0, 1976.0, 1311.0, 949.0, 645.0, 420.0, 322.0, 199.0, 141.0, 86.0, 57.0, 55.0, 33.0, 19.0, 18.0, 13.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-30.046875, -29.061279296875, -28.07568359375, -27.090087890625, -26.1044921875, -25.118896484375, -24.13330078125, -23.147705078125, -22.162109375, -21.176513671875, -20.19091796875, -19.205322265625, -18.2197265625, -17.234130859375, -16.24853515625, -15.262939453125, -14.27734375, -13.291748046875, -12.30615234375, -11.320556640625, -10.3349609375, -9.349365234375, -8.36376953125, -7.378173828125, -6.392578125, -5.406982421875, -4.42138671875, -3.435791015625, -2.4501953125, -1.464599609375, -0.47900390625, 0.506591796875, 1.4921875, 2.477783203125, 3.46337890625, 4.448974609375, 5.4345703125, 6.420166015625, 7.40576171875, 8.391357421875, 9.376953125, 10.362548828125, 11.34814453125, 12.333740234375, 13.3193359375, 14.304931640625, 15.29052734375, 16.276123046875, 17.26171875, 18.247314453125, 19.23291015625, 20.218505859375, 21.2041015625, 22.189697265625, 23.17529296875, 24.160888671875, 25.146484375, 26.132080078125, 27.11767578125, 28.103271484375, 29.0888671875, 30.074462890625, 31.06005859375, 32.045654296875, 33.03125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 5.0, 10.0, 10.0, 15.0, 9.0, 11.0, 17.0, 21.0, 20.0, 26.0, 33.0, 24.0, 25.0, 34.0, 39.0, 28.0, 22.0, 38.0, 35.0, 44.0, 40.0, 47.0, 43.0, 38.0, 39.0, 40.0, 32.0, 27.0, 35.0, 20.0, 21.0, 16.0, 24.0, 21.0, 20.0, 9.0, 6.0, 8.0, 6.0, 4.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-24.359375, -23.59912109375, -22.8388671875, -22.07861328125, -21.318359375, -20.55810546875, -19.7978515625, -19.03759765625, -18.27734375, -17.51708984375, -16.7568359375, -15.99658203125, -15.236328125, -14.47607421875, -13.7158203125, -12.95556640625, -12.1953125, -11.43505859375, -10.6748046875, -9.91455078125, -9.154296875, -8.39404296875, -7.6337890625, -6.87353515625, -6.11328125, -5.35302734375, -4.5927734375, -3.83251953125, -3.072265625, -2.31201171875, -1.5517578125, -0.79150390625, -0.03125, 0.72900390625, 1.4892578125, 2.24951171875, 3.009765625, 3.77001953125, 4.5302734375, 5.29052734375, 6.05078125, 6.81103515625, 7.5712890625, 8.33154296875, 9.091796875, 9.85205078125, 10.6123046875, 11.37255859375, 12.1328125, 12.89306640625, 13.6533203125, 14.41357421875, 15.173828125, 15.93408203125, 16.6943359375, 17.45458984375, 18.21484375, 18.97509765625, 19.7353515625, 20.49560546875, 21.255859375, 22.01611328125, 22.7763671875, 23.53662109375, 24.296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 8.0, 12.0, 15.0, 15.0, 32.0, 33.0, 41.0, 60.0, 87.0, 124.0, 161.0, 271.0, 407.0, 636.0, 958.0, 1557.0, 2540.0, 4067.0, 6810.0, 11431.0, 19141.0, 31052.0, 49783.0, 74882.0, 104293.0, 129253.0, 141534.0, 133419.0, 110411.0, 81473.0, 54805.0, 35016.0, 21350.0, 12851.0, 7713.0, 4721.0, 2746.0, 1688.0, 1084.0, 666.0, 433.0, 343.0, 179.0, 148.0, 84.0, 70.0, 51.0, 31.0, 27.0, 8.0, 14.0, 5.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-6.90234375, -6.6768798828125, -6.451416015625, -6.2259521484375, -6.00048828125, -5.7750244140625, -5.549560546875, -5.3240966796875, -5.0986328125, -4.8731689453125, -4.647705078125, -4.4222412109375, -4.19677734375, -3.9713134765625, -3.745849609375, -3.5203857421875, -3.294921875, -3.0694580078125, -2.843994140625, -2.6185302734375, -2.39306640625, -2.1676025390625, -1.942138671875, -1.7166748046875, -1.4912109375, -1.2657470703125, -1.040283203125, -0.8148193359375, -0.58935546875, -0.3638916015625, -0.138427734375, 0.0870361328125, 0.3125, 0.5379638671875, 0.763427734375, 0.9888916015625, 1.21435546875, 1.4398193359375, 1.665283203125, 1.8907470703125, 2.1162109375, 2.3416748046875, 2.567138671875, 2.7926025390625, 3.01806640625, 3.2435302734375, 3.468994140625, 3.6944580078125, 3.919921875, 4.1453857421875, 4.370849609375, 4.5963134765625, 4.82177734375, 5.0472412109375, 5.272705078125, 5.4981689453125, 5.7236328125, 5.9490966796875, 6.174560546875, 6.4000244140625, 6.62548828125, 6.8509521484375, 7.076416015625, 7.3018798828125, 7.52734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 6.0, 2.0, 4.0, 9.0, 11.0, 11.0, 19.0, 21.0, 24.0, 30.0, 25.0, 25.0, 28.0, 35.0, 39.0, 48.0, 47.0, 50.0, 44.0, 55.0, 60.0, 37.0, 41.0, 39.0, 40.0, 46.0, 33.0, 29.0, 22.0, 24.0, 13.0, 13.0, 8.0, 9.0, 10.0, 6.0, 5.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0006771087646484375, -0.0006559714674949646, -0.0006348341703414917, -0.0006136968731880188, -0.0005925595760345459, -0.000571422278881073, -0.0005502849817276001, -0.0005291476845741272, -0.0005080103874206543, -0.0004868730902671814, -0.0004657357931137085, -0.0004445984959602356, -0.0004234611988067627, -0.0004023239016532898, -0.0003811866044998169, -0.000360049307346344, -0.0003389120101928711, -0.0003177747130393982, -0.0002966374158859253, -0.0002755001187324524, -0.0002543628215789795, -0.0002332255244255066, -0.0002120882272720337, -0.0001909509301185608, -0.0001698136329650879, -0.000148676335811615, -0.0001275390386581421, -0.00010640174150466919, -8.526444435119629e-05, -6.412714719772339e-05, -4.298985004425049e-05, -2.1852552890777588e-05, -7.152557373046875e-07, 2.0422041416168213e-05, 4.155933856964111e-05, 6.269663572311401e-05, 8.383393287658691e-05, 0.00010497123003005981, 0.00012610852718353271, 0.00014724582433700562, 0.00016838312149047852, 0.00018952041864395142, 0.00021065771579742432, 0.00023179501295089722, 0.0002529323101043701, 0.000274069607257843, 0.0002952069044113159, 0.0003163442015647888, 0.0003374814987182617, 0.0003586187958717346, 0.0003797560930252075, 0.0004008933901786804, 0.0004220306873321533, 0.0004431679844856262, 0.0004643052816390991, 0.000485442578792572, 0.0005065798759460449, 0.0005277171730995178, 0.0005488544702529907, 0.0005699917674064636, 0.0005911290645599365, 0.0006122663617134094, 0.0006334036588668823, 0.0006545409560203552, 0.0006756782531738281]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 4.0, 14.0, 13.0, 34.0, 50.0, 67.0, 131.0, 146.0, 239.0, 413.0, 629.0, 930.0, 1336.0, 2094.0, 3351.0, 5213.0, 8323.0, 12956.0, 20083.0, 30864.0, 46514.0, 66941.0, 91662.0, 114270.0, 128104.0, 127583.0, 111225.0, 87359.0, 63217.0, 43649.0, 28910.0, 18839.0, 11997.0, 7699.0, 4885.0, 3141.0, 1968.0, 1325.0, 853.0, 509.0, 340.0, 236.0, 141.0, 106.0, 61.0, 52.0, 25.0, 23.0, 9.0, 7.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.03515625, -6.81475830078125, -6.5943603515625, -6.37396240234375, -6.153564453125, -5.93316650390625, -5.7127685546875, -5.49237060546875, -5.27197265625, -5.05157470703125, -4.8311767578125, -4.61077880859375, -4.390380859375, -4.16998291015625, -3.9495849609375, -3.72918701171875, -3.5087890625, -3.28839111328125, -3.0679931640625, -2.84759521484375, -2.627197265625, -2.40679931640625, -2.1864013671875, -1.96600341796875, -1.74560546875, -1.52520751953125, -1.3048095703125, -1.08441162109375, -0.864013671875, -0.64361572265625, -0.4232177734375, -0.20281982421875, 0.017578125, 0.23797607421875, 0.4583740234375, 0.67877197265625, 0.899169921875, 1.11956787109375, 1.3399658203125, 1.56036376953125, 1.78076171875, 2.00115966796875, 2.2215576171875, 2.44195556640625, 2.662353515625, 2.88275146484375, 3.1031494140625, 3.32354736328125, 3.5439453125, 3.76434326171875, 3.9847412109375, 4.20513916015625, 4.425537109375, 4.64593505859375, 4.8663330078125, 5.08673095703125, 5.30712890625, 5.52752685546875, 5.7479248046875, 5.96832275390625, 6.188720703125, 6.40911865234375, 6.6295166015625, 6.84991455078125, 7.0703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 6.0, 9.0, 9.0, 20.0, 14.0, 25.0, 27.0, 40.0, 35.0, 57.0, 68.0, 49.0, 63.0, 73.0, 73.0, 64.0, 57.0, 48.0, 35.0, 40.0, 29.0, 29.0, 28.0, 28.0, 17.0, 13.0, 6.0, 12.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.98876953125, -3.8603515625, -3.73193359375, -3.603515625, -3.47509765625, -3.3466796875, -3.21826171875, -3.08984375, -2.96142578125, -2.8330078125, -2.70458984375, -2.576171875, -2.44775390625, -2.3193359375, -2.19091796875, -2.0625, -1.93408203125, -1.8056640625, -1.67724609375, -1.548828125, -1.42041015625, -1.2919921875, -1.16357421875, -1.03515625, -0.90673828125, -0.7783203125, -0.64990234375, -0.521484375, -0.39306640625, -0.2646484375, -0.13623046875, -0.0078125, 0.12060546875, 0.2490234375, 0.37744140625, 0.505859375, 0.63427734375, 0.7626953125, 0.89111328125, 1.01953125, 1.14794921875, 1.2763671875, 1.40478515625, 1.533203125, 1.66162109375, 1.7900390625, 1.91845703125, 2.046875, 2.17529296875, 2.3037109375, 2.43212890625, 2.560546875, 2.68896484375, 2.8173828125, 2.94580078125, 3.07421875, 3.20263671875, 3.3310546875, 3.45947265625, 3.587890625, 3.71630859375, 3.8447265625, 3.97314453125, 4.1015625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 6.0, 7.0, 6.0, 9.0, 13.0, 19.0, 28.0, 19.0, 32.0, 38.0, 40.0, 37.0, 40.0, 65.0, 57.0, 55.0, 50.0, 46.0, 49.0, 53.0, 48.0, 42.0, 31.0, 23.0, 29.0, 26.0, 31.0, 29.0, 13.0, 22.0, 6.0, 6.0, 9.0, 1.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.259735107421875, -32.01853942871094, -30.777347564697266, -29.53615379333496, -28.294960021972656, -27.05376625061035, -25.812572479248047, -24.57137680053711, -23.330184936523438, -22.088991165161133, -20.847797393798828, -19.606603622436523, -18.36540985107422, -17.124216079711914, -15.883021354675293, -14.641827583312988, -13.400632858276367, -12.159439086914062, -10.918245315551758, -9.677051544189453, -8.435857772827148, -7.1946635246276855, -5.953469276428223, -4.712275505065918, -3.4710817337036133, -2.2298879623413086, -0.9886939525604248, 0.252500057220459, 1.4936938285827637, 2.7348875999450684, 3.9760818481445312, 5.217275619506836, 6.458469390869141, 7.699663162231445, 8.94085693359375, 10.182050704956055, 11.42324447631836, 12.664438247680664, 13.905632972717285, 15.14682674407959, 16.388019561767578, 17.629213333129883, 18.870407104492188, 20.111600875854492, 21.352794647216797, 22.5939884185791, 23.835182189941406, 25.076377868652344, 26.31757164001465, 27.558765411376953, 28.799959182739258, 30.041152954101562, 31.282346725463867, 32.52354049682617, 33.76473617553711, 35.00592803955078, 36.24712371826172, 37.488319396972656, 38.72951126098633, 39.970706939697266, 41.21189880371094, 42.453094482421875, 43.69428634643555, 44.935482025146484, 46.176673889160156]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 3.0, 11.0, 12.0, 17.0, 17.0, 17.0, 14.0, 17.0, 28.0, 22.0, 29.0, 35.0, 31.0, 31.0, 39.0, 40.0, 44.0, 33.0, 50.0, 43.0, 43.0, 35.0, 41.0, 36.0, 33.0, 32.0, 35.0, 24.0, 27.0, 24.0, 24.0, 16.0, 15.0, 17.0, 13.0, 9.0, 7.0, 10.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.88664245605469, -41.53130340576172, -40.175960540771484, -38.820621490478516, -37.46527862548828, -36.10993957519531, -34.754600524902344, -33.399261474609375, -32.04391860961914, -30.68857765197754, -29.333236694335938, -27.97789764404297, -26.622556686401367, -25.267215728759766, -23.911876678466797, -22.556535720825195, -21.201194763183594, -19.845853805541992, -18.49051284790039, -17.135173797607422, -15.77983283996582, -14.424491882324219, -13.069151878356934, -11.713811874389648, -10.358470916748047, -9.003129959106445, -7.64778995513916, -6.292449474334717, -4.937108993530273, -3.58176851272583, -2.2264280319213867, -0.8710880279541016, 0.4842491149902344, 1.8395895957946777, 3.194930076599121, 4.5502705574035645, 5.905611038208008, 7.260951519012451, 8.616291999816895, 9.97163200378418, 11.326972961425781, 12.682313919067383, 14.037653923034668, 15.392993927001953, 16.748334884643555, 18.103675842285156, 19.459014892578125, 20.814355850219727, 22.169696807861328, 23.52503776550293, 24.88037872314453, 26.2357177734375, 27.5910587310791, 28.946399688720703, 30.301738739013672, 31.657079696655273, 33.012420654296875, 34.367759704589844, 35.72310256958008, 37.07844161987305, 38.43378448486328, 39.78912353515625, 41.14446258544922, 42.49980163574219, 43.85514450073242]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 15.0, 17.0, 29.0, 53.0, 69.0, 113.0, 175.0, 284.0, 425.0, 642.0, 1010.0, 1542.0, 2388.0, 3654.0, 5613.0, 8491.0, 13438.0, 20937.0, 33806.0, 53299.0, 86000.0, 137167.0, 217500.0, 332693.0, 472661.0, 585277.0, 606504.0, 523858.0, 388892.0, 259744.0, 165460.0, 102679.0, 63817.0, 39642.0, 24788.0, 15196.0, 9648.0, 6234.0, 3820.0, 2428.0, 1568.0, 998.0, 642.0, 401.0, 248.0, 150.0, 95.0, 71.0, 40.0, 20.0, 18.0, 5.0, 12.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-29.984375, -29.052734375, -28.12109375, -27.189453125, -26.2578125, -25.326171875, -24.39453125, -23.462890625, -22.53125, -21.599609375, -20.66796875, -19.736328125, -18.8046875, -17.873046875, -16.94140625, -16.009765625, -15.078125, -14.146484375, -13.21484375, -12.283203125, -11.3515625, -10.419921875, -9.48828125, -8.556640625, -7.625, -6.693359375, -5.76171875, -4.830078125, -3.8984375, -2.966796875, -2.03515625, -1.103515625, -0.171875, 0.759765625, 1.69140625, 2.623046875, 3.5546875, 4.486328125, 5.41796875, 6.349609375, 7.28125, 8.212890625, 9.14453125, 10.076171875, 11.0078125, 11.939453125, 12.87109375, 13.802734375, 14.734375, 15.666015625, 16.59765625, 17.529296875, 18.4609375, 19.392578125, 20.32421875, 21.255859375, 22.1875, 23.119140625, 24.05078125, 24.982421875, 25.9140625, 26.845703125, 27.77734375, 28.708984375, 29.640625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 13.0, 11.0, 22.0, 14.0, 16.0, 15.0, 30.0, 22.0, 28.0, 38.0, 25.0, 34.0, 37.0, 38.0, 40.0, 40.0, 45.0, 46.0, 41.0, 36.0, 39.0, 33.0, 33.0, 37.0, 32.0, 28.0, 28.0, 20.0, 26.0, 16.0, 15.0, 16.0, 17.0, 8.0, 8.0, 9.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.1875, -32.14453125, -31.1015625, -30.05859375, -29.015625, -27.97265625, -26.9296875, -25.88671875, -24.84375, -23.80078125, -22.7578125, -21.71484375, -20.671875, -19.62890625, -18.5859375, -17.54296875, -16.5, -15.45703125, -14.4140625, -13.37109375, -12.328125, -11.28515625, -10.2421875, -9.19921875, -8.15625, -7.11328125, -6.0703125, -5.02734375, -3.984375, -2.94140625, -1.8984375, -0.85546875, 0.1875, 1.23046875, 2.2734375, 3.31640625, 4.359375, 5.40234375, 6.4453125, 7.48828125, 8.53125, 9.57421875, 10.6171875, 11.66015625, 12.703125, 13.74609375, 14.7890625, 15.83203125, 16.875, 17.91796875, 18.9609375, 20.00390625, 21.046875, 22.08984375, 23.1328125, 24.17578125, 25.21875, 26.26171875, 27.3046875, 28.34765625, 29.390625, 30.43359375, 31.4765625, 32.51953125, 33.5625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 23.0, 24.0, 56.0, 72.0, 133.0, 208.0, 289.0, 520.0, 831.0, 1426.0, 2305.0, 3776.0, 6092.0, 10012.0, 16754.0, 27136.0, 45330.0, 71511.0, 113021.0, 173342.0, 254386.0, 347508.0, 439008.0, 504316.0, 514097.0, 464452.0, 378060.0, 279644.0, 194969.0, 129182.0, 82541.0, 52013.0, 32010.0, 19443.0, 11754.0, 6977.0, 4274.0, 2614.0, 1585.0, 974.0, 593.0, 374.0, 245.0, 162.0, 83.0, 68.0, 37.0, 13.0, 12.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.765625, -25.93310546875, -25.1005859375, -24.26806640625, -23.435546875, -22.60302734375, -21.7705078125, -20.93798828125, -20.10546875, -19.27294921875, -18.4404296875, -17.60791015625, -16.775390625, -15.94287109375, -15.1103515625, -14.27783203125, -13.4453125, -12.61279296875, -11.7802734375, -10.94775390625, -10.115234375, -9.28271484375, -8.4501953125, -7.61767578125, -6.78515625, -5.95263671875, -5.1201171875, -4.28759765625, -3.455078125, -2.62255859375, -1.7900390625, -0.95751953125, -0.125, 0.70751953125, 1.5400390625, 2.37255859375, 3.205078125, 4.03759765625, 4.8701171875, 5.70263671875, 6.53515625, 7.36767578125, 8.2001953125, 9.03271484375, 9.865234375, 10.69775390625, 11.5302734375, 12.36279296875, 13.1953125, 14.02783203125, 14.8603515625, 15.69287109375, 16.525390625, 17.35791015625, 18.1904296875, 19.02294921875, 19.85546875, 20.68798828125, 21.5205078125, 22.35302734375, 23.185546875, 24.01806640625, 24.8505859375, 25.68310546875, 26.515625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 6.0, 9.0, 21.0, 16.0, 25.0, 39.0, 34.0, 36.0, 60.0, 78.0, 86.0, 100.0, 115.0, 127.0, 146.0, 177.0, 177.0, 214.0, 229.0, 231.0, 225.0, 230.0, 198.0, 199.0, 191.0, 165.0, 164.0, 131.0, 114.0, 94.0, 88.0, 70.0, 54.0, 55.0, 34.0, 29.0, 19.0, 31.0, 10.0, 3.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1015625, -14.61572265625, -14.1298828125, -13.64404296875, -13.158203125, -12.67236328125, -12.1865234375, -11.70068359375, -11.21484375, -10.72900390625, -10.2431640625, -9.75732421875, -9.271484375, -8.78564453125, -8.2998046875, -7.81396484375, -7.328125, -6.84228515625, -6.3564453125, -5.87060546875, -5.384765625, -4.89892578125, -4.4130859375, -3.92724609375, -3.44140625, -2.95556640625, -2.4697265625, -1.98388671875, -1.498046875, -1.01220703125, -0.5263671875, -0.04052734375, 0.4453125, 0.93115234375, 1.4169921875, 1.90283203125, 2.388671875, 2.87451171875, 3.3603515625, 3.84619140625, 4.33203125, 4.81787109375, 5.3037109375, 5.78955078125, 6.275390625, 6.76123046875, 7.2470703125, 7.73291015625, 8.21875, 8.70458984375, 9.1904296875, 9.67626953125, 10.162109375, 10.64794921875, 11.1337890625, 11.61962890625, 12.10546875, 12.59130859375, 13.0771484375, 13.56298828125, 14.048828125, 14.53466796875, 15.0205078125, 15.50634765625, 15.9921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 12.0, 9.0, 13.0, 12.0, 16.0, 30.0, 32.0, 38.0, 31.0, 39.0, 41.0, 57.0, 55.0, 37.0, 55.0, 50.0, 63.0, 47.0, 37.0, 38.0, 37.0, 42.0, 33.0, 28.0, 25.0, 14.0, 20.0, 17.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.20675277709961, -27.105480194091797, -26.004207611083984, -24.902935028076172, -23.80166244506836, -22.700389862060547, -21.599117279052734, -20.497844696044922, -19.39657211303711, -18.295299530029297, -17.194026947021484, -16.092754364013672, -14.99148178100586, -13.890209197998047, -12.788935661315918, -11.687663078308105, -10.586389541625977, -9.485116958618164, -8.383844375610352, -7.282571315765381, -6.181298732757568, -5.080026149749756, -3.978753089904785, -2.8774805068969727, -1.7762079238891602, -0.6749352216720581, 0.42633748054504395, 1.5276103019714355, 2.628882884979248, 3.7301554679870605, 4.831428527832031, 5.932701110839844, 7.033973693847656, 8.135246276855469, 9.236518859863281, 10.337791442871094, 11.439064025878906, 12.540336608886719, 13.641610145568848, 14.74288272857666, 15.844155311584473, 16.9454288482666, 18.046701431274414, 19.147974014282227, 20.24924659729004, 21.35051918029785, 22.451791763305664, 23.553064346313477, 24.65433692932129, 25.7556095123291, 26.856882095336914, 27.958154678344727, 29.05942726135254, 30.16069984436035, 31.261974334716797, 32.36324691772461, 33.46451950073242, 34.565792083740234, 35.66706466674805, 36.76833724975586, 37.86960983276367, 38.970882415771484, 40.0721549987793, 41.17342758178711, 42.27470016479492]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 8.0, 10.0, 11.0, 11.0, 5.0, 17.0, 16.0, 20.0, 28.0, 23.0, 31.0, 29.0, 30.0, 31.0, 39.0, 46.0, 30.0, 31.0, 40.0, 37.0, 47.0, 46.0, 53.0, 47.0, 37.0, 29.0, 27.0, 35.0, 24.0, 22.0, 22.0, 21.0, 22.0, 15.0, 15.0, 9.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-40.44240951538086, -39.20189666748047, -37.96138381958008, -36.72086715698242, -35.48035430908203, -34.23984146118164, -32.99932861328125, -31.75881576538086, -30.518301010131836, -29.277788162231445, -28.037273406982422, -26.79676055908203, -25.55624771118164, -24.315732955932617, -23.075220108032227, -21.834705352783203, -20.594192504882812, -19.353679656982422, -18.1131649017334, -16.872652053833008, -15.6321382522583, -14.391624450683594, -13.151111602783203, -11.910597801208496, -10.670083999633789, -9.429570198059082, -8.189056396484375, -6.948543548583984, -5.708029747009277, -4.46751594543457, -3.2270026206970215, -1.9864892959594727, -0.7459716796875, 0.49454188346862793, 1.7350554466247559, 2.975569009780884, 4.216082572937012, 5.456596374511719, 6.697109699249268, 7.937623023986816, 9.178136825561523, 10.41865062713623, 11.659164428710938, 12.899677276611328, 14.140191078186035, 15.380704879760742, 16.621217727661133, 17.861732482910156, 19.102245330810547, 20.342758178710938, 21.58327293395996, 22.82378578186035, 24.064300537109375, 25.304813385009766, 26.545326232910156, 27.785839080810547, 29.02635383605957, 30.26686668395996, 31.507381439208984, 32.747894287109375, 33.988407135009766, 35.228919982910156, 36.46943664550781, 37.7099494934082, 38.950462341308594]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 15.0, 26.0, 32.0, 59.0, 105.0, 119.0, 211.0, 291.0, 460.0, 770.0, 1119.0, 1917.0, 2830.0, 4555.0, 7071.0, 11550.0, 17742.0, 27648.0, 42298.0, 61391.0, 86292.0, 110955.0, 129154.0, 130617.0, 116505.0, 92703.0, 68433.0, 46808.0, 31248.0, 20308.0, 12930.0, 8264.0, 5171.0, 3283.0, 2036.0, 1316.0, 837.0, 502.0, 346.0, 227.0, 135.0, 86.0, 66.0, 44.0, 21.0, 20.0, 13.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.34375, -9.0230712890625, -8.702392578125, -8.3817138671875, -8.06103515625, -7.7403564453125, -7.419677734375, -7.0989990234375, -6.7783203125, -6.4576416015625, -6.136962890625, -5.8162841796875, -5.49560546875, -5.1749267578125, -4.854248046875, -4.5335693359375, -4.212890625, -3.8922119140625, -3.571533203125, -3.2508544921875, -2.93017578125, -2.6094970703125, -2.288818359375, -1.9681396484375, -1.6474609375, -1.3267822265625, -1.006103515625, -0.6854248046875, -0.36474609375, -0.0440673828125, 0.276611328125, 0.5972900390625, 0.91796875, 1.2386474609375, 1.559326171875, 1.8800048828125, 2.20068359375, 2.5213623046875, 2.842041015625, 3.1627197265625, 3.4833984375, 3.8040771484375, 4.124755859375, 4.4454345703125, 4.76611328125, 5.0867919921875, 5.407470703125, 5.7281494140625, 6.048828125, 6.3695068359375, 6.690185546875, 7.0108642578125, 7.33154296875, 7.6522216796875, 7.972900390625, 8.2935791015625, 8.6142578125, 8.9349365234375, 9.255615234375, 9.5762939453125, 9.89697265625, 10.2176513671875, 10.538330078125, 10.8590087890625, 11.1796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 8.0, 9.0, 11.0, 10.0, 7.0, 18.0, 14.0, 21.0, 25.0, 24.0, 33.0, 29.0, 30.0, 29.0, 44.0, 40.0, 33.0, 31.0, 38.0, 37.0, 49.0, 50.0, 48.0, 44.0, 41.0, 28.0, 25.0, 31.0, 29.0, 23.0, 22.0, 20.0, 22.0, 15.0, 16.0, 9.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-39.40625, -38.189453125, -36.97265625, -35.755859375, -34.5390625, -33.322265625, -32.10546875, -30.888671875, -29.671875, -28.455078125, -27.23828125, -26.021484375, -24.8046875, -23.587890625, -22.37109375, -21.154296875, -19.9375, -18.720703125, -17.50390625, -16.287109375, -15.0703125, -13.853515625, -12.63671875, -11.419921875, -10.203125, -8.986328125, -7.76953125, -6.552734375, -5.3359375, -4.119140625, -2.90234375, -1.685546875, -0.46875, 0.748046875, 1.96484375, 3.181640625, 4.3984375, 5.615234375, 6.83203125, 8.048828125, 9.265625, 10.482421875, 11.69921875, 12.916015625, 14.1328125, 15.349609375, 16.56640625, 17.783203125, 19.0, 20.216796875, 21.43359375, 22.650390625, 23.8671875, 25.083984375, 26.30078125, 27.517578125, 28.734375, 29.951171875, 31.16796875, 32.384765625, 33.6015625, 34.818359375, 36.03515625, 37.251953125, 38.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 6.0, 11.0, 6.0, 19.0, 24.0, 36.0, 65.0, 81.0, 142.0, 190.0, 237.0, 430.0, 637.0, 960.0, 1604.0, 2443.0, 3798.0, 5949.0, 9457.0, 15342.0, 28820.0, 836484.0, 77704.0, 25681.0, 14084.0, 8747.0, 5635.0, 3525.0, 2245.0, 1446.0, 954.0, 624.0, 404.0, 231.0, 169.0, 124.0, 81.0, 44.0, 32.0, 28.0, 20.0, 13.0, 5.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.359375, -26.50244140625, -25.6455078125, -24.78857421875, -23.931640625, -23.07470703125, -22.2177734375, -21.36083984375, -20.50390625, -19.64697265625, -18.7900390625, -17.93310546875, -17.076171875, -16.21923828125, -15.3623046875, -14.50537109375, -13.6484375, -12.79150390625, -11.9345703125, -11.07763671875, -10.220703125, -9.36376953125, -8.5068359375, -7.64990234375, -6.79296875, -5.93603515625, -5.0791015625, -4.22216796875, -3.365234375, -2.50830078125, -1.6513671875, -0.79443359375, 0.0625, 0.91943359375, 1.7763671875, 2.63330078125, 3.490234375, 4.34716796875, 5.2041015625, 6.06103515625, 6.91796875, 7.77490234375, 8.6318359375, 9.48876953125, 10.345703125, 11.20263671875, 12.0595703125, 12.91650390625, 13.7734375, 14.63037109375, 15.4873046875, 16.34423828125, 17.201171875, 18.05810546875, 18.9150390625, 19.77197265625, 20.62890625, 21.48583984375, 22.3427734375, 23.19970703125, 24.056640625, 24.91357421875, 25.7705078125, 26.62744140625, 27.484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 4.0, 10.0, 11.0, 15.0, 20.0, 22.0, 17.0, 20.0, 30.0, 37.0, 44.0, 28.0, 39.0, 39.0, 48.0, 46.0, 46.0, 50.0, 43.0, 58.0, 49.0, 36.0, 32.0, 30.0, 38.0, 21.0, 27.0, 18.0, 20.0, 22.0, 18.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.984375, -28.09228515625, -27.2001953125, -26.30810546875, -25.416015625, -24.52392578125, -23.6318359375, -22.73974609375, -21.84765625, -20.95556640625, -20.0634765625, -19.17138671875, -18.279296875, -17.38720703125, -16.4951171875, -15.60302734375, -14.7109375, -13.81884765625, -12.9267578125, -12.03466796875, -11.142578125, -10.25048828125, -9.3583984375, -8.46630859375, -7.57421875, -6.68212890625, -5.7900390625, -4.89794921875, -4.005859375, -3.11376953125, -2.2216796875, -1.32958984375, -0.4375, 0.45458984375, 1.3466796875, 2.23876953125, 3.130859375, 4.02294921875, 4.9150390625, 5.80712890625, 6.69921875, 7.59130859375, 8.4833984375, 9.37548828125, 10.267578125, 11.15966796875, 12.0517578125, 12.94384765625, 13.8359375, 14.72802734375, 15.6201171875, 16.51220703125, 17.404296875, 18.29638671875, 19.1884765625, 20.08056640625, 20.97265625, 21.86474609375, 22.7568359375, 23.64892578125, 24.541015625, 25.43310546875, 26.3251953125, 27.21728515625, 28.109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 14.0, 13.0, 17.0, 15.0, 25.0, 22.0, 53.0, 96.0, 99.0, 139.0, 232.0, 285.0, 454.0, 736.0, 1168.0, 1944.0, 3438.0, 6938.0, 15476.0, 42834.0, 903631.0, 40653.0, 15027.0, 6632.0, 3421.0, 1929.0, 1119.0, 695.0, 442.0, 316.0, 198.0, 144.0, 98.0, 74.0, 47.0, 47.0, 20.0, 22.0, 13.0, 11.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.5166473388671875, -1.466888427734375, -1.4171295166015625, -1.36737060546875, -1.3176116943359375, -1.267852783203125, -1.2180938720703125, -1.1683349609375, -1.1185760498046875, -1.068817138671875, -1.0190582275390625, -0.96929931640625, -0.9195404052734375, -0.869781494140625, -0.8200225830078125, -0.770263671875, -0.7205047607421875, -0.670745849609375, -0.6209869384765625, -0.57122802734375, -0.5214691162109375, -0.471710205078125, -0.4219512939453125, -0.3721923828125, -0.3224334716796875, -0.272674560546875, -0.2229156494140625, -0.17315673828125, -0.1233978271484375, -0.073638916015625, -0.0238800048828125, 0.02587890625, 0.0756378173828125, 0.125396728515625, 0.1751556396484375, 0.22491455078125, 0.2746734619140625, 0.324432373046875, 0.3741912841796875, 0.4239501953125, 0.4737091064453125, 0.523468017578125, 0.5732269287109375, 0.62298583984375, 0.6727447509765625, 0.722503662109375, 0.7722625732421875, 0.822021484375, 0.8717803955078125, 0.921539306640625, 0.9712982177734375, 1.02105712890625, 1.0708160400390625, 1.120574951171875, 1.1703338623046875, 1.2200927734375, 1.2698516845703125, 1.319610595703125, 1.3693695068359375, 1.41912841796875, 1.4688873291015625, 1.518646240234375, 1.5684051513671875, 1.6181640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 3.0, 3.0, 10.0, 7.0, 13.0, 13.0, 18.0, 24.0, 38.0, 45.0, 46.0, 55.0, 43.0, 73.0, 51.0, 62.0, 58.0, 49.0, 61.0, 47.0, 57.0, 39.0, 37.0, 31.0, 18.0, 21.0, 15.0, 10.0, 13.0, 10.0, 8.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2757798433303833e-05, -2.197176218032837e-05, -2.1185725927352905e-05, -2.039968967437744e-05, -1.9613653421401978e-05, -1.8827617168426514e-05, -1.804158091545105e-05, -1.7255544662475586e-05, -1.6469508409500122e-05, -1.5683472156524658e-05, -1.4897435903549194e-05, -1.411139965057373e-05, -1.3325363397598267e-05, -1.2539327144622803e-05, -1.1753290891647339e-05, -1.0967254638671875e-05, -1.0181218385696411e-05, -9.395182132720947e-06, -8.609145879745483e-06, -7.82310962677002e-06, -7.037073373794556e-06, -6.251037120819092e-06, -5.465000867843628e-06, -4.678964614868164e-06, -3.8929283618927e-06, -3.1068921089172363e-06, -2.3208558559417725e-06, -1.5348196029663086e-06, -7.487833499908447e-07, 3.725290298461914e-08, 8.23289155960083e-07, 1.6093254089355469e-06, 2.3953616619110107e-06, 3.1813979148864746e-06, 3.9674341678619385e-06, 4.753470420837402e-06, 5.539506673812866e-06, 6.32554292678833e-06, 7.111579179763794e-06, 7.897615432739258e-06, 8.683651685714722e-06, 9.469687938690186e-06, 1.025572419166565e-05, 1.1041760444641113e-05, 1.1827796697616577e-05, 1.2613832950592041e-05, 1.3399869203567505e-05, 1.4185905456542969e-05, 1.4971941709518433e-05, 1.5757977962493896e-05, 1.654401421546936e-05, 1.7330050468444824e-05, 1.8116086721420288e-05, 1.8902122974395752e-05, 1.9688159227371216e-05, 2.047419548034668e-05, 2.1260231733322144e-05, 2.2046267986297607e-05, 2.283230423927307e-05, 2.3618340492248535e-05, 2.4404376745224e-05, 2.5190412998199463e-05, 2.5976449251174927e-05, 2.676248550415039e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 11.0, 6.0, 16.0, 20.0, 26.0, 34.0, 58.0, 63.0, 125.0, 141.0, 230.0, 352.0, 574.0, 818.0, 1311.0, 1966.0, 3145.0, 4897.0, 7862.0, 12652.0, 20179.0, 33092.0, 55302.0, 94959.0, 162723.0, 218004.0, 173739.0, 103082.0, 59615.0, 35129.0, 21787.0, 13411.0, 8387.0, 5388.0, 3308.0, 2195.0, 1324.0, 950.0, 536.0, 357.0, 248.0, 171.0, 108.0, 82.0, 50.0, 49.0, 29.0, 16.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.59521484375, -0.57574462890625, -0.5562744140625, -0.53680419921875, -0.517333984375, -0.49786376953125, -0.4783935546875, -0.45892333984375, -0.439453125, -0.41998291015625, -0.4005126953125, -0.38104248046875, -0.361572265625, -0.34210205078125, -0.3226318359375, -0.30316162109375, -0.28369140625, -0.26422119140625, -0.2447509765625, -0.22528076171875, -0.205810546875, -0.18634033203125, -0.1668701171875, -0.14739990234375, -0.1279296875, -0.10845947265625, -0.0889892578125, -0.06951904296875, -0.050048828125, -0.03057861328125, -0.0111083984375, 0.00836181640625, 0.02783203125, 0.04730224609375, 0.0667724609375, 0.08624267578125, 0.105712890625, 0.12518310546875, 0.1446533203125, 0.16412353515625, 0.18359375, 0.20306396484375, 0.2225341796875, 0.24200439453125, 0.261474609375, 0.28094482421875, 0.3004150390625, 0.31988525390625, 0.33935546875, 0.35882568359375, 0.3782958984375, 0.39776611328125, 0.417236328125, 0.43670654296875, 0.4561767578125, 0.47564697265625, 0.4951171875, 0.51458740234375, 0.5340576171875, 0.55352783203125, 0.572998046875, 0.59246826171875, 0.6119384765625, 0.63140869140625, 0.65087890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 5.0, 7.0, 4.0, 11.0, 15.0, 14.0, 16.0, 17.0, 16.0, 32.0, 34.0, 47.0, 53.0, 74.0, 70.0, 69.0, 66.0, 78.0, 66.0, 46.0, 47.0, 35.0, 32.0, 33.0, 16.0, 20.0, 14.0, 12.0, 9.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21709251403808594, -0.21006393432617188, -0.2030353546142578, -0.19600677490234375, -0.1889781951904297, -0.18194961547851562, -0.17492103576660156, -0.1678924560546875, -0.16086387634277344, -0.15383529663085938, -0.1468067169189453, -0.13977813720703125, -0.1327495574951172, -0.12572097778320312, -0.11869239807128906, -0.111663818359375, -0.10463523864746094, -0.09760665893554688, -0.09057807922363281, -0.08354949951171875, -0.07652091979980469, -0.06949234008789062, -0.06246376037597656, -0.0554351806640625, -0.04840660095214844, -0.041378021240234375, -0.03434944152832031, -0.02732086181640625, -0.020292282104492188, -0.013263702392578125, -0.0062351226806640625, 0.00079345703125, 0.007822036743164062, 0.014850616455078125, 0.021879196166992188, 0.02890777587890625, 0.03593635559082031, 0.042964935302734375, 0.04999351501464844, 0.0570220947265625, 0.06405067443847656, 0.07107925415039062, 0.07810783386230469, 0.08513641357421875, 0.09216499328613281, 0.09919357299804688, 0.10622215270996094, 0.113250732421875, 0.12027931213378906, 0.12730789184570312, 0.1343364715576172, 0.14136505126953125, 0.1483936309814453, 0.15542221069335938, 0.16245079040527344, 0.1694793701171875, 0.17650794982910156, 0.18353652954101562, 0.1905651092529297, 0.19759368896484375, 0.2046222686767578, 0.21165084838867188, 0.21867942810058594, 0.2257080078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 5.0, 10.0, 14.0, 11.0, 16.0, 15.0, 19.0, 40.0, 29.0, 39.0, 40.0, 39.0, 53.0, 49.0, 48.0, 43.0, 56.0, 44.0, 58.0, 37.0, 48.0, 28.0, 55.0, 35.0, 20.0, 25.0, 24.0, 18.0, 20.0, 9.0, 11.0, 5.0, 9.0, 2.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.44515037536621, -26.37285614013672, -25.30056381225586, -24.228269577026367, -23.155975341796875, -22.083681106567383, -21.01138687133789, -19.93909454345703, -18.86680030822754, -17.794506072998047, -16.722213745117188, -15.649919509887695, -14.577625274658203, -13.505331039428711, -12.433037757873535, -11.36074447631836, -10.288450241088867, -9.216156005859375, -8.1438627243042, -7.071568965911865, -5.999275207519531, -4.926981449127197, -3.8546876907348633, -2.7823939323425293, -1.7101001739501953, -0.6378064155578613, 0.43448734283447266, 1.5067811012268066, 2.5790748596191406, 3.6513686180114746, 4.723662376403809, 5.795956134796143, 6.868247985839844, 7.940541744232178, 9.012835502624512, 10.085128784179688, 11.15742301940918, 12.229717254638672, 13.302010536193848, 14.374303817749023, 15.446598052978516, 16.518892288208008, 17.5911865234375, 18.66347885131836, 19.73577308654785, 20.808067321777344, 21.880359649658203, 22.952653884887695, 24.024948120117188, 25.09724235534668, 26.169536590576172, 27.24182891845703, 28.314123153686523, 29.386417388916016, 30.458709716796875, 31.531003952026367, 32.60329818725586, 33.67559051513672, 34.747886657714844, 35.8201789855957, 36.89247131347656, 37.96476745605469, 39.03705978393555, 40.10935592651367, 41.18164825439453]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 8.0, 10.0, 10.0, 11.0, 7.0, 17.0, 15.0, 20.0, 28.0, 22.0, 32.0, 29.0, 32.0, 30.0, 43.0, 40.0, 33.0, 30.0, 38.0, 38.0, 49.0, 48.0, 48.0, 44.0, 42.0, 28.0, 24.0, 33.0, 27.0, 24.0, 21.0, 20.0, 22.0, 16.0, 15.0, 8.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-39.309913635253906, -38.09489440917969, -36.879878997802734, -35.664859771728516, -34.44984436035156, -33.234825134277344, -32.01980972290039, -30.804790496826172, -29.589773178100586, -28.374755859375, -27.159738540649414, -25.944721221923828, -24.72970199584961, -23.514686584472656, -22.299667358398438, -21.08465003967285, -19.869632720947266, -18.65461540222168, -17.439598083496094, -16.224580764770508, -15.009562492370605, -13.79454517364502, -12.579526901245117, -11.364509582519531, -10.149492263793945, -8.93447494506836, -7.719457149505615, -6.504439353942871, -5.289422035217285, -4.074404716491699, -2.859386920928955, -1.644369125366211, -0.429351806640625, 0.78566575050354, 2.000683307647705, 3.21570086479187, 4.430718421936035, 5.645735740661621, 6.860753536224365, 8.07577133178711, 9.290788650512695, 10.505805969238281, 11.720823287963867, 12.93584156036377, 14.150858879089355, 15.365876197814941, 16.580894470214844, 17.79591178894043, 19.010929107666016, 20.2259464263916, 21.440963745117188, 22.655981063842773, 23.87099838256836, 25.086017608642578, 26.301034927368164, 27.51605224609375, 28.731069564819336, 29.946086883544922, 31.161104202270508, 32.376121520996094, 33.59114074707031, 34.806156158447266, 36.021175384521484, 37.23619079589844, 38.451210021972656]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 11.0, 16.0, 19.0, 34.0, 51.0, 79.0, 118.0, 182.0, 254.0, 403.0, 646.0, 1050.0, 1631.0, 2610.0, 4321.0, 6974.0, 11591.0, 18616.0, 29403.0, 44946.0, 65647.0, 90510.0, 113146.0, 127503.0, 128154.0, 114129.0, 92081.0, 67282.0, 46520.0, 30328.0, 19027.0, 12035.0, 7356.0, 4549.0, 2800.0, 1676.0, 1044.0, 626.0, 404.0, 310.0, 160.0, 99.0, 64.0, 53.0, 37.0, 18.0, 20.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0], "bins": [-29.40625, -28.51611328125, -27.6259765625, -26.73583984375, -25.845703125, -24.95556640625, -24.0654296875, -23.17529296875, -22.28515625, -21.39501953125, -20.5048828125, -19.61474609375, -18.724609375, -17.83447265625, -16.9443359375, -16.05419921875, -15.1640625, -14.27392578125, -13.3837890625, -12.49365234375, -11.603515625, -10.71337890625, -9.8232421875, -8.93310546875, -8.04296875, -7.15283203125, -6.2626953125, -5.37255859375, -4.482421875, -3.59228515625, -2.7021484375, -1.81201171875, -0.921875, -0.03173828125, 0.8583984375, 1.74853515625, 2.638671875, 3.52880859375, 4.4189453125, 5.30908203125, 6.19921875, 7.08935546875, 7.9794921875, 8.86962890625, 9.759765625, 10.64990234375, 11.5400390625, 12.43017578125, 13.3203125, 14.21044921875, 15.1005859375, 15.99072265625, 16.880859375, 17.77099609375, 18.6611328125, 19.55126953125, 20.44140625, 21.33154296875, 22.2216796875, 23.11181640625, 24.001953125, 24.89208984375, 25.7822265625, 26.67236328125, 27.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 0.0, 7.0, 8.0, 9.0, 9.0, 14.0, 6.0, 16.0, 15.0, 20.0, 28.0, 22.0, 32.0, 31.0, 27.0, 33.0, 38.0, 44.0, 32.0, 32.0, 36.0, 36.0, 50.0, 48.0, 51.0, 42.0, 39.0, 29.0, 27.0, 33.0, 30.0, 18.0, 23.0, 22.0, 21.0, 12.0, 21.0, 5.0, 14.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-37.78125, -36.61669921875, -35.4521484375, -34.28759765625, -33.123046875, -31.95849609375, -30.7939453125, -29.62939453125, -28.46484375, -27.30029296875, -26.1357421875, -24.97119140625, -23.806640625, -22.64208984375, -21.4775390625, -20.31298828125, -19.1484375, -17.98388671875, -16.8193359375, -15.65478515625, -14.490234375, -13.32568359375, -12.1611328125, -10.99658203125, -9.83203125, -8.66748046875, -7.5029296875, -6.33837890625, -5.173828125, -4.00927734375, -2.8447265625, -1.68017578125, -0.515625, 0.64892578125, 1.8134765625, 2.97802734375, 4.142578125, 5.30712890625, 6.4716796875, 7.63623046875, 8.80078125, 9.96533203125, 11.1298828125, 12.29443359375, 13.458984375, 14.62353515625, 15.7880859375, 16.95263671875, 18.1171875, 19.28173828125, 20.4462890625, 21.61083984375, 22.775390625, 23.93994140625, 25.1044921875, 26.26904296875, 27.43359375, 28.59814453125, 29.7626953125, 30.92724609375, 32.091796875, 33.25634765625, 34.4208984375, 35.58544921875, 36.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 9.0, 14.0, 10.0, 18.0, 39.0, 52.0, 64.0, 102.0, 188.0, 303.0, 424.0, 694.0, 1244.0, 1825.0, 2957.0, 4546.0, 7730.0, 12747.0, 20636.0, 32242.0, 49245.0, 71419.0, 97198.0, 119435.0, 131385.0, 127359.0, 110122.0, 85317.0, 60948.0, 40747.0, 26239.0, 16710.0, 10165.0, 6314.0, 3840.0, 2295.0, 1414.0, 912.0, 597.0, 364.0, 272.0, 149.0, 103.0, 59.0, 38.0, 22.0, 18.0, 17.0, 9.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-32.03125, -31.110107421875, -30.18896484375, -29.267822265625, -28.3466796875, -27.425537109375, -26.50439453125, -25.583251953125, -24.662109375, -23.740966796875, -22.81982421875, -21.898681640625, -20.9775390625, -20.056396484375, -19.13525390625, -18.214111328125, -17.29296875, -16.371826171875, -15.45068359375, -14.529541015625, -13.6083984375, -12.687255859375, -11.76611328125, -10.844970703125, -9.923828125, -9.002685546875, -8.08154296875, -7.160400390625, -6.2392578125, -5.318115234375, -4.39697265625, -3.475830078125, -2.5546875, -1.633544921875, -0.71240234375, 0.208740234375, 1.1298828125, 2.051025390625, 2.97216796875, 3.893310546875, 4.814453125, 5.735595703125, 6.65673828125, 7.577880859375, 8.4990234375, 9.420166015625, 10.34130859375, 11.262451171875, 12.18359375, 13.104736328125, 14.02587890625, 14.947021484375, 15.8681640625, 16.789306640625, 17.71044921875, 18.631591796875, 19.552734375, 20.473876953125, 21.39501953125, 22.316162109375, 23.2373046875, 24.158447265625, 25.07958984375, 26.000732421875, 26.921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 10.0, 14.0, 11.0, 16.0, 22.0, 20.0, 28.0, 29.0, 34.0, 30.0, 27.0, 38.0, 35.0, 33.0, 31.0, 42.0, 40.0, 46.0, 50.0, 46.0, 43.0, 37.0, 35.0, 31.0, 23.0, 34.0, 23.0, 32.0, 23.0, 20.0, 17.0, 13.0, 13.0, 14.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.828125, -24.0517578125, -23.275390625, -22.4990234375, -21.72265625, -20.9462890625, -20.169921875, -19.3935546875, -18.6171875, -17.8408203125, -17.064453125, -16.2880859375, -15.51171875, -14.7353515625, -13.958984375, -13.1826171875, -12.40625, -11.6298828125, -10.853515625, -10.0771484375, -9.30078125, -8.5244140625, -7.748046875, -6.9716796875, -6.1953125, -5.4189453125, -4.642578125, -3.8662109375, -3.08984375, -2.3134765625, -1.537109375, -0.7607421875, 0.015625, 0.7919921875, 1.568359375, 2.3447265625, 3.12109375, 3.8974609375, 4.673828125, 5.4501953125, 6.2265625, 7.0029296875, 7.779296875, 8.5556640625, 9.33203125, 10.1083984375, 10.884765625, 11.6611328125, 12.4375, 13.2138671875, 13.990234375, 14.7666015625, 15.54296875, 16.3193359375, 17.095703125, 17.8720703125, 18.6484375, 19.4248046875, 20.201171875, 20.9775390625, 21.75390625, 22.5302734375, 23.306640625, 24.0830078125, 24.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 11.0, 15.0, 26.0, 33.0, 56.0, 92.0, 121.0, 177.0, 241.0, 379.0, 636.0, 1022.0, 1598.0, 2825.0, 4897.0, 8592.0, 14942.0, 26196.0, 43952.0, 71406.0, 106309.0, 140034.0, 156708.0, 146936.0, 116497.0, 80894.0, 51558.0, 30404.0, 17571.0, 10044.0, 5883.0, 3293.0, 1985.0, 1189.0, 715.0, 477.0, 262.0, 178.0, 130.0, 82.0, 54.0, 40.0, 33.0, 15.0, 15.0, 13.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.82421875, -7.56890869140625, -7.3135986328125, -7.05828857421875, -6.802978515625, -6.54766845703125, -6.2923583984375, -6.03704833984375, -5.78173828125, -5.52642822265625, -5.2711181640625, -5.01580810546875, -4.760498046875, -4.50518798828125, -4.2498779296875, -3.99456787109375, -3.7392578125, -3.48394775390625, -3.2286376953125, -2.97332763671875, -2.718017578125, -2.46270751953125, -2.2073974609375, -1.95208740234375, -1.69677734375, -1.44146728515625, -1.1861572265625, -0.93084716796875, -0.675537109375, -0.42022705078125, -0.1649169921875, 0.09039306640625, 0.345703125, 0.60101318359375, 0.8563232421875, 1.11163330078125, 1.366943359375, 1.62225341796875, 1.8775634765625, 2.13287353515625, 2.38818359375, 2.64349365234375, 2.8988037109375, 3.15411376953125, 3.409423828125, 3.66473388671875, 3.9200439453125, 4.17535400390625, 4.4306640625, 4.68597412109375, 4.9412841796875, 5.19659423828125, 5.451904296875, 5.70721435546875, 5.9625244140625, 6.21783447265625, 6.47314453125, 6.72845458984375, 6.9837646484375, 7.23907470703125, 7.494384765625, 7.74969482421875, 8.0050048828125, 8.26031494140625, 8.515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 16.0, 8.0, 15.0, 16.0, 20.0, 33.0, 26.0, 33.0, 29.0, 34.0, 45.0, 51.0, 55.0, 51.0, 59.0, 53.0, 52.0, 52.0, 52.0, 38.0, 49.0, 34.0, 28.0, 22.0, 25.0, 28.0, 16.0, 16.0, 10.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007271766662597656, -0.0007035285234451294, -0.0006798803806304932, -0.0006562322378158569, -0.0006325840950012207, -0.0006089359521865845, -0.0005852878093719482, -0.000561639666557312, -0.0005379915237426758, -0.0005143433809280396, -0.0004906952381134033, -0.0004670470952987671, -0.00044339895248413086, -0.00041975080966949463, -0.0003961026668548584, -0.00037245452404022217, -0.00034880638122558594, -0.0003251582384109497, -0.0003015100955963135, -0.00027786195278167725, -0.000254213809967041, -0.00023056566715240479, -0.00020691752433776855, -0.00018326938152313232, -0.0001596212387084961, -0.00013597309589385986, -0.00011232495307922363, -8.86768102645874e-05, -6.502866744995117e-05, -4.138052463531494e-05, -1.773238182067871e-05, 5.9157609939575195e-06, 2.956390380859375e-05, 5.321204662322998e-05, 7.686018943786621e-05, 0.00010050833225250244, 0.00012415647506713867, 0.0001478046178817749, 0.00017145276069641113, 0.00019510090351104736, 0.0002187490463256836, 0.00024239718914031982, 0.00026604533195495605, 0.0002896934747695923, 0.0003133416175842285, 0.00033698976039886475, 0.000360637903213501, 0.0003842860460281372, 0.00040793418884277344, 0.00043158233165740967, 0.0004552304744720459, 0.00047887861728668213, 0.0005025267601013184, 0.0005261749029159546, 0.0005498230457305908, 0.000573471188545227, 0.0005971193313598633, 0.0006207674741744995, 0.0006444156169891357, 0.000668063759803772, 0.0006917119026184082, 0.0007153600454330444, 0.0007390081882476807, 0.0007626563310623169, 0.0007863044738769531]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 12.0, 11.0, 17.0, 19.0, 32.0, 49.0, 67.0, 113.0, 168.0, 242.0, 356.0, 519.0, 829.0, 1211.0, 1767.0, 2750.0, 4072.0, 6089.0, 9239.0, 13795.0, 20768.0, 30656.0, 45175.0, 63668.0, 86980.0, 108001.0, 121623.0, 121876.0, 109251.0, 88989.0, 66084.0, 47047.0, 32272.0, 21947.0, 14220.0, 9469.0, 6373.0, 4262.0, 2855.0, 1845.0, 1223.0, 908.0, 565.0, 384.0, 250.0, 172.0, 111.0, 76.0, 52.0, 34.0, 23.0, 14.0, 15.0, 6.0, 3.0, 4.0, 6.0], "bins": [-7.484375, -7.26458740234375, -7.0447998046875, -6.82501220703125, -6.605224609375, -6.38543701171875, -6.1656494140625, -5.94586181640625, -5.72607421875, -5.50628662109375, -5.2864990234375, -5.06671142578125, -4.846923828125, -4.62713623046875, -4.4073486328125, -4.18756103515625, -3.9677734375, -3.74798583984375, -3.5281982421875, -3.30841064453125, -3.088623046875, -2.86883544921875, -2.6490478515625, -2.42926025390625, -2.20947265625, -1.98968505859375, -1.7698974609375, -1.55010986328125, -1.330322265625, -1.11053466796875, -0.8907470703125, -0.67095947265625, -0.451171875, -0.23138427734375, -0.0115966796875, 0.20819091796875, 0.427978515625, 0.64776611328125, 0.8675537109375, 1.08734130859375, 1.30712890625, 1.52691650390625, 1.7467041015625, 1.96649169921875, 2.186279296875, 2.40606689453125, 2.6258544921875, 2.84564208984375, 3.0654296875, 3.28521728515625, 3.5050048828125, 3.72479248046875, 3.944580078125, 4.16436767578125, 4.3841552734375, 4.60394287109375, 4.82373046875, 5.04351806640625, 5.2633056640625, 5.48309326171875, 5.702880859375, 5.92266845703125, 6.1424560546875, 6.36224365234375, 6.58203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 9.0, 14.0, 15.0, 22.0, 19.0, 29.0, 34.0, 33.0, 31.0, 43.0, 47.0, 68.0, 54.0, 71.0, 54.0, 33.0, 59.0, 50.0, 49.0, 39.0, 43.0, 37.0, 30.0, 17.0, 15.0, 14.0, 17.0, 11.0, 9.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.08880615234375, -3.9510498046875, -3.81329345703125, -3.675537109375, -3.53778076171875, -3.4000244140625, -3.26226806640625, -3.12451171875, -2.98675537109375, -2.8489990234375, -2.71124267578125, -2.573486328125, -2.43572998046875, -2.2979736328125, -2.16021728515625, -2.0224609375, -1.88470458984375, -1.7469482421875, -1.60919189453125, -1.471435546875, -1.33367919921875, -1.1959228515625, -1.05816650390625, -0.92041015625, -0.78265380859375, -0.6448974609375, -0.50714111328125, -0.369384765625, -0.23162841796875, -0.0938720703125, 0.04388427734375, 0.181640625, 0.31939697265625, 0.4571533203125, 0.59490966796875, 0.732666015625, 0.87042236328125, 1.0081787109375, 1.14593505859375, 1.28369140625, 1.42144775390625, 1.5592041015625, 1.69696044921875, 1.834716796875, 1.97247314453125, 2.1102294921875, 2.24798583984375, 2.3857421875, 2.52349853515625, 2.6612548828125, 2.79901123046875, 2.936767578125, 3.07452392578125, 3.2122802734375, 3.35003662109375, 3.48779296875, 3.62554931640625, 3.7633056640625, 3.90106201171875, 4.038818359375, 4.17657470703125, 4.3143310546875, 4.45208740234375, 4.58984375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 2.0, 7.0, 7.0, 9.0, 8.0, 5.0, 16.0, 13.0, 17.0, 16.0, 16.0, 22.0, 36.0, 32.0, 38.0, 45.0, 38.0, 44.0, 41.0, 41.0, 46.0, 50.0, 51.0, 37.0, 33.0, 43.0, 31.0, 31.0, 27.0, 31.0, 28.0, 22.0, 25.0, 9.0, 16.0, 18.0, 10.0, 9.0, 8.0, 9.0, 1.0, 2.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.605348587036133, -24.664093017578125, -23.722837448120117, -22.78158187866211, -21.8403263092041, -20.899070739746094, -19.95781707763672, -19.016559600830078, -18.075305938720703, -17.134050369262695, -16.192794799804688, -15.25153923034668, -14.310283660888672, -13.369028091430664, -12.427773475646973, -11.486517906188965, -10.54526138305664, -9.604005813598633, -8.662750244140625, -7.721495151519775, -6.780239582061768, -5.83898401260376, -4.89772891998291, -3.9564733505249023, -3.0152177810668945, -2.0739622116088867, -1.132706880569458, -0.1914515495300293, 0.7498040199279785, 1.6910595893859863, 2.632314682006836, 3.5735702514648438, 4.514827728271484, 5.456083297729492, 6.3973388671875, 7.33859395980835, 8.279850006103516, 9.221105575561523, 10.162360191345215, 11.103615760803223, 12.04487133026123, 12.986126899719238, 13.927382469177246, 14.868637084960938, 15.809892654418945, 16.751148223876953, 17.69240379333496, 18.63365936279297, 19.574914932250977, 20.516170501708984, 21.457426071166992, 22.398681640625, 23.339937210083008, 24.281192779541016, 25.22244644165039, 26.16370391845703, 27.104957580566406, 28.046213150024414, 28.987468719482422, 29.92872428894043, 30.869979858398438, 31.811235427856445, 32.75249099731445, 33.69374465942383, 34.63500213623047]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 8.0, 12.0, 6.0, 10.0, 15.0, 14.0, 18.0, 19.0, 23.0, 25.0, 20.0, 33.0, 30.0, 43.0, 31.0, 37.0, 39.0, 43.0, 41.0, 48.0, 32.0, 34.0, 32.0, 25.0, 46.0, 39.0, 39.0, 28.0, 29.0, 23.0, 19.0, 20.0, 19.0, 16.0, 13.0, 10.0, 13.0, 3.0, 5.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 6.0], "bins": [-43.02202606201172, -41.84022521972656, -40.658424377441406, -39.47662353515625, -38.294822692871094, -37.11302185058594, -35.93122100830078, -34.749420166015625, -33.56761932373047, -32.38581848144531, -31.204017639160156, -30.022216796875, -28.840415954589844, -27.658615112304688, -26.47681427001953, -25.295013427734375, -24.113210678100586, -22.93140983581543, -21.749608993530273, -20.567808151245117, -19.38600730895996, -18.204206466674805, -17.022403717041016, -15.840603828430176, -14.65880298614502, -13.477002143859863, -12.295201301574707, -11.113399505615234, -9.931598663330078, -8.749797821044922, -7.567996978759766, -6.386196136474609, -5.204395294189453, -4.022594451904297, -2.8407933712005615, -1.6589922904968262, -0.4771914482116699, 0.7046093940734863, 1.8864107131958008, 3.068211555480957, 4.250012397766113, 5.4318132400512695, 6.613614082336426, 7.79541540145874, 8.977216720581055, 10.159017562866211, 11.340818405151367, 12.522619247436523, 13.70442008972168, 14.886220932006836, 16.068021774291992, 17.24982261657715, 18.431623458862305, 19.61342430114746, 20.79522705078125, 21.977027893066406, 23.158828735351562, 24.34062957763672, 25.522430419921875, 26.70423126220703, 27.886032104492188, 29.067832946777344, 30.2496337890625, 31.431434631347656, 32.61323547363281]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 6.0, 2.0, 7.0, 19.0, 29.0, 43.0, 67.0, 109.0, 158.0, 229.0, 344.0, 555.0, 801.0, 1237.0, 1938.0, 3047.0, 4612.0, 7110.0, 11265.0, 17588.0, 27609.0, 42573.0, 66648.0, 103041.0, 157762.0, 238135.0, 344655.0, 458148.0, 541256.0, 551777.0, 485090.0, 374101.0, 263125.0, 176709.0, 114842.0, 73389.0, 46921.0, 29336.0, 18628.0, 11583.0, 7273.0, 4663.0, 2953.0, 1812.0, 1145.0, 724.0, 443.0, 310.0, 183.0, 120.0, 67.0, 37.0, 27.0, 23.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-26.390625, -25.593505859375, -24.79638671875, -23.999267578125, -23.2021484375, -22.405029296875, -21.60791015625, -20.810791015625, -20.013671875, -19.216552734375, -18.41943359375, -17.622314453125, -16.8251953125, -16.028076171875, -15.23095703125, -14.433837890625, -13.63671875, -12.839599609375, -12.04248046875, -11.245361328125, -10.4482421875, -9.651123046875, -8.85400390625, -8.056884765625, -7.259765625, -6.462646484375, -5.66552734375, -4.868408203125, -4.0712890625, -3.274169921875, -2.47705078125, -1.679931640625, -0.8828125, -0.085693359375, 0.71142578125, 1.508544921875, 2.3056640625, 3.102783203125, 3.89990234375, 4.697021484375, 5.494140625, 6.291259765625, 7.08837890625, 7.885498046875, 8.6826171875, 9.479736328125, 10.27685546875, 11.073974609375, 11.87109375, 12.668212890625, 13.46533203125, 14.262451171875, 15.0595703125, 15.856689453125, 16.65380859375, 17.450927734375, 18.248046875, 19.045166015625, 19.84228515625, 20.639404296875, 21.4365234375, 22.233642578125, 23.03076171875, 23.827880859375, 24.625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 7.0, 11.0, 6.0, 14.0, 7.0, 16.0, 19.0, 21.0, 24.0, 21.0, 23.0, 28.0, 33.0, 34.0, 41.0, 34.0, 44.0, 38.0, 39.0, 44.0, 41.0, 30.0, 34.0, 28.0, 40.0, 44.0, 36.0, 29.0, 26.0, 23.0, 22.0, 25.0, 12.0, 17.0, 16.0, 9.0, 11.0, 7.0, 4.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0], "bins": [-33.3125, -32.3974609375, -31.482421875, -30.5673828125, -29.65234375, -28.7373046875, -27.822265625, -26.9072265625, -25.9921875, -25.0771484375, -24.162109375, -23.2470703125, -22.33203125, -21.4169921875, -20.501953125, -19.5869140625, -18.671875, -17.7568359375, -16.841796875, -15.9267578125, -15.01171875, -14.0966796875, -13.181640625, -12.2666015625, -11.3515625, -10.4365234375, -9.521484375, -8.6064453125, -7.69140625, -6.7763671875, -5.861328125, -4.9462890625, -4.03125, -3.1162109375, -2.201171875, -1.2861328125, -0.37109375, 0.5439453125, 1.458984375, 2.3740234375, 3.2890625, 4.2041015625, 5.119140625, 6.0341796875, 6.94921875, 7.8642578125, 8.779296875, 9.6943359375, 10.609375, 11.5244140625, 12.439453125, 13.3544921875, 14.26953125, 15.1845703125, 16.099609375, 17.0146484375, 17.9296875, 18.8447265625, 19.759765625, 20.6748046875, 21.58984375, 22.5048828125, 23.419921875, 24.3349609375, 25.25]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 12.0, 9.0, 16.0, 30.0, 40.0, 77.0, 100.0, 195.0, 285.0, 460.0, 654.0, 1058.0, 1642.0, 2460.0, 3671.0, 5854.0, 8817.0, 13620.0, 20711.0, 31118.0, 46257.0, 67673.0, 96828.0, 134727.0, 184135.0, 240126.0, 299532.0, 352588.0, 390380.0, 402440.0, 390349.0, 351216.0, 297416.0, 237798.0, 182228.0, 133798.0, 95306.0, 66841.0, 45325.0, 30319.0, 20230.0, 13344.0, 8619.0, 5782.0, 3629.0, 2299.0, 1575.0, 947.0, 618.0, 415.0, 267.0, 163.0, 98.0, 72.0, 45.0, 38.0, 21.0, 9.0, 8.0, 5.0, 3.0], "bins": [-19.609375, -19.005615234375, -18.40185546875, -17.798095703125, -17.1943359375, -16.590576171875, -15.98681640625, -15.383056640625, -14.779296875, -14.175537109375, -13.57177734375, -12.968017578125, -12.3642578125, -11.760498046875, -11.15673828125, -10.552978515625, -9.94921875, -9.345458984375, -8.74169921875, -8.137939453125, -7.5341796875, -6.930419921875, -6.32666015625, -5.722900390625, -5.119140625, -4.515380859375, -3.91162109375, -3.307861328125, -2.7041015625, -2.100341796875, -1.49658203125, -0.892822265625, -0.2890625, 0.314697265625, 0.91845703125, 1.522216796875, 2.1259765625, 2.729736328125, 3.33349609375, 3.937255859375, 4.541015625, 5.144775390625, 5.74853515625, 6.352294921875, 6.9560546875, 7.559814453125, 8.16357421875, 8.767333984375, 9.37109375, 9.974853515625, 10.57861328125, 11.182373046875, 11.7861328125, 12.389892578125, 12.99365234375, 13.597412109375, 14.201171875, 14.804931640625, 15.40869140625, 16.012451171875, 16.6162109375, 17.219970703125, 17.82373046875, 18.427490234375, 19.03125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 11.0, 19.0, 19.0, 21.0, 22.0, 45.0, 43.0, 52.0, 74.0, 82.0, 95.0, 107.0, 126.0, 128.0, 188.0, 200.0, 204.0, 203.0, 226.0, 216.0, 233.0, 217.0, 206.0, 195.0, 185.0, 146.0, 116.0, 135.0, 93.0, 87.0, 79.0, 65.0, 47.0, 43.0, 33.0, 20.0, 27.0, 14.0, 17.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.203125, -13.7591552734375, -13.315185546875, -12.8712158203125, -12.42724609375, -11.9832763671875, -11.539306640625, -11.0953369140625, -10.6513671875, -10.2073974609375, -9.763427734375, -9.3194580078125, -8.87548828125, -8.4315185546875, -7.987548828125, -7.5435791015625, -7.099609375, -6.6556396484375, -6.211669921875, -5.7677001953125, -5.32373046875, -4.8797607421875, -4.435791015625, -3.9918212890625, -3.5478515625, -3.1038818359375, -2.659912109375, -2.2159423828125, -1.77197265625, -1.3280029296875, -0.884033203125, -0.4400634765625, 0.00390625, 0.4478759765625, 0.891845703125, 1.3358154296875, 1.77978515625, 2.2237548828125, 2.667724609375, 3.1116943359375, 3.5556640625, 3.9996337890625, 4.443603515625, 4.8875732421875, 5.33154296875, 5.7755126953125, 6.219482421875, 6.6634521484375, 7.107421875, 7.5513916015625, 7.995361328125, 8.4393310546875, 8.88330078125, 9.3272705078125, 9.771240234375, 10.2152099609375, 10.6591796875, 11.1031494140625, 11.547119140625, 11.9910888671875, 12.43505859375, 12.8790283203125, 13.322998046875, 13.7669677734375, 14.2109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 14.0, 14.0, 13.0, 16.0, 21.0, 28.0, 17.0, 42.0, 34.0, 44.0, 49.0, 48.0, 51.0, 64.0, 50.0, 45.0, 34.0, 56.0, 44.0, 45.0, 31.0, 39.0, 35.0, 22.0, 28.0, 18.0, 20.0, 8.0, 8.0, 9.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.74521827697754, -26.74308204650879, -25.74094581604004, -24.738811492919922, -23.736675262451172, -22.734539031982422, -21.732402801513672, -20.730266571044922, -19.728130340576172, -18.725994110107422, -17.723857879638672, -16.721721649169922, -15.719587326049805, -14.717451095581055, -13.715314865112305, -12.713178634643555, -11.711044311523438, -10.708908081054688, -9.706772804260254, -8.704636573791504, -7.702500820159912, -6.70036506652832, -5.69822883605957, -4.6960930824279785, -3.6939573287963867, -2.691821575164795, -1.689685583114624, -0.6875495910644531, 0.31458616256713867, 1.3167219161987305, 2.3188581466674805, 3.3209939002990723, 4.323131561279297, 5.325267314910889, 6.3274030685424805, 7.3295392990112305, 8.331674575805664, 9.333810806274414, 10.335947036743164, 11.338083267211914, 12.340218544006348, 13.342354774475098, 14.344490051269531, 15.346626281738281, 16.34876251220703, 17.35089874267578, 18.35303497314453, 19.35516929626465, 20.3573055267334, 21.35944175720215, 22.3615779876709, 23.363712310791016, 24.365848541259766, 25.367984771728516, 26.370121002197266, 27.372257232666016, 28.374393463134766, 29.376529693603516, 30.378665924072266, 31.380802154541016, 32.382938385009766, 33.38507080078125, 34.38720703125, 35.38934326171875, 36.3914794921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 7.0, 5.0, 10.0, 17.0, 18.0, 25.0, 27.0, 27.0, 29.0, 32.0, 42.0, 44.0, 45.0, 37.0, 57.0, 46.0, 38.0, 49.0, 36.0, 40.0, 43.0, 42.0, 47.0, 34.0, 33.0, 33.0, 25.0, 18.0, 15.0, 12.0, 9.0, 7.0, 9.0, 4.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.54336166381836, -40.30707550048828, -39.0707893371582, -37.834503173828125, -36.59821701049805, -35.36193084716797, -34.125640869140625, -32.88935470581055, -31.65306854248047, -30.41678237915039, -29.180496215820312, -27.944210052490234, -26.707921981811523, -25.471635818481445, -24.235349655151367, -22.999061584472656, -21.76277732849121, -20.526491165161133, -19.290205001831055, -18.053916931152344, -16.817630767822266, -15.581344604492188, -14.34505844116211, -13.108771324157715, -11.872485160827637, -10.636198997497559, -9.399911880493164, -8.163625717163086, -6.92733907699585, -5.691052436828613, -4.454766273498535, -3.2184791564941406, -1.9821929931640625, -0.7459064722061157, 0.49038004875183105, 1.7266664505004883, 2.9629530906677246, 4.199239730834961, 5.435525894165039, 6.671813011169434, 7.908099174499512, 9.14438533782959, 10.380672454833984, 11.616958618164062, 12.85324478149414, 14.089531898498535, 15.325818061828613, 16.562105178833008, 17.798391342163086, 19.034677505493164, 20.270963668823242, 21.507251739501953, 22.74353790283203, 23.97982406616211, 25.216110229492188, 26.452396392822266, 27.688682556152344, 28.924968719482422, 30.1612548828125, 31.397541046142578, 32.633827209472656, 33.8701171875, 35.10639953613281, 36.342689514160156, 37.578975677490234]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 17.0, 15.0, 15.0, 33.0, 53.0, 88.0, 105.0, 161.0, 252.0, 330.0, 534.0, 814.0, 1256.0, 1934.0, 3013.0, 4427.0, 6908.0, 10351.0, 15451.0, 23667.0, 35002.0, 50060.0, 68988.0, 90305.0, 109928.0, 121306.0, 118495.0, 104262.0, 83683.0, 62245.0, 44249.0, 30490.0, 20615.0, 13562.0, 8792.0, 5830.0, 3898.0, 2514.0, 1665.0, 1027.0, 702.0, 461.0, 344.0, 222.0, 155.0, 112.0, 75.0, 59.0, 36.0, 16.0, 15.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.78125, -7.5203857421875, -7.259521484375, -6.9986572265625, -6.73779296875, -6.4769287109375, -6.216064453125, -5.9552001953125, -5.6943359375, -5.4334716796875, -5.172607421875, -4.9117431640625, -4.65087890625, -4.3900146484375, -4.129150390625, -3.8682861328125, -3.607421875, -3.3465576171875, -3.085693359375, -2.8248291015625, -2.56396484375, -2.3031005859375, -2.042236328125, -1.7813720703125, -1.5205078125, -1.2596435546875, -0.998779296875, -0.7379150390625, -0.47705078125, -0.2161865234375, 0.044677734375, 0.3055419921875, 0.56640625, 0.8272705078125, 1.088134765625, 1.3489990234375, 1.60986328125, 1.8707275390625, 2.131591796875, 2.3924560546875, 2.6533203125, 2.9141845703125, 3.175048828125, 3.4359130859375, 3.69677734375, 3.9576416015625, 4.218505859375, 4.4793701171875, 4.740234375, 5.0010986328125, 5.261962890625, 5.5228271484375, 5.78369140625, 6.0445556640625, 6.305419921875, 6.5662841796875, 6.8271484375, 7.0880126953125, 7.348876953125, 7.6097412109375, 7.87060546875, 8.1314697265625, 8.392333984375, 8.6531982421875, 8.9140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 7.0, 5.0, 10.0, 17.0, 18.0, 26.0, 27.0, 25.0, 31.0, 33.0, 41.0, 44.0, 46.0, 35.0, 58.0, 44.0, 38.0, 49.0, 38.0, 41.0, 43.0, 40.0, 50.0, 32.0, 32.0, 33.0, 25.0, 18.0, 15.0, 14.0, 7.0, 8.0, 9.0, 3.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.84375, -39.6220703125, -38.400390625, -37.1787109375, -35.95703125, -34.7353515625, -33.513671875, -32.2919921875, -31.0703125, -29.8486328125, -28.626953125, -27.4052734375, -26.18359375, -24.9619140625, -23.740234375, -22.5185546875, -21.296875, -20.0751953125, -18.853515625, -17.6318359375, -16.41015625, -15.1884765625, -13.966796875, -12.7451171875, -11.5234375, -10.3017578125, -9.080078125, -7.8583984375, -6.63671875, -5.4150390625, -4.193359375, -2.9716796875, -1.75, -0.5283203125, 0.693359375, 1.9150390625, 3.13671875, 4.3583984375, 5.580078125, 6.8017578125, 8.0234375, 9.2451171875, 10.466796875, 11.6884765625, 12.91015625, 14.1318359375, 15.353515625, 16.5751953125, 17.796875, 19.0185546875, 20.240234375, 21.4619140625, 22.68359375, 23.9052734375, 25.126953125, 26.3486328125, 27.5703125, 28.7919921875, 30.013671875, 31.2353515625, 32.45703125, 33.6787109375, 34.900390625, 36.1220703125, 37.34375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 3.0, 5.0, 4.0, 7.0, 8.0, 20.0, 27.0, 32.0, 52.0, 88.0, 123.0, 183.0, 297.0, 390.0, 619.0, 1007.0, 1459.0, 2175.0, 3229.0, 5209.0, 7830.0, 12255.0, 20792.0, 44014.0, 859425.0, 37977.0, 18880.0, 11285.0, 7248.0, 4761.0, 3058.0, 2065.0, 1324.0, 944.0, 592.0, 394.0, 273.0, 191.0, 105.0, 78.0, 55.0, 23.0, 22.0, 8.0, 13.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.953125, -22.22265625, -21.4921875, -20.76171875, -20.03125, -19.30078125, -18.5703125, -17.83984375, -17.109375, -16.37890625, -15.6484375, -14.91796875, -14.1875, -13.45703125, -12.7265625, -11.99609375, -11.265625, -10.53515625, -9.8046875, -9.07421875, -8.34375, -7.61328125, -6.8828125, -6.15234375, -5.421875, -4.69140625, -3.9609375, -3.23046875, -2.5, -1.76953125, -1.0390625, -0.30859375, 0.421875, 1.15234375, 1.8828125, 2.61328125, 3.34375, 4.07421875, 4.8046875, 5.53515625, 6.265625, 6.99609375, 7.7265625, 8.45703125, 9.1875, 9.91796875, 10.6484375, 11.37890625, 12.109375, 12.83984375, 13.5703125, 14.30078125, 15.03125, 15.76171875, 16.4921875, 17.22265625, 17.953125, 18.68359375, 19.4140625, 20.14453125, 20.875, 21.60546875, 22.3359375, 23.06640625, 23.796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 9.0, 7.0, 10.0, 18.0, 12.0, 19.0, 27.0, 21.0, 36.0, 24.0, 25.0, 30.0, 25.0, 41.0, 40.0, 46.0, 33.0, 30.0, 44.0, 41.0, 42.0, 39.0, 43.0, 34.0, 26.0, 26.0, 25.0, 25.0, 22.0, 20.0, 21.0, 20.0, 16.0, 23.0, 17.0, 10.0, 9.0, 7.0, 7.0, 4.0, 7.0, 4.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-21.828125, -21.138916015625, -20.44970703125, -19.760498046875, -19.0712890625, -18.382080078125, -17.69287109375, -17.003662109375, -16.314453125, -15.625244140625, -14.93603515625, -14.246826171875, -13.5576171875, -12.868408203125, -12.17919921875, -11.489990234375, -10.80078125, -10.111572265625, -9.42236328125, -8.733154296875, -8.0439453125, -7.354736328125, -6.66552734375, -5.976318359375, -5.287109375, -4.597900390625, -3.90869140625, -3.219482421875, -2.5302734375, -1.841064453125, -1.15185546875, -0.462646484375, 0.2265625, 0.915771484375, 1.60498046875, 2.294189453125, 2.9833984375, 3.672607421875, 4.36181640625, 5.051025390625, 5.740234375, 6.429443359375, 7.11865234375, 7.807861328125, 8.4970703125, 9.186279296875, 9.87548828125, 10.564697265625, 11.25390625, 11.943115234375, 12.63232421875, 13.321533203125, 14.0107421875, 14.699951171875, 15.38916015625, 16.078369140625, 16.767578125, 17.456787109375, 18.14599609375, 18.835205078125, 19.5244140625, 20.213623046875, 20.90283203125, 21.592041015625, 22.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 10.0, 5.0, 3.0, 6.0, 12.0, 18.0, 33.0, 37.0, 52.0, 74.0, 94.0, 128.0, 192.0, 294.0, 427.0, 743.0, 1004.0, 1669.0, 2868.0, 5306.0, 10096.0, 22020.0, 62539.0, 880733.0, 30912.0, 13477.0, 6557.0, 3556.0, 1954.0, 1276.0, 788.0, 514.0, 333.0, 260.0, 164.0, 114.0, 87.0, 52.0, 39.0, 26.0, 33.0, 7.0, 10.0, 6.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.2109375, -1.1744537353515625, -1.137969970703125, -1.1014862060546875, -1.06500244140625, -1.0285186767578125, -0.992034912109375, -0.9555511474609375, -0.9190673828125, -0.8825836181640625, -0.846099853515625, -0.8096160888671875, -0.77313232421875, -0.7366485595703125, -0.700164794921875, -0.6636810302734375, -0.627197265625, -0.5907135009765625, -0.554229736328125, -0.5177459716796875, -0.48126220703125, -0.4447784423828125, -0.408294677734375, -0.3718109130859375, -0.3353271484375, -0.2988433837890625, -0.262359619140625, -0.2258758544921875, -0.18939208984375, -0.1529083251953125, -0.116424560546875, -0.0799407958984375, -0.04345703125, -0.0069732666015625, 0.029510498046875, 0.0659942626953125, 0.10247802734375, 0.1389617919921875, 0.175445556640625, 0.2119293212890625, 0.2484130859375, 0.2848968505859375, 0.321380615234375, 0.3578643798828125, 0.39434814453125, 0.4308319091796875, 0.467315673828125, 0.5037994384765625, 0.540283203125, 0.5767669677734375, 0.613250732421875, 0.6497344970703125, 0.68621826171875, 0.7227020263671875, 0.759185791015625, 0.7956695556640625, 0.8321533203125, 0.8686370849609375, 0.905120849609375, 0.9416046142578125, 0.97808837890625, 1.0145721435546875, 1.051055908203125, 1.0875396728515625, 1.1240234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 5.0, 4.0, 6.0, 14.0, 14.0, 19.0, 34.0, 41.0, 56.0, 61.0, 87.0, 74.0, 104.0, 92.0, 86.0, 59.0, 65.0, 52.0, 40.0, 18.0, 21.0, 17.0, 10.0, 1.0, 8.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -3.014504909515381e-05, -2.905726432800293e-05, -2.796947956085205e-05, -2.6881694793701172e-05, -2.5793910026550293e-05, -2.4706125259399414e-05, -2.3618340492248535e-05, -2.2530555725097656e-05, -2.1442770957946777e-05, -2.03549861907959e-05, -1.926720142364502e-05, -1.817941665649414e-05, -1.7091631889343262e-05, -1.6003847122192383e-05, -1.4916062355041504e-05, -1.3828277587890625e-05, -1.2740492820739746e-05, -1.1652708053588867e-05, -1.0564923286437988e-05, -9.47713851928711e-06, -8.38935375213623e-06, -7.3015689849853516e-06, -6.213784217834473e-06, -5.125999450683594e-06, -4.038214683532715e-06, -2.950429916381836e-06, -1.862645149230957e-06, -7.748603820800781e-07, 3.129243850708008e-07, 1.4007091522216797e-06, 2.4884939193725586e-06, 3.5762786865234375e-06, 4.664063453674316e-06, 5.751848220825195e-06, 6.839632987976074e-06, 7.927417755126953e-06, 9.015202522277832e-06, 1.0102987289428711e-05, 1.119077205657959e-05, 1.2278556823730469e-05, 1.3366341590881348e-05, 1.4454126358032227e-05, 1.5541911125183105e-05, 1.6629695892333984e-05, 1.7717480659484863e-05, 1.8805265426635742e-05, 1.989305019378662e-05, 2.09808349609375e-05, 2.206861972808838e-05, 2.3156404495239258e-05, 2.4244189262390137e-05, 2.5331974029541016e-05, 2.6419758796691895e-05, 2.7507543563842773e-05, 2.8595328330993652e-05, 2.968311309814453e-05, 3.077089786529541e-05, 3.185868263244629e-05, 3.294646739959717e-05, 3.403425216674805e-05, 3.5122036933898926e-05, 3.6209821701049805e-05, 3.7297606468200684e-05, 3.838539123535156e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 6.0, 1.0, 11.0, 20.0, 30.0, 34.0, 68.0, 103.0, 120.0, 183.0, 297.0, 424.0, 619.0, 945.0, 1465.0, 2099.0, 3215.0, 5062.0, 8016.0, 12626.0, 19508.0, 30771.0, 48505.0, 76640.0, 121850.0, 177221.0, 182937.0, 130229.0, 82011.0, 51640.0, 33197.0, 21089.0, 13397.0, 8486.0, 5449.0, 3443.0, 2295.0, 1506.0, 975.0, 695.0, 458.0, 291.0, 193.0, 151.0, 96.0, 60.0, 47.0, 36.0, 12.0, 9.0, 11.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4560546875, -0.44036865234375, -0.4246826171875, -0.40899658203125, -0.393310546875, -0.37762451171875, -0.3619384765625, -0.34625244140625, -0.33056640625, -0.31488037109375, -0.2991943359375, -0.28350830078125, -0.267822265625, -0.25213623046875, -0.2364501953125, -0.22076416015625, -0.205078125, -0.18939208984375, -0.1737060546875, -0.15802001953125, -0.142333984375, -0.12664794921875, -0.1109619140625, -0.09527587890625, -0.07958984375, -0.06390380859375, -0.0482177734375, -0.03253173828125, -0.016845703125, -0.00115966796875, 0.0145263671875, 0.03021240234375, 0.0458984375, 0.06158447265625, 0.0772705078125, 0.09295654296875, 0.108642578125, 0.12432861328125, 0.1400146484375, 0.15570068359375, 0.17138671875, 0.18707275390625, 0.2027587890625, 0.21844482421875, 0.234130859375, 0.24981689453125, 0.2655029296875, 0.28118896484375, 0.296875, 0.31256103515625, 0.3282470703125, 0.34393310546875, 0.359619140625, 0.37530517578125, 0.3909912109375, 0.40667724609375, 0.42236328125, 0.43804931640625, 0.4537353515625, 0.46942138671875, 0.485107421875, 0.50079345703125, 0.5164794921875, 0.53216552734375, 0.5478515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 8.0, 8.0, 9.0, 9.0, 4.0, 21.0, 6.0, 23.0, 21.0, 30.0, 32.0, 40.0, 51.0, 48.0, 64.0, 61.0, 77.0, 59.0, 49.0, 63.0, 50.0, 46.0, 38.0, 31.0, 30.0, 18.0, 16.0, 17.0, 12.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16455078125, -0.15935897827148438, -0.15416717529296875, -0.14897537231445312, -0.1437835693359375, -0.13859176635742188, -0.13339996337890625, -0.12820816040039062, -0.123016357421875, -0.11782455444335938, -0.11263275146484375, -0.10744094848632812, -0.1022491455078125, -0.09705734252929688, -0.09186553955078125, -0.08667373657226562, -0.08148193359375, -0.07629013061523438, -0.07109832763671875, -0.06590652465820312, -0.0607147216796875, -0.055522918701171875, -0.05033111572265625, -0.045139312744140625, -0.039947509765625, -0.034755706787109375, -0.02956390380859375, -0.024372100830078125, -0.0191802978515625, -0.013988494873046875, -0.00879669189453125, -0.003604888916015625, 0.0015869140625, 0.006778717041015625, 0.01197052001953125, 0.017162322998046875, 0.0223541259765625, 0.027545928955078125, 0.03273773193359375, 0.037929534912109375, 0.043121337890625, 0.048313140869140625, 0.05350494384765625, 0.058696746826171875, 0.0638885498046875, 0.06908035278320312, 0.07427215576171875, 0.07946395874023438, 0.08465576171875, 0.08984756469726562, 0.09503936767578125, 0.10023117065429688, 0.1054229736328125, 0.11061477661132812, 0.11580657958984375, 0.12099838256835938, 0.126190185546875, 0.13138198852539062, 0.13657379150390625, 0.14176559448242188, 0.1469573974609375, 0.15214920043945312, 0.15734100341796875, 0.16253280639648438, 0.167724609375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 11.0, 13.0, 14.0, 16.0, 18.0, 14.0, 23.0, 35.0, 40.0, 40.0, 43.0, 46.0, 62.0, 56.0, 46.0, 49.0, 38.0, 41.0, 47.0, 50.0, 45.0, 30.0, 36.0, 32.0, 26.0, 20.0, 22.0, 13.0, 10.0, 8.0, 5.0, 7.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.52516746520996, -26.548152923583984, -25.571136474609375, -24.5941219329834, -23.617107391357422, -22.640090942382812, -21.663076400756836, -20.68606185913086, -19.70904541015625, -18.732030868530273, -17.755014419555664, -16.777999877929688, -15.800985336303711, -14.823969841003418, -13.846954345703125, -12.869939804077148, -11.892925262451172, -10.915909767150879, -9.938895225524902, -8.96187973022461, -7.984864711761475, -7.00784969329834, -6.030834197998047, -5.053819179534912, -4.076804161071777, -3.0997891426086426, -2.1227738857269287, -1.1457586288452148, -0.16874361038208008, 0.8082714080810547, 1.7852869033813477, 2.7623019218444824, 3.73931884765625, 4.716333866119385, 5.6933488845825195, 6.6703643798828125, 7.647379398345947, 8.624394416809082, 9.601409912109375, 10.578424453735352, 11.555439949035645, 12.532455444335938, 13.509469985961914, 14.486485481262207, 15.4635009765625, 16.440515518188477, 17.417530059814453, 18.394546508789062, 19.37156105041504, 20.348575592041016, 21.325592041015625, 22.3026065826416, 23.279621124267578, 24.256637573242188, 25.233652114868164, 26.21066665649414, 27.18768310546875, 28.164697647094727, 29.141714096069336, 30.118728637695312, 31.09574317932129, 32.072757720947266, 33.049774169921875, 34.026790618896484, 35.00380325317383]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 8.0, 5.0, 10.0, 17.0, 18.0, 25.0, 29.0, 24.0, 31.0, 31.0, 44.0, 41.0, 44.0, 39.0, 58.0, 44.0, 38.0, 51.0, 34.0, 43.0, 41.0, 42.0, 49.0, 32.0, 33.0, 33.0, 25.0, 18.0, 15.0, 14.0, 7.0, 7.0, 10.0, 3.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.8514289855957, -39.62977981567383, -38.40813064575195, -37.18648147583008, -35.96482849121094, -34.74317932128906, -33.52153015136719, -32.29988098144531, -31.078231811523438, -29.856582641601562, -28.634933471679688, -27.41328239440918, -26.191633224487305, -24.96998405456543, -23.748332977294922, -22.526683807373047, -21.305034637451172, -20.083385467529297, -18.861736297607422, -17.640085220336914, -16.41843605041504, -15.196786880493164, -13.975136756896973, -12.753486633300781, -11.531837463378906, -10.310188293457031, -9.08853816986084, -7.866888523101807, -6.645238876342773, -5.42358922958374, -4.201939582824707, -2.9802894592285156, -1.7586441040039062, -0.536994457244873, 0.6846551895141602, 1.9063048362731934, 3.1279544830322266, 4.34960412979126, 5.571253776550293, 6.792903900146484, 8.01455307006836, 9.236202239990234, 10.457852363586426, 11.679502487182617, 12.901151657104492, 14.122800827026367, 15.344450950622559, 16.56610107421875, 17.787750244140625, 19.0093994140625, 20.231048583984375, 21.452699661254883, 22.674348831176758, 23.895998001098633, 25.11764907836914, 26.339298248291016, 27.56094741821289, 28.782596588134766, 30.00424575805664, 31.22589683532715, 32.447547912597656, 33.66919708251953, 34.890846252441406, 36.11249542236328, 37.334144592285156]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 7.0, 6.0, 6.0, 15.0, 31.0, 35.0, 79.0, 101.0, 152.0, 225.0, 345.0, 530.0, 885.0, 1318.0, 2116.0, 3342.0, 5372.0, 8622.0, 13402.0, 20844.0, 31917.0, 47395.0, 66589.0, 86565.0, 105437.0, 117039.0, 118238.0, 108419.0, 91295.0, 70115.0, 50872.0, 34749.0, 22670.0, 14634.0, 9201.0, 5882.0, 3688.0, 2305.0, 1442.0, 927.0, 614.0, 421.0, 248.0, 170.0, 93.0, 71.0, 56.0, 29.0, 13.0, 14.0, 11.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.984375, -22.268310546875, -21.55224609375, -20.836181640625, -20.1201171875, -19.404052734375, -18.68798828125, -17.971923828125, -17.255859375, -16.539794921875, -15.82373046875, -15.107666015625, -14.3916015625, -13.675537109375, -12.95947265625, -12.243408203125, -11.52734375, -10.811279296875, -10.09521484375, -9.379150390625, -8.6630859375, -7.947021484375, -7.23095703125, -6.514892578125, -5.798828125, -5.082763671875, -4.36669921875, -3.650634765625, -2.9345703125, -2.218505859375, -1.50244140625, -0.786376953125, -0.0703125, 0.645751953125, 1.36181640625, 2.077880859375, 2.7939453125, 3.510009765625, 4.22607421875, 4.942138671875, 5.658203125, 6.374267578125, 7.09033203125, 7.806396484375, 8.5224609375, 9.238525390625, 9.95458984375, 10.670654296875, 11.38671875, 12.102783203125, 12.81884765625, 13.534912109375, 14.2509765625, 14.967041015625, 15.68310546875, 16.399169921875, 17.115234375, 17.831298828125, 18.54736328125, 19.263427734375, 19.9794921875, 20.695556640625, 21.41162109375, 22.127685546875, 22.84375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 9.0, 8.0, 4.0, 12.0, 19.0, 18.0, 24.0, 29.0, 28.0, 28.0, 38.0, 46.0, 38.0, 41.0, 36.0, 61.0, 43.0, 43.0, 44.0, 37.0, 46.0, 37.0, 47.0, 47.0, 26.0, 42.0, 26.0, 25.0, 16.0, 13.0, 13.0, 8.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.28125, -38.1005859375, -36.919921875, -35.7392578125, -34.55859375, -33.3779296875, -32.197265625, -31.0166015625, -29.8359375, -28.6552734375, -27.474609375, -26.2939453125, -25.11328125, -23.9326171875, -22.751953125, -21.5712890625, -20.390625, -19.2099609375, -18.029296875, -16.8486328125, -15.66796875, -14.4873046875, -13.306640625, -12.1259765625, -10.9453125, -9.7646484375, -8.583984375, -7.4033203125, -6.22265625, -5.0419921875, -3.861328125, -2.6806640625, -1.5, -0.3193359375, 0.861328125, 2.0419921875, 3.22265625, 4.4033203125, 5.583984375, 6.7646484375, 7.9453125, 9.1259765625, 10.306640625, 11.4873046875, 12.66796875, 13.8486328125, 15.029296875, 16.2099609375, 17.390625, 18.5712890625, 19.751953125, 20.9326171875, 22.11328125, 23.2939453125, 24.474609375, 25.6552734375, 26.8359375, 28.0166015625, 29.197265625, 30.3779296875, 31.55859375, 32.7392578125, 33.919921875, 35.1005859375, 36.28125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 12.0, 20.0, 33.0, 45.0, 55.0, 78.0, 109.0, 167.0, 276.0, 376.0, 571.0, 873.0, 1377.0, 2067.0, 3200.0, 4945.0, 8098.0, 12411.0, 19497.0, 28877.0, 43002.0, 60748.0, 81665.0, 102831.0, 117287.0, 120298.0, 112002.0, 94617.0, 73174.0, 53621.0, 36893.0, 24669.0, 16049.0, 10134.0, 6588.0, 4166.0, 2678.0, 1681.0, 1155.0, 747.0, 517.0, 309.0, 231.0, 149.0, 89.0, 48.0, 41.0, 23.0, 19.0, 13.0, 9.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-23.140625, -22.424072265625, -21.70751953125, -20.990966796875, -20.2744140625, -19.557861328125, -18.84130859375, -18.124755859375, -17.408203125, -16.691650390625, -15.97509765625, -15.258544921875, -14.5419921875, -13.825439453125, -13.10888671875, -12.392333984375, -11.67578125, -10.959228515625, -10.24267578125, -9.526123046875, -8.8095703125, -8.093017578125, -7.37646484375, -6.659912109375, -5.943359375, -5.226806640625, -4.51025390625, -3.793701171875, -3.0771484375, -2.360595703125, -1.64404296875, -0.927490234375, -0.2109375, 0.505615234375, 1.22216796875, 1.938720703125, 2.6552734375, 3.371826171875, 4.08837890625, 4.804931640625, 5.521484375, 6.238037109375, 6.95458984375, 7.671142578125, 8.3876953125, 9.104248046875, 9.82080078125, 10.537353515625, 11.25390625, 11.970458984375, 12.68701171875, 13.403564453125, 14.1201171875, 14.836669921875, 15.55322265625, 16.269775390625, 16.986328125, 17.702880859375, 18.41943359375, 19.135986328125, 19.8525390625, 20.569091796875, 21.28564453125, 22.002197265625, 22.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 12.0, 8.0, 10.0, 14.0, 16.0, 24.0, 17.0, 21.0, 25.0, 18.0, 32.0, 37.0, 45.0, 35.0, 30.0, 37.0, 35.0, 45.0, 41.0, 47.0, 39.0, 47.0, 39.0, 25.0, 32.0, 37.0, 24.0, 35.0, 23.0, 31.0, 20.0, 23.0, 7.0, 10.0, 12.0, 6.0, 7.0, 10.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-23.515625, -22.840087890625, -22.16455078125, -21.489013671875, -20.8134765625, -20.137939453125, -19.46240234375, -18.786865234375, -18.111328125, -17.435791015625, -16.76025390625, -16.084716796875, -15.4091796875, -14.733642578125, -14.05810546875, -13.382568359375, -12.70703125, -12.031494140625, -11.35595703125, -10.680419921875, -10.0048828125, -9.329345703125, -8.65380859375, -7.978271484375, -7.302734375, -6.627197265625, -5.95166015625, -5.276123046875, -4.6005859375, -3.925048828125, -3.24951171875, -2.573974609375, -1.8984375, -1.222900390625, -0.54736328125, 0.128173828125, 0.8037109375, 1.479248046875, 2.15478515625, 2.830322265625, 3.505859375, 4.181396484375, 4.85693359375, 5.532470703125, 6.2080078125, 6.883544921875, 7.55908203125, 8.234619140625, 8.91015625, 9.585693359375, 10.26123046875, 10.936767578125, 11.6123046875, 12.287841796875, 12.96337890625, 13.638916015625, 14.314453125, 14.989990234375, 15.66552734375, 16.341064453125, 17.0166015625, 17.692138671875, 18.36767578125, 19.043212890625, 19.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 9.0, 16.0, 33.0, 42.0, 47.0, 87.0, 145.0, 196.0, 317.0, 444.0, 753.0, 1233.0, 1877.0, 2979.0, 4805.0, 7768.0, 12685.0, 21085.0, 34114.0, 53716.0, 79876.0, 110404.0, 134427.0, 142555.0, 131182.0, 104049.0, 74378.0, 48937.0, 30899.0, 19106.0, 11653.0, 7028.0, 4303.0, 2766.0, 1677.0, 1032.0, 687.0, 416.0, 285.0, 171.0, 121.0, 86.0, 58.0, 44.0, 25.0, 10.0, 5.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.33203125, -6.11663818359375, -5.9012451171875, -5.68585205078125, -5.470458984375, -5.25506591796875, -5.0396728515625, -4.82427978515625, -4.60888671875, -4.39349365234375, -4.1781005859375, -3.96270751953125, -3.747314453125, -3.53192138671875, -3.3165283203125, -3.10113525390625, -2.8857421875, -2.67034912109375, -2.4549560546875, -2.23956298828125, -2.024169921875, -1.80877685546875, -1.5933837890625, -1.37799072265625, -1.16259765625, -0.94720458984375, -0.7318115234375, -0.51641845703125, -0.301025390625, -0.08563232421875, 0.1297607421875, 0.34515380859375, 0.560546875, 0.77593994140625, 0.9913330078125, 1.20672607421875, 1.422119140625, 1.63751220703125, 1.8529052734375, 2.06829833984375, 2.28369140625, 2.49908447265625, 2.7144775390625, 2.92987060546875, 3.145263671875, 3.36065673828125, 3.5760498046875, 3.79144287109375, 4.0068359375, 4.22222900390625, 4.4376220703125, 4.65301513671875, 4.868408203125, 5.08380126953125, 5.2991943359375, 5.51458740234375, 5.72998046875, 5.94537353515625, 6.1607666015625, 6.37615966796875, 6.591552734375, 6.80694580078125, 7.0223388671875, 7.23773193359375, 7.453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 5.0, 7.0, 10.0, 7.0, 10.0, 15.0, 15.0, 13.0, 12.0, 21.0, 31.0, 30.0, 28.0, 43.0, 59.0, 51.0, 49.0, 42.0, 48.0, 60.0, 45.0, 46.0, 45.0, 38.0, 37.0, 36.0, 30.0, 25.0, 24.0, 25.0, 16.0, 14.0, 15.0, 10.0, 8.0, 7.0, 4.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006818771362304688, -0.0006618723273277283, -0.0006418675184249878, -0.0006218627095222473, -0.0006018579006195068, -0.0005818530917167664, -0.0005618482828140259, -0.0005418434739112854, -0.0005218386650085449, -0.0005018338561058044, -0.00048182904720306396, -0.0004618242383003235, -0.000441819429397583, -0.00042181462049484253, -0.00040180981159210205, -0.00038180500268936157, -0.0003618001937866211, -0.0003417953848838806, -0.00032179057598114014, -0.00030178576707839966, -0.0002817809581756592, -0.0002617761492729187, -0.00024177134037017822, -0.00022176653146743774, -0.00020176172256469727, -0.0001817569136619568, -0.0001617521047592163, -0.00014174729585647583, -0.00012174248695373535, -0.00010173767805099487, -8.17328691482544e-05, -6.172806024551392e-05, -4.172325134277344e-05, -2.171844244003296e-05, -1.7136335372924805e-06, 1.8291175365447998e-05, 3.8295984268188477e-05, 5.8300793170928955e-05, 7.830560207366943e-05, 9.831041097640991e-05, 0.00011831521987915039, 0.00013832002878189087, 0.00015832483768463135, 0.00017832964658737183, 0.0001983344554901123, 0.00021833926439285278, 0.00023834407329559326, 0.00025834888219833374, 0.0002783536911010742, 0.0002983585000038147, 0.0003183633089065552, 0.00033836811780929565, 0.00035837292671203613, 0.0003783777356147766, 0.0003983825445175171, 0.00041838735342025757, 0.00043839216232299805, 0.0004583969712257385, 0.000478401780128479, 0.0004984065890312195, 0.00051841139793396, 0.0005384162068367004, 0.0005584210157394409, 0.0005784258246421814, 0.0005984306335449219]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 21.0, 21.0, 23.0, 42.0, 81.0, 107.0, 165.0, 227.0, 420.0, 657.0, 983.0, 1511.0, 2457.0, 4196.0, 6867.0, 11223.0, 18605.0, 30611.0, 49102.0, 76702.0, 109667.0, 139074.0, 150265.0, 138172.0, 107988.0, 75143.0, 48229.0, 29732.0, 18067.0, 10942.0, 6584.0, 3999.0, 2436.0, 1563.0, 991.0, 566.0, 394.0, 237.0, 158.0, 91.0, 76.0, 44.0, 52.0, 11.0, 13.0, 11.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.52734375, -7.28033447265625, -7.0333251953125, -6.78631591796875, -6.539306640625, -6.29229736328125, -6.0452880859375, -5.79827880859375, -5.55126953125, -5.30426025390625, -5.0572509765625, -4.81024169921875, -4.563232421875, -4.31622314453125, -4.0692138671875, -3.82220458984375, -3.5751953125, -3.32818603515625, -3.0811767578125, -2.83416748046875, -2.587158203125, -2.34014892578125, -2.0931396484375, -1.84613037109375, -1.59912109375, -1.35211181640625, -1.1051025390625, -0.85809326171875, -0.611083984375, -0.36407470703125, -0.1170654296875, 0.12994384765625, 0.376953125, 0.62396240234375, 0.8709716796875, 1.11798095703125, 1.364990234375, 1.61199951171875, 1.8590087890625, 2.10601806640625, 2.35302734375, 2.60003662109375, 2.8470458984375, 3.09405517578125, 3.341064453125, 3.58807373046875, 3.8350830078125, 4.08209228515625, 4.3291015625, 4.57611083984375, 4.8231201171875, 5.07012939453125, 5.317138671875, 5.56414794921875, 5.8111572265625, 6.05816650390625, 6.30517578125, 6.55218505859375, 6.7991943359375, 7.04620361328125, 7.293212890625, 7.54022216796875, 7.7872314453125, 8.03424072265625, 8.28125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 2.0, 5.0, 11.0, 16.0, 8.0, 16.0, 17.0, 21.0, 29.0, 22.0, 31.0, 29.0, 38.0, 44.0, 47.0, 48.0, 54.0, 57.0, 52.0, 51.0, 49.0, 52.0, 35.0, 35.0, 42.0, 39.0, 23.0, 26.0, 15.0, 15.0, 15.0, 10.0, 6.0, 8.0, 3.0, 2.0, 5.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.946197509765625, -3.82208251953125, -3.697967529296875, -3.5738525390625, -3.449737548828125, -3.32562255859375, -3.201507568359375, -3.077392578125, -2.953277587890625, -2.82916259765625, -2.705047607421875, -2.5809326171875, -2.456817626953125, -2.33270263671875, -2.208587646484375, -2.08447265625, -1.960357666015625, -1.83624267578125, -1.712127685546875, -1.5880126953125, -1.463897705078125, -1.33978271484375, -1.215667724609375, -1.091552734375, -0.967437744140625, -0.84332275390625, -0.719207763671875, -0.5950927734375, -0.470977783203125, -0.34686279296875, -0.222747802734375, -0.0986328125, 0.025482177734375, 0.14959716796875, 0.273712158203125, 0.3978271484375, 0.521942138671875, 0.64605712890625, 0.770172119140625, 0.894287109375, 1.018402099609375, 1.14251708984375, 1.266632080078125, 1.3907470703125, 1.514862060546875, 1.63897705078125, 1.763092041015625, 1.88720703125, 2.011322021484375, 2.13543701171875, 2.259552001953125, 2.3836669921875, 2.507781982421875, 2.63189697265625, 2.756011962890625, 2.880126953125, 3.004241943359375, 3.12835693359375, 3.252471923828125, 3.3765869140625, 3.500701904296875, 3.62481689453125, 3.748931884765625, 3.873046875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 9.0, 12.0, 15.0, 17.0, 14.0, 25.0, 30.0, 26.0, 28.0, 28.0, 32.0, 49.0, 56.0, 43.0, 39.0, 50.0, 49.0, 54.0, 51.0, 57.0, 48.0, 35.0, 34.0, 33.0, 31.0, 26.0, 14.0, 20.0, 16.0, 15.0, 8.0, 6.0, 7.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.358348846435547, -27.382587432861328, -26.40682601928711, -25.431066513061523, -24.455305099487305, -23.479543685913086, -22.5037841796875, -21.52802276611328, -20.552261352539062, -19.576499938964844, -18.600738525390625, -17.62497901916504, -16.64921760559082, -15.673456192016602, -14.6976957321167, -13.721935272216797, -12.746173858642578, -11.77041244506836, -10.794651985168457, -9.818891525268555, -8.843130111694336, -7.867369174957275, -6.891608238220215, -5.915847301483154, -4.940086364746094, -3.964325428009033, -2.9885644912719727, -2.012803554534912, -1.0370426177978516, -0.061281681060791016, 0.9144792556762695, 1.89024019241333, 2.8660011291503906, 3.841762065887451, 4.817523002624512, 5.793283939361572, 6.769044876098633, 7.744805812835693, 8.720566749572754, 9.696327209472656, 10.672088623046875, 11.647850036621094, 12.623610496520996, 13.599370956420898, 14.575132369995117, 15.550893783569336, 16.526653289794922, 17.50241470336914, 18.47817611694336, 19.453937530517578, 20.429698944091797, 21.405458450317383, 22.3812198638916, 23.35698127746582, 24.332740783691406, 25.308502197265625, 26.284263610839844, 27.260025024414062, 28.23578643798828, 29.211545944213867, 30.187307357788086, 31.163068771362305, 32.13882827758789, 33.11458969116211, 34.09035110473633]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 6.0, 14.0, 1.0, 9.0, 15.0, 16.0, 15.0, 18.0, 30.0, 34.0, 32.0, 39.0, 25.0, 41.0, 31.0, 49.0, 51.0, 47.0, 36.0, 51.0, 42.0, 43.0, 34.0, 41.0, 39.0, 26.0, 32.0, 28.0, 26.0, 25.0, 20.0, 11.0, 17.0, 10.0, 7.0, 4.0, 5.0, 8.0, 4.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.672821044921875, -35.462120056152344, -34.25141525268555, -33.04071044921875, -31.83000946044922, -30.619306564331055, -29.40860366821289, -28.197900772094727, -26.987197875976562, -25.7764949798584, -24.565792083740234, -23.35508918762207, -22.144386291503906, -20.933683395385742, -19.722980499267578, -18.512277603149414, -17.30157470703125, -16.090871810913086, -14.880168914794922, -13.669466018676758, -12.458763122558594, -11.24806022644043, -10.037357330322266, -8.826654434204102, -7.6159515380859375, -6.405248641967773, -5.194545745849609, -3.9838428497314453, -2.7731399536132812, -1.5624370574951172, -0.3517341613769531, 0.8589687347412109, 2.0696678161621094, 3.2803707122802734, 4.4910736083984375, 5.701776504516602, 6.912479400634766, 8.12318229675293, 9.333885192871094, 10.544588088989258, 11.755290985107422, 12.965993881225586, 14.17669677734375, 15.387399673461914, 16.598102569580078, 17.808805465698242, 19.019508361816406, 20.23021125793457, 21.440914154052734, 22.6516170501709, 23.862319946289062, 25.073022842407227, 26.28372573852539, 27.494428634643555, 28.70513153076172, 29.915834426879883, 31.126537322998047, 32.337242126464844, 33.547943115234375, 34.758644104003906, 35.9693489074707, 37.1800537109375, 38.39075469970703, 39.60145568847656, 40.81216049194336]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 8.0, 6.0, 19.0, 32.0, 53.0, 62.0, 125.0, 194.0, 285.0, 395.0, 669.0, 989.0, 1668.0, 2538.0, 3965.0, 6092.0, 9464.0, 14983.0, 23196.0, 35823.0, 55382.0, 84351.0, 126836.0, 186012.0, 265080.0, 355931.0, 442706.0, 496105.0, 495044.0, 438163.0, 351218.0, 259748.0, 181084.0, 123019.0, 82245.0, 53770.0, 34788.0, 22167.0, 14511.0, 9271.0, 5991.0, 3798.0, 2333.0, 1555.0, 968.0, 608.0, 383.0, 242.0, 151.0, 93.0, 61.0, 46.0, 27.0, 12.0, 10.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0], "bins": [-20.8125, -20.140380859375, -19.46826171875, -18.796142578125, -18.1240234375, -17.451904296875, -16.77978515625, -16.107666015625, -15.435546875, -14.763427734375, -14.09130859375, -13.419189453125, -12.7470703125, -12.074951171875, -11.40283203125, -10.730712890625, -10.05859375, -9.386474609375, -8.71435546875, -8.042236328125, -7.3701171875, -6.697998046875, -6.02587890625, -5.353759765625, -4.681640625, -4.009521484375, -3.33740234375, -2.665283203125, -1.9931640625, -1.321044921875, -0.64892578125, 0.023193359375, 0.6953125, 1.367431640625, 2.03955078125, 2.711669921875, 3.3837890625, 4.055908203125, 4.72802734375, 5.400146484375, 6.072265625, 6.744384765625, 7.41650390625, 8.088623046875, 8.7607421875, 9.432861328125, 10.10498046875, 10.777099609375, 11.44921875, 12.121337890625, 12.79345703125, 13.465576171875, 14.1376953125, 14.809814453125, 15.48193359375, 16.154052734375, 16.826171875, 17.498291015625, 18.17041015625, 18.842529296875, 19.5146484375, 20.186767578125, 20.85888671875, 21.531005859375, 22.203125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 12.0, 3.0, 8.0, 16.0, 17.0, 18.0, 12.0, 32.0, 35.0, 33.0, 34.0, 32.0, 42.0, 38.0, 39.0, 56.0, 44.0, 38.0, 49.0, 39.0, 44.0, 32.0, 45.0, 38.0, 27.0, 32.0, 26.0, 33.0, 20.0, 21.0, 12.0, 15.0, 9.0, 5.0, 3.0, 6.0, 9.0, 2.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.09375, -28.1357421875, -27.177734375, -26.2197265625, -25.26171875, -24.3037109375, -23.345703125, -22.3876953125, -21.4296875, -20.4716796875, -19.513671875, -18.5556640625, -17.59765625, -16.6396484375, -15.681640625, -14.7236328125, -13.765625, -12.8076171875, -11.849609375, -10.8916015625, -9.93359375, -8.9755859375, -8.017578125, -7.0595703125, -6.1015625, -5.1435546875, -4.185546875, -3.2275390625, -2.26953125, -1.3115234375, -0.353515625, 0.6044921875, 1.5625, 2.5205078125, 3.478515625, 4.4365234375, 5.39453125, 6.3525390625, 7.310546875, 8.2685546875, 9.2265625, 10.1845703125, 11.142578125, 12.1005859375, 13.05859375, 14.0166015625, 14.974609375, 15.9326171875, 16.890625, 17.8486328125, 18.806640625, 19.7646484375, 20.72265625, 21.6806640625, 22.638671875, 23.5966796875, 24.5546875, 25.5126953125, 26.470703125, 27.4287109375, 28.38671875, 29.3447265625, 30.302734375, 31.2607421875, 32.21875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 11.0, 14.0, 18.0, 46.0, 69.0, 138.0, 200.0, 350.0, 667.0, 1070.0, 1957.0, 3298.0, 5666.0, 9646.0, 16665.0, 28110.0, 45618.0, 73746.0, 114780.0, 172902.0, 247709.0, 330724.0, 412590.0, 467708.0, 484720.0, 453971.0, 387089.0, 302474.0, 222125.0, 151188.0, 99816.0, 63837.0, 38747.0, 23280.0, 13836.0, 8108.0, 4757.0, 2790.0, 1537.0, 970.0, 590.0, 313.0, 185.0, 107.0, 62.0, 34.0, 22.0, 10.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.640625, -19.960205078125, -19.27978515625, -18.599365234375, -17.9189453125, -17.238525390625, -16.55810546875, -15.877685546875, -15.197265625, -14.516845703125, -13.83642578125, -13.156005859375, -12.4755859375, -11.795166015625, -11.11474609375, -10.434326171875, -9.75390625, -9.073486328125, -8.39306640625, -7.712646484375, -7.0322265625, -6.351806640625, -5.67138671875, -4.990966796875, -4.310546875, -3.630126953125, -2.94970703125, -2.269287109375, -1.5888671875, -0.908447265625, -0.22802734375, 0.452392578125, 1.1328125, 1.813232421875, 2.49365234375, 3.174072265625, 3.8544921875, 4.534912109375, 5.21533203125, 5.895751953125, 6.576171875, 7.256591796875, 7.93701171875, 8.617431640625, 9.2978515625, 9.978271484375, 10.65869140625, 11.339111328125, 12.01953125, 12.699951171875, 13.38037109375, 14.060791015625, 14.7412109375, 15.421630859375, 16.10205078125, 16.782470703125, 17.462890625, 18.143310546875, 18.82373046875, 19.504150390625, 20.1845703125, 20.864990234375, 21.54541015625, 22.225830078125, 22.90625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 13.0, 6.0, 7.0, 11.0, 10.0, 26.0, 46.0, 29.0, 42.0, 57.0, 63.0, 69.0, 87.0, 98.0, 127.0, 161.0, 174.0, 204.0, 196.0, 230.0, 206.0, 239.0, 187.0, 195.0, 239.0, 173.0, 206.0, 155.0, 132.0, 131.0, 105.0, 88.0, 71.0, 65.0, 64.0, 31.0, 31.0, 21.0, 19.0, 16.0, 10.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.609375, -12.1998291015625, -11.790283203125, -11.3807373046875, -10.97119140625, -10.5616455078125, -10.152099609375, -9.7425537109375, -9.3330078125, -8.9234619140625, -8.513916015625, -8.1043701171875, -7.69482421875, -7.2852783203125, -6.875732421875, -6.4661865234375, -6.056640625, -5.6470947265625, -5.237548828125, -4.8280029296875, -4.41845703125, -4.0089111328125, -3.599365234375, -3.1898193359375, -2.7802734375, -2.3707275390625, -1.961181640625, -1.5516357421875, -1.14208984375, -0.7325439453125, -0.322998046875, 0.0865478515625, 0.49609375, 0.9056396484375, 1.315185546875, 1.7247314453125, 2.13427734375, 2.5438232421875, 2.953369140625, 3.3629150390625, 3.7724609375, 4.1820068359375, 4.591552734375, 5.0010986328125, 5.41064453125, 5.8201904296875, 6.229736328125, 6.6392822265625, 7.048828125, 7.4583740234375, 7.867919921875, 8.2774658203125, 8.68701171875, 9.0965576171875, 9.506103515625, 9.9156494140625, 10.3251953125, 10.7347412109375, 11.144287109375, 11.5538330078125, 11.96337890625, 12.3729248046875, 12.782470703125, 13.1920166015625, 13.6015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 10.0, 4.0, 15.0, 12.0, 14.0, 15.0, 29.0, 31.0, 46.0, 38.0, 38.0, 51.0, 57.0, 58.0, 41.0, 45.0, 60.0, 51.0, 55.0, 39.0, 35.0, 43.0, 42.0, 35.0, 27.0, 23.0, 20.0, 5.0, 13.0, 6.0, 12.0, 5.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-36.20433807373047, -35.191795349121094, -34.179256439208984, -33.16671371459961, -32.1541748046875, -31.141632080078125, -30.129091262817383, -29.11655044555664, -28.104007720947266, -27.091466903686523, -26.07892608642578, -25.066383361816406, -24.053842544555664, -23.041301727294922, -22.02876091003418, -21.016220092773438, -20.003679275512695, -18.991138458251953, -17.97859764099121, -16.96605682373047, -15.953514099121094, -14.940973281860352, -13.92843246459961, -12.915891647338867, -11.903349876403809, -10.890809059143066, -9.878267288208008, -8.865726470947266, -7.853185176849365, -6.840643882751465, -5.828103065490723, -4.815561771392822, -3.803020477294922, -2.7904791831970215, -1.7779381275177002, -0.7653970718383789, 0.24714422225952148, 1.2596855163574219, 2.272226333618164, 3.2847676277160645, 4.297308921813965, 5.309850215911865, 6.322391510009766, 7.334932327270508, 8.34747314453125, 9.360014915466309, 10.37255573272705, 11.38509750366211, 12.397638320922852, 13.410179138183594, 14.422720909118652, 15.435261726379395, 16.447803497314453, 17.460344314575195, 18.472885131835938, 19.48542594909668, 20.497966766357422, 21.510507583618164, 22.523048400878906, 23.53559112548828, 24.548131942749023, 25.560672760009766, 26.573213577270508, 27.58575439453125, 28.598297119140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 5.0, 7.0, 9.0, 14.0, 8.0, 17.0, 16.0, 16.0, 24.0, 27.0, 22.0, 29.0, 30.0, 43.0, 39.0, 47.0, 42.0, 41.0, 31.0, 33.0, 35.0, 43.0, 38.0, 24.0, 42.0, 45.0, 28.0, 26.0, 34.0, 22.0, 23.0, 25.0, 18.0, 17.0, 16.0, 11.0, 8.0, 4.0, 7.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.76988983154297, -31.77004623413086, -30.770204544067383, -29.770362854003906, -28.770519256591797, -27.770675659179688, -26.77083396911621, -25.770992279052734, -24.771148681640625, -23.771305084228516, -22.77146339416504, -21.771621704101562, -20.771778106689453, -19.771934509277344, -18.772092819213867, -17.77225112915039, -16.77240753173828, -15.772564888000488, -14.772722244262695, -13.772879600524902, -12.77303695678711, -11.773194313049316, -10.773351669311523, -9.77350902557373, -8.773666381835938, -7.7738237380981445, -6.773981094360352, -5.774138450622559, -4.774295806884766, -3.7744531631469727, -2.7746105194091797, -1.7747678756713867, -0.7749233245849609, 0.22491931915283203, 1.224761962890625, 2.224604606628418, 3.224447250366211, 4.224289894104004, 5.224132537841797, 6.22397518157959, 7.223817825317383, 8.223660469055176, 9.223503112792969, 10.223345756530762, 11.223188400268555, 12.223031044006348, 13.22287368774414, 14.222716331481934, 15.222558975219727, 16.222400665283203, 17.222244262695312, 18.222087860107422, 19.2219295501709, 20.221771240234375, 21.221614837646484, 22.221458435058594, 23.22130012512207, 24.221141815185547, 25.220985412597656, 26.220829010009766, 27.220670700073242, 28.22051239013672, 29.220355987548828, 30.220199584960938, 31.220041275024414]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 23.0, 26.0, 43.0, 75.0, 103.0, 149.0, 230.0, 367.0, 558.0, 840.0, 1250.0, 1859.0, 2859.0, 4175.0, 6011.0, 9084.0, 13479.0, 19553.0, 27831.0, 38751.0, 52897.0, 69026.0, 86825.0, 102570.0, 111221.0, 108477.0, 95973.0, 79061.0, 61392.0, 45886.0, 33440.0, 23613.0, 16582.0, 11101.0, 7782.0, 5064.0, 3542.0, 2273.0, 1494.0, 1052.0, 720.0, 445.0, 301.0, 188.0, 115.0, 90.0, 59.0, 26.0, 29.0, 13.0, 12.0, 8.0, 5.0, 1.0, 1.0, 1.0], "bins": [-7.3125, -7.08935546875, -6.8662109375, -6.64306640625, -6.419921875, -6.19677734375, -5.9736328125, -5.75048828125, -5.52734375, -5.30419921875, -5.0810546875, -4.85791015625, -4.634765625, -4.41162109375, -4.1884765625, -3.96533203125, -3.7421875, -3.51904296875, -3.2958984375, -3.07275390625, -2.849609375, -2.62646484375, -2.4033203125, -2.18017578125, -1.95703125, -1.73388671875, -1.5107421875, -1.28759765625, -1.064453125, -0.84130859375, -0.6181640625, -0.39501953125, -0.171875, 0.05126953125, 0.2744140625, 0.49755859375, 0.720703125, 0.94384765625, 1.1669921875, 1.39013671875, 1.61328125, 1.83642578125, 2.0595703125, 2.28271484375, 2.505859375, 2.72900390625, 2.9521484375, 3.17529296875, 3.3984375, 3.62158203125, 3.8447265625, 4.06787109375, 4.291015625, 4.51416015625, 4.7373046875, 4.96044921875, 5.18359375, 5.40673828125, 5.6298828125, 5.85302734375, 6.076171875, 6.29931640625, 6.5224609375, 6.74560546875, 6.96875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 5.0, 6.0, 10.0, 15.0, 8.0, 17.0, 13.0, 20.0, 23.0, 27.0, 22.0, 30.0, 29.0, 45.0, 36.0, 47.0, 42.0, 41.0, 32.0, 32.0, 36.0, 42.0, 38.0, 24.0, 41.0, 45.0, 28.0, 28.0, 33.0, 22.0, 23.0, 26.0, 18.0, 16.0, 16.0, 12.0, 7.0, 4.0, 6.0, 9.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.16796875, -30.1796875, -29.19140625, -28.203125, -27.21484375, -26.2265625, -25.23828125, -24.25, -23.26171875, -22.2734375, -21.28515625, -20.296875, -19.30859375, -18.3203125, -17.33203125, -16.34375, -15.35546875, -14.3671875, -13.37890625, -12.390625, -11.40234375, -10.4140625, -9.42578125, -8.4375, -7.44921875, -6.4609375, -5.47265625, -4.484375, -3.49609375, -2.5078125, -1.51953125, -0.53125, 0.45703125, 1.4453125, 2.43359375, 3.421875, 4.41015625, 5.3984375, 6.38671875, 7.375, 8.36328125, 9.3515625, 10.33984375, 11.328125, 12.31640625, 13.3046875, 14.29296875, 15.28125, 16.26953125, 17.2578125, 18.24609375, 19.234375, 20.22265625, 21.2109375, 22.19921875, 23.1875, 24.17578125, 25.1640625, 26.15234375, 27.140625, 28.12890625, 29.1171875, 30.10546875, 31.09375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 10.0, 8.0, 14.0, 21.0, 26.0, 40.0, 61.0, 71.0, 119.0, 152.0, 228.0, 367.0, 533.0, 791.0, 1196.0, 1844.0, 2854.0, 4325.0, 6616.0, 10056.0, 15790.0, 29803.0, 842857.0, 64718.0, 25225.0, 14116.0, 9110.0, 6054.0, 3876.0, 2625.0, 1655.0, 1118.0, 774.0, 462.0, 381.0, 198.0, 159.0, 91.0, 73.0, 40.0, 21.0, 26.0, 17.0, 8.0, 5.0, 6.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-19.296875, -18.62890625, -17.9609375, -17.29296875, -16.625, -15.95703125, -15.2890625, -14.62109375, -13.953125, -13.28515625, -12.6171875, -11.94921875, -11.28125, -10.61328125, -9.9453125, -9.27734375, -8.609375, -7.94140625, -7.2734375, -6.60546875, -5.9375, -5.26953125, -4.6015625, -3.93359375, -3.265625, -2.59765625, -1.9296875, -1.26171875, -0.59375, 0.07421875, 0.7421875, 1.41015625, 2.078125, 2.74609375, 3.4140625, 4.08203125, 4.75, 5.41796875, 6.0859375, 6.75390625, 7.421875, 8.08984375, 8.7578125, 9.42578125, 10.09375, 10.76171875, 11.4296875, 12.09765625, 12.765625, 13.43359375, 14.1015625, 14.76953125, 15.4375, 16.10546875, 16.7734375, 17.44140625, 18.109375, 18.77734375, 19.4453125, 20.11328125, 20.78125, 21.44921875, 22.1171875, 22.78515625, 23.453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 10.0, 9.0, 9.0, 7.0, 14.0, 13.0, 13.0, 25.0, 23.0, 31.0, 28.0, 35.0, 40.0, 37.0, 34.0, 45.0, 36.0, 50.0, 40.0, 45.0, 35.0, 43.0, 46.0, 39.0, 46.0, 31.0, 30.0, 20.0, 28.0, 19.0, 17.0, 22.0, 7.0, 14.0, 10.0, 8.0, 11.0, 7.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.55859375, -20.8515625, -20.14453125, -19.4375, -18.73046875, -18.0234375, -17.31640625, -16.609375, -15.90234375, -15.1953125, -14.48828125, -13.78125, -13.07421875, -12.3671875, -11.66015625, -10.953125, -10.24609375, -9.5390625, -8.83203125, -8.125, -7.41796875, -6.7109375, -6.00390625, -5.296875, -4.58984375, -3.8828125, -3.17578125, -2.46875, -1.76171875, -1.0546875, -0.34765625, 0.359375, 1.06640625, 1.7734375, 2.48046875, 3.1875, 3.89453125, 4.6015625, 5.30859375, 6.015625, 6.72265625, 7.4296875, 8.13671875, 8.84375, 9.55078125, 10.2578125, 10.96484375, 11.671875, 12.37890625, 13.0859375, 13.79296875, 14.5, 15.20703125, 15.9140625, 16.62109375, 17.328125, 18.03515625, 18.7421875, 19.44921875, 20.15625, 20.86328125, 21.5703125, 22.27734375, 22.984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 7.0, 6.0, 8.0, 5.0, 16.0, 16.0, 22.0, 29.0, 39.0, 51.0, 55.0, 91.0, 123.0, 173.0, 236.0, 329.0, 497.0, 717.0, 1201.0, 1887.0, 3401.0, 6192.0, 12421.0, 28621.0, 871540.0, 72587.0, 24053.0, 10866.0, 5427.0, 2943.0, 1682.0, 1022.0, 702.0, 457.0, 310.0, 202.0, 165.0, 122.0, 82.0, 66.0, 44.0, 41.0, 30.0, 18.0, 16.0, 10.0, 10.0, 3.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.078125, -1.0443267822265625, -1.010528564453125, -0.9767303466796875, -0.94293212890625, -0.9091339111328125, -0.875335693359375, -0.8415374755859375, -0.8077392578125, -0.7739410400390625, -0.740142822265625, -0.7063446044921875, -0.67254638671875, -0.6387481689453125, -0.604949951171875, -0.5711517333984375, -0.537353515625, -0.5035552978515625, -0.469757080078125, -0.4359588623046875, -0.40216064453125, -0.3683624267578125, -0.334564208984375, -0.3007659912109375, -0.2669677734375, -0.2331695556640625, -0.199371337890625, -0.1655731201171875, -0.13177490234375, -0.0979766845703125, -0.064178466796875, -0.0303802490234375, 0.00341796875, 0.0372161865234375, 0.071014404296875, 0.1048126220703125, 0.13861083984375, 0.1724090576171875, 0.206207275390625, 0.2400054931640625, 0.2738037109375, 0.3076019287109375, 0.341400146484375, 0.3751983642578125, 0.40899658203125, 0.4427947998046875, 0.476593017578125, 0.5103912353515625, 0.544189453125, 0.5779876708984375, 0.611785888671875, 0.6455841064453125, 0.67938232421875, 0.7131805419921875, 0.746978759765625, 0.7807769775390625, 0.8145751953125, 0.8483734130859375, 0.882171630859375, 0.9159698486328125, 0.94976806640625, 0.9835662841796875, 1.017364501953125, 1.0511627197265625, 1.0849609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 10.0, 18.0, 17.0, 24.0, 34.0, 39.0, 41.0, 55.0, 53.0, 69.0, 74.0, 81.0, 74.0, 56.0, 70.0, 69.0, 47.0, 36.0, 34.0, 23.0, 16.0, 17.0, 9.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1398067474365234e-05, -2.0629726350307465e-05, -1.9861385226249695e-05, -1.9093044102191925e-05, -1.8324702978134155e-05, -1.7556361854076385e-05, -1.6788020730018616e-05, -1.6019679605960846e-05, -1.5251338481903076e-05, -1.4482997357845306e-05, -1.3714656233787537e-05, -1.2946315109729767e-05, -1.2177973985671997e-05, -1.1409632861614227e-05, -1.0641291737556458e-05, -9.872950613498688e-06, -9.104609489440918e-06, -8.336268365383148e-06, -7.567927241325378e-06, -6.799586117267609e-06, -6.031244993209839e-06, -5.262903869152069e-06, -4.494562745094299e-06, -3.7262216210365295e-06, -2.9578804969787598e-06, -2.18953937292099e-06, -1.4211982488632202e-06, -6.528571248054504e-07, 1.1548399925231934e-07, 8.838251233100891e-07, 1.6521662473678589e-06, 2.4205073714256287e-06, 3.1888484954833984e-06, 3.957189619541168e-06, 4.725530743598938e-06, 5.493871867656708e-06, 6.2622129917144775e-06, 7.030554115772247e-06, 7.798895239830017e-06, 8.567236363887787e-06, 9.335577487945557e-06, 1.0103918612003326e-05, 1.0872259736061096e-05, 1.1640600860118866e-05, 1.2408941984176636e-05, 1.3177283108234406e-05, 1.3945624232292175e-05, 1.4713965356349945e-05, 1.5482306480407715e-05, 1.6250647604465485e-05, 1.7018988728523254e-05, 1.7787329852581024e-05, 1.8555670976638794e-05, 1.9324012100696564e-05, 2.0092353224754333e-05, 2.0860694348812103e-05, 2.1629035472869873e-05, 2.2397376596927643e-05, 2.3165717720985413e-05, 2.3934058845043182e-05, 2.4702399969100952e-05, 2.5470741093158722e-05, 2.6239082217216492e-05, 2.700742334127426e-05, 2.777576446533203e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 8.0, 8.0, 10.0, 14.0, 23.0, 48.0, 55.0, 91.0, 121.0, 172.0, 245.0, 368.0, 543.0, 791.0, 1175.0, 1685.0, 2481.0, 3506.0, 5254.0, 7677.0, 11548.0, 16838.0, 24914.0, 37648.0, 58651.0, 93542.0, 144992.0, 184124.0, 157903.0, 103368.0, 64767.0, 41451.0, 27215.0, 18243.0, 12506.0, 8329.0, 5765.0, 3911.0, 2736.0, 1821.0, 1286.0, 871.0, 597.0, 413.0, 254.0, 205.0, 125.0, 75.0, 68.0, 35.0, 25.0, 22.0, 18.0, 7.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4083290100097656, -0.39453887939453125, -0.3807487487792969, -0.3669586181640625, -0.3531684875488281, -0.33937835693359375, -0.3255882263183594, -0.311798095703125, -0.2980079650878906, -0.28421783447265625, -0.2704277038574219, -0.2566375732421875, -0.24284744262695312, -0.22905731201171875, -0.21526718139648438, -0.20147705078125, -0.18768692016601562, -0.17389678955078125, -0.16010665893554688, -0.1463165283203125, -0.13252639770507812, -0.11873626708984375, -0.10494613647460938, -0.091156005859375, -0.07736587524414062, -0.06357574462890625, -0.049785614013671875, -0.0359954833984375, -0.022205352783203125, -0.00841522216796875, 0.005374908447265625, 0.0191650390625, 0.032955169677734375, 0.04674530029296875, 0.060535430908203125, 0.0743255615234375, 0.08811569213867188, 0.10190582275390625, 0.11569595336914062, 0.129486083984375, 0.14327621459960938, 0.15706634521484375, 0.17085647583007812, 0.1846466064453125, 0.19843673706054688, 0.21222686767578125, 0.22601699829101562, 0.23980712890625, 0.2535972595214844, 0.26738739013671875, 0.2811775207519531, 0.2949676513671875, 0.3087577819824219, 0.32254791259765625, 0.3363380432128906, 0.350128173828125, 0.3639183044433594, 0.37770843505859375, 0.3914985656738281, 0.4052886962890625, 0.4190788269042969, 0.43286895751953125, 0.4466590881347656, 0.46044921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 3.0, 6.0, 5.0, 7.0, 11.0, 7.0, 9.0, 7.0, 12.0, 18.0, 19.0, 26.0, 33.0, 41.0, 45.0, 63.0, 65.0, 70.0, 84.0, 56.0, 71.0, 67.0, 43.0, 39.0, 45.0, 18.0, 25.0, 14.0, 15.0, 14.0, 5.0, 9.0, 9.0, 2.0, 4.0, 3.0, 5.0, 3.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.2138671875, -0.2068614959716797, -0.19985580444335938, -0.19285011291503906, -0.18584442138671875, -0.17883872985839844, -0.17183303833007812, -0.1648273468017578, -0.1578216552734375, -0.1508159637451172, -0.14381027221679688, -0.13680458068847656, -0.12979888916015625, -0.12279319763183594, -0.11578750610351562, -0.10878181457519531, -0.101776123046875, -0.09477043151855469, -0.08776473999023438, -0.08075904846191406, -0.07375335693359375, -0.06674766540527344, -0.059741973876953125, -0.05273628234863281, -0.0457305908203125, -0.03872489929199219, -0.031719207763671875, -0.024713516235351562, -0.01770782470703125, -0.010702133178710938, -0.003696441650390625, 0.0033092498779296875, 0.01031494140625, 0.017320632934570312, 0.024326324462890625, 0.03133201599121094, 0.03833770751953125, 0.04534339904785156, 0.052349090576171875, 0.05935478210449219, 0.0663604736328125, 0.07336616516113281, 0.08037185668945312, 0.08737754821777344, 0.09438323974609375, 0.10138893127441406, 0.10839462280273438, 0.11540031433105469, 0.122406005859375, 0.1294116973876953, 0.13641738891601562, 0.14342308044433594, 0.15042877197265625, 0.15743446350097656, 0.16444015502929688, 0.1714458465576172, 0.1784515380859375, 0.1854572296142578, 0.19246292114257812, 0.19946861267089844, 0.20647430419921875, 0.21347999572753906, 0.22048568725585938, 0.2274913787841797, 0.2344970703125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 12.0, 10.0, 14.0, 16.0, 29.0, 23.0, 40.0, 42.0, 43.0, 48.0, 55.0, 60.0, 45.0, 48.0, 56.0, 59.0, 55.0, 47.0, 35.0, 40.0, 37.0, 38.0, 29.0, 26.0, 16.0, 11.0, 10.0, 13.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.0214729309082, -34.99333572387695, -33.9651985168457, -32.93705749511719, -31.908920288085938, -30.880783081054688, -29.852645874023438, -28.824508666992188, -27.796369552612305, -26.768232345581055, -25.740093231201172, -24.711956024169922, -23.683818817138672, -22.65567970275879, -21.62754249572754, -20.599403381347656, -19.571266174316406, -18.543128967285156, -17.514989852905273, -16.486852645874023, -15.458714485168457, -14.43057632446289, -13.40243911743164, -12.374300956726074, -11.346162796020508, -10.318024635314941, -9.289886474609375, -8.261749267578125, -7.233611106872559, -6.205472946166992, -5.177335262298584, -4.149197578430176, -3.1210594177246094, -2.092921495437622, -1.0647835731506348, -0.03664565086364746, 0.9914922714233398, 2.0196304321289062, 3.0477681159973145, 4.075905799865723, 5.104043960571289, 6.1321821212768555, 7.160319805145264, 8.188457489013672, 9.216595649719238, 10.244733810424805, 11.272871017456055, 12.301009178161621, 13.329147338867188, 14.357285499572754, 15.38542366027832, 16.41356086730957, 17.441699981689453, 18.469837188720703, 19.497974395751953, 20.526111602783203, 21.554250717163086, 22.582387924194336, 23.61052703857422, 24.63866424560547, 25.66680145263672, 26.6949405670166, 27.72307777404785, 28.751216888427734, 29.779354095458984]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 6.0, 7.0, 8.0, 15.0, 8.0, 17.0, 13.0, 20.0, 23.0, 27.0, 22.0, 30.0, 30.0, 44.0, 37.0, 47.0, 42.0, 40.0, 33.0, 33.0, 35.0, 41.0, 40.0, 24.0, 38.0, 46.0, 29.0, 28.0, 31.0, 24.0, 22.0, 26.0, 17.0, 18.0, 15.0, 10.0, 9.0, 4.0, 6.0, 10.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.09929275512695, -31.1121826171875, -30.125072479248047, -29.137962341308594, -28.15085220336914, -27.163742065429688, -26.176633834838867, -25.189523696899414, -24.20241355895996, -23.215303421020508, -22.228193283081055, -21.2410831451416, -20.25397491455078, -19.266864776611328, -18.279754638671875, -17.292644500732422, -16.30553436279297, -15.318424224853516, -14.331314086914062, -13.344204902648926, -12.357094764709473, -11.36998462677002, -10.382875442504883, -9.39576530456543, -8.408655166625977, -7.421545028686523, -6.4344353675842285, -5.447325706481934, -4.4602155685424805, -3.4731054306030273, -2.4859957695007324, -1.4988861083984375, -0.5117759704589844, 0.47533392906188965, 1.4624438285827637, 2.4495537281036377, 3.4366636276245117, 4.423773765563965, 5.41088342666626, 6.397993087768555, 7.385103225708008, 8.372213363647461, 9.359323501586914, 10.34643268585205, 11.333542823791504, 12.320652961730957, 13.307762145996094, 14.294872283935547, 15.281982421875, 16.269092559814453, 17.256202697753906, 18.24331283569336, 19.230422973632812, 20.217533111572266, 21.204641342163086, 22.19175148010254, 23.178861618041992, 24.165971755981445, 25.1530818939209, 26.14019203186035, 27.127300262451172, 28.114410400390625, 29.101520538330078, 30.08863067626953, 31.075740814208984]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 16.0, 26.0, 29.0, 68.0, 103.0, 129.0, 176.0, 311.0, 464.0, 795.0, 1099.0, 1678.0, 2584.0, 3948.0, 5829.0, 8954.0, 13442.0, 19721.0, 28297.0, 39481.0, 52866.0, 67141.0, 82115.0, 93969.0, 101535.0, 100924.0, 94299.0, 82408.0, 67606.0, 52377.0, 39055.0, 27711.0, 19534.0, 13416.0, 8971.0, 5857.0, 4041.0, 2519.0, 1729.0, 1201.0, 736.0, 475.0, 320.0, 176.0, 164.0, 68.0, 72.0, 45.0, 34.0, 16.0, 6.0, 5.0, 1.0, 3.0, 3.0, 3.0], "bins": [-18.65625, -18.0908203125, -17.525390625, -16.9599609375, -16.39453125, -15.8291015625, -15.263671875, -14.6982421875, -14.1328125, -13.5673828125, -13.001953125, -12.4365234375, -11.87109375, -11.3056640625, -10.740234375, -10.1748046875, -9.609375, -9.0439453125, -8.478515625, -7.9130859375, -7.34765625, -6.7822265625, -6.216796875, -5.6513671875, -5.0859375, -4.5205078125, -3.955078125, -3.3896484375, -2.82421875, -2.2587890625, -1.693359375, -1.1279296875, -0.5625, 0.0029296875, 0.568359375, 1.1337890625, 1.69921875, 2.2646484375, 2.830078125, 3.3955078125, 3.9609375, 4.5263671875, 5.091796875, 5.6572265625, 6.22265625, 6.7880859375, 7.353515625, 7.9189453125, 8.484375, 9.0498046875, 9.615234375, 10.1806640625, 10.74609375, 11.3115234375, 11.876953125, 12.4423828125, 13.0078125, 13.5732421875, 14.138671875, 14.7041015625, 15.26953125, 15.8349609375, 16.400390625, 16.9658203125, 17.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 4.0, 8.0, 11.0, 12.0, 8.0, 18.0, 17.0, 13.0, 26.0, 30.0, 19.0, 30.0, 35.0, 40.0, 37.0, 51.0, 40.0, 40.0, 31.0, 30.0, 39.0, 41.0, 37.0, 23.0, 44.0, 41.0, 32.0, 25.0, 38.0, 18.0, 23.0, 26.0, 18.0, 16.0, 13.0, 15.0, 4.0, 4.0, 8.0, 7.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -30.058349609375, -29.10107421875, -28.143798828125, -27.1865234375, -26.229248046875, -25.27197265625, -24.314697265625, -23.357421875, -22.400146484375, -21.44287109375, -20.485595703125, -19.5283203125, -18.571044921875, -17.61376953125, -16.656494140625, -15.69921875, -14.741943359375, -13.78466796875, -12.827392578125, -11.8701171875, -10.912841796875, -9.95556640625, -8.998291015625, -8.041015625, -7.083740234375, -6.12646484375, -5.169189453125, -4.2119140625, -3.254638671875, -2.29736328125, -1.340087890625, -0.3828125, 0.574462890625, 1.53173828125, 2.489013671875, 3.4462890625, 4.403564453125, 5.36083984375, 6.318115234375, 7.275390625, 8.232666015625, 9.18994140625, 10.147216796875, 11.1044921875, 12.061767578125, 13.01904296875, 13.976318359375, 14.93359375, 15.890869140625, 16.84814453125, 17.805419921875, 18.7626953125, 19.719970703125, 20.67724609375, 21.634521484375, 22.591796875, 23.549072265625, 24.50634765625, 25.463623046875, 26.4208984375, 27.378173828125, 28.33544921875, 29.292724609375, 30.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 12.0, 11.0, 27.0, 39.0, 57.0, 79.0, 137.0, 204.0, 293.0, 432.0, 624.0, 868.0, 1415.0, 2065.0, 3108.0, 4548.0, 6791.0, 10259.0, 15556.0, 22828.0, 32828.0, 45340.0, 61409.0, 77269.0, 92690.0, 103129.0, 106054.0, 101519.0, 89952.0, 73829.0, 57918.0, 42961.0, 30124.0, 20954.0, 14411.0, 9681.0, 6335.0, 4177.0, 2903.0, 1873.0, 1205.0, 867.0, 571.0, 416.0, 253.0, 169.0, 123.0, 88.0, 58.0, 24.0, 29.0, 14.0, 19.0, 5.0, 4.0, 2.0, 3.0, 2.0], "bins": [-19.0625, -18.47412109375, -17.8857421875, -17.29736328125, -16.708984375, -16.12060546875, -15.5322265625, -14.94384765625, -14.35546875, -13.76708984375, -13.1787109375, -12.59033203125, -12.001953125, -11.41357421875, -10.8251953125, -10.23681640625, -9.6484375, -9.06005859375, -8.4716796875, -7.88330078125, -7.294921875, -6.70654296875, -6.1181640625, -5.52978515625, -4.94140625, -4.35302734375, -3.7646484375, -3.17626953125, -2.587890625, -1.99951171875, -1.4111328125, -0.82275390625, -0.234375, 0.35400390625, 0.9423828125, 1.53076171875, 2.119140625, 2.70751953125, 3.2958984375, 3.88427734375, 4.47265625, 5.06103515625, 5.6494140625, 6.23779296875, 6.826171875, 7.41455078125, 8.0029296875, 8.59130859375, 9.1796875, 9.76806640625, 10.3564453125, 10.94482421875, 11.533203125, 12.12158203125, 12.7099609375, 13.29833984375, 13.88671875, 14.47509765625, 15.0634765625, 15.65185546875, 16.240234375, 16.82861328125, 17.4169921875, 18.00537109375, 18.59375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 9.0, 7.0, 7.0, 7.0, 7.0, 8.0, 7.0, 15.0, 15.0, 13.0, 18.0, 25.0, 31.0, 23.0, 34.0, 35.0, 41.0, 31.0, 54.0, 46.0, 45.0, 34.0, 38.0, 44.0, 41.0, 35.0, 35.0, 42.0, 44.0, 25.0, 25.0, 23.0, 18.0, 19.0, 18.0, 15.0, 10.0, 11.0, 8.0, 8.0, 8.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.827880859375, -17.20263671875, -16.577392578125, -15.9521484375, -15.326904296875, -14.70166015625, -14.076416015625, -13.451171875, -12.825927734375, -12.20068359375, -11.575439453125, -10.9501953125, -10.324951171875, -9.69970703125, -9.074462890625, -8.44921875, -7.823974609375, -7.19873046875, -6.573486328125, -5.9482421875, -5.322998046875, -4.69775390625, -4.072509765625, -3.447265625, -2.822021484375, -2.19677734375, -1.571533203125, -0.9462890625, -0.321044921875, 0.30419921875, 0.929443359375, 1.5546875, 2.179931640625, 2.80517578125, 3.430419921875, 4.0556640625, 4.680908203125, 5.30615234375, 5.931396484375, 6.556640625, 7.181884765625, 7.80712890625, 8.432373046875, 9.0576171875, 9.682861328125, 10.30810546875, 10.933349609375, 11.55859375, 12.183837890625, 12.80908203125, 13.434326171875, 14.0595703125, 14.684814453125, 15.31005859375, 15.935302734375, 16.560546875, 17.185791015625, 17.81103515625, 18.436279296875, 19.0615234375, 19.686767578125, 20.31201171875, 20.937255859375, 21.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 10.0, 19.0, 20.0, 41.0, 51.0, 70.0, 124.0, 203.0, 341.0, 592.0, 834.0, 1567.0, 2485.0, 4121.0, 6993.0, 11618.0, 19501.0, 30713.0, 48531.0, 70613.0, 96674.0, 119128.0, 132618.0, 129104.0, 112289.0, 88194.0, 62611.0, 41593.0, 26745.0, 16457.0, 9897.0, 5886.0, 3516.0, 2118.0, 1277.0, 780.0, 457.0, 297.0, 173.0, 106.0, 69.0, 40.0, 30.0, 14.0, 15.0, 15.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.578125, -6.3892822265625, -6.200439453125, -6.0115966796875, -5.82275390625, -5.6339111328125, -5.445068359375, -5.2562255859375, -5.0673828125, -4.8785400390625, -4.689697265625, -4.5008544921875, -4.31201171875, -4.1231689453125, -3.934326171875, -3.7454833984375, -3.556640625, -3.3677978515625, -3.178955078125, -2.9901123046875, -2.80126953125, -2.6124267578125, -2.423583984375, -2.2347412109375, -2.0458984375, -1.8570556640625, -1.668212890625, -1.4793701171875, -1.29052734375, -1.1016845703125, -0.912841796875, -0.7239990234375, -0.53515625, -0.3463134765625, -0.157470703125, 0.0313720703125, 0.22021484375, 0.4090576171875, 0.597900390625, 0.7867431640625, 0.9755859375, 1.1644287109375, 1.353271484375, 1.5421142578125, 1.73095703125, 1.9197998046875, 2.108642578125, 2.2974853515625, 2.486328125, 2.6751708984375, 2.864013671875, 3.0528564453125, 3.24169921875, 3.4305419921875, 3.619384765625, 3.8082275390625, 3.9970703125, 4.1859130859375, 4.374755859375, 4.5635986328125, 4.75244140625, 4.9412841796875, 5.130126953125, 5.3189697265625, 5.5078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 7.0, 6.0, 7.0, 7.0, 11.0, 8.0, 24.0, 22.0, 21.0, 32.0, 23.0, 33.0, 46.0, 41.0, 46.0, 61.0, 53.0, 53.0, 46.0, 63.0, 44.0, 34.0, 48.0, 37.0, 30.0, 28.0, 22.0, 33.0, 17.0, 19.0, 14.0, 13.0, 7.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0005764961242675781, -0.0005569532513618469, -0.0005374103784561157, -0.0005178675055503845, -0.0004983246326446533, -0.0004787817597389221, -0.0004592388868331909, -0.0004396960139274597, -0.0004201531410217285, -0.0004006102681159973, -0.0003810673952102661, -0.0003615245223045349, -0.0003419816493988037, -0.0003224387764930725, -0.0003028959035873413, -0.0002833530306816101, -0.0002638101577758789, -0.0002442672848701477, -0.0002247244119644165, -0.0002051815390586853, -0.0001856386661529541, -0.0001660957932472229, -0.0001465529203414917, -0.0001270100474357605, -0.0001074671745300293, -8.79243016242981e-05, -6.83814287185669e-05, -4.883855581283569e-05, -2.9295682907104492e-05, -9.752810001373291e-06, 9.79006290435791e-06, 2.933293581008911e-05, 4.887580871582031e-05, 6.841868162155151e-05, 8.796155452728271e-05, 0.00010750442743301392, 0.00012704730033874512, 0.00014659017324447632, 0.00016613304615020752, 0.00018567591905593872, 0.00020521879196166992, 0.00022476166486740112, 0.0002443045377731323, 0.0002638474106788635, 0.0002833902835845947, 0.00030293315649032593, 0.00032247602939605713, 0.00034201890230178833, 0.00036156177520751953, 0.00038110464811325073, 0.00040064752101898193, 0.00042019039392471313, 0.00043973326683044434, 0.00045927613973617554, 0.00047881901264190674, 0.0004983618855476379, 0.0005179047584533691, 0.0005374476313591003, 0.0005569905042648315, 0.0005765333771705627, 0.0005960762500762939, 0.0006156191229820251, 0.0006351619958877563, 0.0006547048687934875, 0.0006742477416992188]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 10.0, 12.0, 15.0, 24.0, 33.0, 44.0, 61.0, 105.0, 185.0, 237.0, 435.0, 663.0, 1203.0, 1899.0, 3315.0, 5689.0, 9603.0, 16802.0, 27938.0, 45612.0, 70733.0, 101412.0, 129610.0, 145537.0, 139318.0, 116724.0, 85859.0, 57165.0, 35637.0, 21790.0, 12749.0, 7478.0, 4349.0, 2558.0, 1453.0, 862.0, 519.0, 340.0, 210.0, 118.0, 96.0, 56.0, 43.0, 14.0, 14.0, 14.0, 13.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.5762939453125, -7.351806640625, -7.1273193359375, -6.90283203125, -6.6783447265625, -6.453857421875, -6.2293701171875, -6.0048828125, -5.7803955078125, -5.555908203125, -5.3314208984375, -5.10693359375, -4.8824462890625, -4.657958984375, -4.4334716796875, -4.208984375, -3.9844970703125, -3.760009765625, -3.5355224609375, -3.31103515625, -3.0865478515625, -2.862060546875, -2.6375732421875, -2.4130859375, -2.1885986328125, -1.964111328125, -1.7396240234375, -1.51513671875, -1.2906494140625, -1.066162109375, -0.8416748046875, -0.6171875, -0.3927001953125, -0.168212890625, 0.0562744140625, 0.28076171875, 0.5052490234375, 0.729736328125, 0.9542236328125, 1.1787109375, 1.4031982421875, 1.627685546875, 1.8521728515625, 2.07666015625, 2.3011474609375, 2.525634765625, 2.7501220703125, 2.974609375, 3.1990966796875, 3.423583984375, 3.6480712890625, 3.87255859375, 4.0970458984375, 4.321533203125, 4.5460205078125, 4.7705078125, 4.9949951171875, 5.219482421875, 5.4439697265625, 5.66845703125, 5.8929443359375, 6.117431640625, 6.3419189453125, 6.56640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 7.0, 12.0, 14.0, 16.0, 23.0, 25.0, 30.0, 30.0, 23.0, 44.0, 63.0, 55.0, 62.0, 69.0, 81.0, 51.0, 69.0, 51.0, 49.0, 49.0, 27.0, 34.0, 22.0, 18.0, 18.0, 11.0, 4.0, 10.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.173553466796875, -4.05413818359375, -3.934722900390625, -3.8153076171875, -3.695892333984375, -3.57647705078125, -3.457061767578125, -3.337646484375, -3.218231201171875, -3.09881591796875, -2.979400634765625, -2.8599853515625, -2.740570068359375, -2.62115478515625, -2.501739501953125, -2.38232421875, -2.262908935546875, -2.14349365234375, -2.024078369140625, -1.9046630859375, -1.785247802734375, -1.66583251953125, -1.546417236328125, -1.427001953125, -1.307586669921875, -1.18817138671875, -1.068756103515625, -0.9493408203125, -0.829925537109375, -0.71051025390625, -0.591094970703125, -0.4716796875, -0.352264404296875, -0.23284912109375, -0.113433837890625, 0.0059814453125, 0.125396728515625, 0.24481201171875, 0.364227294921875, 0.483642578125, 0.603057861328125, 0.72247314453125, 0.841888427734375, 0.9613037109375, 1.080718994140625, 1.20013427734375, 1.319549560546875, 1.43896484375, 1.558380126953125, 1.67779541015625, 1.797210693359375, 1.9166259765625, 2.036041259765625, 2.15545654296875, 2.274871826171875, 2.394287109375, 2.513702392578125, 2.63311767578125, 2.752532958984375, 2.8719482421875, 2.991363525390625, 3.11077880859375, 3.230194091796875, 3.349609375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 10.0, 8.0, 9.0, 17.0, 12.0, 19.0, 27.0, 26.0, 31.0, 39.0, 42.0, 38.0, 65.0, 47.0, 61.0, 53.0, 41.0, 45.0, 44.0, 56.0, 39.0, 42.0, 44.0, 26.0, 27.0, 26.0, 20.0, 16.0, 19.0, 7.0, 7.0, 8.0, 7.0, 3.0, 6.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-34.54418182373047, -33.58768081665039, -32.63117599487305, -31.67467498779297, -30.718172073364258, -29.761669158935547, -28.80516815185547, -27.848665237426758, -26.892162322998047, -25.935659408569336, -24.979156494140625, -24.022655487060547, -23.066152572631836, -22.109649658203125, -21.153148651123047, -20.196645736694336, -19.240142822265625, -18.283639907836914, -17.327136993408203, -16.370635986328125, -15.414133071899414, -14.457630157470703, -13.501128196716309, -12.544626235961914, -11.588123321533203, -10.631620407104492, -9.675118446350098, -8.718616485595703, -7.762113571166992, -6.8056111335754395, -5.849108695983887, -4.892606258392334, -3.9361019134521484, -2.9795994758605957, -2.023097038269043, -1.0665946006774902, -0.1100921630859375, 0.8464102745056152, 1.802912712097168, 2.7594151496887207, 3.7159175872802734, 4.672420024871826, 5.628922462463379, 6.585424900054932, 7.541927337646484, 8.498430252075195, 9.45493221282959, 10.411434173583984, 11.367937088012695, 12.324440002441406, 13.2809419631958, 14.237443923950195, 15.193946838378906, 16.150449752807617, 17.106952667236328, 18.063453674316406, 19.019956588745117, 19.976459503173828, 20.932960510253906, 21.889463424682617, 22.845966339111328, 23.80246925354004, 24.75897216796875, 25.715473175048828, 26.67197608947754]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 4.0, 11.0, 8.0, 7.0, 14.0, 14.0, 11.0, 20.0, 14.0, 24.0, 37.0, 24.0, 41.0, 35.0, 28.0, 36.0, 38.0, 41.0, 41.0, 39.0, 45.0, 36.0, 30.0, 42.0, 34.0, 45.0, 30.0, 20.0, 39.0, 23.0, 30.0, 25.0, 24.0, 16.0, 19.0, 11.0, 10.0, 5.0, 8.0, 8.0, 4.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.29576873779297, -34.22861862182617, -33.161468505859375, -32.094322204589844, -31.027172088623047, -29.96002197265625, -28.892871856689453, -27.825721740722656, -26.758573532104492, -25.691423416137695, -24.62427520751953, -23.557125091552734, -22.489974975585938, -21.422826766967773, -20.355676651000977, -19.288528442382812, -18.221378326416016, -17.15422821044922, -16.087080001831055, -15.019929885864258, -13.952780723571777, -12.885631561279297, -11.8184814453125, -10.75133228302002, -9.684183120727539, -8.617033958435059, -7.54988431930542, -6.482734680175781, -5.415585517883301, -4.34843635559082, -3.2812867164611816, -2.214137077331543, -1.1469879150390625, -0.07983851432800293, 0.9873108863830566, 2.054460287094116, 3.121609687805176, 4.188758850097656, 5.255908489227295, 6.323058128356934, 7.390207290649414, 8.457356452941895, 9.524505615234375, 10.591655731201172, 11.658804893493652, 12.725954055786133, 13.79310417175293, 14.86025333404541, 15.92740249633789, 16.994552612304688, 18.06170082092285, 19.12885093688965, 20.195999145507812, 21.26314926147461, 22.330299377441406, 23.397449493408203, 24.464597702026367, 25.531747817993164, 26.598896026611328, 27.666046142578125, 28.733196258544922, 29.800344467163086, 30.867494583129883, 31.934642791748047, 33.001792907714844]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 16.0, 17.0, 30.0, 37.0, 63.0, 101.0, 167.0, 251.0, 316.0, 603.0, 896.0, 1436.0, 2267.0, 3628.0, 5680.0, 9144.0, 14538.0, 23215.0, 36405.0, 57451.0, 87904.0, 133528.0, 196035.0, 276391.0, 365075.0, 444773.0, 490942.0, 486201.0, 430863.0, 346557.0, 257561.0, 180679.0, 122687.0, 79444.0, 51921.0, 32850.0, 20381.0, 13095.0, 7987.0, 5029.0, 3073.0, 1962.0, 1192.0, 712.0, 445.0, 289.0, 185.0, 106.0, 71.0, 44.0, 20.0, 9.0, 5.0, 5.0, 4.0, 1.0], "bins": [-22.578125, -21.930908203125, -21.28369140625, -20.636474609375, -19.9892578125, -19.342041015625, -18.69482421875, -18.047607421875, -17.400390625, -16.753173828125, -16.10595703125, -15.458740234375, -14.8115234375, -14.164306640625, -13.51708984375, -12.869873046875, -12.22265625, -11.575439453125, -10.92822265625, -10.281005859375, -9.6337890625, -8.986572265625, -8.33935546875, -7.692138671875, -7.044921875, -6.397705078125, -5.75048828125, -5.103271484375, -4.4560546875, -3.808837890625, -3.16162109375, -2.514404296875, -1.8671875, -1.219970703125, -0.57275390625, 0.074462890625, 0.7216796875, 1.368896484375, 2.01611328125, 2.663330078125, 3.310546875, 3.957763671875, 4.60498046875, 5.252197265625, 5.8994140625, 6.546630859375, 7.19384765625, 7.841064453125, 8.48828125, 9.135498046875, 9.78271484375, 10.429931640625, 11.0771484375, 11.724365234375, 12.37158203125, 13.018798828125, 13.666015625, 14.313232421875, 14.96044921875, 15.607666015625, 16.2548828125, 16.902099609375, 17.54931640625, 18.196533203125, 18.84375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 11.0, 8.0, 10.0, 12.0, 11.0, 15.0, 16.0, 17.0, 28.0, 38.0, 23.0, 39.0, 35.0, 28.0, 35.0, 40.0, 37.0, 42.0, 44.0, 37.0, 45.0, 32.0, 29.0, 39.0, 42.0, 31.0, 22.0, 30.0, 31.0, 29.0, 27.0, 18.0, 19.0, 17.0, 12.0, 10.0, 6.0, 6.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.71875, -26.878662109375, -26.03857421875, -25.198486328125, -24.3583984375, -23.518310546875, -22.67822265625, -21.838134765625, -20.998046875, -20.157958984375, -19.31787109375, -18.477783203125, -17.6376953125, -16.797607421875, -15.95751953125, -15.117431640625, -14.27734375, -13.437255859375, -12.59716796875, -11.757080078125, -10.9169921875, -10.076904296875, -9.23681640625, -8.396728515625, -7.556640625, -6.716552734375, -5.87646484375, -5.036376953125, -4.1962890625, -3.356201171875, -2.51611328125, -1.676025390625, -0.8359375, 0.004150390625, 0.84423828125, 1.684326171875, 2.5244140625, 3.364501953125, 4.20458984375, 5.044677734375, 5.884765625, 6.724853515625, 7.56494140625, 8.405029296875, 9.2451171875, 10.085205078125, 10.92529296875, 11.765380859375, 12.60546875, 13.445556640625, 14.28564453125, 15.125732421875, 15.9658203125, 16.805908203125, 17.64599609375, 18.486083984375, 19.326171875, 20.166259765625, 21.00634765625, 21.846435546875, 22.6865234375, 23.526611328125, 24.36669921875, 25.206787109375, 26.046875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 11.0, 13.0, 24.0, 43.0, 56.0, 89.0, 152.0, 262.0, 434.0, 770.0, 1373.0, 2182.0, 3923.0, 6563.0, 10742.0, 17265.0, 28187.0, 44178.0, 68226.0, 101048.0, 144687.0, 200087.0, 262688.0, 326897.0, 380339.0, 413479.0, 420326.0, 396398.0, 349035.0, 287393.0, 224389.0, 166250.0, 117024.0, 79218.0, 53001.0, 34220.0, 21121.0, 12920.0, 7857.0, 4570.0, 2835.0, 1631.0, 958.0, 610.0, 353.0, 173.0, 120.0, 73.0, 41.0, 18.0, 14.0, 9.0, 6.0, 8.0, 2.0, 1.0], "bins": [-19.703125, -19.126953125, -18.55078125, -17.974609375, -17.3984375, -16.822265625, -16.24609375, -15.669921875, -15.09375, -14.517578125, -13.94140625, -13.365234375, -12.7890625, -12.212890625, -11.63671875, -11.060546875, -10.484375, -9.908203125, -9.33203125, -8.755859375, -8.1796875, -7.603515625, -7.02734375, -6.451171875, -5.875, -5.298828125, -4.72265625, -4.146484375, -3.5703125, -2.994140625, -2.41796875, -1.841796875, -1.265625, -0.689453125, -0.11328125, 0.462890625, 1.0390625, 1.615234375, 2.19140625, 2.767578125, 3.34375, 3.919921875, 4.49609375, 5.072265625, 5.6484375, 6.224609375, 6.80078125, 7.376953125, 7.953125, 8.529296875, 9.10546875, 9.681640625, 10.2578125, 10.833984375, 11.41015625, 11.986328125, 12.5625, 13.138671875, 13.71484375, 14.291015625, 14.8671875, 15.443359375, 16.01953125, 16.595703125, 17.171875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 15.0, 19.0, 37.0, 42.0, 47.0, 61.0, 94.0, 91.0, 117.0, 131.0, 155.0, 197.0, 194.0, 226.0, 226.0, 230.0, 224.0, 251.0, 191.0, 238.0, 176.0, 172.0, 174.0, 129.0, 117.0, 115.0, 77.0, 68.0, 54.0, 38.0, 38.0, 28.0, 19.0, 18.0, 14.0, 10.0, 4.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.162109375, -12.74609375, -12.330078125, -11.9140625, -11.498046875, -11.08203125, -10.666015625, -10.25, -9.833984375, -9.41796875, -9.001953125, -8.5859375, -8.169921875, -7.75390625, -7.337890625, -6.921875, -6.505859375, -6.08984375, -5.673828125, -5.2578125, -4.841796875, -4.42578125, -4.009765625, -3.59375, -3.177734375, -2.76171875, -2.345703125, -1.9296875, -1.513671875, -1.09765625, -0.681640625, -0.265625, 0.150390625, 0.56640625, 0.982421875, 1.3984375, 1.814453125, 2.23046875, 2.646484375, 3.0625, 3.478515625, 3.89453125, 4.310546875, 4.7265625, 5.142578125, 5.55859375, 5.974609375, 6.390625, 6.806640625, 7.22265625, 7.638671875, 8.0546875, 8.470703125, 8.88671875, 9.302734375, 9.71875, 10.134765625, 10.55078125, 10.966796875, 11.3828125, 11.798828125, 12.21484375, 12.630859375, 13.046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 1.0, 3.0, 8.0, 7.0, 8.0, 17.0, 11.0, 28.0, 28.0, 29.0, 29.0, 41.0, 41.0, 55.0, 43.0, 48.0, 67.0, 58.0, 55.0, 43.0, 44.0, 48.0, 37.0, 41.0, 35.0, 31.0, 22.0, 25.0, 25.0, 12.0, 19.0, 9.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.02227210998535, -28.052122116088867, -27.081972122192383, -26.1118221282959, -25.141672134399414, -24.17152214050293, -23.201370239257812, -22.231220245361328, -21.261070251464844, -20.29092025756836, -19.320770263671875, -18.35062026977539, -17.380470275878906, -16.410320281982422, -15.440169334411621, -14.470019340515137, -13.499870300292969, -12.529720306396484, -11.5595703125, -10.589420318603516, -9.619270324707031, -8.649120330810547, -7.678969383239746, -6.708819389343262, -5.738669395446777, -4.768519401550293, -3.7983691692352295, -2.828218936920166, -1.8580689430236816, -0.8879189491271973, 0.08223152160644531, 1.0523815155029297, 2.022533416748047, 2.9926834106445312, 3.9628336429595947, 4.932983875274658, 5.903133869171143, 6.873283863067627, 7.8434343338012695, 8.813584327697754, 9.783734321594238, 10.753884315490723, 11.724034309387207, 12.694185256958008, 13.664335250854492, 14.634485244750977, 15.604635238647461, 16.574785232543945, 17.54493522644043, 18.515085220336914, 19.4852352142334, 20.455385208129883, 21.425535202026367, 22.39568519592285, 23.36583709716797, 24.335987091064453, 25.306137084960938, 26.276287078857422, 27.246437072753906, 28.21658706665039, 29.186737060546875, 30.15688705444336, 31.127037048339844, 32.09718704223633, 33.06733703613281]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 3.0, 9.0, 15.0, 8.0, 15.0, 13.0, 16.0, 27.0, 22.0, 38.0, 28.0, 37.0, 43.0, 47.0, 29.0, 39.0, 42.0, 38.0, 41.0, 38.0, 54.0, 45.0, 43.0, 30.0, 35.0, 34.0, 32.0, 25.0, 28.0, 24.0, 19.0, 12.0, 16.0, 10.0, 10.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-36.966793060302734, -35.91755294799805, -34.86831283569336, -33.81907272338867, -32.769832611083984, -31.720592498779297, -30.671354293823242, -29.622114181518555, -28.572874069213867, -27.52363395690918, -26.474393844604492, -25.425153732299805, -24.37591552734375, -23.326675415039062, -22.277435302734375, -21.228195190429688, -20.178955078125, -19.129714965820312, -18.080474853515625, -17.031234741210938, -15.981995582580566, -14.932755470275879, -13.883516311645508, -12.83427619934082, -11.785036087036133, -10.735795974731445, -9.686555862426758, -8.637316703796387, -7.588076591491699, -6.538836479187012, -5.489596843719482, -4.440357208251953, -3.391115188598633, -2.3418753147125244, -1.292635440826416, -0.24339556694030762, 0.8058443069458008, 1.8550844192504883, 2.9043240547180176, 3.953563690185547, 5.002803802490234, 6.052043914794922, 7.101283550262451, 8.15052318572998, 9.199763298034668, 10.249003410339355, 11.298242568969727, 12.347482681274414, 13.396722793579102, 14.445962905883789, 15.495203018188477, 16.544443130493164, 17.59368133544922, 18.642921447753906, 19.692161560058594, 20.74140167236328, 21.79064178466797, 22.839881896972656, 23.889122009277344, 24.93836212158203, 25.98760223388672, 27.036842346191406, 28.08608055114746, 29.13532066345215, 30.184560775756836]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 10.0, 15.0, 24.0, 48.0, 65.0, 101.0, 173.0, 291.0, 411.0, 689.0, 1028.0, 1617.0, 2588.0, 4051.0, 6547.0, 10267.0, 15960.0, 24330.0, 37525.0, 54935.0, 77662.0, 102896.0, 123993.0, 132139.0, 122175.0, 100040.0, 74686.0, 53028.0, 35925.0, 23688.0, 15106.0, 9742.0, 6096.0, 3956.0, 2442.0, 1570.0, 978.0, 662.0, 419.0, 247.0, 172.0, 94.0, 62.0, 50.0, 23.0, 10.0, 7.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.37078857421875, -7.1204833984375, -6.87017822265625, -6.619873046875, -6.36956787109375, -6.1192626953125, -5.86895751953125, -5.61865234375, -5.36834716796875, -5.1180419921875, -4.86773681640625, -4.617431640625, -4.36712646484375, -4.1168212890625, -3.86651611328125, -3.6162109375, -3.36590576171875, -3.1156005859375, -2.86529541015625, -2.614990234375, -2.36468505859375, -2.1143798828125, -1.86407470703125, -1.61376953125, -1.36346435546875, -1.1131591796875, -0.86285400390625, -0.612548828125, -0.36224365234375, -0.1119384765625, 0.13836669921875, 0.388671875, 0.63897705078125, 0.8892822265625, 1.13958740234375, 1.389892578125, 1.64019775390625, 1.8905029296875, 2.14080810546875, 2.39111328125, 2.64141845703125, 2.8917236328125, 3.14202880859375, 3.392333984375, 3.64263916015625, 3.8929443359375, 4.14324951171875, 4.3935546875, 4.64385986328125, 4.8941650390625, 5.14447021484375, 5.394775390625, 5.64508056640625, 5.8953857421875, 6.14569091796875, 6.39599609375, 6.64630126953125, 6.8966064453125, 7.14691162109375, 7.397216796875, 7.64752197265625, 7.8978271484375, 8.14813232421875, 8.3984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 7.0, 16.0, 9.0, 14.0, 14.0, 17.0, 24.0, 22.0, 38.0, 30.0, 36.0, 44.0, 46.0, 29.0, 39.0, 42.0, 38.0, 43.0, 37.0, 52.0, 46.0, 43.0, 29.0, 34.0, 36.0, 32.0, 26.0, 26.0, 24.0, 20.0, 13.0, 15.0, 12.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-36.6875, -35.648193359375, -34.60888671875, -33.569580078125, -32.5302734375, -31.490966796875, -30.45166015625, -29.412353515625, -28.373046875, -27.333740234375, -26.29443359375, -25.255126953125, -24.2158203125, -23.176513671875, -22.13720703125, -21.097900390625, -20.05859375, -19.019287109375, -17.97998046875, -16.940673828125, -15.9013671875, -14.862060546875, -13.82275390625, -12.783447265625, -11.744140625, -10.704833984375, -9.66552734375, -8.626220703125, -7.5869140625, -6.547607421875, -5.50830078125, -4.468994140625, -3.4296875, -2.390380859375, -1.35107421875, -0.311767578125, 0.7275390625, 1.766845703125, 2.80615234375, 3.845458984375, 4.884765625, 5.924072265625, 6.96337890625, 8.002685546875, 9.0419921875, 10.081298828125, 11.12060546875, 12.159912109375, 13.19921875, 14.238525390625, 15.27783203125, 16.317138671875, 17.3564453125, 18.395751953125, 19.43505859375, 20.474365234375, 21.513671875, 22.552978515625, 23.59228515625, 24.631591796875, 25.6708984375, 26.710205078125, 27.74951171875, 28.788818359375, 29.828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 13.0, 27.0, 38.0, 61.0, 107.0, 133.0, 218.0, 387.0, 613.0, 998.0, 1639.0, 2613.0, 4228.0, 7019.0, 11077.0, 19112.0, 40290.0, 866820.0, 43114.0, 20000.0, 11491.0, 7080.0, 4379.0, 2705.0, 1697.0, 1015.0, 611.0, 408.0, 248.0, 154.0, 86.0, 61.0, 38.0, 20.0, 12.0, 9.0, 6.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-27.46875, -26.716796875, -25.96484375, -25.212890625, -24.4609375, -23.708984375, -22.95703125, -22.205078125, -21.453125, -20.701171875, -19.94921875, -19.197265625, -18.4453125, -17.693359375, -16.94140625, -16.189453125, -15.4375, -14.685546875, -13.93359375, -13.181640625, -12.4296875, -11.677734375, -10.92578125, -10.173828125, -9.421875, -8.669921875, -7.91796875, -7.166015625, -6.4140625, -5.662109375, -4.91015625, -4.158203125, -3.40625, -2.654296875, -1.90234375, -1.150390625, -0.3984375, 0.353515625, 1.10546875, 1.857421875, 2.609375, 3.361328125, 4.11328125, 4.865234375, 5.6171875, 6.369140625, 7.12109375, 7.873046875, 8.625, 9.376953125, 10.12890625, 10.880859375, 11.6328125, 12.384765625, 13.13671875, 13.888671875, 14.640625, 15.392578125, 16.14453125, 16.896484375, 17.6484375, 18.400390625, 19.15234375, 19.904296875, 20.65625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 10.0, 8.0, 14.0, 15.0, 14.0, 21.0, 24.0, 20.0, 31.0, 34.0, 44.0, 48.0, 29.0, 41.0, 49.0, 34.0, 42.0, 51.0, 51.0, 34.0, 40.0, 34.0, 30.0, 31.0, 35.0, 28.0, 20.0, 35.0, 29.0, 15.0, 10.0, 22.0, 16.0, 9.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.8798828125, -18.166015625, -17.4521484375, -16.73828125, -16.0244140625, -15.310546875, -14.5966796875, -13.8828125, -13.1689453125, -12.455078125, -11.7412109375, -11.02734375, -10.3134765625, -9.599609375, -8.8857421875, -8.171875, -7.4580078125, -6.744140625, -6.0302734375, -5.31640625, -4.6025390625, -3.888671875, -3.1748046875, -2.4609375, -1.7470703125, -1.033203125, -0.3193359375, 0.39453125, 1.1083984375, 1.822265625, 2.5361328125, 3.25, 3.9638671875, 4.677734375, 5.3916015625, 6.10546875, 6.8193359375, 7.533203125, 8.2470703125, 8.9609375, 9.6748046875, 10.388671875, 11.1025390625, 11.81640625, 12.5302734375, 13.244140625, 13.9580078125, 14.671875, 15.3857421875, 16.099609375, 16.8134765625, 17.52734375, 18.2412109375, 18.955078125, 19.6689453125, 20.3828125, 21.0966796875, 21.810546875, 22.5244140625, 23.23828125, 23.9521484375, 24.666015625, 25.3798828125, 26.09375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 8.0, 7.0, 15.0, 13.0, 17.0, 25.0, 36.0, 40.0, 64.0, 91.0, 133.0, 188.0, 263.0, 422.0, 598.0, 968.0, 1575.0, 2697.0, 5023.0, 9798.0, 21114.0, 57161.0, 884252.0, 33265.0, 14443.0, 6957.0, 3691.0, 2064.0, 1229.0, 782.0, 516.0, 309.0, 210.0, 186.0, 106.0, 83.0, 71.0, 40.0, 22.0, 22.0, 23.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8078384399414062, -0.7802276611328125, -0.7526168823242188, -0.725006103515625, -0.6973953247070312, -0.6697845458984375, -0.6421737670898438, -0.61456298828125, -0.5869522094726562, -0.5593414306640625, -0.5317306518554688, -0.504119873046875, -0.47650909423828125, -0.4488983154296875, -0.42128753662109375, -0.3936767578125, -0.36606597900390625, -0.3384552001953125, -0.31084442138671875, -0.283233642578125, -0.25562286376953125, -0.2280120849609375, -0.20040130615234375, -0.17279052734375, -0.14517974853515625, -0.1175689697265625, -0.08995819091796875, -0.062347412109375, -0.03473663330078125, -0.0071258544921875, 0.02048492431640625, 0.048095703125, 0.07570648193359375, 0.1033172607421875, 0.13092803955078125, 0.158538818359375, 0.18614959716796875, 0.2137603759765625, 0.24137115478515625, 0.26898193359375, 0.29659271240234375, 0.3242034912109375, 0.35181427001953125, 0.379425048828125, 0.40703582763671875, 0.4346466064453125, 0.46225738525390625, 0.4898681640625, 0.5174789428710938, 0.5450897216796875, 0.5727005004882812, 0.600311279296875, 0.6279220581054688, 0.6555328369140625, 0.6831436157226562, 0.71075439453125, 0.7383651733398438, 0.7659759521484375, 0.7935867309570312, 0.821197509765625, 0.8488082885742188, 0.8764190673828125, 0.9040298461914062, 0.931640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 5.0, 9.0, 14.0, 19.0, 11.0, 33.0, 22.0, 32.0, 28.0, 35.0, 46.0, 61.0, 44.0, 53.0, 49.0, 52.0, 52.0, 42.0, 66.0, 51.0, 45.0, 39.0, 36.0, 36.0, 26.0, 11.0, 14.0, 13.0, 12.0, 6.0, 6.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.7493031919002533e-05, -1.6985461115837097e-05, -1.647789031267166e-05, -1.5970319509506226e-05, -1.546274870634079e-05, -1.4955177903175354e-05, -1.4447607100009918e-05, -1.3940036296844482e-05, -1.3432465493679047e-05, -1.292489469051361e-05, -1.2417323887348175e-05, -1.190975308418274e-05, -1.1402182281017303e-05, -1.0894611477851868e-05, -1.0387040674686432e-05, -9.879469871520996e-06, -9.37189906835556e-06, -8.864328265190125e-06, -8.356757462024689e-06, -7.849186658859253e-06, -7.341615855693817e-06, -6.834045052528381e-06, -6.3264742493629456e-06, -5.81890344619751e-06, -5.311332643032074e-06, -4.803761839866638e-06, -4.296191036701202e-06, -3.7886202335357666e-06, -3.281049430370331e-06, -2.773478627204895e-06, -2.2659078240394592e-06, -1.7583370208740234e-06, -1.2507662177085876e-06, -7.431954145431519e-07, -2.3562461137771606e-07, 2.7194619178771973e-07, 7.795169949531555e-07, 1.2870877981185913e-06, 1.794658601284027e-06, 2.302229404449463e-06, 2.8098002076148987e-06, 3.3173710107803345e-06, 3.82494181394577e-06, 4.332512617111206e-06, 4.840083420276642e-06, 5.347654223442078e-06, 5.8552250266075134e-06, 6.362795829772949e-06, 6.870366632938385e-06, 7.377937436103821e-06, 7.885508239269257e-06, 8.393079042434692e-06, 8.900649845600128e-06, 9.408220648765564e-06, 9.915791451931e-06, 1.0423362255096436e-05, 1.0930933058261871e-05, 1.1438503861427307e-05, 1.1946074664592743e-05, 1.2453645467758179e-05, 1.2961216270923615e-05, 1.346878707408905e-05, 1.3976357877254486e-05, 1.4483928680419922e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 15.0, 28.0, 33.0, 52.0, 87.0, 142.0, 235.0, 326.0, 443.0, 749.0, 1010.0, 1507.0, 2260.0, 3289.0, 4904.0, 7444.0, 10938.0, 16509.0, 25761.0, 40253.0, 65372.0, 104846.0, 159114.0, 186275.0, 150494.0, 97231.0, 60555.0, 37640.0, 24127.0, 15487.0, 10333.0, 6957.0, 4543.0, 3198.0, 2113.0, 1388.0, 950.0, 680.0, 448.0, 274.0, 182.0, 122.0, 81.0, 57.0, 37.0, 22.0, 10.0, 13.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.3525199890136719, -0.34053802490234375, -0.3285560607910156, -0.3165740966796875, -0.3045921325683594, -0.29261016845703125, -0.2806282043457031, -0.268646240234375, -0.2566642761230469, -0.24468231201171875, -0.23270034790039062, -0.2207183837890625, -0.20873641967773438, -0.19675445556640625, -0.18477249145507812, -0.17279052734375, -0.16080856323242188, -0.14882659912109375, -0.13684463500976562, -0.1248626708984375, -0.11288070678710938, -0.10089874267578125, -0.08891677856445312, -0.076934814453125, -0.06495285034179688, -0.05297088623046875, -0.040988922119140625, -0.0290069580078125, -0.017024993896484375, -0.00504302978515625, 0.006938934326171875, 0.0189208984375, 0.030902862548828125, 0.04288482666015625, 0.054866790771484375, 0.0668487548828125, 0.07883071899414062, 0.09081268310546875, 0.10279464721679688, 0.114776611328125, 0.12675857543945312, 0.13874053955078125, 0.15072250366210938, 0.1627044677734375, 0.17468643188476562, 0.18666839599609375, 0.19865036010742188, 0.21063232421875, 0.22261428833007812, 0.23459625244140625, 0.24657821655273438, 0.2585601806640625, 0.2705421447753906, 0.28252410888671875, 0.2945060729980469, 0.306488037109375, 0.3184700012207031, 0.33045196533203125, 0.3424339294433594, 0.3544158935546875, 0.3663978576660156, 0.37837982177734375, 0.3903617858886719, 0.40234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 3.0, 8.0, 9.0, 15.0, 6.0, 16.0, 13.0, 27.0, 24.0, 25.0, 34.0, 41.0, 62.0, 60.0, 70.0, 84.0, 80.0, 72.0, 52.0, 38.0, 37.0, 34.0, 25.0, 20.0, 32.0, 15.0, 6.0, 11.0, 12.0, 7.0, 14.0, 6.0, 4.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1671142578125, -0.16152000427246094, -0.15592575073242188, -0.1503314971923828, -0.14473724365234375, -0.1391429901123047, -0.13354873657226562, -0.12795448303222656, -0.1223602294921875, -0.11676597595214844, -0.11117172241210938, -0.10557746887207031, -0.09998321533203125, -0.09438896179199219, -0.08879470825195312, -0.08320045471191406, -0.077606201171875, -0.07201194763183594, -0.06641769409179688, -0.06082344055175781, -0.05522918701171875, -0.04963493347167969, -0.044040679931640625, -0.03844642639160156, -0.0328521728515625, -0.027257919311523438, -0.021663665771484375, -0.016069412231445312, -0.01047515869140625, -0.0048809051513671875, 0.000713348388671875, 0.0063076019287109375, 0.01190185546875, 0.017496109008789062, 0.023090362548828125, 0.028684616088867188, 0.03427886962890625, 0.03987312316894531, 0.045467376708984375, 0.05106163024902344, 0.0566558837890625, 0.06225013732910156, 0.06784439086914062, 0.07343864440917969, 0.07903289794921875, 0.08462715148925781, 0.09022140502929688, 0.09581565856933594, 0.101409912109375, 0.10700416564941406, 0.11259841918945312, 0.11819267272949219, 0.12378692626953125, 0.1293811798095703, 0.13497543334960938, 0.14056968688964844, 0.1461639404296875, 0.15175819396972656, 0.15735244750976562, 0.1629467010498047, 0.16854095458984375, 0.1741352081298828, 0.17972946166992188, 0.18532371520996094, 0.19091796875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 5.0, 2.0, 5.0, 7.0, 7.0, 10.0, 16.0, 20.0, 26.0, 32.0, 33.0, 31.0, 43.0, 44.0, 49.0, 42.0, 58.0, 51.0, 61.0, 45.0, 39.0, 51.0, 41.0, 44.0, 35.0, 38.0, 19.0, 24.0, 27.0, 25.0, 19.0, 11.0, 8.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.43564224243164, -26.508100509643555, -25.5805606842041, -24.653018951416016, -23.72547721862793, -22.797935485839844, -21.87039566040039, -20.942853927612305, -20.01531219482422, -19.087770462036133, -18.16023063659668, -17.232688903808594, -16.305147171020508, -15.377606391906738, -14.450065612792969, -13.522523880004883, -12.59498405456543, -11.66744327545166, -10.739901542663574, -9.812360763549805, -8.884819030761719, -7.957278251647949, -7.02973747253418, -6.102196216583252, -5.174654960632324, -4.2471137046813965, -3.319572687149048, -2.392031669616699, -1.4644904136657715, -0.5369491577148438, 0.3905916213989258, 1.3181328773498535, 2.2456722259521484, 3.173213481903076, 4.100754737854004, 5.028295516967773, 5.955836772918701, 6.883378028869629, 7.810918807983398, 8.738460540771484, 9.666001319885254, 10.593542098999023, 11.52108383178711, 12.448624610900879, 13.376165390014648, 14.303707122802734, 15.231247901916504, 16.158788681030273, 17.08633041381836, 18.013872146606445, 18.9414119720459, 19.868953704833984, 20.79649543762207, 21.724037170410156, 22.65157699584961, 23.579118728637695, 24.50666046142578, 25.434202194213867, 26.36174201965332, 27.289283752441406, 28.216825485229492, 29.144367218017578, 30.07190704345703, 30.999448776245117, 31.92698860168457]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 9.0, 16.0, 7.0, 15.0, 13.0, 18.0, 24.0, 23.0, 37.0, 29.0, 36.0, 47.0, 46.0, 26.0, 43.0, 39.0, 38.0, 43.0, 39.0, 53.0, 43.0, 42.0, 30.0, 36.0, 34.0, 33.0, 24.0, 29.0, 21.0, 21.0, 12.0, 15.0, 12.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-36.604740142822266, -35.56626892089844, -34.527793884277344, -33.489322662353516, -32.45085144042969, -31.412378311157227, -30.373905181884766, -29.335433959960938, -28.296960830688477, -27.258487701416016, -26.220016479492188, -25.181543350219727, -24.143070220947266, -23.104598999023438, -22.066125869750977, -21.027652740478516, -19.989181518554688, -18.950708389282227, -17.9122371673584, -16.873764038085938, -15.835291862487793, -14.796819686889648, -13.758346557617188, -12.719874382019043, -11.681402206420898, -10.642930030822754, -9.60445785522461, -8.565984725952148, -7.527512550354004, -6.489040374755859, -5.450567722320557, -4.412095069885254, -3.3736228942871094, -2.3351504802703857, -1.296678066253662, -0.2582056522369385, 0.7802667617797852, 1.8187389373779297, 2.8572115898132324, 3.895684242248535, 4.93415641784668, 5.972628593444824, 7.011101245880127, 8.04957389831543, 9.088046073913574, 10.126518249511719, 11.16499137878418, 12.203463554382324, 13.241935729980469, 14.280407905578613, 15.318880081176758, 16.35735321044922, 17.395824432373047, 18.434297561645508, 19.47277069091797, 20.511241912841797, 21.549715042114258, 22.58818817138672, 23.626659393310547, 24.665132522583008, 25.70360565185547, 26.742076873779297, 27.780550003051758, 28.81902313232422, 29.857494354248047]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 17.0, 20.0, 29.0, 48.0, 76.0, 120.0, 212.0, 342.0, 559.0, 932.0, 1537.0, 2530.0, 4211.0, 6923.0, 11350.0, 18294.0, 28623.0, 42694.0, 61462.0, 82165.0, 102570.0, 116709.0, 120687.0, 113559.0, 96513.0, 75781.0, 55655.0, 38212.0, 25264.0, 16037.0, 10069.0, 6040.0, 3676.0, 2266.0, 1318.0, 836.0, 494.0, 292.0, 171.0, 102.0, 55.0, 45.0, 30.0, 12.0, 11.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.546875, -19.930908203125, -19.31494140625, -18.698974609375, -18.0830078125, -17.467041015625, -16.85107421875, -16.235107421875, -15.619140625, -15.003173828125, -14.38720703125, -13.771240234375, -13.1552734375, -12.539306640625, -11.92333984375, -11.307373046875, -10.69140625, -10.075439453125, -9.45947265625, -8.843505859375, -8.2275390625, -7.611572265625, -6.99560546875, -6.379638671875, -5.763671875, -5.147705078125, -4.53173828125, -3.915771484375, -3.2998046875, -2.683837890625, -2.06787109375, -1.451904296875, -0.8359375, -0.219970703125, 0.39599609375, 1.011962890625, 1.6279296875, 2.243896484375, 2.85986328125, 3.475830078125, 4.091796875, 4.707763671875, 5.32373046875, 5.939697265625, 6.5556640625, 7.171630859375, 7.78759765625, 8.403564453125, 9.01953125, 9.635498046875, 10.25146484375, 10.867431640625, 11.4833984375, 12.099365234375, 12.71533203125, 13.331298828125, 13.947265625, 14.563232421875, 15.17919921875, 15.795166015625, 16.4111328125, 17.027099609375, 17.64306640625, 18.259033203125, 18.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 7.0, 2.0, 5.0, 12.0, 14.0, 7.0, 16.0, 15.0, 18.0, 26.0, 27.0, 35.0, 31.0, 37.0, 52.0, 38.0, 31.0, 36.0, 42.0, 46.0, 37.0, 42.0, 45.0, 47.0, 38.0, 29.0, 39.0, 37.0, 27.0, 23.0, 29.0, 20.0, 19.0, 13.0, 15.0, 11.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.25, -34.24267578125, -33.2353515625, -32.22802734375, -31.220703125, -30.21337890625, -29.2060546875, -28.19873046875, -27.19140625, -26.18408203125, -25.1767578125, -24.16943359375, -23.162109375, -22.15478515625, -21.1474609375, -20.14013671875, -19.1328125, -18.12548828125, -17.1181640625, -16.11083984375, -15.103515625, -14.09619140625, -13.0888671875, -12.08154296875, -11.07421875, -10.06689453125, -9.0595703125, -8.05224609375, -7.044921875, -6.03759765625, -5.0302734375, -4.02294921875, -3.015625, -2.00830078125, -1.0009765625, 0.00634765625, 1.013671875, 2.02099609375, 3.0283203125, 4.03564453125, 5.04296875, 6.05029296875, 7.0576171875, 8.06494140625, 9.072265625, 10.07958984375, 11.0869140625, 12.09423828125, 13.1015625, 14.10888671875, 15.1162109375, 16.12353515625, 17.130859375, 18.13818359375, 19.1455078125, 20.15283203125, 21.16015625, 22.16748046875, 23.1748046875, 24.18212890625, 25.189453125, 26.19677734375, 27.2041015625, 28.21142578125, 29.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 17.0, 21.0, 29.0, 59.0, 70.0, 118.0, 211.0, 289.0, 474.0, 776.0, 1200.0, 1805.0, 2813.0, 4232.0, 6563.0, 10076.0, 15402.0, 22601.0, 33165.0, 47306.0, 63775.0, 82123.0, 97839.0, 108688.0, 110310.0, 103356.0, 89652.0, 71684.0, 54390.0, 39240.0, 27145.0, 18360.0, 12193.0, 7988.0, 5110.0, 3337.0, 2209.0, 1362.0, 909.0, 596.0, 370.0, 244.0, 157.0, 94.0, 64.0, 48.0, 21.0, 17.0, 11.0, 17.0, 9.0, 5.0, 1.0, 1.0, 3.0], "bins": [-19.09375, -18.51904296875, -17.9443359375, -17.36962890625, -16.794921875, -16.22021484375, -15.6455078125, -15.07080078125, -14.49609375, -13.92138671875, -13.3466796875, -12.77197265625, -12.197265625, -11.62255859375, -11.0478515625, -10.47314453125, -9.8984375, -9.32373046875, -8.7490234375, -8.17431640625, -7.599609375, -7.02490234375, -6.4501953125, -5.87548828125, -5.30078125, -4.72607421875, -4.1513671875, -3.57666015625, -3.001953125, -2.42724609375, -1.8525390625, -1.27783203125, -0.703125, -0.12841796875, 0.4462890625, 1.02099609375, 1.595703125, 2.17041015625, 2.7451171875, 3.31982421875, 3.89453125, 4.46923828125, 5.0439453125, 5.61865234375, 6.193359375, 6.76806640625, 7.3427734375, 7.91748046875, 8.4921875, 9.06689453125, 9.6416015625, 10.21630859375, 10.791015625, 11.36572265625, 11.9404296875, 12.51513671875, 13.08984375, 13.66455078125, 14.2392578125, 14.81396484375, 15.388671875, 15.96337890625, 16.5380859375, 17.11279296875, 17.6875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 1.0, 8.0, 7.0, 10.0, 16.0, 23.0, 15.0, 15.0, 22.0, 25.0, 19.0, 35.0, 40.0, 50.0, 42.0, 38.0, 44.0, 42.0, 47.0, 37.0, 40.0, 38.0, 41.0, 30.0, 40.0, 48.0, 28.0, 27.0, 24.0, 21.0, 25.0, 14.0, 11.0, 18.0, 12.0, 12.0, 9.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.625, -20.950439453125, -20.27587890625, -19.601318359375, -18.9267578125, -18.252197265625, -17.57763671875, -16.903076171875, -16.228515625, -15.553955078125, -14.87939453125, -14.204833984375, -13.5302734375, -12.855712890625, -12.18115234375, -11.506591796875, -10.83203125, -10.157470703125, -9.48291015625, -8.808349609375, -8.1337890625, -7.459228515625, -6.78466796875, -6.110107421875, -5.435546875, -4.760986328125, -4.08642578125, -3.411865234375, -2.7373046875, -2.062744140625, -1.38818359375, -0.713623046875, -0.0390625, 0.635498046875, 1.31005859375, 1.984619140625, 2.6591796875, 3.333740234375, 4.00830078125, 4.682861328125, 5.357421875, 6.031982421875, 6.70654296875, 7.381103515625, 8.0556640625, 8.730224609375, 9.40478515625, 10.079345703125, 10.75390625, 11.428466796875, 12.10302734375, 12.777587890625, 13.4521484375, 14.126708984375, 14.80126953125, 15.475830078125, 16.150390625, 16.824951171875, 17.49951171875, 18.174072265625, 18.8486328125, 19.523193359375, 20.19775390625, 20.872314453125, 21.546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 11.0, 16.0, 17.0, 17.0, 26.0, 51.0, 74.0, 109.0, 189.0, 279.0, 510.0, 817.0, 1293.0, 2301.0, 3863.0, 6650.0, 11259.0, 18541.0, 30526.0, 48836.0, 72589.0, 100901.0, 125804.0, 137525.0, 132739.0, 113472.0, 85668.0, 58798.0, 38289.0, 23359.0, 13813.0, 8248.0, 4835.0, 2929.0, 1657.0, 993.0, 610.0, 319.0, 213.0, 137.0, 85.0, 64.0, 37.0, 28.0, 23.0, 18.0, 8.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-6.3671875, -6.172607421875, -5.97802734375, -5.783447265625, -5.5888671875, -5.394287109375, -5.19970703125, -5.005126953125, -4.810546875, -4.615966796875, -4.42138671875, -4.226806640625, -4.0322265625, -3.837646484375, -3.64306640625, -3.448486328125, -3.25390625, -3.059326171875, -2.86474609375, -2.670166015625, -2.4755859375, -2.281005859375, -2.08642578125, -1.891845703125, -1.697265625, -1.502685546875, -1.30810546875, -1.113525390625, -0.9189453125, -0.724365234375, -0.52978515625, -0.335205078125, -0.140625, 0.053955078125, 0.24853515625, 0.443115234375, 0.6376953125, 0.832275390625, 1.02685546875, 1.221435546875, 1.416015625, 1.610595703125, 1.80517578125, 1.999755859375, 2.1943359375, 2.388916015625, 2.58349609375, 2.778076171875, 2.97265625, 3.167236328125, 3.36181640625, 3.556396484375, 3.7509765625, 3.945556640625, 4.14013671875, 4.334716796875, 4.529296875, 4.723876953125, 4.91845703125, 5.113037109375, 5.3076171875, 5.502197265625, 5.69677734375, 5.891357421875, 6.0859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 11.0, 7.0, 10.0, 7.0, 16.0, 23.0, 22.0, 21.0, 34.0, 26.0, 34.0, 42.0, 44.0, 52.0, 55.0, 36.0, 58.0, 59.0, 42.0, 51.0, 40.0, 38.0, 43.0, 40.0, 33.0, 31.0, 19.0, 22.0, 11.0, 16.0, 8.0, 9.0, 7.0, 2.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006594657897949219, -0.0006397292017936707, -0.0006199926137924194, -0.0006002560257911682, -0.000580519437789917, -0.0005607828497886658, -0.0005410462617874146, -0.0005213096737861633, -0.0005015730857849121, -0.0004818364977836609, -0.00046209990978240967, -0.00044236332178115845, -0.0004226267337799072, -0.000402890145778656, -0.0003831535577774048, -0.00036341696977615356, -0.00034368038177490234, -0.0003239437937736511, -0.0003042072057723999, -0.0002844706177711487, -0.00026473402976989746, -0.00024499744176864624, -0.00022526085376739502, -0.0002055242657661438, -0.00018578767776489258, -0.00016605108976364136, -0.00014631450176239014, -0.00012657791376113892, -0.0001068413257598877, -8.710473775863647e-05, -6.736814975738525e-05, -4.763156175613403e-05, -2.7894973754882812e-05, -8.158385753631592e-06, 1.1578202247619629e-05, 3.131479024887085e-05, 5.105137825012207e-05, 7.078796625137329e-05, 9.052455425262451e-05, 0.00011026114225387573, 0.00012999773025512695, 0.00014973431825637817, 0.0001694709062576294, 0.00018920749425888062, 0.00020894408226013184, 0.00022868067026138306, 0.0002484172582626343, 0.0002681538462638855, 0.0002878904342651367, 0.00030762702226638794, 0.00032736361026763916, 0.0003471001982688904, 0.0003668367862701416, 0.0003865733742713928, 0.00040630996227264404, 0.00042604655027389526, 0.0004457831382751465, 0.0004655197262763977, 0.0004852563142776489, 0.0005049929022789001, 0.0005247294902801514, 0.0005444660782814026, 0.0005642026662826538, 0.000583939254283905, 0.0006036758422851562]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 10.0, 12.0, 13.0, 12.0, 23.0, 45.0, 63.0, 85.0, 124.0, 192.0, 296.0, 434.0, 732.0, 1206.0, 1925.0, 3137.0, 5243.0, 8670.0, 14488.0, 23477.0, 38195.0, 58665.0, 85389.0, 113147.0, 133639.0, 138526.0, 125137.0, 98934.0, 71656.0, 47993.0, 30345.0, 18398.0, 11186.0, 6620.0, 4019.0, 2487.0, 1455.0, 916.0, 557.0, 393.0, 239.0, 163.0, 100.0, 65.0, 52.0, 33.0, 22.0, 16.0, 13.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.96484375, -6.75537109375, -6.5458984375, -6.33642578125, -6.126953125, -5.91748046875, -5.7080078125, -5.49853515625, -5.2890625, -5.07958984375, -4.8701171875, -4.66064453125, -4.451171875, -4.24169921875, -4.0322265625, -3.82275390625, -3.61328125, -3.40380859375, -3.1943359375, -2.98486328125, -2.775390625, -2.56591796875, -2.3564453125, -2.14697265625, -1.9375, -1.72802734375, -1.5185546875, -1.30908203125, -1.099609375, -0.89013671875, -0.6806640625, -0.47119140625, -0.26171875, -0.05224609375, 0.1572265625, 0.36669921875, 0.576171875, 0.78564453125, 0.9951171875, 1.20458984375, 1.4140625, 1.62353515625, 1.8330078125, 2.04248046875, 2.251953125, 2.46142578125, 2.6708984375, 2.88037109375, 3.08984375, 3.29931640625, 3.5087890625, 3.71826171875, 3.927734375, 4.13720703125, 4.3466796875, 4.55615234375, 4.765625, 4.97509765625, 5.1845703125, 5.39404296875, 5.603515625, 5.81298828125, 6.0224609375, 6.23193359375, 6.44140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 14.0, 8.0, 19.0, 24.0, 26.0, 25.0, 51.0, 44.0, 54.0, 57.0, 54.0, 75.0, 55.0, 61.0, 50.0, 63.0, 46.0, 43.0, 39.0, 37.0, 27.0, 26.0, 29.0, 13.0, 8.0, 7.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.7265625, -4.599761962890625, -4.47296142578125, -4.346160888671875, -4.2193603515625, -4.092559814453125, -3.96575927734375, -3.838958740234375, -3.712158203125, -3.585357666015625, -3.45855712890625, -3.331756591796875, -3.2049560546875, -3.078155517578125, -2.95135498046875, -2.824554443359375, -2.69775390625, -2.570953369140625, -2.44415283203125, -2.317352294921875, -2.1905517578125, -2.063751220703125, -1.93695068359375, -1.810150146484375, -1.683349609375, -1.556549072265625, -1.42974853515625, -1.302947998046875, -1.1761474609375, -1.049346923828125, -0.92254638671875, -0.795745849609375, -0.6689453125, -0.542144775390625, -0.41534423828125, -0.288543701171875, -0.1617431640625, -0.034942626953125, 0.09185791015625, 0.218658447265625, 0.345458984375, 0.472259521484375, 0.59906005859375, 0.725860595703125, 0.8526611328125, 0.979461669921875, 1.10626220703125, 1.233062744140625, 1.35986328125, 1.486663818359375, 1.61346435546875, 1.740264892578125, 1.8670654296875, 1.993865966796875, 2.12066650390625, 2.247467041015625, 2.374267578125, 2.501068115234375, 2.62786865234375, 2.754669189453125, 2.8814697265625, 3.008270263671875, 3.13507080078125, 3.261871337890625, 3.388671875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 13.0, 15.0, 15.0, 30.0, 29.0, 28.0, 40.0, 40.0, 47.0, 44.0, 53.0, 47.0, 40.0, 49.0, 52.0, 43.0, 49.0, 42.0, 48.0, 44.0, 28.0, 26.0, 23.0, 27.0, 15.0, 25.0, 15.0, 11.0, 11.0, 5.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.218372344970703, -29.295364379882812, -28.37235450744629, -27.4493465423584, -26.526336669921875, -25.603328704833984, -24.680320739746094, -23.75731086730957, -22.834300994873047, -21.911293029785156, -20.988283157348633, -20.065275192260742, -19.14226531982422, -18.219257354736328, -17.296249389648438, -16.373239517211914, -15.450231552124023, -14.527222633361816, -13.60421371459961, -12.681205749511719, -11.758195877075195, -10.835187911987305, -9.912178993225098, -8.98917007446289, -8.066161155700684, -7.143152236938477, -6.2201433181762695, -5.297134876251221, -4.374125957489014, -3.4511170387268066, -2.528108596801758, -1.6050996780395508, -0.6820926666259766, 0.24091613292694092, 1.1639249324798584, 2.0869336128234863, 3.0099425315856934, 3.9329514503479004, 4.855959892272949, 5.778968811035156, 6.701977729797363, 7.62498664855957, 8.547995567321777, 9.471004486083984, 10.394012451171875, 11.317022323608398, 12.240030288696289, 13.163039207458496, 14.086048126220703, 15.00905704498291, 15.932065963745117, 16.855073928833008, 17.77808380126953, 18.701091766357422, 19.624099731445312, 20.547109603881836, 21.47011947631836, 22.39312744140625, 23.316137313842773, 24.239145278930664, 25.162155151367188, 26.085163116455078, 27.00817108154297, 27.931180953979492, 28.854188919067383]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 6.0, 5.0, 11.0, 13.0, 15.0, 13.0, 25.0, 14.0, 18.0, 26.0, 24.0, 27.0, 36.0, 37.0, 30.0, 43.0, 40.0, 47.0, 42.0, 37.0, 42.0, 39.0, 37.0, 40.0, 34.0, 45.0, 34.0, 31.0, 28.0, 21.0, 15.0, 18.0, 14.0, 10.0, 15.0, 14.0, 9.0, 9.0, 9.0, 6.0, 6.0, 2.0, 5.0, 4.0, 2.0, 2.0], "bins": [-38.59059143066406, -37.560340881347656, -36.53009033203125, -35.499839782714844, -34.46958923339844, -33.4393424987793, -32.40909194946289, -31.378841400146484, -30.348590850830078, -29.318340301513672, -28.288089752197266, -27.257841110229492, -26.227590560913086, -25.19734001159668, -24.167091369628906, -23.1368408203125, -22.106590270996094, -21.076339721679688, -20.04608917236328, -19.015840530395508, -17.9855899810791, -16.955339431762695, -15.925089836120605, -14.894840240478516, -13.86458969116211, -12.834339141845703, -11.804089546203613, -10.773839950561523, -9.743589401245117, -8.713338851928711, -7.683089256286621, -6.652839183807373, -5.622591018676758, -4.59234094619751, -3.5620908737182617, -2.5318408012390137, -1.5015907287597656, -0.4713406562805176, 0.5589094161987305, 1.5891594886779785, 2.6194095611572266, 3.6496596336364746, 4.679909706115723, 5.710159778594971, 6.740409851074219, 7.770659923553467, 8.800909996032715, 9.831159591674805, 10.861410140991211, 11.891660690307617, 12.921910285949707, 13.952159881591797, 14.982410430908203, 16.01266098022461, 17.042911529541016, 18.07316017150879, 19.103410720825195, 20.1336612701416, 21.163909912109375, 22.19416046142578, 23.224411010742188, 24.254661560058594, 25.284912109375, 26.315160751342773, 27.34541130065918]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 12.0, 19.0, 38.0, 47.0, 71.0, 129.0, 207.0, 316.0, 534.0, 828.0, 1308.0, 2019.0, 3227.0, 5065.0, 7608.0, 12053.0, 18841.0, 28784.0, 43320.0, 65532.0, 96024.0, 138130.0, 190623.0, 255226.0, 321106.0, 380514.0, 419803.0, 427871.0, 401699.0, 352219.0, 286382.0, 221202.0, 162847.0, 115968.0, 79076.0, 54303.0, 35796.0, 23536.0, 15175.0, 9722.0, 6309.0, 3995.0, 2521.0, 1621.0, 1050.0, 598.0, 355.0, 262.0, 162.0, 98.0, 49.0, 35.0, 20.0, 14.0, 9.0, 6.0, 1.0, 3.0, 1.0], "bins": [-18.1875, -17.62353515625, -17.0595703125, -16.49560546875, -15.931640625, -15.36767578125, -14.8037109375, -14.23974609375, -13.67578125, -13.11181640625, -12.5478515625, -11.98388671875, -11.419921875, -10.85595703125, -10.2919921875, -9.72802734375, -9.1640625, -8.60009765625, -8.0361328125, -7.47216796875, -6.908203125, -6.34423828125, -5.7802734375, -5.21630859375, -4.65234375, -4.08837890625, -3.5244140625, -2.96044921875, -2.396484375, -1.83251953125, -1.2685546875, -0.70458984375, -0.140625, 0.42333984375, 0.9873046875, 1.55126953125, 2.115234375, 2.67919921875, 3.2431640625, 3.80712890625, 4.37109375, 4.93505859375, 5.4990234375, 6.06298828125, 6.626953125, 7.19091796875, 7.7548828125, 8.31884765625, 8.8828125, 9.44677734375, 10.0107421875, 10.57470703125, 11.138671875, 11.70263671875, 12.2666015625, 12.83056640625, 13.39453125, 13.95849609375, 14.5224609375, 15.08642578125, 15.650390625, 16.21435546875, 16.7783203125, 17.34228515625, 17.90625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 10.0, 13.0, 11.0, 17.0, 16.0, 23.0, 14.0, 19.0, 26.0, 29.0, 25.0, 38.0, 34.0, 37.0, 43.0, 44.0, 48.0, 36.0, 38.0, 36.0, 46.0, 35.0, 39.0, 36.0, 45.0, 27.0, 28.0, 29.0, 15.0, 19.0, 15.0, 13.0, 9.0, 18.0, 11.0, 11.0, 5.0, 8.0, 8.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0], "bins": [-30.59375, -29.766845703125, -28.93994140625, -28.113037109375, -27.2861328125, -26.459228515625, -25.63232421875, -24.805419921875, -23.978515625, -23.151611328125, -22.32470703125, -21.497802734375, -20.6708984375, -19.843994140625, -19.01708984375, -18.190185546875, -17.36328125, -16.536376953125, -15.70947265625, -14.882568359375, -14.0556640625, -13.228759765625, -12.40185546875, -11.574951171875, -10.748046875, -9.921142578125, -9.09423828125, -8.267333984375, -7.4404296875, -6.613525390625, -5.78662109375, -4.959716796875, -4.1328125, -3.305908203125, -2.47900390625, -1.652099609375, -0.8251953125, 0.001708984375, 0.82861328125, 1.655517578125, 2.482421875, 3.309326171875, 4.13623046875, 4.963134765625, 5.7900390625, 6.616943359375, 7.44384765625, 8.270751953125, 9.09765625, 9.924560546875, 10.75146484375, 11.578369140625, 12.4052734375, 13.232177734375, 14.05908203125, 14.885986328125, 15.712890625, 16.539794921875, 17.36669921875, 18.193603515625, 19.0205078125, 19.847412109375, 20.67431640625, 21.501220703125, 22.328125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 24.0, 48.0, 68.0, 138.0, 264.0, 420.0, 748.0, 1313.0, 2201.0, 3853.0, 6531.0, 10690.0, 17561.0, 27799.0, 43576.0, 66471.0, 98473.0, 139897.0, 191682.0, 250314.0, 308866.0, 360325.0, 395645.0, 405747.0, 390819.0, 353599.0, 298991.0, 240275.0, 182361.0, 133345.0, 92932.0, 62453.0, 40672.0, 25516.0, 16254.0, 9812.0, 6036.0, 3610.0, 2064.0, 1239.0, 718.0, 403.0, 221.0, 120.0, 83.0, 44.0, 24.0, 14.0, 10.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.55078125, -16.9921875, -16.43359375, -15.875, -15.31640625, -14.7578125, -14.19921875, -13.640625, -13.08203125, -12.5234375, -11.96484375, -11.40625, -10.84765625, -10.2890625, -9.73046875, -9.171875, -8.61328125, -8.0546875, -7.49609375, -6.9375, -6.37890625, -5.8203125, -5.26171875, -4.703125, -4.14453125, -3.5859375, -3.02734375, -2.46875, -1.91015625, -1.3515625, -0.79296875, -0.234375, 0.32421875, 0.8828125, 1.44140625, 2.0, 2.55859375, 3.1171875, 3.67578125, 4.234375, 4.79296875, 5.3515625, 5.91015625, 6.46875, 7.02734375, 7.5859375, 8.14453125, 8.703125, 9.26171875, 9.8203125, 10.37890625, 10.9375, 11.49609375, 12.0546875, 12.61328125, 13.171875, 13.73046875, 14.2890625, 14.84765625, 15.40625, 15.96484375, 16.5234375, 17.08203125, 17.640625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 12.0, 7.0, 18.0, 16.0, 24.0, 29.0, 43.0, 60.0, 51.0, 78.0, 89.0, 65.0, 115.0, 131.0, 119.0, 151.0, 176.0, 159.0, 205.0, 183.0, 215.0, 213.0, 194.0, 183.0, 195.0, 141.0, 160.0, 154.0, 133.0, 130.0, 111.0, 82.0, 71.0, 72.0, 49.0, 55.0, 31.0, 44.0, 18.0, 21.0, 15.0, 10.0, 12.0, 10.0, 10.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.8758544921875, -11.509521484375, -11.1431884765625, -10.77685546875, -10.4105224609375, -10.044189453125, -9.6778564453125, -9.3115234375, -8.9451904296875, -8.578857421875, -8.2125244140625, -7.84619140625, -7.4798583984375, -7.113525390625, -6.7471923828125, -6.380859375, -6.0145263671875, -5.648193359375, -5.2818603515625, -4.91552734375, -4.5491943359375, -4.182861328125, -3.8165283203125, -3.4501953125, -3.0838623046875, -2.717529296875, -2.3511962890625, -1.98486328125, -1.6185302734375, -1.252197265625, -0.8858642578125, -0.51953125, -0.1531982421875, 0.213134765625, 0.5794677734375, 0.94580078125, 1.3121337890625, 1.678466796875, 2.0447998046875, 2.4111328125, 2.7774658203125, 3.143798828125, 3.5101318359375, 3.87646484375, 4.2427978515625, 4.609130859375, 4.9754638671875, 5.341796875, 5.7081298828125, 6.074462890625, 6.4407958984375, 6.80712890625, 7.1734619140625, 7.539794921875, 7.9061279296875, 8.2724609375, 8.6387939453125, 9.005126953125, 9.3714599609375, 9.73779296875, 10.1041259765625, 10.470458984375, 10.8367919921875, 11.203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 7.0, 8.0, 17.0, 23.0, 25.0, 15.0, 23.0, 27.0, 30.0, 28.0, 40.0, 32.0, 30.0, 47.0, 48.0, 38.0, 58.0, 40.0, 36.0, 39.0, 36.0, 34.0, 38.0, 19.0, 26.0, 25.0, 26.0, 25.0, 15.0, 28.0, 11.0, 14.0, 14.0, 5.0, 11.0, 6.0, 5.0, 7.0, 2.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-25.808765411376953, -25.046022415161133, -24.283279418945312, -23.520536422729492, -22.757793426513672, -21.995052337646484, -21.232309341430664, -20.469566345214844, -19.706823348999023, -18.944080352783203, -18.181337356567383, -17.418594360351562, -16.655853271484375, -15.893109321594238, -15.130367279052734, -14.367624282836914, -13.604881286621094, -12.842138290405273, -12.079395294189453, -11.31665325164795, -10.553910255432129, -9.791167259216309, -9.028425216674805, -8.265682220458984, -7.502939224243164, -6.740196228027344, -5.977453708648682, -5.2147111892700195, -4.451968193054199, -3.689225435256958, -2.926482677459717, -2.1637401580810547, -1.4009952545166016, -0.6382524967193604, 0.12449026107788086, 0.8872330188751221, 1.6499757766723633, 2.4127185344696045, 3.1754612922668457, 3.938203811645508, 4.700946807861328, 5.463689804077148, 6.2264323234558105, 6.989174842834473, 7.751917839050293, 8.514660835266113, 9.277402877807617, 10.040145874023438, 10.802888870239258, 11.565631866455078, 12.328374862670898, 13.091116905212402, 13.853859901428223, 14.616602897644043, 15.379344940185547, 16.142087936401367, 16.904830932617188, 17.667573928833008, 18.430316925048828, 19.19305992126465, 19.95580291748047, 20.718544006347656, 21.481287002563477, 22.244029998779297, 23.006772994995117]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 12.0, 12.0, 3.0, 13.0, 13.0, 7.0, 8.0, 19.0, 18.0, 13.0, 25.0, 28.0, 36.0, 34.0, 23.0, 40.0, 35.0, 26.0, 34.0, 37.0, 50.0, 38.0, 42.0, 40.0, 31.0, 35.0, 35.0, 31.0, 26.0, 35.0, 27.0, 20.0, 27.0, 19.0, 16.0, 14.0, 13.0, 7.0, 10.0, 10.0, 9.0, 3.0, 3.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-32.15996551513672, -31.237821578979492, -30.315677642822266, -29.393535614013672, -28.471391677856445, -27.54924774169922, -26.627103805541992, -25.704959869384766, -24.782817840576172, -23.860673904418945, -22.93852996826172, -22.016387939453125, -21.0942440032959, -20.172100067138672, -19.249956130981445, -18.32781219482422, -17.405668258666992, -16.483524322509766, -15.561381340026855, -14.639237403869629, -13.717094421386719, -12.794950485229492, -11.872806549072266, -10.950662612915039, -10.028519630432129, -9.106375694274902, -8.184232711791992, -7.262088775634766, -6.339945316314697, -5.417801856994629, -4.495657920837402, -3.573514461517334, -2.6513729095458984, -1.7292293310165405, -0.8070857524871826, 0.11505794525146484, 1.0372014045715332, 1.9593448638916016, 2.881488800048828, 3.8036322593688965, 4.725775718688965, 5.647919178009033, 6.570062637329102, 7.492206573486328, 8.414350509643555, 9.336493492126465, 10.258637428283691, 11.180780410766602, 12.102924346923828, 13.025068283081055, 13.947211265563965, 14.869355201721191, 15.791498184204102, 16.713642120361328, 17.635786056518555, 18.55792999267578, 19.480072021484375, 20.4022159576416, 21.324359893798828, 22.246501922607422, 23.16864585876465, 24.090789794921875, 25.0129337310791, 25.935077667236328, 26.857221603393555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 14.0, 18.0, 34.0, 39.0, 86.0, 120.0, 180.0, 263.0, 432.0, 730.0, 1173.0, 1904.0, 3060.0, 5002.0, 8402.0, 13395.0, 21495.0, 34012.0, 50765.0, 74630.0, 100642.0, 126193.0, 137823.0, 129644.0, 105681.0, 79137.0, 55276.0, 36408.0, 23900.0, 14485.0, 8996.0, 5644.0, 3404.0, 2141.0, 1316.0, 786.0, 508.0, 310.0, 193.0, 117.0, 74.0, 46.0, 27.0, 24.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.87109375, -7.61383056640625, -7.3565673828125, -7.09930419921875, -6.842041015625, -6.58477783203125, -6.3275146484375, -6.07025146484375, -5.81298828125, -5.55572509765625, -5.2984619140625, -5.04119873046875, -4.783935546875, -4.52667236328125, -4.2694091796875, -4.01214599609375, -3.7548828125, -3.49761962890625, -3.2403564453125, -2.98309326171875, -2.725830078125, -2.46856689453125, -2.2113037109375, -1.95404052734375, -1.69677734375, -1.43951416015625, -1.1822509765625, -0.92498779296875, -0.667724609375, -0.41046142578125, -0.1531982421875, 0.10406494140625, 0.361328125, 0.61859130859375, 0.8758544921875, 1.13311767578125, 1.390380859375, 1.64764404296875, 1.9049072265625, 2.16217041015625, 2.41943359375, 2.67669677734375, 2.9339599609375, 3.19122314453125, 3.448486328125, 3.70574951171875, 3.9630126953125, 4.22027587890625, 4.4775390625, 4.73480224609375, 4.9920654296875, 5.24932861328125, 5.506591796875, 5.76385498046875, 6.0211181640625, 6.27838134765625, 6.53564453125, 6.79290771484375, 7.0501708984375, 7.30743408203125, 7.564697265625, 7.82196044921875, 8.0792236328125, 8.33648681640625, 8.59375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 11.0, 13.0, 2.0, 13.0, 14.0, 4.0, 10.0, 19.0, 17.0, 14.0, 21.0, 33.0, 34.0, 35.0, 22.0, 41.0, 32.0, 27.0, 33.0, 40.0, 49.0, 38.0, 40.0, 43.0, 32.0, 35.0, 33.0, 33.0, 24.0, 37.0, 27.0, 19.0, 27.0, 19.0, 17.0, 14.0, 13.0, 6.0, 11.0, 10.0, 9.0, 3.0, 3.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-31.953125, -31.03564453125, -30.1181640625, -29.20068359375, -28.283203125, -27.36572265625, -26.4482421875, -25.53076171875, -24.61328125, -23.69580078125, -22.7783203125, -21.86083984375, -20.943359375, -20.02587890625, -19.1083984375, -18.19091796875, -17.2734375, -16.35595703125, -15.4384765625, -14.52099609375, -13.603515625, -12.68603515625, -11.7685546875, -10.85107421875, -9.93359375, -9.01611328125, -8.0986328125, -7.18115234375, -6.263671875, -5.34619140625, -4.4287109375, -3.51123046875, -2.59375, -1.67626953125, -0.7587890625, 0.15869140625, 1.076171875, 1.99365234375, 2.9111328125, 3.82861328125, 4.74609375, 5.66357421875, 6.5810546875, 7.49853515625, 8.416015625, 9.33349609375, 10.2509765625, 11.16845703125, 12.0859375, 13.00341796875, 13.9208984375, 14.83837890625, 15.755859375, 16.67333984375, 17.5908203125, 18.50830078125, 19.42578125, 20.34326171875, 21.2607421875, 22.17822265625, 23.095703125, 24.01318359375, 24.9306640625, 25.84814453125, 26.765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 14.0, 10.0, 23.0, 51.0, 31.0, 72.0, 100.0, 179.0, 254.0, 384.0, 613.0, 908.0, 1406.0, 2141.0, 3378.0, 5284.0, 7923.0, 12681.0, 21510.0, 47577.0, 859337.0, 35910.0, 18009.0, 10913.0, 6990.0, 4479.0, 2965.0, 1858.0, 1216.0, 805.0, 586.0, 314.0, 213.0, 129.0, 106.0, 61.0, 40.0, 25.0, 19.0, 17.0, 5.0, 4.0, 4.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.53125, -21.875244140625, -21.21923828125, -20.563232421875, -19.9072265625, -19.251220703125, -18.59521484375, -17.939208984375, -17.283203125, -16.627197265625, -15.97119140625, -15.315185546875, -14.6591796875, -14.003173828125, -13.34716796875, -12.691162109375, -12.03515625, -11.379150390625, -10.72314453125, -10.067138671875, -9.4111328125, -8.755126953125, -8.09912109375, -7.443115234375, -6.787109375, -6.131103515625, -5.47509765625, -4.819091796875, -4.1630859375, -3.507080078125, -2.85107421875, -2.195068359375, -1.5390625, -0.883056640625, -0.22705078125, 0.428955078125, 1.0849609375, 1.740966796875, 2.39697265625, 3.052978515625, 3.708984375, 4.364990234375, 5.02099609375, 5.677001953125, 6.3330078125, 6.989013671875, 7.64501953125, 8.301025390625, 8.95703125, 9.613037109375, 10.26904296875, 10.925048828125, 11.5810546875, 12.237060546875, 12.89306640625, 13.549072265625, 14.205078125, 14.861083984375, 15.51708984375, 16.173095703125, 16.8291015625, 17.485107421875, 18.14111328125, 18.797119140625, 19.453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 2.0, 12.0, 15.0, 12.0, 7.0, 15.0, 19.0, 22.0, 24.0, 29.0, 22.0, 23.0, 26.0, 30.0, 42.0, 23.0, 37.0, 39.0, 44.0, 41.0, 51.0, 34.0, 43.0, 30.0, 31.0, 29.0, 33.0, 27.0, 30.0, 22.0, 24.0, 19.0, 18.0, 29.0, 13.0, 7.0, 16.0, 9.0, 11.0, 7.0, 6.0, 5.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.84375, -18.21875, -17.59375, -16.96875, -16.34375, -15.71875, -15.09375, -14.46875, -13.84375, -13.21875, -12.59375, -11.96875, -11.34375, -10.71875, -10.09375, -9.46875, -8.84375, -8.21875, -7.59375, -6.96875, -6.34375, -5.71875, -5.09375, -4.46875, -3.84375, -3.21875, -2.59375, -1.96875, -1.34375, -0.71875, -0.09375, 0.53125, 1.15625, 1.78125, 2.40625, 3.03125, 3.65625, 4.28125, 4.90625, 5.53125, 6.15625, 6.78125, 7.40625, 8.03125, 8.65625, 9.28125, 9.90625, 10.53125, 11.15625, 11.78125, 12.40625, 13.03125, 13.65625, 14.28125, 14.90625, 15.53125, 16.15625, 16.78125, 17.40625, 18.03125, 18.65625, 19.28125, 19.90625, 20.53125, 21.15625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 8.0, 3.0, 9.0, 17.0, 14.0, 21.0, 26.0, 33.0, 42.0, 72.0, 105.0, 122.0, 207.0, 307.0, 435.0, 641.0, 996.0, 1638.0, 2821.0, 5007.0, 9905.0, 20651.0, 53178.0, 883834.0, 35480.0, 15323.0, 7403.0, 4012.0, 2265.0, 1331.0, 861.0, 524.0, 388.0, 266.0, 162.0, 115.0, 92.0, 77.0, 40.0, 39.0, 24.0, 19.0, 13.0, 11.0, 3.0, 6.0, 8.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.84033203125, -0.8151016235351562, -0.7898712158203125, -0.7646408081054688, -0.739410400390625, -0.7141799926757812, -0.6889495849609375, -0.6637191772460938, -0.63848876953125, -0.6132583618164062, -0.5880279541015625, -0.5627975463867188, -0.537567138671875, -0.5123367309570312, -0.4871063232421875, -0.46187591552734375, -0.4366455078125, -0.41141510009765625, -0.3861846923828125, -0.36095428466796875, -0.335723876953125, -0.31049346923828125, -0.2852630615234375, -0.26003265380859375, -0.23480224609375, -0.20957183837890625, -0.1843414306640625, -0.15911102294921875, -0.133880615234375, -0.10865020751953125, -0.0834197998046875, -0.05818939208984375, -0.032958984375, -0.00772857666015625, 0.0175018310546875, 0.04273223876953125, 0.067962646484375, 0.09319305419921875, 0.1184234619140625, 0.14365386962890625, 0.16888427734375, 0.19411468505859375, 0.2193450927734375, 0.24457550048828125, 0.269805908203125, 0.29503631591796875, 0.3202667236328125, 0.34549713134765625, 0.3707275390625, 0.39595794677734375, 0.4211883544921875, 0.44641876220703125, 0.471649169921875, 0.49687957763671875, 0.5221099853515625, 0.5473403930664062, 0.57257080078125, 0.5978012084960938, 0.6230316162109375, 0.6482620239257812, 0.673492431640625, 0.6987228393554688, 0.7239532470703125, 0.7491836547851562, 0.7744140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 13.0, 7.0, 24.0, 15.0, 23.0, 22.0, 35.0, 31.0, 45.0, 40.0, 38.0, 45.0, 37.0, 53.0, 60.0, 56.0, 58.0, 44.0, 35.0, 41.0, 32.0, 39.0, 33.0, 30.0, 24.0, 19.0, 16.0, 9.0, 11.0, 8.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.3230368494987488e-05, -1.2811273336410522e-05, -1.2392178177833557e-05, -1.1973083019256592e-05, -1.1553987860679626e-05, -1.1134892702102661e-05, -1.0715797543525696e-05, -1.029670238494873e-05, -9.877607226371765e-06, -9.4585120677948e-06, -9.039416909217834e-06, -8.620321750640869e-06, -8.201226592063904e-06, -7.782131433486938e-06, -7.363036274909973e-06, -6.943941116333008e-06, -6.5248459577560425e-06, -6.105750799179077e-06, -5.686655640602112e-06, -5.2675604820251465e-06, -4.848465323448181e-06, -4.429370164871216e-06, -4.0102750062942505e-06, -3.591179847717285e-06, -3.17208468914032e-06, -2.7529895305633545e-06, -2.333894371986389e-06, -1.914799213409424e-06, -1.4957040548324585e-06, -1.0766088962554932e-06, -6.575137376785278e-07, -2.384185791015625e-07, 1.8067657947540283e-07, 5.997717380523682e-07, 1.0188668966293335e-06, 1.4379620552062988e-06, 1.8570572137832642e-06, 2.2761523723602295e-06, 2.695247530937195e-06, 3.11434268951416e-06, 3.5334378480911255e-06, 3.952533006668091e-06, 4.371628165245056e-06, 4.7907233238220215e-06, 5.209818482398987e-06, 5.628913640975952e-06, 6.0480087995529175e-06, 6.467103958129883e-06, 6.886199116706848e-06, 7.3052942752838135e-06, 7.724389433860779e-06, 8.143484592437744e-06, 8.56257975101471e-06, 8.981674909591675e-06, 9.40077006816864e-06, 9.819865226745605e-06, 1.023896038532257e-05, 1.0658055543899536e-05, 1.1077150702476501e-05, 1.1496245861053467e-05, 1.1915341019630432e-05, 1.2334436178207397e-05, 1.2753531336784363e-05, 1.3172626495361328e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 7.0, 5.0, 8.0, 11.0, 15.0, 17.0, 35.0, 58.0, 76.0, 102.0, 149.0, 249.0, 396.0, 514.0, 759.0, 1062.0, 1683.0, 2375.0, 3528.0, 5347.0, 8319.0, 12763.0, 19943.0, 32010.0, 53378.0, 89544.0, 144333.0, 191877.0, 175659.0, 118078.0, 70966.0, 42120.0, 25657.0, 15998.0, 10438.0, 6846.0, 4637.0, 3055.0, 2093.0, 1471.0, 921.0, 672.0, 469.0, 261.0, 237.0, 146.0, 83.0, 67.0, 42.0, 33.0, 20.0, 15.0, 10.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.366943359375, -0.3553962707519531, -0.34384918212890625, -0.3323020935058594, -0.3207550048828125, -0.3092079162597656, -0.29766082763671875, -0.2861137390136719, -0.274566650390625, -0.2630195617675781, -0.25147247314453125, -0.23992538452148438, -0.2283782958984375, -0.21683120727539062, -0.20528411865234375, -0.19373703002929688, -0.18218994140625, -0.17064285278320312, -0.15909576416015625, -0.14754867553710938, -0.1360015869140625, -0.12445449829101562, -0.11290740966796875, -0.10136032104492188, -0.089813232421875, -0.07826614379882812, -0.06671905517578125, -0.055171966552734375, -0.0436248779296875, -0.032077789306640625, -0.02053070068359375, -0.008983612060546875, 0.0025634765625, 0.014110565185546875, 0.02565765380859375, 0.037204742431640625, 0.0487518310546875, 0.060298919677734375, 0.07184600830078125, 0.08339309692382812, 0.094940185546875, 0.10648727416992188, 0.11803436279296875, 0.12958145141601562, 0.1411285400390625, 0.15267562866210938, 0.16422271728515625, 0.17576980590820312, 0.18731689453125, 0.19886398315429688, 0.21041107177734375, 0.22195816040039062, 0.2335052490234375, 0.24505233764648438, 0.25659942626953125, 0.2681465148925781, 0.279693603515625, 0.2912406921386719, 0.30278778076171875, 0.3143348693847656, 0.3258819580078125, 0.3374290466308594, 0.34897613525390625, 0.3605232238769531, 0.3720703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 11.0, 13.0, 28.0, 45.0, 76.0, 110.0, 112.0, 140.0, 120.0, 103.0, 65.0, 49.0, 44.0, 13.0, 14.0, 10.0, 3.0, 4.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.23180007934570312, -0.22336578369140625, -0.21493148803710938, -0.2064971923828125, -0.19806289672851562, -0.18962860107421875, -0.18119430541992188, -0.172760009765625, -0.16432571411132812, -0.15589141845703125, -0.14745712280273438, -0.1390228271484375, -0.13058853149414062, -0.12215423583984375, -0.11371994018554688, -0.10528564453125, -0.09685134887695312, -0.08841705322265625, -0.07998275756835938, -0.0715484619140625, -0.06311416625976562, -0.05467987060546875, -0.046245574951171875, -0.037811279296875, -0.029376983642578125, -0.02094268798828125, -0.012508392333984375, -0.0040740966796875, 0.004360198974609375, 0.01279449462890625, 0.021228790283203125, 0.0296630859375, 0.038097381591796875, 0.04653167724609375, 0.054965972900390625, 0.0634002685546875, 0.07183456420898438, 0.08026885986328125, 0.08870315551757812, 0.097137451171875, 0.10557174682617188, 0.11400604248046875, 0.12244033813476562, 0.1308746337890625, 0.13930892944335938, 0.14774322509765625, 0.15617752075195312, 0.16461181640625, 0.17304611206054688, 0.18148040771484375, 0.18991470336914062, 0.1983489990234375, 0.20678329467773438, 0.21521759033203125, 0.22365188598632812, 0.232086181640625, 0.24052047729492188, 0.24895477294921875, 0.2573890686035156, 0.2658233642578125, 0.2742576599121094, 0.28269195556640625, 0.2911262512207031, 0.299560546875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 8.0, 8.0, 8.0, 12.0, 20.0, 19.0, 24.0, 22.0, 18.0, 30.0, 33.0, 33.0, 32.0, 29.0, 42.0, 44.0, 45.0, 58.0, 37.0, 43.0, 43.0, 43.0, 35.0, 33.0, 29.0, 21.0, 22.0, 29.0, 31.0, 18.0, 19.0, 20.0, 17.0, 8.0, 12.0, 7.0, 10.0, 10.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-26.682445526123047, -25.908300399780273, -25.1341552734375, -24.360010147094727, -23.585865020751953, -22.811717987060547, -22.037572860717773, -21.263427734375, -20.489282608032227, -19.715137481689453, -18.94099235534668, -18.166847229003906, -17.3927001953125, -16.618555068969727, -15.844409942626953, -15.07026481628418, -14.296119689941406, -13.521974563598633, -12.74782943725586, -11.97368335723877, -11.199538230895996, -10.425393104553223, -9.651247024536133, -8.87710189819336, -8.102956771850586, -7.3288116455078125, -6.554666042327881, -5.780520439147949, -5.006375312805176, -4.232230186462402, -3.4580845832824707, -2.683938980102539, -1.9097938537597656, -1.135648488998413, -0.36150312423706055, 0.412642240524292, 1.1867876052856445, 1.960932970046997, 2.7350783348083496, 3.5092239379882812, 4.283369064331055, 5.057514190673828, 5.83165979385376, 6.605805397033691, 7.379950523376465, 8.154095649719238, 8.928241729736328, 9.702386856079102, 10.476531982421875, 11.250677108764648, 12.024822235107422, 12.798968315124512, 13.573113441467285, 14.347258567810059, 15.121404647827148, 15.895549774169922, 16.669694900512695, 17.44384002685547, 18.217985153198242, 18.992130279541016, 19.766277313232422, 20.540422439575195, 21.31456756591797, 22.088712692260742, 22.862857818603516]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 11.0, 13.0, 2.0, 13.0, 14.0, 5.0, 9.0, 19.0, 17.0, 14.0, 21.0, 32.0, 34.0, 35.0, 22.0, 41.0, 33.0, 28.0, 32.0, 39.0, 49.0, 36.0, 42.0, 42.0, 32.0, 34.0, 36.0, 30.0, 25.0, 39.0, 27.0, 16.0, 29.0, 18.0, 18.0, 12.0, 15.0, 6.0, 10.0, 12.0, 8.0, 4.0, 2.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-31.9002742767334, -30.98528289794922, -30.070293426513672, -29.155302047729492, -28.240312576293945, -27.325321197509766, -26.41033172607422, -25.49534034729004, -24.58034896850586, -23.66535758972168, -22.750368118286133, -21.835376739501953, -20.920387268066406, -20.005395889282227, -19.090404510498047, -18.1754150390625, -17.260425567626953, -16.345434188842773, -15.430444717407227, -14.515453338623047, -13.6004638671875, -12.68547248840332, -11.770482063293457, -10.855491638183594, -9.94050121307373, -9.025510787963867, -8.110520362854004, -7.195529460906982, -6.280539035797119, -5.365548610687256, -4.450557708740234, -3.535567283630371, -2.620576858520508, -1.705586314201355, -0.7905957698822021, 0.12439489364624023, 1.0393853187561035, 1.9543757438659668, 2.8693666458129883, 3.7843570709228516, 4.699347496032715, 5.614337921142578, 6.529328346252441, 7.444319248199463, 8.359310150146484, 9.274299621582031, 10.189291000366211, 11.104281425476074, 12.019271850585938, 12.9342622756958, 13.849252700805664, 14.764244079589844, 15.67923355102539, 16.59422492980957, 17.50921630859375, 18.424205780029297, 19.339195251464844, 20.254186630249023, 21.16917610168457, 22.08416748046875, 22.999156951904297, 23.914148330688477, 24.829139709472656, 25.744129180908203, 26.659120559692383]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 6.0, 12.0, 16.0, 32.0, 33.0, 47.0, 77.0, 133.0, 210.0, 301.0, 481.0, 761.0, 1181.0, 1896.0, 2846.0, 4300.0, 6689.0, 10050.0, 14706.0, 21114.0, 30342.0, 41391.0, 55116.0, 69256.0, 83101.0, 93310.0, 99530.0, 98393.0, 91252.0, 79513.0, 65766.0, 51231.0, 38773.0, 27895.0, 19705.0, 13269.0, 9245.0, 5859.0, 3864.0, 2516.0, 1577.0, 981.0, 667.0, 445.0, 249.0, 151.0, 119.0, 52.0, 34.0, 28.0, 16.0, 7.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.7421875, -14.2646484375, -13.787109375, -13.3095703125, -12.83203125, -12.3544921875, -11.876953125, -11.3994140625, -10.921875, -10.4443359375, -9.966796875, -9.4892578125, -9.01171875, -8.5341796875, -8.056640625, -7.5791015625, -7.1015625, -6.6240234375, -6.146484375, -5.6689453125, -5.19140625, -4.7138671875, -4.236328125, -3.7587890625, -3.28125, -2.8037109375, -2.326171875, -1.8486328125, -1.37109375, -0.8935546875, -0.416015625, 0.0615234375, 0.5390625, 1.0166015625, 1.494140625, 1.9716796875, 2.44921875, 2.9267578125, 3.404296875, 3.8818359375, 4.359375, 4.8369140625, 5.314453125, 5.7919921875, 6.26953125, 6.7470703125, 7.224609375, 7.7021484375, 8.1796875, 8.6572265625, 9.134765625, 9.6123046875, 10.08984375, 10.5673828125, 11.044921875, 11.5224609375, 12.0, 12.4775390625, 12.955078125, 13.4326171875, 13.91015625, 14.3876953125, 14.865234375, 15.3427734375, 15.8203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 16.0, 1.0, 12.0, 14.0, 6.0, 9.0, 18.0, 16.0, 16.0, 20.0, 35.0, 29.0, 38.0, 21.0, 37.0, 37.0, 23.0, 39.0, 38.0, 44.0, 40.0, 41.0, 42.0, 32.0, 36.0, 36.0, 28.0, 28.0, 38.0, 25.0, 17.0, 29.0, 22.0, 17.0, 11.0, 14.0, 7.0, 11.0, 9.0, 10.0, 4.0, 3.0, 5.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0], "bins": [-31.328125, -30.431640625, -29.53515625, -28.638671875, -27.7421875, -26.845703125, -25.94921875, -25.052734375, -24.15625, -23.259765625, -22.36328125, -21.466796875, -20.5703125, -19.673828125, -18.77734375, -17.880859375, -16.984375, -16.087890625, -15.19140625, -14.294921875, -13.3984375, -12.501953125, -11.60546875, -10.708984375, -9.8125, -8.916015625, -8.01953125, -7.123046875, -6.2265625, -5.330078125, -4.43359375, -3.537109375, -2.640625, -1.744140625, -0.84765625, 0.048828125, 0.9453125, 1.841796875, 2.73828125, 3.634765625, 4.53125, 5.427734375, 6.32421875, 7.220703125, 8.1171875, 9.013671875, 9.91015625, 10.806640625, 11.703125, 12.599609375, 13.49609375, 14.392578125, 15.2890625, 16.185546875, 17.08203125, 17.978515625, 18.875, 19.771484375, 20.66796875, 21.564453125, 22.4609375, 23.357421875, 24.25390625, 25.150390625, 26.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 10.0, 18.0, 23.0, 54.0, 101.0, 140.0, 215.0, 356.0, 524.0, 791.0, 1221.0, 1986.0, 3129.0, 4884.0, 7560.0, 11856.0, 17232.0, 25024.0, 34938.0, 48199.0, 63548.0, 78639.0, 90887.0, 100409.0, 102695.0, 97738.0, 86936.0, 72878.0, 57373.0, 43387.0, 31285.0, 21739.0, 14946.0, 9855.0, 6409.0, 4199.0, 2677.0, 1719.0, 1081.0, 695.0, 477.0, 280.0, 168.0, 100.0, 56.0, 44.0, 38.0, 17.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0], "bins": [-16.96875, -16.4742431640625, -15.979736328125, -15.4852294921875, -14.99072265625, -14.4962158203125, -14.001708984375, -13.5072021484375, -13.0126953125, -12.5181884765625, -12.023681640625, -11.5291748046875, -11.03466796875, -10.5401611328125, -10.045654296875, -9.5511474609375, -9.056640625, -8.5621337890625, -8.067626953125, -7.5731201171875, -7.07861328125, -6.5841064453125, -6.089599609375, -5.5950927734375, -5.1005859375, -4.6060791015625, -4.111572265625, -3.6170654296875, -3.12255859375, -2.6280517578125, -2.133544921875, -1.6390380859375, -1.14453125, -0.6500244140625, -0.155517578125, 0.3389892578125, 0.83349609375, 1.3280029296875, 1.822509765625, 2.3170166015625, 2.8115234375, 3.3060302734375, 3.800537109375, 4.2950439453125, 4.78955078125, 5.2840576171875, 5.778564453125, 6.2730712890625, 6.767578125, 7.2620849609375, 7.756591796875, 8.2510986328125, 8.74560546875, 9.2401123046875, 9.734619140625, 10.2291259765625, 10.7236328125, 11.2181396484375, 11.712646484375, 12.2071533203125, 12.70166015625, 13.1961669921875, 13.690673828125, 14.1851806640625, 14.6796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 0.0, 8.0, 4.0, 6.0, 6.0, 11.0, 13.0, 12.0, 12.0, 24.0, 19.0, 26.0, 30.0, 29.0, 30.0, 37.0, 37.0, 39.0, 40.0, 42.0, 43.0, 38.0, 41.0, 44.0, 47.0, 31.0, 44.0, 33.0, 34.0, 25.0, 24.0, 32.0, 25.0, 16.0, 15.0, 16.0, 12.0, 12.0, 9.0, 6.0, 7.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.703125, -17.069580078125, -16.43603515625, -15.802490234375, -15.1689453125, -14.535400390625, -13.90185546875, -13.268310546875, -12.634765625, -12.001220703125, -11.36767578125, -10.734130859375, -10.1005859375, -9.467041015625, -8.83349609375, -8.199951171875, -7.56640625, -6.932861328125, -6.29931640625, -5.665771484375, -5.0322265625, -4.398681640625, -3.76513671875, -3.131591796875, -2.498046875, -1.864501953125, -1.23095703125, -0.597412109375, 0.0361328125, 0.669677734375, 1.30322265625, 1.936767578125, 2.5703125, 3.203857421875, 3.83740234375, 4.470947265625, 5.1044921875, 5.738037109375, 6.37158203125, 7.005126953125, 7.638671875, 8.272216796875, 8.90576171875, 9.539306640625, 10.1728515625, 10.806396484375, 11.43994140625, 12.073486328125, 12.70703125, 13.340576171875, 13.97412109375, 14.607666015625, 15.2412109375, 15.874755859375, 16.50830078125, 17.141845703125, 17.775390625, 18.408935546875, 19.04248046875, 19.676025390625, 20.3095703125, 20.943115234375, 21.57666015625, 22.210205078125, 22.84375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 8.0, 6.0, 16.0, 20.0, 26.0, 39.0, 48.0, 80.0, 103.0, 188.0, 303.0, 474.0, 689.0, 1131.0, 1936.0, 3144.0, 5183.0, 8879.0, 14957.0, 24762.0, 39290.0, 59518.0, 84717.0, 109123.0, 128050.0, 132613.0, 122336.0, 100326.0, 74901.0, 51375.0, 32920.0, 20530.0, 12226.0, 7381.0, 4451.0, 2647.0, 1552.0, 975.0, 584.0, 375.0, 236.0, 156.0, 101.0, 71.0, 48.0, 23.0, 15.0, 11.0, 8.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.66015625, -5.4849853515625, -5.309814453125, -5.1346435546875, -4.95947265625, -4.7843017578125, -4.609130859375, -4.4339599609375, -4.2587890625, -4.0836181640625, -3.908447265625, -3.7332763671875, -3.55810546875, -3.3829345703125, -3.207763671875, -3.0325927734375, -2.857421875, -2.6822509765625, -2.507080078125, -2.3319091796875, -2.15673828125, -1.9815673828125, -1.806396484375, -1.6312255859375, -1.4560546875, -1.2808837890625, -1.105712890625, -0.9305419921875, -0.75537109375, -0.5802001953125, -0.405029296875, -0.2298583984375, -0.0546875, 0.1204833984375, 0.295654296875, 0.4708251953125, 0.64599609375, 0.8211669921875, 0.996337890625, 1.1715087890625, 1.3466796875, 1.5218505859375, 1.697021484375, 1.8721923828125, 2.04736328125, 2.2225341796875, 2.397705078125, 2.5728759765625, 2.748046875, 2.9232177734375, 3.098388671875, 3.2735595703125, 3.44873046875, 3.6239013671875, 3.799072265625, 3.9742431640625, 4.1494140625, 4.3245849609375, 4.499755859375, 4.6749267578125, 4.85009765625, 5.0252685546875, 5.200439453125, 5.3756103515625, 5.55078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 14.0, 9.0, 19.0, 18.0, 29.0, 26.0, 33.0, 45.0, 43.0, 42.0, 42.0, 56.0, 69.0, 69.0, 60.0, 50.0, 52.0, 48.0, 40.0, 45.0, 39.0, 27.0, 28.0, 23.0, 13.0, 7.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007290840148925781, -0.0007071644067764282, -0.0006852447986602783, -0.0006633251905441284, -0.0006414055824279785, -0.0006194859743118286, -0.0005975663661956787, -0.0005756467580795288, -0.0005537271499633789, -0.000531807541847229, -0.0005098879337310791, -0.0004879683256149292, -0.0004660487174987793, -0.0004441291093826294, -0.0004222095012664795, -0.0004002898931503296, -0.0003783702850341797, -0.0003564506769180298, -0.0003345310688018799, -0.00031261146068573, -0.0002906918525695801, -0.0002687722444534302, -0.0002468526363372803, -0.00022493302822113037, -0.00020301342010498047, -0.00018109381198883057, -0.00015917420387268066, -0.00013725459575653076, -0.00011533498764038086, -9.341537952423096e-05, -7.149577140808105e-05, -4.957616329193115e-05, -2.765655517578125e-05, -5.736947059631348e-06, 1.6182661056518555e-05, 3.810226917266846e-05, 6.002187728881836e-05, 8.194148540496826e-05, 0.00010386109352111816, 0.00012578070163726807, 0.00014770030975341797, 0.00016961991786956787, 0.00019153952598571777, 0.00021345913410186768, 0.00023537874221801758, 0.0002572983503341675, 0.0002792179584503174, 0.0003011375665664673, 0.0003230571746826172, 0.0003449767827987671, 0.000366896390914917, 0.0003888159990310669, 0.0004107356071472168, 0.0004326552152633667, 0.0004545748233795166, 0.0004764944314956665, 0.0004984140396118164, 0.0005203336477279663, 0.0005422532558441162, 0.0005641728639602661, 0.000586092472076416, 0.0006080120801925659, 0.0006299316883087158, 0.0006518512964248657, 0.0006737709045410156]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 15.0, 8.0, 6.0, 14.0, 23.0, 38.0, 51.0, 71.0, 120.0, 172.0, 246.0, 421.0, 751.0, 1280.0, 2217.0, 4232.0, 8254.0, 16209.0, 33415.0, 66689.0, 118343.0, 174143.0, 199706.0, 172568.0, 117215.0, 65621.0, 32980.0, 16146.0, 8022.0, 4189.0, 2174.0, 1288.0, 745.0, 429.0, 256.0, 179.0, 111.0, 69.0, 44.0, 35.0, 21.0, 14.0, 7.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.90625, -9.6190185546875, -9.331787109375, -9.0445556640625, -8.75732421875, -8.4700927734375, -8.182861328125, -7.8956298828125, -7.6083984375, -7.3211669921875, -7.033935546875, -6.7467041015625, -6.45947265625, -6.1722412109375, -5.885009765625, -5.5977783203125, -5.310546875, -5.0233154296875, -4.736083984375, -4.4488525390625, -4.16162109375, -3.8743896484375, -3.587158203125, -3.2999267578125, -3.0126953125, -2.7254638671875, -2.438232421875, -2.1510009765625, -1.86376953125, -1.5765380859375, -1.289306640625, -1.0020751953125, -0.71484375, -0.4276123046875, -0.140380859375, 0.1468505859375, 0.43408203125, 0.7213134765625, 1.008544921875, 1.2957763671875, 1.5830078125, 1.8702392578125, 2.157470703125, 2.4447021484375, 2.73193359375, 3.0191650390625, 3.306396484375, 3.5936279296875, 3.880859375, 4.1680908203125, 4.455322265625, 4.7425537109375, 5.02978515625, 5.3170166015625, 5.604248046875, 5.8914794921875, 6.1787109375, 6.4659423828125, 6.753173828125, 7.0404052734375, 7.32763671875, 7.6148681640625, 7.902099609375, 8.1893310546875, 8.4765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 2.0, 6.0, 9.0, 8.0, 6.0, 11.0, 16.0, 20.0, 17.0, 28.0, 31.0, 34.0, 52.0, 45.0, 50.0, 50.0, 59.0, 52.0, 58.0, 64.0, 57.0, 50.0, 53.0, 44.0, 37.0, 31.0, 29.0, 19.0, 12.0, 16.0, 7.0, 4.0, 9.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.95703125, -2.861083984375, -2.76513671875, -2.669189453125, -2.5732421875, -2.477294921875, -2.38134765625, -2.285400390625, -2.189453125, -2.093505859375, -1.99755859375, -1.901611328125, -1.8056640625, -1.709716796875, -1.61376953125, -1.517822265625, -1.421875, -1.325927734375, -1.22998046875, -1.134033203125, -1.0380859375, -0.942138671875, -0.84619140625, -0.750244140625, -0.654296875, -0.558349609375, -0.46240234375, -0.366455078125, -0.2705078125, -0.174560546875, -0.07861328125, 0.017333984375, 0.11328125, 0.209228515625, 0.30517578125, 0.401123046875, 0.4970703125, 0.593017578125, 0.68896484375, 0.784912109375, 0.880859375, 0.976806640625, 1.07275390625, 1.168701171875, 1.2646484375, 1.360595703125, 1.45654296875, 1.552490234375, 1.6484375, 1.744384765625, 1.84033203125, 1.936279296875, 2.0322265625, 2.128173828125, 2.22412109375, 2.320068359375, 2.416015625, 2.511962890625, 2.60791015625, 2.703857421875, 2.7998046875, 2.895751953125, 2.99169921875, 3.087646484375, 3.18359375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 6.0, 7.0, 6.0, 16.0, 13.0, 15.0, 18.0, 32.0, 24.0, 26.0, 26.0, 32.0, 34.0, 39.0, 39.0, 54.0, 41.0, 44.0, 38.0, 48.0, 38.0, 50.0, 38.0, 37.0, 40.0, 23.0, 29.0, 17.0, 25.0, 20.0, 30.0, 11.0, 18.0, 8.0, 6.0, 9.0, 5.0, 11.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-27.606557846069336, -26.806156158447266, -26.005752563476562, -25.205350875854492, -24.40494728088379, -23.60454559326172, -22.804141998291016, -22.003740310668945, -21.203336715698242, -20.402935028076172, -19.60253143310547, -18.8021297454834, -18.001726150512695, -17.201324462890625, -16.400920867919922, -15.600519180297852, -14.800116539001465, -13.999713897705078, -13.199311256408691, -12.398908615112305, -11.598505973815918, -10.798103332519531, -9.997701644897461, -9.197298049926758, -8.396896362304688, -7.596493721008301, -6.796091079711914, -5.995688438415527, -5.195285797119141, -4.394883632659912, -3.5944809913635254, -2.7940783500671387, -1.9936752319335938, -1.193272590637207, -0.39287006855010986, 0.4075324535369873, 1.207935094833374, 2.0083374977111816, 2.8087401390075684, 3.609142780303955, 4.409545421600342, 5.2099480628967285, 6.010350704193115, 6.810752868652344, 7.6111555099487305, 8.411558151245117, 9.211960792541504, 10.01236343383789, 10.812766075134277, 11.613168716430664, 12.41357135772705, 13.213973999023438, 14.014376640319824, 14.814779281616211, 15.615180969238281, 16.415584564208984, 17.215986251831055, 18.016387939453125, 18.816791534423828, 19.6171932220459, 20.4175968170166, 21.217998504638672, 22.018402099609375, 22.818803787231445, 23.61920738220215]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 11.0, 10.0, 2.0, 8.0, 12.0, 14.0, 21.0, 17.0, 23.0, 21.0, 25.0, 21.0, 24.0, 37.0, 43.0, 28.0, 38.0, 29.0, 30.0, 39.0, 37.0, 49.0, 40.0, 43.0, 45.0, 42.0, 31.0, 27.0, 33.0, 19.0, 32.0, 21.0, 25.0, 18.0, 14.0, 8.0, 13.0, 10.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.7548828125, -31.74823570251465, -30.741588592529297, -29.734943389892578, -28.728296279907227, -27.721649169921875, -26.715003967285156, -25.708356857299805, -24.701709747314453, -23.6950626373291, -22.68841552734375, -21.68177032470703, -20.67512321472168, -19.668476104736328, -18.66183090209961, -17.655183792114258, -16.648536682128906, -15.641889572143555, -14.63524341583252, -13.628597259521484, -12.621950149536133, -11.615303039550781, -10.608656883239746, -9.602010726928711, -8.59536361694336, -7.588716983795166, -6.582070350646973, -5.575423717498779, -4.568777084350586, -3.5621304512023926, -2.555483818054199, -1.5488371849060059, -0.5421924591064453, 0.46445417404174805, 1.4711008071899414, 2.4777474403381348, 3.484394073486328, 4.4910407066345215, 5.497687339782715, 6.504333972930908, 7.510980606079102, 8.517627716064453, 9.524273872375488, 10.530920028686523, 11.537567138671875, 12.544214248657227, 13.550860404968262, 14.557506561279297, 15.564153671264648, 16.57080078125, 17.57744598388672, 18.58409309387207, 19.590740203857422, 20.597387313842773, 21.604034423828125, 22.610679626464844, 23.617326736450195, 24.623973846435547, 25.630619049072266, 26.637266159057617, 27.64391326904297, 28.65056037902832, 29.657207489013672, 30.66385269165039, 31.670499801635742]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 10.0, 8.0, 17.0, 21.0, 54.0, 83.0, 147.0, 247.0, 395.0, 705.0, 1084.0, 1709.0, 2879.0, 4555.0, 7152.0, 11409.0, 18066.0, 27787.0, 41516.0, 62697.0, 90680.0, 129921.0, 178051.0, 233822.0, 293710.0, 349133.0, 387950.0, 405332.0, 395518.0, 360396.0, 308081.0, 249394.0, 191709.0, 140515.0, 99692.0, 69168.0, 46585.0, 30536.0, 19913.0, 12684.0, 8037.0, 5033.0, 3135.0, 1905.0, 1173.0, 711.0, 383.0, 235.0, 135.0, 98.0, 47.0, 32.0, 14.0, 10.0, 8.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.203125, -16.641357421875, -16.07958984375, -15.517822265625, -14.9560546875, -14.394287109375, -13.83251953125, -13.270751953125, -12.708984375, -12.147216796875, -11.58544921875, -11.023681640625, -10.4619140625, -9.900146484375, -9.33837890625, -8.776611328125, -8.21484375, -7.653076171875, -7.09130859375, -6.529541015625, -5.9677734375, -5.406005859375, -4.84423828125, -4.282470703125, -3.720703125, -3.158935546875, -2.59716796875, -2.035400390625, -1.4736328125, -0.911865234375, -0.35009765625, 0.211669921875, 0.7734375, 1.335205078125, 1.89697265625, 2.458740234375, 3.0205078125, 3.582275390625, 4.14404296875, 4.705810546875, 5.267578125, 5.829345703125, 6.39111328125, 6.952880859375, 7.5146484375, 8.076416015625, 8.63818359375, 9.199951171875, 9.76171875, 10.323486328125, 10.88525390625, 11.447021484375, 12.0087890625, 12.570556640625, 13.13232421875, 13.694091796875, 14.255859375, 14.817626953125, 15.37939453125, 15.941162109375, 16.5029296875, 17.064697265625, 17.62646484375, 18.188232421875, 18.75]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 14.0, 4.0, 7.0, 6.0, 15.0, 13.0, 20.0, 15.0, 27.0, 19.0, 28.0, 23.0, 19.0, 39.0, 38.0, 33.0, 32.0, 33.0, 31.0, 35.0, 43.0, 47.0, 36.0, 47.0, 42.0, 41.0, 30.0, 30.0, 29.0, 24.0, 27.0, 20.0, 25.0, 17.0, 15.0, 9.0, 13.0, 11.0, 6.0, 4.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.832275390625, -25.00830078125, -24.184326171875, -23.3603515625, -22.536376953125, -21.71240234375, -20.888427734375, -20.064453125, -19.240478515625, -18.41650390625, -17.592529296875, -16.7685546875, -15.944580078125, -15.12060546875, -14.296630859375, -13.47265625, -12.648681640625, -11.82470703125, -11.000732421875, -10.1767578125, -9.352783203125, -8.52880859375, -7.704833984375, -6.880859375, -6.056884765625, -5.23291015625, -4.408935546875, -3.5849609375, -2.760986328125, -1.93701171875, -1.113037109375, -0.2890625, 0.534912109375, 1.35888671875, 2.182861328125, 3.0068359375, 3.830810546875, 4.65478515625, 5.478759765625, 6.302734375, 7.126708984375, 7.95068359375, 8.774658203125, 9.5986328125, 10.422607421875, 11.24658203125, 12.070556640625, 12.89453125, 13.718505859375, 14.54248046875, 15.366455078125, 16.1904296875, 17.014404296875, 17.83837890625, 18.662353515625, 19.486328125, 20.310302734375, 21.13427734375, 21.958251953125, 22.7822265625, 23.606201171875, 24.43017578125, 25.254150390625, 26.078125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 17.0, 25.0, 42.0, 63.0, 101.0, 221.0, 368.0, 619.0, 991.0, 1601.0, 2842.0, 4723.0, 7467.0, 11954.0, 19153.0, 29537.0, 44241.0, 65146.0, 93922.0, 129274.0, 172604.0, 218820.0, 267927.0, 312158.0, 347493.0, 366415.0, 365403.0, 347219.0, 312722.0, 267493.0, 219301.0, 171108.0, 129080.0, 93291.0, 65665.0, 44840.0, 29941.0, 19027.0, 12256.0, 7630.0, 4681.0, 2731.0, 1702.0, 1037.0, 588.0, 345.0, 210.0, 126.0, 68.0, 45.0, 22.0, 20.0, 10.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9375, -15.40625, -14.875, -14.34375, -13.8125, -13.28125, -12.75, -12.21875, -11.6875, -11.15625, -10.625, -10.09375, -9.5625, -9.03125, -8.5, -7.96875, -7.4375, -6.90625, -6.375, -5.84375, -5.3125, -4.78125, -4.25, -3.71875, -3.1875, -2.65625, -2.125, -1.59375, -1.0625, -0.53125, 0.0, 0.53125, 1.0625, 1.59375, 2.125, 2.65625, 3.1875, 3.71875, 4.25, 4.78125, 5.3125, 5.84375, 6.375, 6.90625, 7.4375, 7.96875, 8.5, 9.03125, 9.5625, 10.09375, 10.625, 11.15625, 11.6875, 12.21875, 12.75, 13.28125, 13.8125, 14.34375, 14.875, 15.40625, 15.9375, 16.46875, 17.0, 17.53125, 18.0625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 11.0, 5.0, 12.0, 12.0, 28.0, 29.0, 44.0, 53.0, 64.0, 74.0, 68.0, 102.0, 109.0, 128.0, 146.0, 180.0, 158.0, 176.0, 197.0, 195.0, 204.0, 190.0, 202.0, 194.0, 169.0, 193.0, 161.0, 145.0, 138.0, 142.0, 96.0, 84.0, 75.0, 61.0, 43.0, 48.0, 43.0, 22.0, 25.0, 11.0, 19.0, 5.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.57763671875, -12.1865234375, -11.79541015625, -11.404296875, -11.01318359375, -10.6220703125, -10.23095703125, -9.83984375, -9.44873046875, -9.0576171875, -8.66650390625, -8.275390625, -7.88427734375, -7.4931640625, -7.10205078125, -6.7109375, -6.31982421875, -5.9287109375, -5.53759765625, -5.146484375, -4.75537109375, -4.3642578125, -3.97314453125, -3.58203125, -3.19091796875, -2.7998046875, -2.40869140625, -2.017578125, -1.62646484375, -1.2353515625, -0.84423828125, -0.453125, -0.06201171875, 0.3291015625, 0.72021484375, 1.111328125, 1.50244140625, 1.8935546875, 2.28466796875, 2.67578125, 3.06689453125, 3.4580078125, 3.84912109375, 4.240234375, 4.63134765625, 5.0224609375, 5.41357421875, 5.8046875, 6.19580078125, 6.5869140625, 6.97802734375, 7.369140625, 7.76025390625, 8.1513671875, 8.54248046875, 8.93359375, 9.32470703125, 9.7158203125, 10.10693359375, 10.498046875, 10.88916015625, 11.2802734375, 11.67138671875, 12.0625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 9.0, 5.0, 11.0, 12.0, 20.0, 17.0, 26.0, 20.0, 18.0, 30.0, 32.0, 33.0, 34.0, 44.0, 53.0, 46.0, 47.0, 55.0, 44.0, 41.0, 39.0, 38.0, 43.0, 52.0, 35.0, 38.0, 23.0, 17.0, 17.0, 14.0, 28.0, 12.0, 9.0, 4.0, 8.0, 6.0, 4.0, 5.0, 3.0, 7.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.915828704833984, -27.016340255737305, -26.116853713989258, -25.217365264892578, -24.31787872314453, -23.41839027404785, -22.518901824951172, -21.619415283203125, -20.719926834106445, -19.820438385009766, -18.92095184326172, -18.02146339416504, -17.12197494506836, -16.222488403320312, -15.322999954223633, -14.42351245880127, -13.524024963378906, -12.624537467956543, -11.72504997253418, -10.8255615234375, -9.926074028015137, -9.026586532592773, -8.127098083496094, -7.2276105880737305, -6.328123092651367, -5.428635597229004, -4.529147624969482, -3.62965989112854, -2.7301721572875977, -1.8306846618652344, -0.9311966896057129, -0.031708717346191406, 0.8677787780761719, 1.7672665119171143, 2.6667542457580566, 3.566241979598999, 4.465729713439941, 5.365217208862305, 6.264705181121826, 7.164193153381348, 8.063680648803711, 8.963168144226074, 9.862655639648438, 10.762144088745117, 11.66163158416748, 12.561119079589844, 13.460607528686523, 14.360095024108887, 15.25958251953125, 16.15907096862793, 17.058557510375977, 17.958045959472656, 18.857532501220703, 19.757020950317383, 20.656509399414062, 21.55599594116211, 22.45548439025879, 23.35497283935547, 24.254459381103516, 25.153947830200195, 26.053436279296875, 26.952922821044922, 27.8524112701416, 28.75189971923828, 29.651386260986328]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 1.0, 4.0, 6.0, 9.0, 8.0, 12.0, 7.0, 12.0, 16.0, 13.0, 23.0, 23.0, 25.0, 22.0, 18.0, 24.0, 25.0, 35.0, 36.0, 43.0, 45.0, 34.0, 18.0, 27.0, 35.0, 40.0, 41.0, 39.0, 31.0, 26.0, 20.0, 31.0, 39.0, 26.0, 22.0, 14.0, 31.0, 20.0, 10.0, 13.0, 9.0, 8.0, 6.0, 11.0, 12.0, 4.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-29.9938907623291, -29.104814529418945, -28.215740203857422, -27.326663970947266, -26.43758773803711, -25.548511505126953, -24.659435272216797, -23.770360946655273, -22.881284713745117, -21.99220848083496, -21.103134155273438, -20.21405792236328, -19.324981689453125, -18.43590545654297, -17.546829223632812, -16.65775489807129, -15.768678665161133, -14.879602432250977, -13.990527153015137, -13.101451873779297, -12.21237564086914, -11.323299407958984, -10.434224128723145, -9.545148849487305, -8.656072616577148, -7.76699686050415, -6.877921104431152, -5.988845348358154, -5.099769592285156, -4.210693836212158, -3.32161808013916, -2.432542324066162, -1.5434646606445312, -0.6543889045715332, 0.23468685150146484, 1.123762607574463, 2.012838363647461, 2.901914119720459, 3.790989875793457, 4.680065631866455, 5.569141387939453, 6.458217144012451, 7.347292900085449, 8.236368179321289, 9.125444412231445, 10.014520645141602, 10.903595924377441, 11.792671203613281, 12.681747436523438, 13.570823669433594, 14.459898948669434, 15.348974227905273, 16.23805046081543, 17.127126693725586, 18.01620101928711, 18.905277252197266, 19.794353485107422, 20.683429718017578, 21.572505950927734, 22.461580276489258, 23.350656509399414, 24.23973274230957, 25.128807067871094, 26.01788330078125, 26.906959533691406]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 14.0, 19.0, 21.0, 39.0, 69.0, 99.0, 139.0, 210.0, 268.0, 477.0, 680.0, 1071.0, 1665.0, 2653.0, 3986.0, 6061.0, 9229.0, 13483.0, 20393.0, 29552.0, 42342.0, 58968.0, 78072.0, 98302.0, 114779.0, 120207.0, 110402.0, 92915.0, 71535.0, 53192.0, 37610.0, 26441.0, 18043.0, 11970.0, 8094.0, 5289.0, 3627.0, 2348.0, 1482.0, 956.0, 624.0, 424.0, 270.0, 182.0, 150.0, 63.0, 58.0, 33.0, 22.0, 11.0, 11.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-7.75, -7.517578125, -7.28515625, -7.052734375, -6.8203125, -6.587890625, -6.35546875, -6.123046875, -5.890625, -5.658203125, -5.42578125, -5.193359375, -4.9609375, -4.728515625, -4.49609375, -4.263671875, -4.03125, -3.798828125, -3.56640625, -3.333984375, -3.1015625, -2.869140625, -2.63671875, -2.404296875, -2.171875, -1.939453125, -1.70703125, -1.474609375, -1.2421875, -1.009765625, -0.77734375, -0.544921875, -0.3125, -0.080078125, 0.15234375, 0.384765625, 0.6171875, 0.849609375, 1.08203125, 1.314453125, 1.546875, 1.779296875, 2.01171875, 2.244140625, 2.4765625, 2.708984375, 2.94140625, 3.173828125, 3.40625, 3.638671875, 3.87109375, 4.103515625, 4.3359375, 4.568359375, 4.80078125, 5.033203125, 5.265625, 5.498046875, 5.73046875, 5.962890625, 6.1953125, 6.427734375, 6.66015625, 6.892578125, 7.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 1.0, 7.0, 1.0, 4.0, 6.0, 9.0, 8.0, 11.0, 8.0, 11.0, 15.0, 15.0, 22.0, 21.0, 27.0, 22.0, 18.0, 24.0, 25.0, 34.0, 35.0, 42.0, 46.0, 34.0, 20.0, 26.0, 34.0, 41.0, 42.0, 36.0, 32.0, 28.0, 19.0, 33.0, 37.0, 25.0, 23.0, 15.0, 31.0, 21.0, 10.0, 11.0, 10.0, 7.0, 7.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-29.890625, -29.006591796875, -28.12255859375, -27.238525390625, -26.3544921875, -25.470458984375, -24.58642578125, -23.702392578125, -22.818359375, -21.934326171875, -21.05029296875, -20.166259765625, -19.2822265625, -18.398193359375, -17.51416015625, -16.630126953125, -15.74609375, -14.862060546875, -13.97802734375, -13.093994140625, -12.2099609375, -11.325927734375, -10.44189453125, -9.557861328125, -8.673828125, -7.789794921875, -6.90576171875, -6.021728515625, -5.1376953125, -4.253662109375, -3.36962890625, -2.485595703125, -1.6015625, -0.717529296875, 0.16650390625, 1.050537109375, 1.9345703125, 2.818603515625, 3.70263671875, 4.586669921875, 5.470703125, 6.354736328125, 7.23876953125, 8.122802734375, 9.0068359375, 9.890869140625, 10.77490234375, 11.658935546875, 12.54296875, 13.427001953125, 14.31103515625, 15.195068359375, 16.0791015625, 16.963134765625, 17.84716796875, 18.731201171875, 19.615234375, 20.499267578125, 21.38330078125, 22.267333984375, 23.1513671875, 24.035400390625, 24.91943359375, 25.803466796875, 26.6875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 12.0, 16.0, 19.0, 30.0, 42.0, 61.0, 101.0, 123.0, 223.0, 303.0, 385.0, 552.0, 881.0, 1178.0, 1715.0, 2511.0, 3680.0, 5306.0, 7419.0, 11117.0, 17357.0, 32572.0, 847398.0, 48701.0, 23433.0, 13919.0, 9266.0, 6255.0, 4332.0, 3017.0, 2001.0, 1393.0, 947.0, 645.0, 520.0, 335.0, 243.0, 173.0, 99.0, 72.0, 69.0, 31.0, 31.0, 18.0, 14.0, 12.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.375, -17.796142578125, -17.21728515625, -16.638427734375, -16.0595703125, -15.480712890625, -14.90185546875, -14.322998046875, -13.744140625, -13.165283203125, -12.58642578125, -12.007568359375, -11.4287109375, -10.849853515625, -10.27099609375, -9.692138671875, -9.11328125, -8.534423828125, -7.95556640625, -7.376708984375, -6.7978515625, -6.218994140625, -5.64013671875, -5.061279296875, -4.482421875, -3.903564453125, -3.32470703125, -2.745849609375, -2.1669921875, -1.588134765625, -1.00927734375, -0.430419921875, 0.1484375, 0.727294921875, 1.30615234375, 1.885009765625, 2.4638671875, 3.042724609375, 3.62158203125, 4.200439453125, 4.779296875, 5.358154296875, 5.93701171875, 6.515869140625, 7.0947265625, 7.673583984375, 8.25244140625, 8.831298828125, 9.41015625, 9.989013671875, 10.56787109375, 11.146728515625, 11.7255859375, 12.304443359375, 12.88330078125, 13.462158203125, 14.041015625, 14.619873046875, 15.19873046875, 15.777587890625, 16.3564453125, 16.935302734375, 17.51416015625, 18.093017578125, 18.671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 5.0, 10.0, 17.0, 12.0, 13.0, 12.0, 16.0, 18.0, 14.0, 27.0, 29.0, 35.0, 37.0, 32.0, 36.0, 28.0, 51.0, 45.0, 34.0, 43.0, 44.0, 41.0, 37.0, 34.0, 35.0, 41.0, 38.0, 31.0, 28.0, 17.0, 13.0, 13.0, 16.0, 20.0, 18.0, 10.0, 13.0, 10.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.0625, -22.376220703125, -21.68994140625, -21.003662109375, -20.3173828125, -19.631103515625, -18.94482421875, -18.258544921875, -17.572265625, -16.885986328125, -16.19970703125, -15.513427734375, -14.8271484375, -14.140869140625, -13.45458984375, -12.768310546875, -12.08203125, -11.395751953125, -10.70947265625, -10.023193359375, -9.3369140625, -8.650634765625, -7.96435546875, -7.278076171875, -6.591796875, -5.905517578125, -5.21923828125, -4.532958984375, -3.8466796875, -3.160400390625, -2.47412109375, -1.787841796875, -1.1015625, -0.415283203125, 0.27099609375, 0.957275390625, 1.6435546875, 2.329833984375, 3.01611328125, 3.702392578125, 4.388671875, 5.074951171875, 5.76123046875, 6.447509765625, 7.1337890625, 7.820068359375, 8.50634765625, 9.192626953125, 9.87890625, 10.565185546875, 11.25146484375, 11.937744140625, 12.6240234375, 13.310302734375, 13.99658203125, 14.682861328125, 15.369140625, 16.055419921875, 16.74169921875, 17.427978515625, 18.1142578125, 18.800537109375, 19.48681640625, 20.173095703125, 20.859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 12.0, 11.0, 11.0, 22.0, 33.0, 52.0, 59.0, 108.0, 161.0, 245.0, 357.0, 559.0, 875.0, 1472.0, 2688.0, 5143.0, 10496.0, 23502.0, 71646.0, 876018.0, 29010.0, 12361.0, 5979.0, 3130.0, 1743.0, 1052.0, 639.0, 383.0, 254.0, 149.0, 123.0, 73.0, 70.0, 35.0, 27.0, 21.0, 9.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.841796875, -0.8147430419921875, -0.787689208984375, -0.7606353759765625, -0.73358154296875, -0.7065277099609375, -0.679473876953125, -0.6524200439453125, -0.6253662109375, -0.5983123779296875, -0.571258544921875, -0.5442047119140625, -0.51715087890625, -0.4900970458984375, -0.463043212890625, -0.4359893798828125, -0.408935546875, -0.3818817138671875, -0.354827880859375, -0.3277740478515625, -0.30072021484375, -0.2736663818359375, -0.246612548828125, -0.2195587158203125, -0.1925048828125, -0.1654510498046875, -0.138397216796875, -0.1113433837890625, -0.08428955078125, -0.0572357177734375, -0.030181884765625, -0.0031280517578125, 0.02392578125, 0.0509796142578125, 0.078033447265625, 0.1050872802734375, 0.13214111328125, 0.1591949462890625, 0.186248779296875, 0.2133026123046875, 0.2403564453125, 0.2674102783203125, 0.294464111328125, 0.3215179443359375, 0.34857177734375, 0.3756256103515625, 0.402679443359375, 0.4297332763671875, 0.456787109375, 0.4838409423828125, 0.510894775390625, 0.5379486083984375, 0.56500244140625, 0.5920562744140625, 0.619110107421875, 0.6461639404296875, 0.6732177734375, 0.7002716064453125, 0.727325439453125, 0.7543792724609375, 0.78143310546875, 0.8084869384765625, 0.835540771484375, 0.8625946044921875, 0.8896484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 8.0, 13.0, 12.0, 8.0, 15.0, 24.0, 16.0, 19.0, 20.0, 27.0, 17.0, 33.0, 22.0, 35.0, 41.0, 40.0, 44.0, 45.0, 30.0, 43.0, 38.0, 40.0, 31.0, 35.0, 41.0, 27.0, 31.0, 29.0, 23.0, 29.0, 16.0, 22.0, 10.0, 9.0, 15.0, 14.0, 11.0, 11.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1265277862548828e-05, -1.0932795703411102e-05, -1.0600313544273376e-05, -1.026783138513565e-05, -9.935349225997925e-06, -9.602867066860199e-06, -9.270384907722473e-06, -8.937902748584747e-06, -8.605420589447021e-06, -8.272938430309296e-06, -7.94045627117157e-06, -7.607974112033844e-06, -7.275491952896118e-06, -6.943009793758392e-06, -6.6105276346206665e-06, -6.278045475482941e-06, -5.945563316345215e-06, -5.613081157207489e-06, -5.280598998069763e-06, -4.948116838932037e-06, -4.6156346797943115e-06, -4.283152520656586e-06, -3.95067036151886e-06, -3.618188202381134e-06, -3.285706043243408e-06, -2.9532238841056824e-06, -2.6207417249679565e-06, -2.2882595658302307e-06, -1.955777406692505e-06, -1.623295247554779e-06, -1.2908130884170532e-06, -9.583309292793274e-07, -6.258487701416016e-07, -2.9336661100387573e-07, 3.91155481338501e-08, 3.7159770727157593e-07, 7.040798664093018e-07, 1.0365620255470276e-06, 1.3690441846847534e-06, 1.7015263438224792e-06, 2.034008502960205e-06, 2.366490662097931e-06, 2.6989728212356567e-06, 3.0314549803733826e-06, 3.3639371395111084e-06, 3.6964192986488342e-06, 4.02890145778656e-06, 4.361383616924286e-06, 4.693865776062012e-06, 5.0263479351997375e-06, 5.358830094337463e-06, 5.691312253475189e-06, 6.023794412612915e-06, 6.356276571750641e-06, 6.688758730888367e-06, 7.0212408900260925e-06, 7.353723049163818e-06, 7.686205208301544e-06, 8.01868736743927e-06, 8.351169526576996e-06, 8.683651685714722e-06, 9.016133844852448e-06, 9.348616003990173e-06, 9.6810981631279e-06, 1.0013580322265625e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 7.0, 9.0, 6.0, 9.0, 18.0, 31.0, 48.0, 73.0, 126.0, 183.0, 261.0, 359.0, 653.0, 974.0, 1651.0, 2567.0, 4198.0, 6668.0, 11043.0, 18398.0, 32115.0, 56710.0, 100218.0, 166797.0, 212443.0, 176921.0, 109002.0, 61348.0, 34779.0, 20018.0, 11867.0, 7213.0, 4420.0, 2701.0, 1790.0, 1032.0, 690.0, 402.0, 303.0, 198.0, 109.0, 75.0, 52.0, 26.0, 20.0, 13.0, 8.0, 2.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.334716796875, -0.3230018615722656, -0.31128692626953125, -0.2995719909667969, -0.2878570556640625, -0.2761421203613281, -0.26442718505859375, -0.2527122497558594, -0.240997314453125, -0.22928237915039062, -0.21756744384765625, -0.20585250854492188, -0.1941375732421875, -0.18242263793945312, -0.17070770263671875, -0.15899276733398438, -0.14727783203125, -0.13556289672851562, -0.12384796142578125, -0.11213302612304688, -0.1004180908203125, -0.08870315551757812, -0.07698822021484375, -0.06527328491210938, -0.053558349609375, -0.041843414306640625, -0.03012847900390625, -0.018413543701171875, -0.0066986083984375, 0.005016326904296875, 0.01673126220703125, 0.028446197509765625, 0.0401611328125, 0.051876068115234375, 0.06359100341796875, 0.07530593872070312, 0.0870208740234375, 0.09873580932617188, 0.11045074462890625, 0.12216567993164062, 0.133880615234375, 0.14559555053710938, 0.15731048583984375, 0.16902542114257812, 0.1807403564453125, 0.19245529174804688, 0.20417022705078125, 0.21588516235351562, 0.22760009765625, 0.23931503295898438, 0.25102996826171875, 0.2627449035644531, 0.2744598388671875, 0.2861747741699219, 0.29788970947265625, 0.3096046447753906, 0.321319580078125, 0.3330345153808594, 0.34474945068359375, 0.3564643859863281, 0.3681793212890625, 0.3798942565917969, 0.39160919189453125, 0.4033241271972656, 0.4150390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 9.0, 12.0, 9.0, 14.0, 13.0, 18.0, 28.0, 30.0, 44.0, 44.0, 73.0, 86.0, 77.0, 91.0, 97.0, 71.0, 59.0, 42.0, 37.0, 25.0, 24.0, 15.0, 12.0, 13.0, 10.0, 7.0, 3.0, 6.0, 8.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.1960773468017578, -0.19000625610351562, -0.18393516540527344, -0.17786407470703125, -0.17179298400878906, -0.16572189331054688, -0.1596508026123047, -0.1535797119140625, -0.1475086212158203, -0.14143753051757812, -0.13536643981933594, -0.12929534912109375, -0.12322425842285156, -0.11715316772460938, -0.11108207702636719, -0.105010986328125, -0.09893989562988281, -0.09286880493164062, -0.08679771423339844, -0.08072662353515625, -0.07465553283691406, -0.06858444213867188, -0.06251335144042969, -0.0564422607421875, -0.05037117004394531, -0.044300079345703125, -0.03822898864746094, -0.03215789794921875, -0.026086807250976562, -0.020015716552734375, -0.013944625854492188, -0.00787353515625, -0.0018024444580078125, 0.004268646240234375, 0.010339736938476562, 0.01641082763671875, 0.022481918334960938, 0.028553009033203125, 0.03462409973144531, 0.0406951904296875, 0.04676628112792969, 0.052837371826171875, 0.05890846252441406, 0.06497955322265625, 0.07105064392089844, 0.07712173461914062, 0.08319282531738281, 0.089263916015625, 0.09533500671386719, 0.10140609741210938, 0.10747718811035156, 0.11354827880859375, 0.11961936950683594, 0.12569046020507812, 0.1317615509033203, 0.1378326416015625, 0.1439037322998047, 0.14997482299804688, 0.15604591369628906, 0.16211700439453125, 0.16818809509277344, 0.17425918579101562, 0.1803302764892578, 0.1864013671875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 10.0, 5.0, 15.0, 19.0, 18.0, 19.0, 24.0, 28.0, 24.0, 33.0, 26.0, 41.0, 36.0, 48.0, 56.0, 51.0, 54.0, 37.0, 44.0, 41.0, 36.0, 40.0, 55.0, 42.0, 39.0, 20.0, 18.0, 15.0, 16.0, 20.0, 17.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 8.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.99443817138672, -27.09003257751465, -26.185626983642578, -25.281221389770508, -24.376815795898438, -23.472410202026367, -22.568004608154297, -21.663599014282227, -20.759193420410156, -19.854787826538086, -18.950382232666016, -18.045976638793945, -17.141571044921875, -16.237165451049805, -15.332759857177734, -14.428354263305664, -13.523947715759277, -12.619542121887207, -11.715136528015137, -10.810730934143066, -9.906325340270996, -9.00191879272461, -8.097513198852539, -7.193108081817627, -6.288702487945557, -5.384296894073486, -4.479891300201416, -3.5754854679107666, -2.6710798740386963, -1.7666740417480469, -0.8622684478759766, 0.04213714599609375, 0.9465427398681641, 1.8509483337402344, 2.7553539276123047, 3.659759759902954, 4.564165115356445, 5.468571186065674, 6.372976779937744, 7.2773823738098145, 8.181787490844727, 9.086193084716797, 9.990598678588867, 10.895004272460938, 11.799409866333008, 12.703815460205078, 13.608221054077148, 14.512626647949219, 15.417033195495605, 16.321439743041992, 17.225845336914062, 18.130250930786133, 19.034656524658203, 19.939062118530273, 20.843467712402344, 21.747873306274414, 22.652278900146484, 23.556684494018555, 24.461090087890625, 25.365495681762695, 26.269901275634766, 27.174306869506836, 28.078712463378906, 28.983118057250977, 29.887523651123047]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 1.0, 8.0, 1.0, 4.0, 6.0, 7.0, 9.0, 12.0, 8.0, 10.0, 16.0, 15.0, 22.0, 20.0, 28.0, 21.0, 19.0, 23.0, 27.0, 32.0, 36.0, 43.0, 45.0, 32.0, 22.0, 25.0, 34.0, 42.0, 42.0, 34.0, 35.0, 26.0, 21.0, 30.0, 39.0, 24.0, 24.0, 15.0, 31.0, 20.0, 11.0, 11.0, 10.0, 7.0, 7.0, 11.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-29.910776138305664, -29.026519775390625, -28.142261505126953, -27.258005142211914, -26.373748779296875, -25.489492416381836, -24.605236053466797, -23.720977783203125, -22.836721420288086, -21.952465057373047, -21.068206787109375, -20.183950424194336, -19.299694061279297, -18.415437698364258, -17.53118133544922, -16.646923065185547, -15.762666702270508, -14.878410339355469, -13.994153022766113, -13.109895706176758, -12.225639343261719, -11.34138298034668, -10.457125663757324, -9.572868347167969, -8.68861198425293, -7.804355144500732, -6.920098304748535, -6.035841464996338, -5.151584625244141, -4.267327785491943, -3.383070945739746, -2.498814105987549, -1.6145553588867188, -0.7302985191345215, 0.15395832061767578, 1.038215160369873, 1.9224720001220703, 2.8067288398742676, 3.690985679626465, 4.575242519378662, 5.459499359130859, 6.343756198883057, 7.228013038635254, 8.11227035522461, 8.996526718139648, 9.880783081054688, 10.765040397644043, 11.649297714233398, 12.533554077148438, 13.417810440063477, 14.302067756652832, 15.186325073242188, 16.070581436157227, 16.954837799072266, 17.839096069335938, 18.723352432250977, 19.607608795166016, 20.491865158081055, 21.376121520996094, 22.260379791259766, 23.144636154174805, 24.028892517089844, 24.913150787353516, 25.797407150268555, 26.681663513183594]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 17.0, 24.0, 45.0, 81.0, 114.0, 181.0, 270.0, 474.0, 740.0, 1030.0, 1677.0, 2505.0, 3588.0, 5370.0, 7688.0, 11337.0, 16020.0, 22082.0, 29757.0, 39124.0, 50202.0, 61263.0, 72121.0, 80929.0, 86615.0, 87950.0, 85737.0, 78457.0, 69260.0, 57362.0, 46481.0, 36188.0, 27527.0, 20316.0, 14480.0, 10129.0, 7258.0, 4809.0, 3265.0, 2044.0, 1400.0, 945.0, 632.0, 419.0, 231.0, 174.0, 88.0, 59.0, 21.0, 28.0, 9.0, 7.0, 9.0, 1.0, 3.0, 1.0], "bins": [-13.4921875, -13.087646484375, -12.68310546875, -12.278564453125, -11.8740234375, -11.469482421875, -11.06494140625, -10.660400390625, -10.255859375, -9.851318359375, -9.44677734375, -9.042236328125, -8.6376953125, -8.233154296875, -7.82861328125, -7.424072265625, -7.01953125, -6.614990234375, -6.21044921875, -5.805908203125, -5.4013671875, -4.996826171875, -4.59228515625, -4.187744140625, -3.783203125, -3.378662109375, -2.97412109375, -2.569580078125, -2.1650390625, -1.760498046875, -1.35595703125, -0.951416015625, -0.546875, -0.142333984375, 0.26220703125, 0.666748046875, 1.0712890625, 1.475830078125, 1.88037109375, 2.284912109375, 2.689453125, 3.093994140625, 3.49853515625, 3.903076171875, 4.3076171875, 4.712158203125, 5.11669921875, 5.521240234375, 5.92578125, 6.330322265625, 6.73486328125, 7.139404296875, 7.5439453125, 7.948486328125, 8.35302734375, 8.757568359375, 9.162109375, 9.566650390625, 9.97119140625, 10.375732421875, 10.7802734375, 11.184814453125, 11.58935546875, 11.993896484375, 12.3984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 7.0, 9.0, 11.0, 10.0, 7.0, 10.0, 21.0, 17.0, 25.0, 22.0, 21.0, 22.0, 22.0, 28.0, 27.0, 39.0, 37.0, 47.0, 34.0, 25.0, 24.0, 32.0, 42.0, 40.0, 33.0, 42.0, 27.0, 17.0, 32.0, 30.0, 31.0, 31.0, 13.0, 24.0, 25.0, 16.0, 8.0, 15.0, 4.0, 9.0, 8.0, 13.0, 6.0, 4.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0], "bins": [-29.703125, -28.833251953125, -27.96337890625, -27.093505859375, -26.2236328125, -25.353759765625, -24.48388671875, -23.614013671875, -22.744140625, -21.874267578125, -21.00439453125, -20.134521484375, -19.2646484375, -18.394775390625, -17.52490234375, -16.655029296875, -15.78515625, -14.915283203125, -14.04541015625, -13.175537109375, -12.3056640625, -11.435791015625, -10.56591796875, -9.696044921875, -8.826171875, -7.956298828125, -7.08642578125, -6.216552734375, -5.3466796875, -4.476806640625, -3.60693359375, -2.737060546875, -1.8671875, -0.997314453125, -0.12744140625, 0.742431640625, 1.6123046875, 2.482177734375, 3.35205078125, 4.221923828125, 5.091796875, 5.961669921875, 6.83154296875, 7.701416015625, 8.5712890625, 9.441162109375, 10.31103515625, 11.180908203125, 12.05078125, 12.920654296875, 13.79052734375, 14.660400390625, 15.5302734375, 16.400146484375, 17.27001953125, 18.139892578125, 19.009765625, 19.879638671875, 20.74951171875, 21.619384765625, 22.4892578125, 23.359130859375, 24.22900390625, 25.098876953125, 25.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 18.0, 30.0, 41.0, 63.0, 120.0, 164.0, 274.0, 475.0, 739.0, 1236.0, 2092.0, 3164.0, 5110.0, 7889.0, 12091.0, 18186.0, 26552.0, 36975.0, 50267.0, 65276.0, 79737.0, 91952.0, 99600.0, 101043.0, 96128.0, 85228.0, 71679.0, 56801.0, 42523.0, 30936.0, 21393.0, 14487.0, 9547.0, 6169.0, 3998.0, 2440.0, 1603.0, 969.0, 642.0, 359.0, 194.0, 142.0, 89.0, 53.0, 23.0, 23.0, 12.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.2578125, -13.7860107421875, -13.314208984375, -12.8424072265625, -12.37060546875, -11.8988037109375, -11.427001953125, -10.9552001953125, -10.4833984375, -10.0115966796875, -9.539794921875, -9.0679931640625, -8.59619140625, -8.1243896484375, -7.652587890625, -7.1807861328125, -6.708984375, -6.2371826171875, -5.765380859375, -5.2935791015625, -4.82177734375, -4.3499755859375, -3.878173828125, -3.4063720703125, -2.9345703125, -2.4627685546875, -1.990966796875, -1.5191650390625, -1.04736328125, -0.5755615234375, -0.103759765625, 0.3680419921875, 0.83984375, 1.3116455078125, 1.783447265625, 2.2552490234375, 2.72705078125, 3.1988525390625, 3.670654296875, 4.1424560546875, 4.6142578125, 5.0860595703125, 5.557861328125, 6.0296630859375, 6.50146484375, 6.9732666015625, 7.445068359375, 7.9168701171875, 8.388671875, 8.8604736328125, 9.332275390625, 9.8040771484375, 10.27587890625, 10.7476806640625, 11.219482421875, 11.6912841796875, 12.1630859375, 12.6348876953125, 13.106689453125, 13.5784912109375, 14.05029296875, 14.5220947265625, 14.993896484375, 15.4656982421875, 15.9375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 10.0, 8.0, 12.0, 13.0, 11.0, 15.0, 20.0, 17.0, 17.0, 23.0, 23.0, 31.0, 29.0, 41.0, 28.0, 40.0, 40.0, 34.0, 39.0, 38.0, 34.0, 34.0, 36.0, 35.0, 37.0, 26.0, 20.0, 33.0, 24.0, 27.0, 40.0, 17.0, 17.0, 21.0, 23.0, 13.0, 13.0, 8.0, 17.0, 12.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-18.359375, -17.772216796875, -17.18505859375, -16.597900390625, -16.0107421875, -15.423583984375, -14.83642578125, -14.249267578125, -13.662109375, -13.074951171875, -12.48779296875, -11.900634765625, -11.3134765625, -10.726318359375, -10.13916015625, -9.552001953125, -8.96484375, -8.377685546875, -7.79052734375, -7.203369140625, -6.6162109375, -6.029052734375, -5.44189453125, -4.854736328125, -4.267578125, -3.680419921875, -3.09326171875, -2.506103515625, -1.9189453125, -1.331787109375, -0.74462890625, -0.157470703125, 0.4296875, 1.016845703125, 1.60400390625, 2.191162109375, 2.7783203125, 3.365478515625, 3.95263671875, 4.539794921875, 5.126953125, 5.714111328125, 6.30126953125, 6.888427734375, 7.4755859375, 8.062744140625, 8.64990234375, 9.237060546875, 9.82421875, 10.411376953125, 10.99853515625, 11.585693359375, 12.1728515625, 12.760009765625, 13.34716796875, 13.934326171875, 14.521484375, 15.108642578125, 15.69580078125, 16.282958984375, 16.8701171875, 17.457275390625, 18.04443359375, 18.631591796875, 19.21875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 20.0, 35.0, 55.0, 103.0, 156.0, 214.0, 339.0, 568.0, 866.0, 1386.0, 2290.0, 3769.0, 6049.0, 9632.0, 15214.0, 23747.0, 34759.0, 50486.0, 67902.0, 86457.0, 101676.0, 111688.0, 111706.0, 103181.0, 88214.0, 70265.0, 52738.0, 36735.0, 24952.0, 16277.0, 10288.0, 6377.0, 3925.0, 2472.0, 1501.0, 895.0, 597.0, 343.0, 243.0, 150.0, 107.0, 46.0, 40.0, 30.0, 13.0, 17.0, 3.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.86328125, -4.71160888671875, -4.5599365234375, -4.40826416015625, -4.256591796875, -4.10491943359375, -3.9532470703125, -3.80157470703125, -3.64990234375, -3.49822998046875, -3.3465576171875, -3.19488525390625, -3.043212890625, -2.89154052734375, -2.7398681640625, -2.58819580078125, -2.4365234375, -2.28485107421875, -2.1331787109375, -1.98150634765625, -1.829833984375, -1.67816162109375, -1.5264892578125, -1.37481689453125, -1.22314453125, -1.07147216796875, -0.9197998046875, -0.76812744140625, -0.616455078125, -0.46478271484375, -0.3131103515625, -0.16143798828125, -0.009765625, 0.14190673828125, 0.2935791015625, 0.44525146484375, 0.596923828125, 0.74859619140625, 0.9002685546875, 1.05194091796875, 1.20361328125, 1.35528564453125, 1.5069580078125, 1.65863037109375, 1.810302734375, 1.96197509765625, 2.1136474609375, 2.26531982421875, 2.4169921875, 2.56866455078125, 2.7203369140625, 2.87200927734375, 3.023681640625, 3.17535400390625, 3.3270263671875, 3.47869873046875, 3.63037109375, 3.78204345703125, 3.9337158203125, 4.08538818359375, 4.237060546875, 4.38873291015625, 4.5404052734375, 4.69207763671875, 4.84375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 8.0, 11.0, 7.0, 11.0, 17.0, 10.0, 17.0, 26.0, 32.0, 25.0, 18.0, 30.0, 31.0, 35.0, 46.0, 43.0, 34.0, 49.0, 39.0, 50.0, 37.0, 40.0, 48.0, 42.0, 43.0, 33.0, 36.0, 32.0, 21.0, 21.0, 19.0, 13.0, 10.0, 12.0, 18.0, 7.0, 6.0, 3.0, 7.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.000537872314453125, -0.0005209445953369141, -0.0005040168762207031, -0.0004870891571044922, -0.00047016143798828125, -0.0004532337188720703, -0.0004363059997558594, -0.00041937828063964844, -0.0004024505615234375, -0.00038552284240722656, -0.0003685951232910156, -0.0003516674041748047, -0.00033473968505859375, -0.0003178119659423828, -0.0003008842468261719, -0.00028395652770996094, -0.00026702880859375, -0.00025010108947753906, -0.00023317337036132812, -0.0002162456512451172, -0.00019931793212890625, -0.0001823902130126953, -0.00016546249389648438, -0.00014853477478027344, -0.0001316070556640625, -0.00011467933654785156, -9.775161743164062e-05, -8.082389831542969e-05, -6.389617919921875e-05, -4.696846008300781e-05, -3.0040740966796875e-05, -1.3113021850585938e-05, 3.814697265625e-06, 2.0742416381835938e-05, 3.7670135498046875e-05, 5.459785461425781e-05, 7.152557373046875e-05, 8.845329284667969e-05, 0.00010538101196289062, 0.00012230873107910156, 0.0001392364501953125, 0.00015616416931152344, 0.00017309188842773438, 0.0001900196075439453, 0.00020694732666015625, 0.0002238750457763672, 0.00024080276489257812, 0.00025773048400878906, 0.000274658203125, 0.00029158592224121094, 0.0003085136413574219, 0.0003254413604736328, 0.00034236907958984375, 0.0003592967987060547, 0.0003762245178222656, 0.00039315223693847656, 0.0004100799560546875, 0.00042700767517089844, 0.0004439353942871094, 0.0004608631134033203, 0.00047779083251953125, 0.0004947185516357422, 0.0005116462707519531, 0.0005285739898681641, 0.000545501708984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 5.0, 4.0, 15.0, 23.0, 26.0, 39.0, 61.0, 106.0, 147.0, 220.0, 347.0, 541.0, 899.0, 1392.0, 2192.0, 3379.0, 5282.0, 8067.0, 12434.0, 18934.0, 27725.0, 39888.0, 55371.0, 72277.0, 89669.0, 103042.0, 109139.0, 107626.0, 96769.0, 81372.0, 64101.0, 47470.0, 33805.0, 22686.0, 15200.0, 10151.0, 6452.0, 4293.0, 2623.0, 1762.0, 1127.0, 689.0, 428.0, 290.0, 154.0, 126.0, 79.0, 51.0, 24.0, 22.0, 14.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.703125, -4.5450439453125, -4.386962890625, -4.2288818359375, -4.07080078125, -3.9127197265625, -3.754638671875, -3.5965576171875, -3.4384765625, -3.2803955078125, -3.122314453125, -2.9642333984375, -2.80615234375, -2.6480712890625, -2.489990234375, -2.3319091796875, -2.173828125, -2.0157470703125, -1.857666015625, -1.6995849609375, -1.54150390625, -1.3834228515625, -1.225341796875, -1.0672607421875, -0.9091796875, -0.7510986328125, -0.593017578125, -0.4349365234375, -0.27685546875, -0.1187744140625, 0.039306640625, 0.1973876953125, 0.35546875, 0.5135498046875, 0.671630859375, 0.8297119140625, 0.98779296875, 1.1458740234375, 1.303955078125, 1.4620361328125, 1.6201171875, 1.7781982421875, 1.936279296875, 2.0943603515625, 2.25244140625, 2.4105224609375, 2.568603515625, 2.7266845703125, 2.884765625, 3.0428466796875, 3.200927734375, 3.3590087890625, 3.51708984375, 3.6751708984375, 3.833251953125, 3.9913330078125, 4.1494140625, 4.3074951171875, 4.465576171875, 4.6236572265625, 4.78173828125, 4.9398193359375, 5.097900390625, 5.2559814453125, 5.4140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 2.0, 13.0, 6.0, 10.0, 10.0, 9.0, 14.0, 18.0, 14.0, 21.0, 21.0, 28.0, 27.0, 43.0, 40.0, 35.0, 32.0, 51.0, 45.0, 48.0, 47.0, 46.0, 40.0, 41.0, 28.0, 34.0, 43.0, 35.0, 27.0, 34.0, 15.0, 19.0, 14.0, 14.0, 12.0, 14.0, 14.0, 10.0, 3.0, 2.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.646484375, -2.5615234375, -2.4765625, -2.3916015625, -2.306640625, -2.2216796875, -2.13671875, -2.0517578125, -1.966796875, -1.8818359375, -1.796875, -1.7119140625, -1.626953125, -1.5419921875, -1.45703125, -1.3720703125, -1.287109375, -1.2021484375, -1.1171875, -1.0322265625, -0.947265625, -0.8623046875, -0.77734375, -0.6923828125, -0.607421875, -0.5224609375, -0.4375, -0.3525390625, -0.267578125, -0.1826171875, -0.09765625, -0.0126953125, 0.072265625, 0.1572265625, 0.2421875, 0.3271484375, 0.412109375, 0.4970703125, 0.58203125, 0.6669921875, 0.751953125, 0.8369140625, 0.921875, 1.0068359375, 1.091796875, 1.1767578125, 1.26171875, 1.3466796875, 1.431640625, 1.5166015625, 1.6015625, 1.6865234375, 1.771484375, 1.8564453125, 1.94140625, 2.0263671875, 2.111328125, 2.1962890625, 2.28125, 2.3662109375, 2.451171875, 2.5361328125, 2.62109375, 2.7060546875, 2.791015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 11.0, 13.0, 13.0, 14.0, 16.0, 23.0, 19.0, 27.0, 28.0, 21.0, 27.0, 43.0, 38.0, 44.0, 46.0, 49.0, 55.0, 49.0, 35.0, 47.0, 41.0, 48.0, 42.0, 38.0, 45.0, 33.0, 25.0, 19.0, 15.0, 12.0, 12.0, 10.0, 7.0, 8.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.380844116210938, -27.474355697631836, -26.567867279052734, -25.661378860473633, -24.75489044189453, -23.848403930664062, -22.94191551208496, -22.03542709350586, -21.128938674926758, -20.222450256347656, -19.315961837768555, -18.409473419189453, -17.502986907958984, -16.59649658203125, -15.690010070800781, -14.78352165222168, -13.877033233642578, -12.970544815063477, -12.064056396484375, -11.15756893157959, -10.251080513000488, -9.344592094421387, -8.438104629516602, -7.5316162109375, -6.625127792358398, -5.718639373779297, -4.8121514320373535, -3.905663251876831, -2.9991750717163086, -2.092686653137207, -1.1861987113952637, -0.2797107696533203, 0.6267757415771484, 1.533263921737671, 2.4397521018981934, 3.346240282058716, 4.252728462219238, 5.15921688079834, 6.065704822540283, 6.972192764282227, 7.878681182861328, 8.78516960144043, 9.691658020019531, 10.598145484924316, 11.504633903503418, 12.41112232208252, 13.317609786987305, 14.224098205566406, 15.130586624145508, 16.03707504272461, 16.94356346130371, 17.850051879882812, 18.75653839111328, 19.663028717041016, 20.569515228271484, 21.476003646850586, 22.382492065429688, 23.28898048400879, 24.19546890258789, 25.101957321166992, 26.008445739746094, 26.914932250976562, 27.821420669555664, 28.727909088134766, 29.634397506713867]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 10.0, 2.0, 8.0, 6.0, 7.0, 11.0, 16.0, 15.0, 15.0, 19.0, 19.0, 36.0, 24.0, 25.0, 36.0, 26.0, 34.0, 39.0, 37.0, 29.0, 32.0, 42.0, 46.0, 48.0, 47.0, 38.0, 27.0, 39.0, 30.0, 24.0, 25.0, 19.0, 23.0, 15.0, 22.0, 23.0, 15.0, 12.0, 8.0, 12.0, 12.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.9967155456543, -31.970258712768555, -30.943801879882812, -29.917343139648438, -28.890886306762695, -27.864429473876953, -26.837970733642578, -25.811513900756836, -24.785057067871094, -23.75860023498535, -22.73214340209961, -21.705684661865234, -20.679227828979492, -19.65277099609375, -18.626312255859375, -17.599855422973633, -16.57339859008789, -15.546941757202148, -14.52048397064209, -13.494026184082031, -12.467569351196289, -11.441112518310547, -10.414654731750488, -9.38819694519043, -8.361740112304688, -7.335282802581787, -6.308825492858887, -5.282368183135986, -4.255910873413086, -3.2294535636901855, -2.202996253967285, -1.1765389442443848, -0.15008544921875, 0.8763718605041504, 1.9028291702270508, 2.929286479949951, 3.9557437896728516, 4.982201099395752, 6.008658409118652, 7.035115718841553, 8.061573028564453, 9.088029861450195, 10.114487648010254, 11.140945434570312, 12.167402267456055, 13.193859100341797, 14.220316886901855, 15.246774673461914, 16.273231506347656, 17.2996883392334, 18.32614517211914, 19.352603912353516, 20.379060745239258, 21.405517578125, 22.431976318359375, 23.458433151245117, 24.48488998413086, 25.5113468170166, 26.537803649902344, 27.56426239013672, 28.59071922302246, 29.617176055908203, 30.643634796142578, 31.67009162902832, 32.69654846191406]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 4.0, 9.0, 14.0, 27.0, 41.0, 74.0, 111.0, 211.0, 384.0, 552.0, 986.0, 1516.0, 2393.0, 3825.0, 6071.0, 9254.0, 14551.0, 21763.0, 33099.0, 47498.0, 67740.0, 95499.0, 129254.0, 169904.0, 213865.0, 262090.0, 305818.0, 339392.0, 357437.0, 357496.0, 340938.0, 308069.0, 265194.0, 218853.0, 172522.0, 132271.0, 97545.0, 70049.0, 48870.0, 34130.0, 22554.0, 15132.0, 9952.0, 6358.0, 4152.0, 2574.0, 1666.0, 990.0, 596.0, 392.0, 231.0, 150.0, 90.0, 50.0, 31.0, 18.0, 23.0, 3.0, 6.0, 2.0, 4.0], "bins": [-17.59375, -17.044677734375, -16.49560546875, -15.946533203125, -15.3974609375, -14.848388671875, -14.29931640625, -13.750244140625, -13.201171875, -12.652099609375, -12.10302734375, -11.553955078125, -11.0048828125, -10.455810546875, -9.90673828125, -9.357666015625, -8.80859375, -8.259521484375, -7.71044921875, -7.161376953125, -6.6123046875, -6.063232421875, -5.51416015625, -4.965087890625, -4.416015625, -3.866943359375, -3.31787109375, -2.768798828125, -2.2197265625, -1.670654296875, -1.12158203125, -0.572509765625, -0.0234375, 0.525634765625, 1.07470703125, 1.623779296875, 2.1728515625, 2.721923828125, 3.27099609375, 3.820068359375, 4.369140625, 4.918212890625, 5.46728515625, 6.016357421875, 6.5654296875, 7.114501953125, 7.66357421875, 8.212646484375, 8.76171875, 9.310791015625, 9.85986328125, 10.408935546875, 10.9580078125, 11.507080078125, 12.05615234375, 12.605224609375, 13.154296875, 13.703369140625, 14.25244140625, 14.801513671875, 15.3505859375, 15.899658203125, 16.44873046875, 16.997802734375, 17.546875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 7.0, 5.0, 16.0, 10.0, 16.0, 15.0, 20.0, 25.0, 29.0, 29.0, 26.0, 27.0, 31.0, 32.0, 39.0, 33.0, 32.0, 35.0, 41.0, 46.0, 51.0, 39.0, 38.0, 29.0, 31.0, 31.0, 28.0, 24.0, 17.0, 25.0, 14.0, 27.0, 19.0, 15.0, 16.0, 9.0, 8.0, 15.0, 6.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.97119140625, -26.0986328125, -25.22607421875, -24.353515625, -23.48095703125, -22.6083984375, -21.73583984375, -20.86328125, -19.99072265625, -19.1181640625, -18.24560546875, -17.373046875, -16.50048828125, -15.6279296875, -14.75537109375, -13.8828125, -13.01025390625, -12.1376953125, -11.26513671875, -10.392578125, -9.52001953125, -8.6474609375, -7.77490234375, -6.90234375, -6.02978515625, -5.1572265625, -4.28466796875, -3.412109375, -2.53955078125, -1.6669921875, -0.79443359375, 0.078125, 0.95068359375, 1.8232421875, 2.69580078125, 3.568359375, 4.44091796875, 5.3134765625, 6.18603515625, 7.05859375, 7.93115234375, 8.8037109375, 9.67626953125, 10.548828125, 11.42138671875, 12.2939453125, 13.16650390625, 14.0390625, 14.91162109375, 15.7841796875, 16.65673828125, 17.529296875, 18.40185546875, 19.2744140625, 20.14697265625, 21.01953125, 21.89208984375, 22.7646484375, 23.63720703125, 24.509765625, 25.38232421875, 26.2548828125, 27.12744140625, 28.0]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 15.0, 39.0, 48.0, 105.0, 160.0, 275.0, 505.0, 882.0, 1362.0, 2275.0, 3877.0, 6147.0, 9678.0, 15348.0, 23214.0, 35690.0, 51409.0, 73924.0, 102106.0, 137762.0, 179032.0, 222763.0, 266490.0, 306049.0, 335768.0, 349468.0, 348963.0, 332865.0, 300315.0, 260172.0, 215325.0, 171589.0, 131859.0, 97360.0, 69722.0, 49055.0, 32833.0, 21817.0, 14060.0, 9206.0, 5734.0, 3545.0, 2178.0, 1372.0, 831.0, 437.0, 256.0, 166.0, 105.0, 48.0, 27.0, 22.0, 16.0, 10.0, 0.0, 3.0, 2.0], "bins": [-18.453125, -17.892578125, -17.33203125, -16.771484375, -16.2109375, -15.650390625, -15.08984375, -14.529296875, -13.96875, -13.408203125, -12.84765625, -12.287109375, -11.7265625, -11.166015625, -10.60546875, -10.044921875, -9.484375, -8.923828125, -8.36328125, -7.802734375, -7.2421875, -6.681640625, -6.12109375, -5.560546875, -5.0, -4.439453125, -3.87890625, -3.318359375, -2.7578125, -2.197265625, -1.63671875, -1.076171875, -0.515625, 0.044921875, 0.60546875, 1.166015625, 1.7265625, 2.287109375, 2.84765625, 3.408203125, 3.96875, 4.529296875, 5.08984375, 5.650390625, 6.2109375, 6.771484375, 7.33203125, 7.892578125, 8.453125, 9.013671875, 9.57421875, 10.134765625, 10.6953125, 11.255859375, 11.81640625, 12.376953125, 12.9375, 13.498046875, 14.05859375, 14.619140625, 15.1796875, 15.740234375, 16.30078125, 16.861328125, 17.421875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 8.0, 10.0, 14.0, 22.0, 18.0, 33.0, 36.0, 51.0, 55.0, 56.0, 87.0, 119.0, 116.0, 142.0, 125.0, 128.0, 169.0, 170.0, 192.0, 191.0, 195.0, 199.0, 206.0, 216.0, 190.0, 185.0, 176.0, 149.0, 145.0, 104.0, 105.0, 85.0, 79.0, 53.0, 34.0, 51.0, 33.0, 29.0, 27.0, 15.0, 7.0, 12.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.28125, -11.8575439453125, -11.433837890625, -11.0101318359375, -10.58642578125, -10.1627197265625, -9.739013671875, -9.3153076171875, -8.8916015625, -8.4678955078125, -8.044189453125, -7.6204833984375, -7.19677734375, -6.7730712890625, -6.349365234375, -5.9256591796875, -5.501953125, -5.0782470703125, -4.654541015625, -4.2308349609375, -3.80712890625, -3.3834228515625, -2.959716796875, -2.5360107421875, -2.1123046875, -1.6885986328125, -1.264892578125, -0.8411865234375, -0.41748046875, 0.0062255859375, 0.429931640625, 0.8536376953125, 1.27734375, 1.7010498046875, 2.124755859375, 2.5484619140625, 2.97216796875, 3.3958740234375, 3.819580078125, 4.2432861328125, 4.6669921875, 5.0906982421875, 5.514404296875, 5.9381103515625, 6.36181640625, 6.7855224609375, 7.209228515625, 7.6329345703125, 8.056640625, 8.4803466796875, 8.904052734375, 9.3277587890625, 9.75146484375, 10.1751708984375, 10.598876953125, 11.0225830078125, 11.4462890625, 11.8699951171875, 12.293701171875, 12.7174072265625, 13.14111328125, 13.5648193359375, 13.988525390625, 14.4122314453125, 14.8359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 17.0, 12.0, 15.0, 14.0, 16.0, 20.0, 25.0, 26.0, 32.0, 34.0, 38.0, 37.0, 28.0, 47.0, 47.0, 45.0, 33.0, 30.0, 38.0, 40.0, 43.0, 48.0, 40.0, 27.0, 32.0, 32.0, 25.0, 24.0, 12.0, 16.0, 12.0, 15.0, 10.0, 11.0, 12.0, 10.0, 8.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.514690399169922, -28.615232467651367, -27.715774536132812, -26.816316604614258, -25.916858673095703, -25.01740074157715, -24.117942810058594, -23.21848487854004, -22.319026947021484, -21.41956901550293, -20.520111083984375, -19.62065315246582, -18.721195220947266, -17.82173728942871, -16.922279357910156, -16.0228214263916, -15.12336254119873, -14.223904609680176, -13.324446678161621, -12.424988746643066, -11.525530815124512, -10.62607192993164, -9.726613998413086, -8.827156066894531, -7.927698612213135, -7.02824068069458, -6.128782749176025, -5.2293243408203125, -4.329866409301758, -3.430408477783203, -2.5309505462646484, -1.6314926147460938, -0.7320346832275391, 0.1674233078956604, 1.0668812990188599, 1.966339349746704, 2.865797281265259, 3.7652554512023926, 4.664713382720947, 5.564171314239502, 6.463629245758057, 7.363087177276611, 8.262545585632324, 9.162003517150879, 10.061461448669434, 10.960919380187988, 11.860377311706543, 12.759835243225098, 13.659293174743652, 14.558751106262207, 15.458209037780762, 16.357667922973633, 17.257125854492188, 18.156583786010742, 19.056041717529297, 19.95549964904785, 20.854957580566406, 21.75441551208496, 22.653873443603516, 23.55333137512207, 24.452789306640625, 25.35224723815918, 26.251705169677734, 27.15116310119629, 28.050621032714844]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 7.0, 14.0, 11.0, 24.0, 13.0, 25.0, 34.0, 40.0, 31.0, 39.0, 41.0, 32.0, 38.0, 43.0, 37.0, 48.0, 31.0, 41.0, 45.0, 32.0, 32.0, 35.0, 33.0, 39.0, 31.0, 25.0, 15.0, 23.0, 14.0, 13.0, 18.0, 8.0, 10.0, 8.0, 17.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.902427673339844, -39.76179885864258, -38.62117004394531, -37.48053741455078, -36.339908599853516, -35.19927978515625, -34.05864715576172, -32.91801834106445, -31.777389526367188, -30.636760711669922, -29.496129989624023, -28.355499267578125, -27.21487045288086, -26.074241638183594, -24.933610916137695, -23.792980194091797, -22.65235137939453, -21.511722564697266, -20.371091842651367, -19.23046112060547, -18.089832305908203, -16.949203491210938, -15.808572769165039, -14.667943000793457, -13.527313232421875, -12.386683464050293, -11.246053695678711, -10.105423927307129, -8.964794158935547, -7.824164390563965, -6.683534622192383, -5.542904853820801, -4.402278900146484, -3.2616491317749023, -2.1210193634033203, -0.9803895950317383, 0.16024017333984375, 1.3008699417114258, 2.441499710083008, 3.58212947845459, 4.722759246826172, 5.863389015197754, 7.004018783569336, 8.144648551940918, 9.2852783203125, 10.425908088684082, 11.566537857055664, 12.707167625427246, 13.847797393798828, 14.98842716217041, 16.129056930541992, 17.26968765258789, 18.410316467285156, 19.550945281982422, 20.69157600402832, 21.83220672607422, 22.972835540771484, 24.11346435546875, 25.25409507751465, 26.394725799560547, 27.535354614257812, 28.675983428955078, 29.816614151000977, 30.957244873046875, 32.09787368774414]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 5.0, 34.0, 37.0, 59.0, 87.0, 114.0, 167.0, 277.0, 457.0, 705.0, 1119.0, 1697.0, 2586.0, 3852.0, 5991.0, 9499.0, 13952.0, 20744.0, 30281.0, 42871.0, 59990.0, 80219.0, 99932.0, 114780.0, 118795.0, 109649.0, 92257.0, 70978.0, 52643.0, 37206.0, 25562.0, 17691.0, 11658.0, 7869.0, 5238.0, 3342.0, 2209.0, 1426.0, 849.0, 634.0, 355.0, 264.0, 162.0, 107.0, 66.0, 52.0, 31.0, 18.0, 13.0, 5.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.86328125, -7.61199951171875, -7.3607177734375, -7.10943603515625, -6.858154296875, -6.60687255859375, -6.3555908203125, -6.10430908203125, -5.85302734375, -5.60174560546875, -5.3504638671875, -5.09918212890625, -4.847900390625, -4.59661865234375, -4.3453369140625, -4.09405517578125, -3.8427734375, -3.59149169921875, -3.3402099609375, -3.08892822265625, -2.837646484375, -2.58636474609375, -2.3350830078125, -2.08380126953125, -1.83251953125, -1.58123779296875, -1.3299560546875, -1.07867431640625, -0.827392578125, -0.57611083984375, -0.3248291015625, -0.07354736328125, 0.177734375, 0.42901611328125, 0.6802978515625, 0.93157958984375, 1.182861328125, 1.43414306640625, 1.6854248046875, 1.93670654296875, 2.18798828125, 2.43927001953125, 2.6905517578125, 2.94183349609375, 3.193115234375, 3.44439697265625, 3.6956787109375, 3.94696044921875, 4.1982421875, 4.44952392578125, 4.7008056640625, 4.95208740234375, 5.203369140625, 5.45465087890625, 5.7059326171875, 5.95721435546875, 6.20849609375, 6.45977783203125, 6.7110595703125, 6.96234130859375, 7.213623046875, 7.46490478515625, 7.7161865234375, 7.96746826171875, 8.21875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 7.0, 14.0, 12.0, 23.0, 12.0, 26.0, 33.0, 39.0, 33.0, 39.0, 40.0, 33.0, 38.0, 42.0, 39.0, 45.0, 34.0, 40.0, 45.0, 31.0, 33.0, 35.0, 33.0, 38.0, 32.0, 24.0, 16.0, 23.0, 14.0, 13.0, 18.0, 8.0, 10.0, 9.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.6875, -39.55126953125, -38.4150390625, -37.27880859375, -36.142578125, -35.00634765625, -33.8701171875, -32.73388671875, -31.59765625, -30.46142578125, -29.3251953125, -28.18896484375, -27.052734375, -25.91650390625, -24.7802734375, -23.64404296875, -22.5078125, -21.37158203125, -20.2353515625, -19.09912109375, -17.962890625, -16.82666015625, -15.6904296875, -14.55419921875, -13.41796875, -12.28173828125, -11.1455078125, -10.00927734375, -8.873046875, -7.73681640625, -6.6005859375, -5.46435546875, -4.328125, -3.19189453125, -2.0556640625, -0.91943359375, 0.216796875, 1.35302734375, 2.4892578125, 3.62548828125, 4.76171875, 5.89794921875, 7.0341796875, 8.17041015625, 9.306640625, 10.44287109375, 11.5791015625, 12.71533203125, 13.8515625, 14.98779296875, 16.1240234375, 17.26025390625, 18.396484375, 19.53271484375, 20.6689453125, 21.80517578125, 22.94140625, 24.07763671875, 25.2138671875, 26.35009765625, 27.486328125, 28.62255859375, 29.7587890625, 30.89501953125, 32.03125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 11.0, 19.0, 15.0, 33.0, 47.0, 75.0, 106.0, 180.0, 246.0, 409.0, 660.0, 940.0, 1513.0, 2469.0, 3836.0, 6224.0, 9758.0, 16398.0, 31765.0, 857196.0, 57513.0, 23521.0, 13324.0, 8224.0, 5122.0, 3269.0, 2112.0, 1323.0, 773.0, 531.0, 335.0, 208.0, 131.0, 104.0, 61.0, 39.0, 21.0, 7.0, 13.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.125, -23.342041015625, -22.55908203125, -21.776123046875, -20.9931640625, -20.210205078125, -19.42724609375, -18.644287109375, -17.861328125, -17.078369140625, -16.29541015625, -15.512451171875, -14.7294921875, -13.946533203125, -13.16357421875, -12.380615234375, -11.59765625, -10.814697265625, -10.03173828125, -9.248779296875, -8.4658203125, -7.682861328125, -6.89990234375, -6.116943359375, -5.333984375, -4.551025390625, -3.76806640625, -2.985107421875, -2.2021484375, -1.419189453125, -0.63623046875, 0.146728515625, 0.9296875, 1.712646484375, 2.49560546875, 3.278564453125, 4.0615234375, 4.844482421875, 5.62744140625, 6.410400390625, 7.193359375, 7.976318359375, 8.75927734375, 9.542236328125, 10.3251953125, 11.108154296875, 11.89111328125, 12.674072265625, 13.45703125, 14.239990234375, 15.02294921875, 15.805908203125, 16.5888671875, 17.371826171875, 18.15478515625, 18.937744140625, 19.720703125, 20.503662109375, 21.28662109375, 22.069580078125, 22.8525390625, 23.635498046875, 24.41845703125, 25.201416015625, 25.984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 2.0, 4.0, 6.0, 6.0, 4.0, 16.0, 12.0, 11.0, 9.0, 7.0, 21.0, 19.0, 23.0, 25.0, 32.0, 39.0, 35.0, 28.0, 33.0, 54.0, 39.0, 36.0, 33.0, 36.0, 33.0, 36.0, 40.0, 39.0, 34.0, 36.0, 27.0, 31.0, 30.0, 19.0, 26.0, 24.0, 17.0, 15.0, 15.0, 8.0, 6.0, 9.0, 9.0, 6.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.79931640625, -19.0830078125, -18.36669921875, -17.650390625, -16.93408203125, -16.2177734375, -15.50146484375, -14.78515625, -14.06884765625, -13.3525390625, -12.63623046875, -11.919921875, -11.20361328125, -10.4873046875, -9.77099609375, -9.0546875, -8.33837890625, -7.6220703125, -6.90576171875, -6.189453125, -5.47314453125, -4.7568359375, -4.04052734375, -3.32421875, -2.60791015625, -1.8916015625, -1.17529296875, -0.458984375, 0.25732421875, 0.9736328125, 1.68994140625, 2.40625, 3.12255859375, 3.8388671875, 4.55517578125, 5.271484375, 5.98779296875, 6.7041015625, 7.42041015625, 8.13671875, 8.85302734375, 9.5693359375, 10.28564453125, 11.001953125, 11.71826171875, 12.4345703125, 13.15087890625, 13.8671875, 14.58349609375, 15.2998046875, 16.01611328125, 16.732421875, 17.44873046875, 18.1650390625, 18.88134765625, 19.59765625, 20.31396484375, 21.0302734375, 21.74658203125, 22.462890625, 23.17919921875, 23.8955078125, 24.61181640625, 25.328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 8.0, 9.0, 21.0, 25.0, 36.0, 45.0, 48.0, 67.0, 98.0, 114.0, 172.0, 197.0, 286.0, 382.0, 546.0, 798.0, 1150.0, 1887.0, 2908.0, 4980.0, 8932.0, 16862.0, 35891.0, 876193.0, 49058.0, 21050.0, 10979.0, 5842.0, 3368.0, 2086.0, 1340.0, 882.0, 626.0, 415.0, 323.0, 218.0, 185.0, 130.0, 103.0, 57.0, 56.0, 55.0, 28.0, 27.0, 14.0, 16.0, 10.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7165603637695312, -0.6923980712890625, -0.6682357788085938, -0.644073486328125, -0.6199111938476562, -0.5957489013671875, -0.5715866088867188, -0.54742431640625, -0.5232620239257812, -0.4990997314453125, -0.47493743896484375, -0.450775146484375, -0.42661285400390625, -0.4024505615234375, -0.37828826904296875, -0.3541259765625, -0.32996368408203125, -0.3058013916015625, -0.28163909912109375, -0.257476806640625, -0.23331451416015625, -0.2091522216796875, -0.18498992919921875, -0.16082763671875, -0.13666534423828125, -0.1125030517578125, -0.08834075927734375, -0.064178466796875, -0.04001617431640625, -0.0158538818359375, 0.00830841064453125, 0.032470703125, 0.05663299560546875, 0.0807952880859375, 0.10495758056640625, 0.129119873046875, 0.15328216552734375, 0.1774444580078125, 0.20160675048828125, 0.22576904296875, 0.24993133544921875, 0.2740936279296875, 0.29825592041015625, 0.322418212890625, 0.34658050537109375, 0.3707427978515625, 0.39490509033203125, 0.4190673828125, 0.44322967529296875, 0.4673919677734375, 0.49155426025390625, 0.515716552734375, 0.5398788452148438, 0.5640411376953125, 0.5882034301757812, 0.61236572265625, 0.6365280151367188, 0.6606903076171875, 0.6848526000976562, 0.709014892578125, 0.7331771850585938, 0.7573394775390625, 0.7815017700195312, 0.8056640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 5.0, 7.0, 5.0, 11.0, 13.0, 19.0, 18.0, 13.0, 16.0, 22.0, 20.0, 41.0, 31.0, 28.0, 36.0, 44.0, 45.0, 37.0, 41.0, 44.0, 33.0, 29.0, 38.0, 38.0, 40.0, 35.0, 34.0, 38.0, 25.0, 37.0, 20.0, 28.0, 20.0, 19.0, 10.0, 13.0, 13.0, 6.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0], "bins": [-1.2516975402832031e-05, -1.215469092130661e-05, -1.1792406439781189e-05, -1.1430121958255768e-05, -1.1067837476730347e-05, -1.0705552995204926e-05, -1.0343268513679504e-05, -9.980984032154083e-06, -9.618699550628662e-06, -9.256415069103241e-06, -8.89413058757782e-06, -8.531846106052399e-06, -8.169561624526978e-06, -7.807277143001556e-06, -7.444992661476135e-06, -7.082708179950714e-06, -6.720423698425293e-06, -6.358139216899872e-06, -5.995854735374451e-06, -5.6335702538490295e-06, -5.271285772323608e-06, -4.909001290798187e-06, -4.546716809272766e-06, -4.184432327747345e-06, -3.822147846221924e-06, -3.4598633646965027e-06, -3.0975788831710815e-06, -2.7352944016456604e-06, -2.3730099201202393e-06, -2.010725438594818e-06, -1.648440957069397e-06, -1.2861564755439758e-06, -9.238719940185547e-07, -5.615875124931335e-07, -1.993030309677124e-07, 1.6298145055770874e-07, 5.252659320831299e-07, 8.87550413608551e-07, 1.2498348951339722e-06, 1.6121193766593933e-06, 1.9744038581848145e-06, 2.3366883397102356e-06, 2.6989728212356567e-06, 3.061257302761078e-06, 3.423541784286499e-06, 3.78582626581192e-06, 4.148110747337341e-06, 4.5103952288627625e-06, 4.872679710388184e-06, 5.234964191913605e-06, 5.597248673439026e-06, 5.959533154964447e-06, 6.321817636489868e-06, 6.684102118015289e-06, 7.0463865995407104e-06, 7.408671081066132e-06, 7.770955562591553e-06, 8.133240044116974e-06, 8.495524525642395e-06, 8.857809007167816e-06, 9.220093488693237e-06, 9.582377970218658e-06, 9.94466245174408e-06, 1.03069469332695e-05, 1.0669231414794922e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 14.0, 13.0, 12.0, 24.0, 26.0, 43.0, 48.0, 96.0, 170.0, 244.0, 385.0, 581.0, 821.0, 1317.0, 2117.0, 3277.0, 5248.0, 8547.0, 13517.0, 22140.0, 38202.0, 66359.0, 119156.0, 191985.0, 213387.0, 151379.0, 86923.0, 48816.0, 28283.0, 17225.0, 10479.0, 6512.0, 3936.0, 2597.0, 1642.0, 1043.0, 673.0, 478.0, 280.0, 206.0, 114.0, 85.0, 49.0, 39.0, 19.0, 21.0, 10.0, 12.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.45263671875, -0.4390144348144531, -0.42539215087890625, -0.4117698669433594, -0.3981475830078125, -0.3845252990722656, -0.37090301513671875, -0.3572807312011719, -0.343658447265625, -0.3300361633300781, -0.31641387939453125, -0.3027915954589844, -0.2891693115234375, -0.2755470275878906, -0.26192474365234375, -0.24830245971679688, -0.23468017578125, -0.22105789184570312, -0.20743560791015625, -0.19381332397460938, -0.1801910400390625, -0.16656875610351562, -0.15294647216796875, -0.13932418823242188, -0.125701904296875, -0.11207962036132812, -0.09845733642578125, -0.08483505249023438, -0.0712127685546875, -0.057590484619140625, -0.04396820068359375, -0.030345916748046875, -0.0167236328125, -0.003101348876953125, 0.01052093505859375, 0.024143218994140625, 0.0377655029296875, 0.051387786865234375, 0.06501007080078125, 0.07863235473632812, 0.092254638671875, 0.10587692260742188, 0.11949920654296875, 0.13312149047851562, 0.1467437744140625, 0.16036605834960938, 0.17398834228515625, 0.18761062622070312, 0.20123291015625, 0.21485519409179688, 0.22847747802734375, 0.24209976196289062, 0.2557220458984375, 0.2693443298339844, 0.28296661376953125, 0.2965888977050781, 0.310211181640625, 0.3238334655761719, 0.33745574951171875, 0.3510780334472656, 0.3647003173828125, 0.3783226013183594, 0.39194488525390625, 0.4055671691894531, 0.419189453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 16.0, 8.0, 15.0, 16.0, 19.0, 25.0, 30.0, 35.0, 42.0, 42.0, 61.0, 67.0, 65.0, 71.0, 71.0, 59.0, 54.0, 51.0, 36.0, 33.0, 31.0, 22.0, 22.0, 18.0, 11.0, 10.0, 14.0, 7.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14349365234375, -0.1387939453125, -0.13409423828125, -0.12939453125, -0.12469482421875, -0.1199951171875, -0.11529541015625, -0.110595703125, -0.10589599609375, -0.1011962890625, -0.09649658203125, -0.091796875, -0.08709716796875, -0.0823974609375, -0.07769775390625, -0.072998046875, -0.06829833984375, -0.0635986328125, -0.05889892578125, -0.05419921875, -0.04949951171875, -0.0447998046875, -0.04010009765625, -0.035400390625, -0.03070068359375, -0.0260009765625, -0.02130126953125, -0.0166015625, -0.01190185546875, -0.0072021484375, -0.00250244140625, 0.002197265625, 0.00689697265625, 0.0115966796875, 0.01629638671875, 0.02099609375, 0.02569580078125, 0.0303955078125, 0.03509521484375, 0.039794921875, 0.04449462890625, 0.0491943359375, 0.05389404296875, 0.05859375, 0.06329345703125, 0.0679931640625, 0.07269287109375, 0.077392578125, 0.08209228515625, 0.0867919921875, 0.09149169921875, 0.09619140625, 0.10089111328125, 0.1055908203125, 0.11029052734375, 0.114990234375, 0.11968994140625, 0.1243896484375, 0.12908935546875, 0.1337890625, 0.13848876953125, 0.1431884765625, 0.14788818359375, 0.152587890625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 6.0, 15.0, 15.0, 12.0, 17.0, 19.0, 24.0, 24.0, 27.0, 30.0, 27.0, 39.0, 43.0, 34.0, 40.0, 48.0, 47.0, 27.0, 38.0, 37.0, 44.0, 41.0, 46.0, 31.0, 36.0, 27.0, 38.0, 25.0, 22.0, 18.0, 12.0, 12.0, 15.0, 11.0, 12.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.088132858276367, -29.171817779541016, -28.255504608154297, -27.339189529418945, -26.422874450683594, -25.506559371948242, -24.59024429321289, -23.673931121826172, -22.75761604309082, -21.84130096435547, -20.92498779296875, -20.0086727142334, -19.092357635498047, -18.176042556762695, -17.259727478027344, -16.343414306640625, -15.427099227905273, -14.510784149169922, -13.594470024108887, -12.678155899047852, -11.7618408203125, -10.845525741577148, -9.929211616516113, -9.012897491455078, -8.096582412719727, -7.180267810821533, -6.26395320892334, -5.3476386070251465, -4.431324005126953, -3.5150094032287598, -2.5986948013305664, -1.682380199432373, -0.7660655975341797, 0.15024900436401367, 1.066563606262207, 1.9828782081604004, 2.8991928100585938, 3.815507411956787, 4.7318220138549805, 5.648136615753174, 6.564451217651367, 7.4807658195495605, 8.397080421447754, 9.313394546508789, 10.22970962524414, 11.146024703979492, 12.062338829040527, 12.978652954101562, 13.894968032836914, 14.811283111572266, 15.7275972366333, 16.643911361694336, 17.560226440429688, 18.47654151916504, 19.39285659790039, 20.30916976928711, 21.22548484802246, 22.141799926757812, 23.05811309814453, 23.974428176879883, 24.890743255615234, 25.807058334350586, 26.723373413085938, 27.639686584472656, 28.556001663208008]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 13.0, 9.0, 14.0, 11.0, 24.0, 10.0, 26.0, 34.0, 40.0, 32.0, 40.0, 40.0, 33.0, 35.0, 43.0, 40.0, 45.0, 34.0, 41.0, 45.0, 32.0, 31.0, 35.0, 34.0, 37.0, 33.0, 24.0, 16.0, 23.0, 14.0, 13.0, 16.0, 10.0, 10.0, 8.0, 17.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.73759078979492, -39.60079574584961, -38.46399688720703, -37.32720184326172, -36.190406799316406, -35.05360794067383, -33.916812896728516, -32.78001403808594, -31.643218994140625, -30.50642204284668, -29.369625091552734, -28.232830047607422, -27.096033096313477, -25.95923614501953, -24.82244110107422, -23.685644149780273, -22.548847198486328, -21.412050247192383, -20.275253295898438, -19.138458251953125, -18.00166130065918, -16.864864349365234, -15.728068351745605, -14.591272354125977, -13.454475402832031, -12.317678451538086, -11.180882453918457, -10.044086456298828, -8.907289505004883, -7.770493030548096, -6.633696556091309, -5.4969000816345215, -4.360103607177734, -3.2233071327209473, -2.08651065826416, -0.949714183807373, 0.18708229064941406, 1.3238787651062012, 2.4606752395629883, 3.5974717140197754, 4.7342681884765625, 5.87106466293335, 7.007861137390137, 8.144657135009766, 9.281454086303711, 10.418251037597656, 11.555047035217285, 12.691843032836914, 13.82863998413086, 14.965436935424805, 16.10223388671875, 17.239028930664062, 18.375825881958008, 19.512622833251953, 20.649417877197266, 21.78621482849121, 22.923011779785156, 24.0598087310791, 25.196605682373047, 26.33340072631836, 27.470197677612305, 28.60699462890625, 29.743789672851562, 30.880586624145508, 32.01738357543945]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 11.0, 17.0, 30.0, 39.0, 71.0, 103.0, 166.0, 301.0, 423.0, 751.0, 1091.0, 1796.0, 2804.0, 4139.0, 6338.0, 9161.0, 13388.0, 18957.0, 26702.0, 35545.0, 46350.0, 58191.0, 69607.0, 80684.0, 87853.0, 91240.0, 88846.0, 83223.0, 73540.0, 61828.0, 50005.0, 38829.0, 28928.0, 21504.0, 15252.0, 10354.0, 7143.0, 4780.0, 3036.0, 1979.0, 1303.0, 855.0, 548.0, 315.0, 216.0, 107.0, 88.0, 50.0, 31.0, 16.0, 11.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.3984375, -12.9752197265625, -12.552001953125, -12.1287841796875, -11.70556640625, -11.2823486328125, -10.859130859375, -10.4359130859375, -10.0126953125, -9.5894775390625, -9.166259765625, -8.7430419921875, -8.31982421875, -7.8966064453125, -7.473388671875, -7.0501708984375, -6.626953125, -6.2037353515625, -5.780517578125, -5.3572998046875, -4.93408203125, -4.5108642578125, -4.087646484375, -3.6644287109375, -3.2412109375, -2.8179931640625, -2.394775390625, -1.9715576171875, -1.54833984375, -1.1251220703125, -0.701904296875, -0.2786865234375, 0.14453125, 0.5677490234375, 0.990966796875, 1.4141845703125, 1.83740234375, 2.2606201171875, 2.683837890625, 3.1070556640625, 3.5302734375, 3.9534912109375, 4.376708984375, 4.7999267578125, 5.22314453125, 5.6463623046875, 6.069580078125, 6.4927978515625, 6.916015625, 7.3392333984375, 7.762451171875, 8.1856689453125, 8.60888671875, 9.0321044921875, 9.455322265625, 9.8785400390625, 10.3017578125, 10.7249755859375, 11.148193359375, 11.5714111328125, 11.99462890625, 12.4178466796875, 12.841064453125, 13.2642822265625, 13.6875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 10.0, 10.0, 12.0, 15.0, 23.0, 10.0, 27.0, 41.0, 36.0, 31.0, 39.0, 33.0, 38.0, 37.0, 43.0, 36.0, 48.0, 32.0, 42.0, 43.0, 34.0, 29.0, 38.0, 35.0, 39.0, 28.0, 26.0, 18.0, 19.0, 15.0, 14.0, 17.0, 9.0, 9.0, 11.0, 14.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.125, -39.00439453125, -37.8837890625, -36.76318359375, -35.642578125, -34.52197265625, -33.4013671875, -32.28076171875, -31.16015625, -30.03955078125, -28.9189453125, -27.79833984375, -26.677734375, -25.55712890625, -24.4365234375, -23.31591796875, -22.1953125, -21.07470703125, -19.9541015625, -18.83349609375, -17.712890625, -16.59228515625, -15.4716796875, -14.35107421875, -13.23046875, -12.10986328125, -10.9892578125, -9.86865234375, -8.748046875, -7.62744140625, -6.5068359375, -5.38623046875, -4.265625, -3.14501953125, -2.0244140625, -0.90380859375, 0.216796875, 1.33740234375, 2.4580078125, 3.57861328125, 4.69921875, 5.81982421875, 6.9404296875, 8.06103515625, 9.181640625, 10.30224609375, 11.4228515625, 12.54345703125, 13.6640625, 14.78466796875, 15.9052734375, 17.02587890625, 18.146484375, 19.26708984375, 20.3876953125, 21.50830078125, 22.62890625, 23.74951171875, 24.8701171875, 25.99072265625, 27.111328125, 28.23193359375, 29.3525390625, 30.47314453125, 31.59375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 6.0, 17.0, 30.0, 45.0, 85.0, 148.0, 262.0, 345.0, 632.0, 1034.0, 1679.0, 2715.0, 4264.0, 6767.0, 10502.0, 15635.0, 22719.0, 32307.0, 44199.0, 58326.0, 71948.0, 84744.0, 93916.0, 99174.0, 97044.0, 89481.0, 78163.0, 63854.0, 50413.0, 37533.0, 26781.0, 18730.0, 12660.0, 8227.0, 5364.0, 3408.0, 2086.0, 1290.0, 808.0, 484.0, 297.0, 197.0, 95.0, 61.0, 36.0, 20.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0546875, -14.5802001953125, -14.105712890625, -13.6312255859375, -13.15673828125, -12.6822509765625, -12.207763671875, -11.7332763671875, -11.2587890625, -10.7843017578125, -10.309814453125, -9.8353271484375, -9.36083984375, -8.8863525390625, -8.411865234375, -7.9373779296875, -7.462890625, -6.9884033203125, -6.513916015625, -6.0394287109375, -5.56494140625, -5.0904541015625, -4.615966796875, -4.1414794921875, -3.6669921875, -3.1925048828125, -2.718017578125, -2.2435302734375, -1.76904296875, -1.2945556640625, -0.820068359375, -0.3455810546875, 0.12890625, 0.6033935546875, 1.077880859375, 1.5523681640625, 2.02685546875, 2.5013427734375, 2.975830078125, 3.4503173828125, 3.9248046875, 4.3992919921875, 4.873779296875, 5.3482666015625, 5.82275390625, 6.2972412109375, 6.771728515625, 7.2462158203125, 7.720703125, 8.1951904296875, 8.669677734375, 9.1441650390625, 9.61865234375, 10.0931396484375, 10.567626953125, 11.0421142578125, 11.5166015625, 11.9910888671875, 12.465576171875, 12.9400634765625, 13.41455078125, 13.8890380859375, 14.363525390625, 14.8380126953125, 15.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 9.0, 7.0, 12.0, 18.0, 19.0, 17.0, 29.0, 30.0, 24.0, 30.0, 24.0, 30.0, 29.0, 52.0, 32.0, 37.0, 31.0, 38.0, 44.0, 42.0, 38.0, 29.0, 33.0, 33.0, 35.0, 27.0, 29.0, 28.0, 28.0, 14.0, 24.0, 17.0, 14.0, 14.0, 15.0, 6.0, 7.0, 7.0, 3.0, 5.0, 2.0, 6.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.70263671875, -18.0146484375, -17.32666015625, -16.638671875, -15.95068359375, -15.2626953125, -14.57470703125, -13.88671875, -13.19873046875, -12.5107421875, -11.82275390625, -11.134765625, -10.44677734375, -9.7587890625, -9.07080078125, -8.3828125, -7.69482421875, -7.0068359375, -6.31884765625, -5.630859375, -4.94287109375, -4.2548828125, -3.56689453125, -2.87890625, -2.19091796875, -1.5029296875, -0.81494140625, -0.126953125, 0.56103515625, 1.2490234375, 1.93701171875, 2.625, 3.31298828125, 4.0009765625, 4.68896484375, 5.376953125, 6.06494140625, 6.7529296875, 7.44091796875, 8.12890625, 8.81689453125, 9.5048828125, 10.19287109375, 10.880859375, 11.56884765625, 12.2568359375, 12.94482421875, 13.6328125, 14.32080078125, 15.0087890625, 15.69677734375, 16.384765625, 17.07275390625, 17.7607421875, 18.44873046875, 19.13671875, 19.82470703125, 20.5126953125, 21.20068359375, 21.888671875, 22.57666015625, 23.2646484375, 23.95263671875, 24.640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 14.0, 29.0, 39.0, 42.0, 77.0, 126.0, 180.0, 272.0, 387.0, 605.0, 985.0, 1489.0, 2224.0, 3352.0, 5203.0, 7972.0, 11653.0, 16885.0, 23678.0, 33227.0, 44032.0, 56687.0, 69141.0, 80656.0, 88828.0, 93389.0, 92247.0, 86523.0, 76821.0, 64561.0, 52110.0, 39992.0, 29689.0, 21186.0, 14861.0, 10105.0, 6570.0, 4402.0, 2853.0, 1889.0, 1213.0, 783.0, 525.0, 353.0, 246.0, 163.0, 95.0, 55.0, 38.0, 33.0, 16.0, 20.0, 12.0, 6.0, 2.0, 6.0, 2.0, 1.0], "bins": [-4.421875, -4.28289794921875, -4.1439208984375, -4.00494384765625, -3.865966796875, -3.72698974609375, -3.5880126953125, -3.44903564453125, -3.31005859375, -3.17108154296875, -3.0321044921875, -2.89312744140625, -2.754150390625, -2.61517333984375, -2.4761962890625, -2.33721923828125, -2.1982421875, -2.05926513671875, -1.9202880859375, -1.78131103515625, -1.642333984375, -1.50335693359375, -1.3643798828125, -1.22540283203125, -1.08642578125, -0.94744873046875, -0.8084716796875, -0.66949462890625, -0.530517578125, -0.39154052734375, -0.2525634765625, -0.11358642578125, 0.025390625, 0.16436767578125, 0.3033447265625, 0.44232177734375, 0.581298828125, 0.72027587890625, 0.8592529296875, 0.99822998046875, 1.13720703125, 1.27618408203125, 1.4151611328125, 1.55413818359375, 1.693115234375, 1.83209228515625, 1.9710693359375, 2.11004638671875, 2.2490234375, 2.38800048828125, 2.5269775390625, 2.66595458984375, 2.804931640625, 2.94390869140625, 3.0828857421875, 3.22186279296875, 3.36083984375, 3.49981689453125, 3.6387939453125, 3.77777099609375, 3.916748046875, 4.05572509765625, 4.1947021484375, 4.33367919921875, 4.47265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 10.0, 13.0, 17.0, 11.0, 15.0, 15.0, 20.0, 24.0, 25.0, 20.0, 25.0, 17.0, 44.0, 24.0, 37.0, 30.0, 42.0, 31.0, 36.0, 40.0, 37.0, 43.0, 39.0, 40.0, 29.0, 41.0, 25.0, 32.0, 22.0, 16.0, 22.0, 19.0, 20.0, 15.0, 6.0, 10.0, 9.0, 15.0, 8.0, 11.0, 1.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0005574226379394531, -0.0005406886339187622, -0.0005239546298980713, -0.0005072206258773804, -0.0004904866218566895, -0.00047375261783599854, -0.0004570186138153076, -0.0004402846097946167, -0.0004235506057739258, -0.00040681660175323486, -0.00039008259773254395, -0.00037334859371185303, -0.0003566145896911621, -0.0003398805856704712, -0.0003231465816497803, -0.00030641257762908936, -0.00028967857360839844, -0.0002729445695877075, -0.0002562105655670166, -0.00023947656154632568, -0.00022274255752563477, -0.00020600855350494385, -0.00018927454948425293, -0.000172540545463562, -0.0001558065414428711, -0.00013907253742218018, -0.00012233853340148926, -0.00010560452938079834, -8.887052536010742e-05, -7.21365213394165e-05, -5.5402517318725586e-05, -3.866851329803467e-05, -2.193450927734375e-05, -5.200505256652832e-06, 1.1533498764038086e-05, 2.8267502784729004e-05, 4.500150680541992e-05, 6.173551082611084e-05, 7.846951484680176e-05, 9.520351886749268e-05, 0.0001119375228881836, 0.0001286715269088745, 0.00014540553092956543, 0.00016213953495025635, 0.00017887353897094727, 0.00019560754299163818, 0.0002123415470123291, 0.00022907555103302002, 0.00024580955505371094, 0.00026254355907440186, 0.0002792775630950928, 0.0002960115671157837, 0.0003127455711364746, 0.00032947957515716553, 0.00034621357917785645, 0.00036294758319854736, 0.0003796815872192383, 0.0003964155912399292, 0.0004131495952606201, 0.00042988359928131104, 0.00044661760330200195, 0.00046335160732269287, 0.0004800856113433838, 0.0004968196153640747, 0.0005135536193847656]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 2.0, 14.0, 13.0, 20.0, 29.0, 45.0, 81.0, 109.0, 197.0, 280.0, 436.0, 711.0, 1029.0, 1704.0, 2933.0, 4737.0, 7665.0, 12426.0, 19636.0, 30012.0, 44804.0, 62742.0, 81914.0, 100282.0, 112663.0, 116615.0, 109627.0, 94927.0, 75623.0, 56672.0, 39609.0, 26234.0, 16989.0, 10716.0, 6578.0, 3953.0, 2458.0, 1538.0, 944.0, 599.0, 348.0, 250.0, 138.0, 90.0, 63.0, 44.0, 20.0, 17.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.06097412109375, -4.8758544921875, -4.69073486328125, -4.505615234375, -4.32049560546875, -4.1353759765625, -3.95025634765625, -3.76513671875, -3.58001708984375, -3.3948974609375, -3.20977783203125, -3.024658203125, -2.83953857421875, -2.6544189453125, -2.46929931640625, -2.2841796875, -2.09906005859375, -1.9139404296875, -1.72882080078125, -1.543701171875, -1.35858154296875, -1.1734619140625, -0.98834228515625, -0.80322265625, -0.61810302734375, -0.4329833984375, -0.24786376953125, -0.062744140625, 0.12237548828125, 0.3074951171875, 0.49261474609375, 0.677734375, 0.86285400390625, 1.0479736328125, 1.23309326171875, 1.418212890625, 1.60333251953125, 1.7884521484375, 1.97357177734375, 2.15869140625, 2.34381103515625, 2.5289306640625, 2.71405029296875, 2.899169921875, 3.08428955078125, 3.2694091796875, 3.45452880859375, 3.6396484375, 3.82476806640625, 4.0098876953125, 4.19500732421875, 4.380126953125, 4.56524658203125, 4.7503662109375, 4.93548583984375, 5.12060546875, 5.30572509765625, 5.4908447265625, 5.67596435546875, 5.861083984375, 6.04620361328125, 6.2313232421875, 6.41644287109375, 6.6015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 6.0, 11.0, 8.0, 9.0, 15.0, 21.0, 10.0, 21.0, 38.0, 27.0, 32.0, 61.0, 49.0, 42.0, 57.0, 58.0, 61.0, 68.0, 47.0, 51.0, 48.0, 34.0, 42.0, 26.0, 41.0, 28.0, 19.0, 10.0, 12.0, 4.0, 6.0, 12.0, 3.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.06024169921875, -2.9447021484375, -2.82916259765625, -2.713623046875, -2.59808349609375, -2.4825439453125, -2.36700439453125, -2.25146484375, -2.13592529296875, -2.0203857421875, -1.90484619140625, -1.789306640625, -1.67376708984375, -1.5582275390625, -1.44268798828125, -1.3271484375, -1.21160888671875, -1.0960693359375, -0.98052978515625, -0.864990234375, -0.74945068359375, -0.6339111328125, -0.51837158203125, -0.40283203125, -0.28729248046875, -0.1717529296875, -0.05621337890625, 0.059326171875, 0.17486572265625, 0.2904052734375, 0.40594482421875, 0.521484375, 0.63702392578125, 0.7525634765625, 0.86810302734375, 0.983642578125, 1.09918212890625, 1.2147216796875, 1.33026123046875, 1.44580078125, 1.56134033203125, 1.6768798828125, 1.79241943359375, 1.907958984375, 2.02349853515625, 2.1390380859375, 2.25457763671875, 2.3701171875, 2.48565673828125, 2.6011962890625, 2.71673583984375, 2.832275390625, 2.94781494140625, 3.0633544921875, 3.17889404296875, 3.29443359375, 3.40997314453125, 3.5255126953125, 3.64105224609375, 3.756591796875, 3.87213134765625, 3.9876708984375, 4.10321044921875, 4.21875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 4.0, 8.0, 9.0, 19.0, 15.0, 24.0, 22.0, 20.0, 24.0, 34.0, 32.0, 26.0, 38.0, 40.0, 47.0, 45.0, 39.0, 52.0, 38.0, 40.0, 42.0, 35.0, 31.0, 42.0, 31.0, 37.0, 33.0, 24.0, 25.0, 24.0, 13.0, 11.0, 16.0, 11.0, 10.0, 6.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.847383499145508, -29.910114288330078, -28.97284698486328, -28.03557777404785, -27.098308563232422, -26.161041259765625, -25.223772048950195, -24.286502838134766, -23.34923553466797, -22.41196632385254, -21.474699020385742, -20.537429809570312, -19.600160598754883, -18.662891387939453, -17.725624084472656, -16.788354873657227, -15.851085662841797, -14.913817405700684, -13.976548194885254, -13.03927993774414, -12.102010726928711, -11.164742469787598, -10.227474212646484, -9.290205001831055, -8.352936744689941, -7.41566801071167, -6.478399276733398, -5.541131019592285, -4.603862285614014, -3.666593551635742, -2.729325294494629, -1.7920565605163574, -0.8547897338867188, 0.08247888088226318, 1.0197474956512451, 1.9570159912109375, 2.894284725189209, 3.8315534591674805, 4.768821716308594, 5.706090450286865, 6.643359184265137, 7.580627918243408, 8.51789665222168, 9.455164909362793, 10.392433166503906, 11.329702377319336, 12.26697063446045, 13.204238891601562, 14.141508102416992, 15.078776359558105, 16.01604461669922, 16.95331382751465, 17.890583038330078, 18.827850341796875, 19.765119552612305, 20.702388763427734, 21.63965606689453, 22.57692527770996, 23.514192581176758, 24.451461791992188, 25.388731002807617, 26.326000213623047, 27.263267517089844, 28.200536727905273, 29.137805938720703]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 6.0, 5.0, 14.0, 11.0, 17.0, 19.0, 24.0, 25.0, 30.0, 30.0, 25.0, 43.0, 31.0, 33.0, 35.0, 42.0, 35.0, 42.0, 47.0, 38.0, 46.0, 31.0, 27.0, 37.0, 34.0, 34.0, 28.0, 34.0, 14.0, 19.0, 21.0, 23.0, 9.0, 17.0, 20.0, 10.0, 7.0, 5.0, 6.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.07436752319336, -38.872161865234375, -37.669960021972656, -36.46775436401367, -35.26554870605469, -34.0633430480957, -32.86113739013672, -31.658935546875, -30.456729888916016, -29.25452423095703, -28.05232048034668, -26.850116729736328, -25.647911071777344, -24.44570541381836, -23.243501663208008, -22.041297912597656, -20.839092254638672, -19.636886596679688, -18.434682846069336, -17.232479095458984, -16.0302734375, -14.828068733215332, -13.625864028930664, -12.423659324645996, -11.221454620361328, -10.01924991607666, -8.817045211791992, -7.614840507507324, -6.412635803222656, -5.210431098937988, -4.00822639465332, -2.8060216903686523, -1.60382080078125, -0.40161609649658203, 0.8005886077880859, 2.002793312072754, 3.204998016357422, 4.40720272064209, 5.609407424926758, 6.811612129211426, 8.013816833496094, 9.216021537780762, 10.41822624206543, 11.620430946350098, 12.822635650634766, 14.024840354919434, 15.227045059204102, 16.429248809814453, 17.631454467773438, 18.833660125732422, 20.035863876342773, 21.238067626953125, 22.44027328491211, 23.642478942871094, 24.844682693481445, 26.046886444091797, 27.24909210205078, 28.451297760009766, 29.653501510620117, 30.85570526123047, 32.05791091918945, 33.26011657714844, 34.462318420410156, 35.66452407836914, 36.866729736328125]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [4.0, 0.0, 9.0, 10.0, 21.0, 38.0, 58.0, 96.0, 189.0, 267.0, 460.0, 758.0, 1233.0, 2045.0, 3226.0, 4981.0, 8021.0, 11883.0, 18616.0, 27625.0, 40515.0, 58263.0, 81421.0, 109543.0, 144902.0, 186061.0, 229755.0, 272080.0, 308631.0, 334476.0, 346493.0, 342276.0, 322544.0, 289226.0, 250188.0, 206623.0, 163630.0, 125756.0, 93490.0, 67741.0, 47472.0, 32544.0, 21759.0, 14215.0, 9322.0, 6033.0, 3804.0, 2343.0, 1466.0, 930.0, 504.0, 302.0, 201.0, 105.0, 63.0, 37.0, 19.0, 13.0, 9.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-18.953125, -18.336181640625, -17.71923828125, -17.102294921875, -16.4853515625, -15.868408203125, -15.25146484375, -14.634521484375, -14.017578125, -13.400634765625, -12.78369140625, -12.166748046875, -11.5498046875, -10.932861328125, -10.31591796875, -9.698974609375, -9.08203125, -8.465087890625, -7.84814453125, -7.231201171875, -6.6142578125, -5.997314453125, -5.38037109375, -4.763427734375, -4.146484375, -3.529541015625, -2.91259765625, -2.295654296875, -1.6787109375, -1.061767578125, -0.44482421875, 0.172119140625, 0.7890625, 1.406005859375, 2.02294921875, 2.639892578125, 3.2568359375, 3.873779296875, 4.49072265625, 5.107666015625, 5.724609375, 6.341552734375, 6.95849609375, 7.575439453125, 8.1923828125, 8.809326171875, 9.42626953125, 10.043212890625, 10.66015625, 11.277099609375, 11.89404296875, 12.510986328125, 13.1279296875, 13.744873046875, 14.36181640625, 14.978759765625, 15.595703125, 16.212646484375, 16.82958984375, 17.446533203125, 18.0634765625, 18.680419921875, 19.29736328125, 19.914306640625, 20.53125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 7.0, 4.0, 12.0, 13.0, 16.0, 17.0, 23.0, 28.0, 26.0, 27.0, 26.0, 45.0, 32.0, 31.0, 35.0, 50.0, 35.0, 39.0, 43.0, 35.0, 49.0, 35.0, 24.0, 40.0, 35.0, 27.0, 34.0, 29.0, 21.0, 14.0, 20.0, 26.0, 11.0, 16.0, 20.0, 12.0, 5.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.9375, -34.8564453125, -33.775390625, -32.6943359375, -31.61328125, -30.5322265625, -29.451171875, -28.3701171875, -27.2890625, -26.2080078125, -25.126953125, -24.0458984375, -22.96484375, -21.8837890625, -20.802734375, -19.7216796875, -18.640625, -17.5595703125, -16.478515625, -15.3974609375, -14.31640625, -13.2353515625, -12.154296875, -11.0732421875, -9.9921875, -8.9111328125, -7.830078125, -6.7490234375, -5.66796875, -4.5869140625, -3.505859375, -2.4248046875, -1.34375, -0.2626953125, 0.818359375, 1.8994140625, 2.98046875, 4.0615234375, 5.142578125, 6.2236328125, 7.3046875, 8.3857421875, 9.466796875, 10.5478515625, 11.62890625, 12.7099609375, 13.791015625, 14.8720703125, 15.953125, 17.0341796875, 18.115234375, 19.1962890625, 20.27734375, 21.3583984375, 22.439453125, 23.5205078125, 24.6015625, 25.6826171875, 26.763671875, 27.8447265625, 28.92578125, 30.0068359375, 31.087890625, 32.1689453125, 33.25]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 16.0, 42.0, 90.0, 141.0, 218.0, 432.0, 834.0, 1490.0, 2648.0, 4662.0, 8182.0, 14185.0, 23170.0, 38692.0, 61781.0, 94063.0, 138354.0, 193209.0, 255807.0, 319287.0, 374621.0, 412262.0, 422585.0, 405244.0, 360408.0, 302431.0, 237574.0, 177339.0, 123360.0, 84095.0, 54244.0, 34036.0, 20470.0, 12059.0, 7070.0, 3994.0, 2217.0, 1314.0, 724.0, 429.0, 235.0, 115.0, 67.0, 40.0, 15.0, 16.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-26.4375, -25.64501953125, -24.8525390625, -24.06005859375, -23.267578125, -22.47509765625, -21.6826171875, -20.89013671875, -20.09765625, -19.30517578125, -18.5126953125, -17.72021484375, -16.927734375, -16.13525390625, -15.3427734375, -14.55029296875, -13.7578125, -12.96533203125, -12.1728515625, -11.38037109375, -10.587890625, -9.79541015625, -9.0029296875, -8.21044921875, -7.41796875, -6.62548828125, -5.8330078125, -5.04052734375, -4.248046875, -3.45556640625, -2.6630859375, -1.87060546875, -1.078125, -0.28564453125, 0.5068359375, 1.29931640625, 2.091796875, 2.88427734375, 3.6767578125, 4.46923828125, 5.26171875, 6.05419921875, 6.8466796875, 7.63916015625, 8.431640625, 9.22412109375, 10.0166015625, 10.80908203125, 11.6015625, 12.39404296875, 13.1865234375, 13.97900390625, 14.771484375, 15.56396484375, 16.3564453125, 17.14892578125, 17.94140625, 18.73388671875, 19.5263671875, 20.31884765625, 21.111328125, 21.90380859375, 22.6962890625, 23.48876953125, 24.28125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 8.0, 11.0, 19.0, 17.0, 25.0, 34.0, 36.0, 45.0, 56.0, 82.0, 99.0, 108.0, 126.0, 145.0, 156.0, 191.0, 166.0, 204.0, 206.0, 214.0, 217.0, 233.0, 201.0, 180.0, 172.0, 177.0, 145.0, 135.0, 121.0, 109.0, 99.0, 61.0, 65.0, 48.0, 42.0, 27.0, 24.0, 23.0, 21.0, 5.0, 12.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.687255859375, -15.17138671875, -14.655517578125, -14.1396484375, -13.623779296875, -13.10791015625, -12.592041015625, -12.076171875, -11.560302734375, -11.04443359375, -10.528564453125, -10.0126953125, -9.496826171875, -8.98095703125, -8.465087890625, -7.94921875, -7.433349609375, -6.91748046875, -6.401611328125, -5.8857421875, -5.369873046875, -4.85400390625, -4.338134765625, -3.822265625, -3.306396484375, -2.79052734375, -2.274658203125, -1.7587890625, -1.242919921875, -0.72705078125, -0.211181640625, 0.3046875, 0.820556640625, 1.33642578125, 1.852294921875, 2.3681640625, 2.884033203125, 3.39990234375, 3.915771484375, 4.431640625, 4.947509765625, 5.46337890625, 5.979248046875, 6.4951171875, 7.010986328125, 7.52685546875, 8.042724609375, 8.55859375, 9.074462890625, 9.59033203125, 10.106201171875, 10.6220703125, 11.137939453125, 11.65380859375, 12.169677734375, 12.685546875, 13.201416015625, 13.71728515625, 14.233154296875, 14.7490234375, 15.264892578125, 15.78076171875, 16.296630859375, 16.8125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 7.0, 9.0, 11.0, 8.0, 13.0, 21.0, 23.0, 23.0, 30.0, 26.0, 29.0, 28.0, 37.0, 45.0, 37.0, 27.0, 40.0, 49.0, 54.0, 39.0, 42.0, 40.0, 38.0, 35.0, 37.0, 35.0, 30.0, 33.0, 22.0, 17.0, 18.0, 18.0, 21.0, 10.0, 7.0, 5.0, 2.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.20836639404297, -34.11933898925781, -33.03031539916992, -31.9412899017334, -30.852264404296875, -29.76323699951172, -28.674211502075195, -27.585186004638672, -26.49616050720215, -25.407135009765625, -24.3181095123291, -23.229084014892578, -22.140056610107422, -21.05103302001953, -19.962005615234375, -18.87298011779785, -17.783954620361328, -16.694929122924805, -15.605903625488281, -14.516877174377441, -13.427851676940918, -12.338826179504395, -11.249799728393555, -10.160774230957031, -9.071748733520508, -7.982723236083984, -6.893697261810303, -5.804671287536621, -4.715645790100098, -3.626620292663574, -2.5375943183898926, -1.448568344116211, -0.3595428466796875, 0.729482889175415, 1.8185086250305176, 2.90753436088562, 3.9965600967407227, 5.085585594177246, 6.174611568450928, 7.263637542724609, 8.352663040161133, 9.441688537597656, 10.53071403503418, 11.61974048614502, 12.708765983581543, 13.797791481018066, 14.886817932128906, 15.97584342956543, 17.064868927001953, 18.153894424438477, 19.242919921875, 20.331945419311523, 21.420970916748047, 22.509998321533203, 23.599023818969727, 24.68804931640625, 25.777074813842773, 26.866100311279297, 27.95512580871582, 29.044151306152344, 30.1331787109375, 31.22220230102539, 32.31122970581055, 33.40025329589844, 34.489280700683594]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 6.0, 8.0, 11.0, 18.0, 13.0, 20.0, 18.0, 26.0, 39.0, 27.0, 31.0, 34.0, 41.0, 35.0, 31.0, 34.0, 38.0, 54.0, 44.0, 43.0, 36.0, 36.0, 42.0, 44.0, 31.0, 33.0, 30.0, 27.0, 22.0, 21.0, 19.0, 16.0, 14.0, 6.0, 9.0, 11.0, 7.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0], "bins": [-53.80036926269531, -52.41516876220703, -51.029964447021484, -49.6447639465332, -48.259559631347656, -46.874359130859375, -45.489158630371094, -44.10395431518555, -42.71875, -41.33354949951172, -39.94834518432617, -38.56314468383789, -37.177940368652344, -35.79273986816406, -34.40753936767578, -33.022335052490234, -31.637134552001953, -30.25193214416504, -28.866729736328125, -27.481529235839844, -26.096324920654297, -24.711124420166016, -23.3259220123291, -21.940719604492188, -20.555517196655273, -19.17031478881836, -17.785112380981445, -16.39990997314453, -15.014708518981934, -13.62950611114502, -12.244304656982422, -10.859102249145508, -9.473899841308594, -8.08869743347168, -6.703495502471924, -5.318293571472168, -3.933091163635254, -2.54788875579834, -1.1626873016357422, 0.22251510620117188, 1.607717514038086, 2.992919683456421, 4.378121852874756, 5.763323783874512, 7.148526191711426, 8.53372859954834, 9.918930053710938, 11.304132461547852, 12.689334869384766, 14.07453727722168, 15.459739685058594, 16.844940185546875, 18.230144500732422, 19.615345001220703, 21.000547409057617, 22.38574981689453, 23.770952224731445, 25.15615463256836, 26.541357040405273, 27.926559448242188, 29.31175994873047, 30.696964263916016, 32.0821647644043, 33.467369079589844, 34.852569580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 9.0, 13.0, 24.0, 21.0, 38.0, 79.0, 127.0, 189.0, 316.0, 470.0, 700.0, 1155.0, 1813.0, 2812.0, 4532.0, 7112.0, 10993.0, 16779.0, 25789.0, 38201.0, 55563.0, 76560.0, 100017.0, 119462.0, 127249.0, 119288.0, 98928.0, 76015.0, 54776.0, 37836.0, 25249.0, 16639.0, 10841.0, 6851.0, 4350.0, 2770.0, 1808.0, 1131.0, 739.0, 464.0, 295.0, 193.0, 123.0, 81.0, 67.0, 28.0, 28.0, 13.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.96875, -9.652099609375, -9.33544921875, -9.018798828125, -8.7021484375, -8.385498046875, -8.06884765625, -7.752197265625, -7.435546875, -7.118896484375, -6.80224609375, -6.485595703125, -6.1689453125, -5.852294921875, -5.53564453125, -5.218994140625, -4.90234375, -4.585693359375, -4.26904296875, -3.952392578125, -3.6357421875, -3.319091796875, -3.00244140625, -2.685791015625, -2.369140625, -2.052490234375, -1.73583984375, -1.419189453125, -1.1025390625, -0.785888671875, -0.46923828125, -0.152587890625, 0.1640625, 0.480712890625, 0.79736328125, 1.114013671875, 1.4306640625, 1.747314453125, 2.06396484375, 2.380615234375, 2.697265625, 3.013916015625, 3.33056640625, 3.647216796875, 3.9638671875, 4.280517578125, 4.59716796875, 4.913818359375, 5.23046875, 5.547119140625, 5.86376953125, 6.180419921875, 6.4970703125, 6.813720703125, 7.13037109375, 7.447021484375, 7.763671875, 8.080322265625, 8.39697265625, 8.713623046875, 9.0302734375, 9.346923828125, 9.66357421875, 9.980224609375, 10.296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 5.0, 9.0, 11.0, 18.0, 13.0, 21.0, 17.0, 26.0, 39.0, 26.0, 32.0, 33.0, 43.0, 33.0, 32.0, 33.0, 39.0, 56.0, 44.0, 42.0, 37.0, 34.0, 42.0, 46.0, 31.0, 31.0, 31.0, 26.0, 22.0, 23.0, 17.0, 18.0, 12.0, 7.0, 10.0, 9.0, 8.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-53.6875, -52.302734375, -50.91796875, -49.533203125, -48.1484375, -46.763671875, -45.37890625, -43.994140625, -42.609375, -41.224609375, -39.83984375, -38.455078125, -37.0703125, -35.685546875, -34.30078125, -32.916015625, -31.53125, -30.146484375, -28.76171875, -27.376953125, -25.9921875, -24.607421875, -23.22265625, -21.837890625, -20.453125, -19.068359375, -17.68359375, -16.298828125, -14.9140625, -13.529296875, -12.14453125, -10.759765625, -9.375, -7.990234375, -6.60546875, -5.220703125, -3.8359375, -2.451171875, -1.06640625, 0.318359375, 1.703125, 3.087890625, 4.47265625, 5.857421875, 7.2421875, 8.626953125, 10.01171875, 11.396484375, 12.78125, 14.166015625, 15.55078125, 16.935546875, 18.3203125, 19.705078125, 21.08984375, 22.474609375, 23.859375, 25.244140625, 26.62890625, 28.013671875, 29.3984375, 30.783203125, 32.16796875, 33.552734375, 34.9375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 5.0, 13.0, 9.0, 24.0, 30.0, 40.0, 86.0, 114.0, 172.0, 229.0, 337.0, 523.0, 846.0, 1268.0, 1845.0, 2803.0, 4304.0, 6376.0, 9420.0, 15216.0, 27492.0, 713930.0, 192931.0, 27127.0, 15419.0, 9456.0, 6106.0, 4214.0, 2761.0, 1750.0, 1182.0, 791.0, 567.0, 369.0, 257.0, 177.0, 118.0, 91.0, 47.0, 33.0, 17.0, 15.0, 12.0, 8.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-29.3125, -28.474609375, -27.63671875, -26.798828125, -25.9609375, -25.123046875, -24.28515625, -23.447265625, -22.609375, -21.771484375, -20.93359375, -20.095703125, -19.2578125, -18.419921875, -17.58203125, -16.744140625, -15.90625, -15.068359375, -14.23046875, -13.392578125, -12.5546875, -11.716796875, -10.87890625, -10.041015625, -9.203125, -8.365234375, -7.52734375, -6.689453125, -5.8515625, -5.013671875, -4.17578125, -3.337890625, -2.5, -1.662109375, -0.82421875, 0.013671875, 0.8515625, 1.689453125, 2.52734375, 3.365234375, 4.203125, 5.041015625, 5.87890625, 6.716796875, 7.5546875, 8.392578125, 9.23046875, 10.068359375, 10.90625, 11.744140625, 12.58203125, 13.419921875, 14.2578125, 15.095703125, 15.93359375, 16.771484375, 17.609375, 18.447265625, 19.28515625, 20.123046875, 20.9609375, 21.798828125, 22.63671875, 23.474609375, 24.3125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 3.0, 3.0, 7.0, 9.0, 13.0, 15.0, 13.0, 19.0, 20.0, 19.0, 31.0, 24.0, 26.0, 30.0, 37.0, 21.0, 39.0, 34.0, 39.0, 42.0, 34.0, 39.0, 23.0, 50.0, 34.0, 41.0, 44.0, 29.0, 29.0, 26.0, 24.0, 24.0, 26.0, 22.0, 12.0, 17.0, 11.0, 11.0, 14.0, 5.0, 7.0, 11.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-29.5625, -28.736328125, -27.91015625, -27.083984375, -26.2578125, -25.431640625, -24.60546875, -23.779296875, -22.953125, -22.126953125, -21.30078125, -20.474609375, -19.6484375, -18.822265625, -17.99609375, -17.169921875, -16.34375, -15.517578125, -14.69140625, -13.865234375, -13.0390625, -12.212890625, -11.38671875, -10.560546875, -9.734375, -8.908203125, -8.08203125, -7.255859375, -6.4296875, -5.603515625, -4.77734375, -3.951171875, -3.125, -2.298828125, -1.47265625, -0.646484375, 0.1796875, 1.005859375, 1.83203125, 2.658203125, 3.484375, 4.310546875, 5.13671875, 5.962890625, 6.7890625, 7.615234375, 8.44140625, 9.267578125, 10.09375, 10.919921875, 11.74609375, 12.572265625, 13.3984375, 14.224609375, 15.05078125, 15.876953125, 16.703125, 17.529296875, 18.35546875, 19.181640625, 20.0078125, 20.833984375, 21.66015625, 22.486328125, 23.3125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 13.0, 17.0, 28.0, 19.0, 31.0, 54.0, 66.0, 99.0, 145.0, 186.0, 231.0, 333.0, 512.0, 733.0, 1163.0, 1862.0, 3133.0, 5458.0, 9939.0, 19847.0, 46198.0, 880764.0, 38411.0, 17671.0, 8742.0, 4970.0, 2791.0, 1671.0, 1085.0, 713.0, 527.0, 299.0, 221.0, 171.0, 119.0, 77.0, 64.0, 50.0, 35.0, 19.0, 19.0, 13.0, 10.0, 10.0, 11.0, 8.0, 5.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.9937515258789062, -0.9621124267578125, -0.9304733276367188, -0.898834228515625, -0.8671951293945312, -0.8355560302734375, -0.8039169311523438, -0.77227783203125, -0.7406387329101562, -0.7089996337890625, -0.6773605346679688, -0.645721435546875, -0.6140823364257812, -0.5824432373046875, -0.5508041381835938, -0.5191650390625, -0.48752593994140625, -0.4558868408203125, -0.42424774169921875, -0.392608642578125, -0.36096954345703125, -0.3293304443359375, -0.29769134521484375, -0.26605224609375, -0.23441314697265625, -0.2027740478515625, -0.17113494873046875, -0.139495849609375, -0.10785675048828125, -0.0762176513671875, -0.04457855224609375, -0.012939453125, 0.01869964599609375, 0.0503387451171875, 0.08197784423828125, 0.113616943359375, 0.14525604248046875, 0.1768951416015625, 0.20853424072265625, 0.24017333984375, 0.27181243896484375, 0.3034515380859375, 0.33509063720703125, 0.366729736328125, 0.39836883544921875, 0.4300079345703125, 0.46164703369140625, 0.4932861328125, 0.5249252319335938, 0.5565643310546875, 0.5882034301757812, 0.619842529296875, 0.6514816284179688, 0.6831207275390625, 0.7147598266601562, 0.74639892578125, 0.7780380249023438, 0.8096771240234375, 0.8413162231445312, 0.872955322265625, 0.9045944213867188, 0.9362335205078125, 0.9678726196289062, 0.99951171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 7.0, 6.0, 9.0, 10.0, 15.0, 23.0, 16.0, 20.0, 31.0, 25.0, 33.0, 38.0, 32.0, 45.0, 47.0, 38.0, 44.0, 39.0, 64.0, 51.0, 41.0, 45.0, 41.0, 42.0, 32.0, 24.0, 31.0, 28.0, 27.0, 11.0, 16.0, 11.0, 8.0, 13.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4151446521282196e-05, -1.3640150427818298e-05, -1.31288543343544e-05, -1.2617558240890503e-05, -1.2106262147426605e-05, -1.1594966053962708e-05, -1.108366996049881e-05, -1.0572373867034912e-05, -1.0061077773571014e-05, -9.549781680107117e-06, -9.038485586643219e-06, -8.527189493179321e-06, -8.015893399715424e-06, -7.504597306251526e-06, -6.993301212787628e-06, -6.4820051193237305e-06, -5.970709025859833e-06, -5.459412932395935e-06, -4.948116838932037e-06, -4.43682074546814e-06, -3.925524652004242e-06, -3.4142285585403442e-06, -2.9029324650764465e-06, -2.391636371612549e-06, -1.8803402781486511e-06, -1.3690441846847534e-06, -8.577480912208557e-07, -3.46451997756958e-07, 1.648440957069397e-07, 6.761401891708374e-07, 1.1874362826347351e-06, 1.6987323760986328e-06, 2.2100284695625305e-06, 2.7213245630264282e-06, 3.232620656490326e-06, 3.7439167499542236e-06, 4.255212843418121e-06, 4.766508936882019e-06, 5.277805030345917e-06, 5.7891011238098145e-06, 6.300397217273712e-06, 6.81169331073761e-06, 7.3229894042015076e-06, 7.834285497665405e-06, 8.345581591129303e-06, 8.8568776845932e-06, 9.368173778057098e-06, 9.879469871520996e-06, 1.0390765964984894e-05, 1.0902062058448792e-05, 1.141335815191269e-05, 1.1924654245376587e-05, 1.2435950338840485e-05, 1.2947246432304382e-05, 1.345854252576828e-05, 1.3969838619232178e-05, 1.4481134712696075e-05, 1.4992430806159973e-05, 1.550372689962387e-05, 1.601502299308777e-05, 1.6526319086551666e-05, 1.7037615180015564e-05, 1.754891127347946e-05, 1.806020736694336e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 7.0, 10.0, 13.0, 14.0, 21.0, 19.0, 44.0, 64.0, 93.0, 141.0, 220.0, 326.0, 512.0, 768.0, 1165.0, 1794.0, 2892.0, 4513.0, 7406.0, 12282.0, 21486.0, 38345.0, 71441.0, 131489.0, 206107.0, 217655.0, 146255.0, 80474.0, 43487.0, 23834.0, 13521.0, 8284.0, 5027.0, 3196.0, 2005.0, 1274.0, 825.0, 502.0, 383.0, 231.0, 137.0, 104.0, 59.0, 45.0, 28.0, 21.0, 12.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.5595703125, -0.54266357421875, -0.5257568359375, -0.50885009765625, -0.491943359375, -0.47503662109375, -0.4581298828125, -0.44122314453125, -0.42431640625, -0.40740966796875, -0.3905029296875, -0.37359619140625, -0.356689453125, -0.33978271484375, -0.3228759765625, -0.30596923828125, -0.2890625, -0.27215576171875, -0.2552490234375, -0.23834228515625, -0.221435546875, -0.20452880859375, -0.1876220703125, -0.17071533203125, -0.15380859375, -0.13690185546875, -0.1199951171875, -0.10308837890625, -0.086181640625, -0.06927490234375, -0.0523681640625, -0.03546142578125, -0.0185546875, -0.00164794921875, 0.0152587890625, 0.03216552734375, 0.049072265625, 0.06597900390625, 0.0828857421875, 0.09979248046875, 0.11669921875, 0.13360595703125, 0.1505126953125, 0.16741943359375, 0.184326171875, 0.20123291015625, 0.2181396484375, 0.23504638671875, 0.251953125, 0.26885986328125, 0.2857666015625, 0.30267333984375, 0.319580078125, 0.33648681640625, 0.3533935546875, 0.37030029296875, 0.38720703125, 0.40411376953125, 0.4210205078125, 0.43792724609375, 0.454833984375, 0.47174072265625, 0.4886474609375, 0.50555419921875, 0.5224609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 7.0, 7.0, 10.0, 7.0, 19.0, 26.0, 21.0, 29.0, 26.0, 44.0, 61.0, 60.0, 68.0, 65.0, 92.0, 76.0, 75.0, 58.0, 54.0, 49.0, 29.0, 21.0, 19.0, 14.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.28173828125, -0.27376365661621094, -0.2657890319824219, -0.2578144073486328, -0.24983978271484375, -0.2418651580810547, -0.23389053344726562, -0.22591590881347656, -0.2179412841796875, -0.20996665954589844, -0.20199203491210938, -0.1940174102783203, -0.18604278564453125, -0.1780681610107422, -0.17009353637695312, -0.16211891174316406, -0.154144287109375, -0.14616966247558594, -0.13819503784179688, -0.1302204132080078, -0.12224578857421875, -0.11427116394042969, -0.10629653930664062, -0.09832191467285156, -0.0903472900390625, -0.08237266540527344, -0.07439804077148438, -0.06642341613769531, -0.05844879150390625, -0.05047416687011719, -0.042499542236328125, -0.03452491760253906, -0.02655029296875, -0.018575668334960938, -0.010601043701171875, -0.0026264190673828125, 0.00534820556640625, 0.013322830200195312, 0.021297454833984375, 0.029272079467773438, 0.0372467041015625, 0.04522132873535156, 0.053195953369140625, 0.06117057800292969, 0.06914520263671875, 0.07711982727050781, 0.08509445190429688, 0.09306907653808594, 0.101043701171875, 0.10901832580566406, 0.11699295043945312, 0.12496757507324219, 0.13294219970703125, 0.1409168243408203, 0.14889144897460938, 0.15686607360839844, 0.1648406982421875, 0.17281532287597656, 0.18078994750976562, 0.1887645721435547, 0.19673919677734375, 0.2047138214111328, 0.21268844604492188, 0.22066307067871094, 0.2286376953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 2.0, 9.0, 8.0, 10.0, 11.0, 13.0, 21.0, 19.0, 30.0, 26.0, 31.0, 35.0, 32.0, 33.0, 42.0, 36.0, 33.0, 43.0, 56.0, 52.0, 37.0, 39.0, 43.0, 41.0, 32.0, 33.0, 39.0, 29.0, 26.0, 22.0, 17.0, 21.0, 16.0, 19.0, 7.0, 3.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-35.50404739379883, -34.39483642578125, -33.285621643066406, -32.17641067504883, -31.067197799682617, -29.957984924316406, -28.848773956298828, -27.739561080932617, -26.630348205566406, -25.521135330200195, -24.411924362182617, -23.302711486816406, -22.193498611450195, -21.084285736083984, -19.975074768066406, -18.865861892700195, -17.756650924682617, -16.647438049316406, -15.538226127624512, -14.429014205932617, -13.319801330566406, -12.210589408874512, -11.101377487182617, -9.992164611816406, -8.882952690124512, -7.773740291595459, -6.664527893066406, -5.555315971374512, -4.446103572845459, -3.3368911743164062, -2.2276792526245117, -1.118466854095459, -0.00925445556640625, 1.099957823753357, 2.20917010307312, 3.3183822631835938, 4.4275946617126465, 5.536807060241699, 6.646018981933594, 7.7552313804626465, 8.8644437789917, 9.973655700683594, 11.082868576049805, 12.1920804977417, 13.301292419433594, 14.410505294799805, 15.5197172164917, 16.628929138183594, 17.738142013549805, 18.847354888916016, 19.956565856933594, 21.065778732299805, 22.174991607666016, 23.284202575683594, 24.393415451049805, 25.502628326416016, 26.611839294433594, 27.721052169799805, 28.830263137817383, 29.939476013183594, 31.048688888549805, 32.157901763916016, 33.267112731933594, 34.37632369995117, 35.485538482666016]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 11.0, 18.0, 13.0, 21.0, 17.0, 26.0, 39.0, 25.0, 32.0, 35.0, 41.0, 34.0, 32.0, 33.0, 39.0, 56.0, 44.0, 44.0, 33.0, 39.0, 41.0, 46.0, 29.0, 31.0, 33.0, 24.0, 22.0, 23.0, 18.0, 17.0, 12.0, 7.0, 11.0, 8.0, 8.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-53.72690200805664, -52.34080123901367, -50.9547004699707, -49.568599700927734, -48.182498931884766, -46.79640197753906, -45.410301208496094, -44.024200439453125, -42.638099670410156, -41.25199890136719, -39.86589813232422, -38.47979736328125, -37.09369659423828, -35.70759582519531, -34.321495056152344, -32.93539810180664, -31.54929542541504, -30.16319465637207, -28.7770938873291, -27.390995025634766, -26.004894256591797, -24.618793487548828, -23.23269271850586, -21.84659194946289, -20.460491180419922, -19.074390411376953, -17.688289642333984, -16.302188873291016, -14.91609001159668, -13.529989242553711, -12.143888473510742, -10.75778865814209, -9.371688842773438, -7.985588550567627, -6.599488258361816, -5.213387489318848, -3.827287197113037, -2.4411869049072266, -1.0550861358642578, 0.33101367950439453, 1.7171144485473633, 3.103214740753174, 4.489315032958984, 5.875415802001953, 7.261516094207764, 8.647616386413574, 10.033717155456543, 11.419816970825195, 12.805917739868164, 14.192018508911133, 15.578118324279785, 16.964218139648438, 18.350318908691406, 19.736419677734375, 21.122520446777344, 22.508621215820312, 23.89472198486328, 25.28082275390625, 26.66692352294922, 28.053024291992188, 29.439123153686523, 30.825223922729492, 32.211326599121094, 33.5974235534668, 34.983524322509766]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 11.0, 13.0, 35.0, 55.0, 83.0, 135.0, 187.0, 325.0, 501.0, 761.0, 1295.0, 2123.0, 3268.0, 5131.0, 7825.0, 11843.0, 17423.0, 24771.0, 34538.0, 46498.0, 59000.0, 71773.0, 84150.0, 92335.0, 94939.0, 93136.0, 86556.0, 75515.0, 62891.0, 49203.0, 37592.0, 27384.0, 19249.0, 13222.0, 8764.0, 5765.0, 3743.0, 2426.0, 1532.0, 983.0, 601.0, 339.0, 235.0, 153.0, 90.0, 57.0, 26.0, 21.0, 12.0, 16.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.9765625, -15.487060546875, -14.99755859375, -14.508056640625, -14.0185546875, -13.529052734375, -13.03955078125, -12.550048828125, -12.060546875, -11.571044921875, -11.08154296875, -10.592041015625, -10.1025390625, -9.613037109375, -9.12353515625, -8.634033203125, -8.14453125, -7.655029296875, -7.16552734375, -6.676025390625, -6.1865234375, -5.697021484375, -5.20751953125, -4.718017578125, -4.228515625, -3.739013671875, -3.24951171875, -2.760009765625, -2.2705078125, -1.781005859375, -1.29150390625, -0.802001953125, -0.3125, 0.177001953125, 0.66650390625, 1.156005859375, 1.6455078125, 2.135009765625, 2.62451171875, 3.114013671875, 3.603515625, 4.093017578125, 4.58251953125, 5.072021484375, 5.5615234375, 6.051025390625, 6.54052734375, 7.030029296875, 7.51953125, 8.009033203125, 8.49853515625, 8.988037109375, 9.4775390625, 9.967041015625, 10.45654296875, 10.946044921875, 11.435546875, 11.925048828125, 12.41455078125, 12.904052734375, 13.3935546875, 13.883056640625, 14.37255859375, 14.862060546875, 15.3515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 6.0, 9.0, 11.0, 15.0, 17.0, 19.0, 12.0, 31.0, 40.0, 20.0, 37.0, 31.0, 43.0, 32.0, 35.0, 34.0, 37.0, 56.0, 45.0, 43.0, 32.0, 40.0, 38.0, 46.0, 29.0, 37.0, 30.0, 24.0, 25.0, 20.0, 19.0, 16.0, 14.0, 6.0, 11.0, 9.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-53.21875, -51.84814453125, -50.4775390625, -49.10693359375, -47.736328125, -46.36572265625, -44.9951171875, -43.62451171875, -42.25390625, -40.88330078125, -39.5126953125, -38.14208984375, -36.771484375, -35.40087890625, -34.0302734375, -32.65966796875, -31.2890625, -29.91845703125, -28.5478515625, -27.17724609375, -25.806640625, -24.43603515625, -23.0654296875, -21.69482421875, -20.32421875, -18.95361328125, -17.5830078125, -16.21240234375, -14.841796875, -13.47119140625, -12.1005859375, -10.72998046875, -9.359375, -7.98876953125, -6.6181640625, -5.24755859375, -3.876953125, -2.50634765625, -1.1357421875, 0.23486328125, 1.60546875, 2.97607421875, 4.3466796875, 5.71728515625, 7.087890625, 8.45849609375, 9.8291015625, 11.19970703125, 12.5703125, 13.94091796875, 15.3115234375, 16.68212890625, 18.052734375, 19.42333984375, 20.7939453125, 22.16455078125, 23.53515625, 24.90576171875, 26.2763671875, 27.64697265625, 29.017578125, 30.38818359375, 31.7587890625, 33.12939453125, 34.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 7.0, 19.0, 27.0, 44.0, 57.0, 113.0, 156.0, 310.0, 490.0, 747.0, 1234.0, 2055.0, 3302.0, 5102.0, 7929.0, 12564.0, 18386.0, 26538.0, 37237.0, 50387.0, 64859.0, 78628.0, 91073.0, 98131.0, 99618.0, 95278.0, 85028.0, 72263.0, 57267.0, 43694.0, 31601.0, 22234.0, 14935.0, 9973.0, 6403.0, 3991.0, 2552.0, 1620.0, 1055.0, 607.0, 410.0, 243.0, 134.0, 90.0, 59.0, 35.0, 23.0, 18.0, 5.0, 13.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.203125, -16.669677734375, -16.13623046875, -15.602783203125, -15.0693359375, -14.535888671875, -14.00244140625, -13.468994140625, -12.935546875, -12.402099609375, -11.86865234375, -11.335205078125, -10.8017578125, -10.268310546875, -9.73486328125, -9.201416015625, -8.66796875, -8.134521484375, -7.60107421875, -7.067626953125, -6.5341796875, -6.000732421875, -5.46728515625, -4.933837890625, -4.400390625, -3.866943359375, -3.33349609375, -2.800048828125, -2.2666015625, -1.733154296875, -1.19970703125, -0.666259765625, -0.1328125, 0.400634765625, 0.93408203125, 1.467529296875, 2.0009765625, 2.534423828125, 3.06787109375, 3.601318359375, 4.134765625, 4.668212890625, 5.20166015625, 5.735107421875, 6.2685546875, 6.802001953125, 7.33544921875, 7.868896484375, 8.40234375, 8.935791015625, 9.46923828125, 10.002685546875, 10.5361328125, 11.069580078125, 11.60302734375, 12.136474609375, 12.669921875, 13.203369140625, 13.73681640625, 14.270263671875, 14.8037109375, 15.337158203125, 15.87060546875, 16.404052734375, 16.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 3.0, 14.0, 11.0, 16.0, 21.0, 12.0, 25.0, 25.0, 25.0, 25.0, 30.0, 38.0, 33.0, 49.0, 44.0, 49.0, 45.0, 29.0, 55.0, 35.0, 43.0, 48.0, 41.0, 34.0, 29.0, 25.0, 31.0, 26.0, 22.0, 19.0, 14.0, 19.0, 11.0, 10.0, 6.0, 11.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.15869140625, -24.2705078125, -23.38232421875, -22.494140625, -21.60595703125, -20.7177734375, -19.82958984375, -18.94140625, -18.05322265625, -17.1650390625, -16.27685546875, -15.388671875, -14.50048828125, -13.6123046875, -12.72412109375, -11.8359375, -10.94775390625, -10.0595703125, -9.17138671875, -8.283203125, -7.39501953125, -6.5068359375, -5.61865234375, -4.73046875, -3.84228515625, -2.9541015625, -2.06591796875, -1.177734375, -0.28955078125, 0.5986328125, 1.48681640625, 2.375, 3.26318359375, 4.1513671875, 5.03955078125, 5.927734375, 6.81591796875, 7.7041015625, 8.59228515625, 9.48046875, 10.36865234375, 11.2568359375, 12.14501953125, 13.033203125, 13.92138671875, 14.8095703125, 15.69775390625, 16.5859375, 17.47412109375, 18.3623046875, 19.25048828125, 20.138671875, 21.02685546875, 21.9150390625, 22.80322265625, 23.69140625, 24.57958984375, 25.4677734375, 26.35595703125, 27.244140625, 28.13232421875, 29.0205078125, 29.90869140625, 30.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 7.0, 15.0, 17.0, 26.0, 47.0, 65.0, 83.0, 153.0, 227.0, 387.0, 696.0, 1181.0, 2041.0, 3665.0, 6547.0, 11693.0, 20634.0, 34020.0, 52826.0, 77988.0, 104088.0, 125384.0, 134468.0, 128573.0, 109532.0, 83884.0, 58389.0, 38127.0, 22944.0, 13461.0, 7426.0, 4208.0, 2447.0, 1340.0, 739.0, 476.0, 282.0, 145.0, 101.0, 70.0, 60.0, 29.0, 23.0, 13.0, 11.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0], "bins": [-9.1953125, -8.9371337890625, -8.678955078125, -8.4207763671875, -8.16259765625, -7.9044189453125, -7.646240234375, -7.3880615234375, -7.1298828125, -6.8717041015625, -6.613525390625, -6.3553466796875, -6.09716796875, -5.8389892578125, -5.580810546875, -5.3226318359375, -5.064453125, -4.8062744140625, -4.548095703125, -4.2899169921875, -4.03173828125, -3.7735595703125, -3.515380859375, -3.2572021484375, -2.9990234375, -2.7408447265625, -2.482666015625, -2.2244873046875, -1.96630859375, -1.7081298828125, -1.449951171875, -1.1917724609375, -0.93359375, -0.6754150390625, -0.417236328125, -0.1590576171875, 0.09912109375, 0.3572998046875, 0.615478515625, 0.8736572265625, 1.1318359375, 1.3900146484375, 1.648193359375, 1.9063720703125, 2.16455078125, 2.4227294921875, 2.680908203125, 2.9390869140625, 3.197265625, 3.4554443359375, 3.713623046875, 3.9718017578125, 4.22998046875, 4.4881591796875, 4.746337890625, 5.0045166015625, 5.2626953125, 5.5208740234375, 5.779052734375, 6.0372314453125, 6.29541015625, 6.5535888671875, 6.811767578125, 7.0699462890625, 7.328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 5.0, 7.0, 8.0, 6.0, 16.0, 12.0, 21.0, 19.0, 26.0, 29.0, 27.0, 30.0, 32.0, 35.0, 48.0, 44.0, 50.0, 52.0, 36.0, 38.0, 48.0, 41.0, 54.0, 37.0, 45.0, 26.0, 34.0, 25.0, 30.0, 17.0, 21.0, 18.0, 8.0, 11.0, 12.0, 8.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006899833679199219, -0.0006648823618888855, -0.0006397813558578491, -0.0006146803498268127, -0.0005895793437957764, -0.00056447833776474, -0.0005393773317337036, -0.0005142763257026672, -0.0004891753196716309, -0.0004640743136405945, -0.0004389733076095581, -0.00041387230157852173, -0.00038877129554748535, -0.000363670289516449, -0.0003385692834854126, -0.0003134682774543762, -0.00028836727142333984, -0.00026326626539230347, -0.0002381652593612671, -0.0002130642533302307, -0.00018796324729919434, -0.00016286224126815796, -0.00013776123523712158, -0.0001126602292060852, -8.755922317504883e-05, -6.245821714401245e-05, -3.7357211112976074e-05, -1.2256205081939697e-05, 1.284480094909668e-05, 3.794580698013306e-05, 6.304681301116943e-05, 8.814781904220581e-05, 0.00011324882507324219, 0.00013834983110427856, 0.00016345083713531494, 0.00018855184316635132, 0.0002136528491973877, 0.00023875385522842407, 0.00026385486125946045, 0.0002889558672904968, 0.0003140568733215332, 0.0003391578793525696, 0.00036425888538360596, 0.00038935989141464233, 0.0004144608974456787, 0.0004395619034767151, 0.00046466290950775146, 0.0004897639155387878, 0.0005148649215698242, 0.0005399659276008606, 0.000565066933631897, 0.0005901679396629333, 0.0006152689456939697, 0.0006403699517250061, 0.0006654709577560425, 0.0006905719637870789, 0.0007156729698181152, 0.0007407739758491516, 0.000765874981880188, 0.0007909759879112244, 0.0008160769939422607, 0.0008411779999732971, 0.0008662790060043335, 0.0008913800120353699, 0.0009164810180664062]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 7.0, 16.0, 18.0, 33.0, 47.0, 52.0, 84.0, 149.0, 225.0, 452.0, 793.0, 1500.0, 2693.0, 4888.0, 9231.0, 16798.0, 29890.0, 48584.0, 75397.0, 105910.0, 131392.0, 143805.0, 136874.0, 115478.0, 85783.0, 57478.0, 35644.0, 20319.0, 11587.0, 6001.0, 3379.0, 1783.0, 972.0, 520.0, 300.0, 175.0, 102.0, 48.0, 44.0, 25.0, 25.0, 13.0, 6.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0234375, -8.738525390625, -8.45361328125, -8.168701171875, -7.8837890625, -7.598876953125, -7.31396484375, -7.029052734375, -6.744140625, -6.459228515625, -6.17431640625, -5.889404296875, -5.6044921875, -5.319580078125, -5.03466796875, -4.749755859375, -4.46484375, -4.179931640625, -3.89501953125, -3.610107421875, -3.3251953125, -3.040283203125, -2.75537109375, -2.470458984375, -2.185546875, -1.900634765625, -1.61572265625, -1.330810546875, -1.0458984375, -0.760986328125, -0.47607421875, -0.191162109375, 0.09375, 0.378662109375, 0.66357421875, 0.948486328125, 1.2333984375, 1.518310546875, 1.80322265625, 2.088134765625, 2.373046875, 2.657958984375, 2.94287109375, 3.227783203125, 3.5126953125, 3.797607421875, 4.08251953125, 4.367431640625, 4.65234375, 4.937255859375, 5.22216796875, 5.507080078125, 5.7919921875, 6.076904296875, 6.36181640625, 6.646728515625, 6.931640625, 7.216552734375, 7.50146484375, 7.786376953125, 8.0712890625, 8.356201171875, 8.64111328125, 8.926025390625, 9.2109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 16.0, 10.0, 15.0, 21.0, 21.0, 33.0, 29.0, 39.0, 39.0, 41.0, 42.0, 46.0, 56.0, 56.0, 55.0, 53.0, 54.0, 48.0, 63.0, 44.0, 44.0, 31.0, 28.0, 19.0, 21.0, 9.0, 9.0, 12.0, 8.0, 8.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.637603759765625, -3.51544189453125, -3.393280029296875, -3.2711181640625, -3.148956298828125, -3.02679443359375, -2.904632568359375, -2.782470703125, -2.660308837890625, -2.53814697265625, -2.415985107421875, -2.2938232421875, -2.171661376953125, -2.04949951171875, -1.927337646484375, -1.80517578125, -1.683013916015625, -1.56085205078125, -1.438690185546875, -1.3165283203125, -1.194366455078125, -1.07220458984375, -0.950042724609375, -0.827880859375, -0.705718994140625, -0.58355712890625, -0.461395263671875, -0.3392333984375, -0.217071533203125, -0.09490966796875, 0.027252197265625, 0.1494140625, 0.271575927734375, 0.39373779296875, 0.515899658203125, 0.6380615234375, 0.760223388671875, 0.88238525390625, 1.004547119140625, 1.126708984375, 1.248870849609375, 1.37103271484375, 1.493194580078125, 1.6153564453125, 1.737518310546875, 1.85968017578125, 1.981842041015625, 2.10400390625, 2.226165771484375, 2.34832763671875, 2.470489501953125, 2.5926513671875, 2.714813232421875, 2.83697509765625, 2.959136962890625, 3.081298828125, 3.203460693359375, 3.32562255859375, 3.447784423828125, 3.5699462890625, 3.692108154296875, 3.81427001953125, 3.936431884765625, 4.05859375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 4.0, 12.0, 15.0, 16.0, 18.0, 23.0, 23.0, 26.0, 33.0, 24.0, 28.0, 37.0, 41.0, 33.0, 39.0, 40.0, 42.0, 39.0, 38.0, 41.0, 37.0, 43.0, 34.0, 34.0, 29.0, 38.0, 31.0, 30.0, 20.0, 14.0, 12.0, 12.0, 20.0, 12.0, 14.0, 5.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.835514068603516, -31.792724609375, -30.749935150146484, -29.70714569091797, -28.664356231689453, -27.621566772460938, -26.57877540588379, -25.535985946655273, -24.493196487426758, -23.450407028198242, -22.407617568969727, -21.36482810974121, -20.322036743164062, -19.279247283935547, -18.23645782470703, -17.193668365478516, -16.15087890625, -15.108089447021484, -14.065299987792969, -13.022509574890137, -11.979720115661621, -10.936930656433105, -9.894140243530273, -8.851350784301758, -7.808561325073242, -6.765771865844727, -5.722981929779053, -4.680191993713379, -3.6374025344848633, -2.5946130752563477, -1.5518231391906738, -0.509033203125, 0.5337562561035156, 1.5765459537506104, 2.619335651397705, 3.6621253490448, 4.7049150466918945, 5.74770450592041, 6.790494441986084, 7.833284378051758, 8.876073837280273, 9.918863296508789, 10.961652755737305, 12.004443168640137, 13.047232627868652, 14.090022087097168, 15.1328125, 16.175601959228516, 17.21839141845703, 18.261180877685547, 19.303970336914062, 20.346759796142578, 21.389549255371094, 22.43233871459961, 23.475130081176758, 24.517919540405273, 25.56070899963379, 26.603498458862305, 27.64628791809082, 28.689077377319336, 29.731868743896484, 30.774658203125, 31.817447662353516, 32.86023712158203, 33.90302658081055]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 8.0, 7.0, 14.0, 12.0, 14.0, 18.0, 21.0, 23.0, 15.0, 24.0, 18.0, 26.0, 26.0, 41.0, 30.0, 40.0, 43.0, 39.0, 36.0, 32.0, 31.0, 42.0, 39.0, 31.0, 33.0, 41.0, 33.0, 44.0, 26.0, 27.0, 22.0, 15.0, 10.0, 18.0, 20.0, 15.0, 6.0, 8.0, 13.0, 6.0, 5.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-50.01160430908203, -48.61640930175781, -47.221214294433594, -45.826019287109375, -44.430824279785156, -43.03562927246094, -41.64043426513672, -40.245243072509766, -38.85004806518555, -37.45485305786133, -36.05965805053711, -34.66446304321289, -33.26926803588867, -31.874074935913086, -30.478879928588867, -29.08368682861328, -27.68848991394043, -26.29329490661621, -24.898099899291992, -23.502906799316406, -22.107711791992188, -20.71251678466797, -19.31732177734375, -17.92212677001953, -16.526931762695312, -15.131736755371094, -13.736542701721191, -12.341347694396973, -10.94615364074707, -9.550958633422852, -8.155763626098633, -6.7605695724487305, -5.365375518798828, -3.9701809883117676, -2.574986219406128, -1.1797914505004883, 0.21540307998657227, 1.6105976104736328, 3.0057926177978516, 4.400986671447754, 5.796181678771973, 7.191376209259033, 8.586570739746094, 9.981765747070312, 11.376960754394531, 12.772154808044434, 14.167349815368652, 15.562543869018555, 16.957738876342773, 18.352933883666992, 19.74812889099121, 21.143321990966797, 22.538516998291016, 23.933712005615234, 25.328907012939453, 26.724102020263672, 28.11929702758789, 29.51449203491211, 30.909687042236328, 32.30488204956055, 33.700077056884766, 35.09526824951172, 36.49046325683594, 37.885658264160156, 39.280853271484375]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 12.0, 16.0, 20.0, 48.0, 50.0, 107.0, 149.0, 262.0, 482.0, 743.0, 1162.0, 1808.0, 3016.0, 4738.0, 7412.0, 11390.0, 17414.0, 26322.0, 38462.0, 56296.0, 80839.0, 110665.0, 150078.0, 193740.0, 241458.0, 290291.0, 330646.0, 358712.0, 367577.0, 356017.0, 329162.0, 287779.0, 240339.0, 191130.0, 147393.0, 108410.0, 78359.0, 54603.0, 37155.0, 25038.0, 16574.0, 10438.0, 6797.0, 4326.0, 2685.0, 1666.0, 1014.0, 576.0, 382.0, 207.0, 135.0, 77.0, 50.0, 23.0, 22.0, 11.0, 5.0, 1.0, 1.0, 3.0], "bins": [-26.6875, -25.865234375, -25.04296875, -24.220703125, -23.3984375, -22.576171875, -21.75390625, -20.931640625, -20.109375, -19.287109375, -18.46484375, -17.642578125, -16.8203125, -15.998046875, -15.17578125, -14.353515625, -13.53125, -12.708984375, -11.88671875, -11.064453125, -10.2421875, -9.419921875, -8.59765625, -7.775390625, -6.953125, -6.130859375, -5.30859375, -4.486328125, -3.6640625, -2.841796875, -2.01953125, -1.197265625, -0.375, 0.447265625, 1.26953125, 2.091796875, 2.9140625, 3.736328125, 4.55859375, 5.380859375, 6.203125, 7.025390625, 7.84765625, 8.669921875, 9.4921875, 10.314453125, 11.13671875, 11.958984375, 12.78125, 13.603515625, 14.42578125, 15.248046875, 16.0703125, 16.892578125, 17.71484375, 18.537109375, 19.359375, 20.181640625, 21.00390625, 21.826171875, 22.6484375, 23.470703125, 24.29296875, 25.115234375, 25.9375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 9.0, 6.0, 15.0, 10.0, 11.0, 18.0, 19.0, 20.0, 20.0, 21.0, 23.0, 18.0, 32.0, 27.0, 41.0, 34.0, 44.0, 41.0, 34.0, 35.0, 31.0, 39.0, 42.0, 29.0, 40.0, 35.0, 34.0, 42.0, 31.0, 27.0, 19.0, 23.0, 9.0, 19.0, 20.0, 17.0, 8.0, 6.0, 14.0, 6.0, 6.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-48.0625, -46.7353515625, -45.408203125, -44.0810546875, -42.75390625, -41.4267578125, -40.099609375, -38.7724609375, -37.4453125, -36.1181640625, -34.791015625, -33.4638671875, -32.13671875, -30.8095703125, -29.482421875, -28.1552734375, -26.828125, -25.5009765625, -24.173828125, -22.8466796875, -21.51953125, -20.1923828125, -18.865234375, -17.5380859375, -16.2109375, -14.8837890625, -13.556640625, -12.2294921875, -10.90234375, -9.5751953125, -8.248046875, -6.9208984375, -5.59375, -4.2666015625, -2.939453125, -1.6123046875, -0.28515625, 1.0419921875, 2.369140625, 3.6962890625, 5.0234375, 6.3505859375, 7.677734375, 9.0048828125, 10.33203125, 11.6591796875, 12.986328125, 14.3134765625, 15.640625, 16.9677734375, 18.294921875, 19.6220703125, 20.94921875, 22.2763671875, 23.603515625, 24.9306640625, 26.2578125, 27.5849609375, 28.912109375, 30.2392578125, 31.56640625, 32.8935546875, 34.220703125, 35.5478515625, 36.875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 4.0, 13.0, 23.0, 42.0, 45.0, 103.0, 177.0, 246.0, 385.0, 723.0, 1008.0, 1676.0, 2719.0, 4355.0, 6990.0, 11178.0, 17764.0, 27059.0, 41482.0, 62135.0, 89205.0, 126135.0, 170828.0, 223160.0, 277377.0, 326556.0, 364033.0, 383278.0, 381841.0, 357329.0, 316409.0, 265468.0, 211636.0, 160239.0, 117513.0, 82750.0, 56659.0, 38080.0, 24808.0, 15813.0, 10078.0, 6407.0, 3988.0, 2458.0, 1599.0, 947.0, 619.0, 380.0, 226.0, 130.0, 67.0, 46.0, 45.0, 26.0, 18.0, 6.0, 2.0, 4.0, 0.0, 3.0], "bins": [-29.828125, -28.892822265625, -27.95751953125, -27.022216796875, -26.0869140625, -25.151611328125, -24.21630859375, -23.281005859375, -22.345703125, -21.410400390625, -20.47509765625, -19.539794921875, -18.6044921875, -17.669189453125, -16.73388671875, -15.798583984375, -14.86328125, -13.927978515625, -12.99267578125, -12.057373046875, -11.1220703125, -10.186767578125, -9.25146484375, -8.316162109375, -7.380859375, -6.445556640625, -5.51025390625, -4.574951171875, -3.6396484375, -2.704345703125, -1.76904296875, -0.833740234375, 0.1015625, 1.036865234375, 1.97216796875, 2.907470703125, 3.8427734375, 4.778076171875, 5.71337890625, 6.648681640625, 7.583984375, 8.519287109375, 9.45458984375, 10.389892578125, 11.3251953125, 12.260498046875, 13.19580078125, 14.131103515625, 15.06640625, 16.001708984375, 16.93701171875, 17.872314453125, 18.8076171875, 19.742919921875, 20.67822265625, 21.613525390625, 22.548828125, 23.484130859375, 24.41943359375, 25.354736328125, 26.2900390625, 27.225341796875, 28.16064453125, 29.095947265625, 30.03125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 9.0, 8.0, 3.0, 15.0, 23.0, 22.0, 25.0, 29.0, 38.0, 46.0, 62.0, 88.0, 94.0, 100.0, 121.0, 144.0, 162.0, 150.0, 178.0, 195.0, 185.0, 202.0, 166.0, 185.0, 191.0, 188.0, 182.0, 151.0, 173.0, 160.0, 133.0, 97.0, 94.0, 76.0, 79.0, 59.0, 54.0, 48.0, 34.0, 19.0, 18.0, 15.0, 13.0, 14.0, 7.0, 5.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-20.75, -20.132080078125, -19.51416015625, -18.896240234375, -18.2783203125, -17.660400390625, -17.04248046875, -16.424560546875, -15.806640625, -15.188720703125, -14.57080078125, -13.952880859375, -13.3349609375, -12.717041015625, -12.09912109375, -11.481201171875, -10.86328125, -10.245361328125, -9.62744140625, -9.009521484375, -8.3916015625, -7.773681640625, -7.15576171875, -6.537841796875, -5.919921875, -5.302001953125, -4.68408203125, -4.066162109375, -3.4482421875, -2.830322265625, -2.21240234375, -1.594482421875, -0.9765625, -0.358642578125, 0.25927734375, 0.877197265625, 1.4951171875, 2.113037109375, 2.73095703125, 3.348876953125, 3.966796875, 4.584716796875, 5.20263671875, 5.820556640625, 6.4384765625, 7.056396484375, 7.67431640625, 8.292236328125, 8.91015625, 9.528076171875, 10.14599609375, 10.763916015625, 11.3818359375, 11.999755859375, 12.61767578125, 13.235595703125, 13.853515625, 14.471435546875, 15.08935546875, 15.707275390625, 16.3251953125, 16.943115234375, 17.56103515625, 18.178955078125, 18.796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 12.0, 12.0, 12.0, 16.0, 18.0, 18.0, 22.0, 27.0, 34.0, 38.0, 43.0, 43.0, 34.0, 47.0, 65.0, 49.0, 57.0, 51.0, 52.0, 39.0, 40.0, 33.0, 41.0, 30.0, 37.0, 12.0, 21.0, 22.0, 16.0, 14.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-57.26791763305664, -55.61261749267578, -53.957313537597656, -52.3020133972168, -50.64671325683594, -48.99141311645508, -47.33611297607422, -45.680809020996094, -44.025508880615234, -42.370208740234375, -40.71490478515625, -39.05960464477539, -37.40430450439453, -35.74900436401367, -34.09370422363281, -32.43840026855469, -30.783100128173828, -29.12779998779297, -27.472497940063477, -25.817195892333984, -24.161895751953125, -22.506595611572266, -20.851293563842773, -19.19599151611328, -17.540691375732422, -15.885390281677246, -14.23008918762207, -12.574788093566895, -10.919486999511719, -9.264185905456543, -7.608884811401367, -5.953583717346191, -4.29827880859375, -2.642977714538574, -0.9876766204833984, 0.6676244735717773, 2.322925567626953, 3.978226661682129, 5.633527755737305, 7.2888288497924805, 8.944129943847656, 10.599431037902832, 12.254732131958008, 13.910033226013184, 15.56533432006836, 17.22063446044922, 18.87593650817871, 20.531238555908203, 22.186538696289062, 23.841838836669922, 25.497140884399414, 27.152442932128906, 28.807743072509766, 30.463043212890625, 32.11834716796875, 33.77364730834961, 35.42894744873047, 37.08424758911133, 38.73954772949219, 40.39485168457031, 42.05015182495117, 43.70545196533203, 45.360755920410156, 47.016056060791016, 48.671356201171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 7.0, 12.0, 7.0, 9.0, 16.0, 10.0, 9.0, 20.0, 26.0, 24.0, 26.0, 19.0, 28.0, 28.0, 48.0, 26.0, 33.0, 39.0, 33.0, 43.0, 43.0, 42.0, 37.0, 37.0, 32.0, 36.0, 39.0, 35.0, 26.0, 22.0, 21.0, 24.0, 18.0, 16.0, 11.0, 20.0, 13.0, 9.0, 7.0, 7.0, 6.0, 7.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-54.954036712646484, -53.337615966796875, -51.721195220947266, -50.104774475097656, -48.48835372924805, -46.87193298339844, -45.255516052246094, -43.63909149169922, -42.022674560546875, -40.406253814697266, -38.789833068847656, -37.17341232299805, -35.55699157714844, -33.94057083129883, -32.32415008544922, -30.707731246948242, -29.09130859375, -27.47488784790039, -25.85846710205078, -24.242046356201172, -22.625625610351562, -21.009204864501953, -19.392786026000977, -17.776365280151367, -16.159944534301758, -14.543523788452148, -12.927103042602539, -11.310683250427246, -9.694262504577637, -8.077841758728027, -6.461421966552734, -4.845001220703125, -3.2285804748535156, -1.6121599674224854, 0.004260540008544922, 1.620680809020996, 3.2371015548706055, 4.853522300720215, 6.469942092895508, 8.086362838745117, 9.702783584594727, 11.319204330444336, 12.935625076293945, 14.552044868469238, 16.16846466064453, 17.78488540649414, 19.40130615234375, 21.01772689819336, 22.63414764404297, 24.250568389892578, 25.866989135742188, 27.483409881591797, 29.099830627441406, 30.716251373291016, 32.332672119140625, 33.94908905029297, 35.565513610839844, 37.18193435668945, 38.79835510253906, 40.41477584838867, 42.03119659423828, 43.64761734008789, 45.2640380859375, 46.880455017089844, 48.49687576293945]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 3.0, 9.0, 7.0, 11.0, 21.0, 34.0, 50.0, 86.0, 147.0, 238.0, 403.0, 604.0, 1001.0, 1574.0, 2435.0, 3962.0, 6195.0, 9804.0, 15205.0, 23465.0, 36136.0, 53555.0, 76723.0, 102609.0, 124803.0, 134427.0, 124615.0, 101811.0, 76042.0, 53088.0, 35236.0, 23083.0, 15183.0, 9639.0, 6044.0, 3892.0, 2368.0, 1565.0, 936.0, 563.0, 375.0, 243.0, 144.0, 95.0, 61.0, 28.0, 24.0, 12.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.72509765625, -12.2783203125, -11.83154296875, -11.384765625, -10.93798828125, -10.4912109375, -10.04443359375, -9.59765625, -9.15087890625, -8.7041015625, -8.25732421875, -7.810546875, -7.36376953125, -6.9169921875, -6.47021484375, -6.0234375, -5.57666015625, -5.1298828125, -4.68310546875, -4.236328125, -3.78955078125, -3.3427734375, -2.89599609375, -2.44921875, -2.00244140625, -1.5556640625, -1.10888671875, -0.662109375, -0.21533203125, 0.2314453125, 0.67822265625, 1.125, 1.57177734375, 2.0185546875, 2.46533203125, 2.912109375, 3.35888671875, 3.8056640625, 4.25244140625, 4.69921875, 5.14599609375, 5.5927734375, 6.03955078125, 6.486328125, 6.93310546875, 7.3798828125, 7.82666015625, 8.2734375, 8.72021484375, 9.1669921875, 9.61376953125, 10.060546875, 10.50732421875, 10.9541015625, 11.40087890625, 11.84765625, 12.29443359375, 12.7412109375, 13.18798828125, 13.634765625, 14.08154296875, 14.5283203125, 14.97509765625, 15.421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 5.0, 8.0, 17.0, 10.0, 9.0, 21.0, 28.0, 23.0, 25.0, 22.0, 28.0, 28.0, 47.0, 25.0, 33.0, 37.0, 35.0, 42.0, 46.0, 40.0, 36.0, 38.0, 31.0, 36.0, 42.0, 33.0, 25.0, 22.0, 22.0, 23.0, 20.0, 15.0, 12.0, 20.0, 12.0, 8.0, 7.0, 7.0, 6.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-54.96875, -53.35595703125, -51.7431640625, -50.13037109375, -48.517578125, -46.90478515625, -45.2919921875, -43.67919921875, -42.06640625, -40.45361328125, -38.8408203125, -37.22802734375, -35.615234375, -34.00244140625, -32.3896484375, -30.77685546875, -29.1640625, -27.55126953125, -25.9384765625, -24.32568359375, -22.712890625, -21.10009765625, -19.4873046875, -17.87451171875, -16.26171875, -14.64892578125, -13.0361328125, -11.42333984375, -9.810546875, -8.19775390625, -6.5849609375, -4.97216796875, -3.359375, -1.74658203125, -0.1337890625, 1.47900390625, 3.091796875, 4.70458984375, 6.3173828125, 7.93017578125, 9.54296875, 11.15576171875, 12.7685546875, 14.38134765625, 15.994140625, 17.60693359375, 19.2197265625, 20.83251953125, 22.4453125, 24.05810546875, 25.6708984375, 27.28369140625, 28.896484375, 30.50927734375, 32.1220703125, 33.73486328125, 35.34765625, 36.96044921875, 38.5732421875, 40.18603515625, 41.798828125, 43.41162109375, 45.0244140625, 46.63720703125, 48.25]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 12.0, 7.0, 23.0, 37.0, 44.0, 71.0, 105.0, 128.0, 230.0, 338.0, 459.0, 671.0, 942.0, 1450.0, 2148.0, 3148.0, 4838.0, 7415.0, 11306.0, 18292.0, 36433.0, 856657.0, 45019.0, 21329.0, 12817.0, 8244.0, 5426.0, 3648.0, 2359.0, 1544.0, 1147.0, 698.0, 498.0, 335.0, 226.0, 150.0, 108.0, 82.0, 64.0, 24.0, 19.0, 16.0, 14.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.75, -32.61083984375, -31.4716796875, -30.33251953125, -29.193359375, -28.05419921875, -26.9150390625, -25.77587890625, -24.63671875, -23.49755859375, -22.3583984375, -21.21923828125, -20.080078125, -18.94091796875, -17.8017578125, -16.66259765625, -15.5234375, -14.38427734375, -13.2451171875, -12.10595703125, -10.966796875, -9.82763671875, -8.6884765625, -7.54931640625, -6.41015625, -5.27099609375, -4.1318359375, -2.99267578125, -1.853515625, -0.71435546875, 0.4248046875, 1.56396484375, 2.703125, 3.84228515625, 4.9814453125, 6.12060546875, 7.259765625, 8.39892578125, 9.5380859375, 10.67724609375, 11.81640625, 12.95556640625, 14.0947265625, 15.23388671875, 16.373046875, 17.51220703125, 18.6513671875, 19.79052734375, 20.9296875, 22.06884765625, 23.2080078125, 24.34716796875, 25.486328125, 26.62548828125, 27.7646484375, 28.90380859375, 30.04296875, 31.18212890625, 32.3212890625, 33.46044921875, 34.599609375, 35.73876953125, 36.8779296875, 38.01708984375, 39.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 8.0, 13.0, 7.0, 9.0, 15.0, 12.0, 13.0, 21.0, 23.0, 18.0, 19.0, 19.0, 31.0, 24.0, 31.0, 39.0, 43.0, 43.0, 41.0, 42.0, 31.0, 39.0, 36.0, 35.0, 38.0, 34.0, 31.0, 29.0, 31.0, 30.0, 29.0, 21.0, 21.0, 27.0, 13.0, 15.0, 14.0, 6.0, 9.0, 9.0, 8.0, 4.0, 2.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-38.71875, -37.6064453125, -36.494140625, -35.3818359375, -34.26953125, -33.1572265625, -32.044921875, -30.9326171875, -29.8203125, -28.7080078125, -27.595703125, -26.4833984375, -25.37109375, -24.2587890625, -23.146484375, -22.0341796875, -20.921875, -19.8095703125, -18.697265625, -17.5849609375, -16.47265625, -15.3603515625, -14.248046875, -13.1357421875, -12.0234375, -10.9111328125, -9.798828125, -8.6865234375, -7.57421875, -6.4619140625, -5.349609375, -4.2373046875, -3.125, -2.0126953125, -0.900390625, 0.2119140625, 1.32421875, 2.4365234375, 3.548828125, 4.6611328125, 5.7734375, 6.8857421875, 7.998046875, 9.1103515625, 10.22265625, 11.3349609375, 12.447265625, 13.5595703125, 14.671875, 15.7841796875, 16.896484375, 18.0087890625, 19.12109375, 20.2333984375, 21.345703125, 22.4580078125, 23.5703125, 24.6826171875, 25.794921875, 26.9072265625, 28.01953125, 29.1318359375, 30.244140625, 31.3564453125, 32.46875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 6.0, 13.0, 12.0, 16.0, 21.0, 32.0, 49.0, 64.0, 67.0, 91.0, 129.0, 137.0, 227.0, 275.0, 394.0, 538.0, 816.0, 1284.0, 2052.0, 3441.0, 5771.0, 10791.0, 21702.0, 54762.0, 876507.0, 33399.0, 15569.0, 8090.0, 4540.0, 2651.0, 1556.0, 1052.0, 675.0, 485.0, 335.0, 245.0, 199.0, 144.0, 98.0, 77.0, 46.0, 47.0, 34.0, 34.0, 15.0, 19.0, 12.0, 15.0, 5.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.29296875, -1.252899169921875, -1.21282958984375, -1.172760009765625, -1.1326904296875, -1.092620849609375, -1.05255126953125, -1.012481689453125, -0.972412109375, -0.932342529296875, -0.89227294921875, -0.852203369140625, -0.8121337890625, -0.772064208984375, -0.73199462890625, -0.691925048828125, -0.65185546875, -0.611785888671875, -0.57171630859375, -0.531646728515625, -0.4915771484375, -0.451507568359375, -0.41143798828125, -0.371368408203125, -0.331298828125, -0.291229248046875, -0.25115966796875, -0.211090087890625, -0.1710205078125, -0.130950927734375, -0.09088134765625, -0.050811767578125, -0.0107421875, 0.029327392578125, 0.06939697265625, 0.109466552734375, 0.1495361328125, 0.189605712890625, 0.22967529296875, 0.269744873046875, 0.309814453125, 0.349884033203125, 0.38995361328125, 0.430023193359375, 0.4700927734375, 0.510162353515625, 0.55023193359375, 0.590301513671875, 0.63037109375, 0.670440673828125, 0.71051025390625, 0.750579833984375, 0.7906494140625, 0.830718994140625, 0.87078857421875, 0.910858154296875, 0.950927734375, 0.990997314453125, 1.03106689453125, 1.071136474609375, 1.1112060546875, 1.151275634765625, 1.19134521484375, 1.231414794921875, 1.271484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 0.0, 8.0, 13.0, 8.0, 10.0, 12.0, 16.0, 18.0, 32.0, 23.0, 31.0, 41.0, 32.0, 46.0, 42.0, 28.0, 49.0, 49.0, 58.0, 52.0, 43.0, 54.0, 53.0, 37.0, 28.0, 28.0, 44.0, 20.0, 25.0, 22.0, 15.0, 14.0, 13.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9788742065429688e-05, -1.9076280295848846e-05, -1.8363818526268005e-05, -1.7651356756687164e-05, -1.6938894987106323e-05, -1.6226433217525482e-05, -1.551397144794464e-05, -1.48015096783638e-05, -1.4089047908782959e-05, -1.3376586139202118e-05, -1.2664124369621277e-05, -1.1951662600040436e-05, -1.1239200830459595e-05, -1.0526739060878754e-05, -9.814277291297913e-06, -9.101815521717072e-06, -8.38935375213623e-06, -7.67689198255539e-06, -6.964430212974548e-06, -6.251968443393707e-06, -5.539506673812866e-06, -4.827044904232025e-06, -4.114583134651184e-06, -3.402121365070343e-06, -2.689659595489502e-06, -1.977197825908661e-06, -1.2647360563278198e-06, -5.522742867469788e-07, 1.601874828338623e-07, 8.726492524147034e-07, 1.5851110219955444e-06, 2.2975727915763855e-06, 3.0100345611572266e-06, 3.7224963307380676e-06, 4.434958100318909e-06, 5.14741986989975e-06, 5.859881639480591e-06, 6.572343409061432e-06, 7.284805178642273e-06, 7.997266948223114e-06, 8.709728717803955e-06, 9.422190487384796e-06, 1.0134652256965637e-05, 1.0847114026546478e-05, 1.155957579612732e-05, 1.227203756570816e-05, 1.2984499335289001e-05, 1.3696961104869843e-05, 1.4409422874450684e-05, 1.5121884644031525e-05, 1.5834346413612366e-05, 1.6546808183193207e-05, 1.7259269952774048e-05, 1.797173172235489e-05, 1.868419349193573e-05, 1.939665526151657e-05, 2.0109117031097412e-05, 2.0821578800678253e-05, 2.1534040570259094e-05, 2.2246502339839935e-05, 2.2958964109420776e-05, 2.3671425879001617e-05, 2.438388764858246e-05, 2.50963494181633e-05, 2.580881118774414e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 16.0, 15.0, 11.0, 46.0, 63.0, 85.0, 143.0, 186.0, 291.0, 432.0, 687.0, 1054.0, 1727.0, 2708.0, 4220.0, 6759.0, 11396.0, 19094.0, 32435.0, 58262.0, 107631.0, 185811.0, 227363.0, 169186.0, 94407.0, 51757.0, 28646.0, 16963.0, 10308.0, 6222.0, 3901.0, 2361.0, 1594.0, 932.0, 575.0, 443.0, 258.0, 177.0, 131.0, 86.0, 47.0, 44.0, 22.0, 20.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.7421875, -0.7199630737304688, -0.6977386474609375, -0.6755142211914062, -0.653289794921875, -0.6310653686523438, -0.6088409423828125, -0.5866165161132812, -0.56439208984375, -0.5421676635742188, -0.5199432373046875, -0.49771881103515625, -0.475494384765625, -0.45326995849609375, -0.4310455322265625, -0.40882110595703125, -0.3865966796875, -0.36437225341796875, -0.3421478271484375, -0.31992340087890625, -0.297698974609375, -0.27547454833984375, -0.2532501220703125, -0.23102569580078125, -0.20880126953125, -0.18657684326171875, -0.1643524169921875, -0.14212799072265625, -0.119903564453125, -0.09767913818359375, -0.0754547119140625, -0.05323028564453125, -0.031005859375, -0.00878143310546875, 0.0134429931640625, 0.03566741943359375, 0.057891845703125, 0.08011627197265625, 0.1023406982421875, 0.12456512451171875, 0.14678955078125, 0.16901397705078125, 0.1912384033203125, 0.21346282958984375, 0.235687255859375, 0.25791168212890625, 0.2801361083984375, 0.30236053466796875, 0.3245849609375, 0.34680938720703125, 0.3690338134765625, 0.39125823974609375, 0.413482666015625, 0.43570709228515625, 0.4579315185546875, 0.48015594482421875, 0.50238037109375, 0.5246047973632812, 0.5468292236328125, 0.5690536499023438, 0.591278076171875, 0.6135025024414062, 0.6357269287109375, 0.6579513549804688, 0.68017578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 4.0, 4.0, 6.0, 14.0, 10.0, 15.0, 20.0, 19.0, 33.0, 32.0, 48.0, 56.0, 68.0, 61.0, 74.0, 57.0, 55.0, 70.0, 73.0, 51.0, 45.0, 43.0, 20.0, 29.0, 16.0, 14.0, 12.0, 7.0, 11.0, 6.0, 5.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.299072265625, -0.2907066345214844, -0.28234100341796875, -0.2739753723144531, -0.2656097412109375, -0.2572441101074219, -0.24887847900390625, -0.24051284790039062, -0.232147216796875, -0.22378158569335938, -0.21541595458984375, -0.20705032348632812, -0.1986846923828125, -0.19031906127929688, -0.18195343017578125, -0.17358779907226562, -0.16522216796875, -0.15685653686523438, -0.14849090576171875, -0.14012527465820312, -0.1317596435546875, -0.12339401245117188, -0.11502838134765625, -0.10666275024414062, -0.098297119140625, -0.08993148803710938, -0.08156585693359375, -0.07320022583007812, -0.0648345947265625, -0.056468963623046875, -0.04810333251953125, -0.039737701416015625, -0.0313720703125, -0.023006439208984375, -0.01464080810546875, -0.006275177001953125, 0.0020904541015625, 0.010456085205078125, 0.01882171630859375, 0.027187347412109375, 0.035552978515625, 0.043918609619140625, 0.05228424072265625, 0.060649871826171875, 0.0690155029296875, 0.07738113403320312, 0.08574676513671875, 0.09411239624023438, 0.10247802734375, 0.11084365844726562, 0.11920928955078125, 0.12757492065429688, 0.1359405517578125, 0.14430618286132812, 0.15267181396484375, 0.16103744506835938, 0.169403076171875, 0.17776870727539062, 0.18613433837890625, 0.19449996948242188, 0.2028656005859375, 0.21123123168945312, 0.21959686279296875, 0.22796249389648438, 0.236328125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 9.0, 12.0, 13.0, 13.0, 17.0, 14.0, 23.0, 21.0, 30.0, 32.0, 38.0, 41.0, 48.0, 45.0, 46.0, 59.0, 59.0, 49.0, 50.0, 51.0, 43.0, 35.0, 48.0, 32.0, 33.0, 27.0, 18.0, 22.0, 12.0, 20.0, 6.0, 5.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-60.030418395996094, -58.336402893066406, -56.64238739013672, -54.94837188720703, -53.254356384277344, -51.560340881347656, -49.86632537841797, -48.17230987548828, -46.478294372558594, -44.784278869628906, -43.09026336669922, -41.39624786376953, -39.702232360839844, -38.008216857910156, -36.31420135498047, -34.62018585205078, -32.92616653442383, -31.23215103149414, -29.538135528564453, -27.844120025634766, -26.150104522705078, -24.45608901977539, -22.76207160949707, -21.068056106567383, -19.374040603637695, -17.680025100708008, -15.98600959777832, -14.291993141174316, -12.597977638244629, -10.903962135314941, -9.209945678710938, -7.51593017578125, -5.821918487548828, -4.127902984619141, -2.433887004852295, -0.7398710250854492, 0.9541444778442383, 2.648159980773926, 4.34217643737793, 6.036191940307617, 7.730207443237305, 9.424222946166992, 11.11823844909668, 12.812254905700684, 14.506270408630371, 16.200286865234375, 17.894302368164062, 19.58831787109375, 21.282333374023438, 22.976348876953125, 24.670364379882812, 26.3643798828125, 28.058395385742188, 29.752410888671875, 31.446428298950195, 33.14044189453125, 34.83445739746094, 36.528472900390625, 38.22248840332031, 39.91650390625, 41.61051940917969, 43.304534912109375, 44.99855041503906, 46.69256591796875, 48.3865852355957]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 8.0, 12.0, 6.0, 8.0, 17.0, 10.0, 8.0, 22.0, 28.0, 24.0, 24.0, 23.0, 25.0, 31.0, 47.0, 23.0, 34.0, 37.0, 37.0, 42.0, 47.0, 36.0, 36.0, 39.0, 32.0, 35.0, 42.0, 34.0, 24.0, 21.0, 23.0, 22.0, 21.0, 14.0, 15.0, 17.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-54.92332458496094, -53.31051254272461, -51.69770431518555, -50.08489227294922, -48.47208023071289, -46.85926818847656, -45.2464599609375, -43.63364791870117, -42.020835876464844, -40.408023834228516, -38.79521560668945, -37.182403564453125, -35.5695915222168, -33.95677947998047, -32.343971252441406, -30.731159210205078, -29.118350982666016, -27.50554084777832, -25.892728805541992, -24.279918670654297, -22.66710662841797, -21.054296493530273, -19.441486358642578, -17.82867431640625, -16.215864181518555, -14.603053092956543, -12.990242004394531, -11.377431869506836, -9.764620780944824, -8.151809692382812, -6.538999557495117, -4.9261884689331055, -3.313373565673828, -1.7005627155303955, -0.08775186538696289, 1.5250587463378906, 3.1378698348999023, 4.750680923461914, 6.363491058349609, 7.976302146911621, 9.589113235473633, 11.201924324035645, 12.814735412597656, 14.427545547485352, 16.040355682373047, 17.653167724609375, 19.26597785949707, 20.878787994384766, 22.491600036621094, 24.10441017150879, 25.717222213745117, 27.330032348632812, 28.94284439086914, 30.555654525756836, 32.16846466064453, 33.78127670288086, 35.39408874511719, 37.006900787353516, 38.61970901489258, 40.232521057128906, 41.845333099365234, 43.45814514160156, 45.070953369140625, 46.68376541137695, 48.296573638916016]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 18.0, 17.0, 33.0, 48.0, 78.0, 94.0, 147.0, 240.0, 342.0, 545.0, 882.0, 1425.0, 2370.0, 3822.0, 6472.0, 10479.0, 17085.0, 27239.0, 41107.0, 59465.0, 81876.0, 102820.0, 118441.0, 123332.0, 115217.0, 99048.0, 77638.0, 55266.0, 38164.0, 24705.0, 15727.0, 9581.0, 5700.0, 3590.0, 2095.0, 1261.0, 804.0, 453.0, 328.0, 203.0, 139.0, 90.0, 62.0, 42.0, 22.0, 15.0, 11.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.21875, -24.38916015625, -23.5595703125, -22.72998046875, -21.900390625, -21.07080078125, -20.2412109375, -19.41162109375, -18.58203125, -17.75244140625, -16.9228515625, -16.09326171875, -15.263671875, -14.43408203125, -13.6044921875, -12.77490234375, -11.9453125, -11.11572265625, -10.2861328125, -9.45654296875, -8.626953125, -7.79736328125, -6.9677734375, -6.13818359375, -5.30859375, -4.47900390625, -3.6494140625, -2.81982421875, -1.990234375, -1.16064453125, -0.3310546875, 0.49853515625, 1.328125, 2.15771484375, 2.9873046875, 3.81689453125, 4.646484375, 5.47607421875, 6.3056640625, 7.13525390625, 7.96484375, 8.79443359375, 9.6240234375, 10.45361328125, 11.283203125, 12.11279296875, 12.9423828125, 13.77197265625, 14.6015625, 15.43115234375, 16.2607421875, 17.09033203125, 17.919921875, 18.74951171875, 19.5791015625, 20.40869140625, 21.23828125, 22.06787109375, 22.8974609375, 23.72705078125, 24.556640625, 25.38623046875, 26.2158203125, 27.04541015625, 27.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 3.0, 7.0, 5.0, 8.0, 12.0, 7.0, 7.0, 17.0, 10.0, 9.0, 22.0, 29.0, 22.0, 24.0, 23.0, 26.0, 32.0, 46.0, 25.0, 32.0, 39.0, 36.0, 40.0, 48.0, 35.0, 36.0, 37.0, 34.0, 34.0, 44.0, 31.0, 29.0, 18.0, 24.0, 21.0, 21.0, 14.0, 16.0, 17.0, 11.0, 8.0, 7.0, 7.0, 7.0, 5.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-55.1875, -53.5654296875, -51.943359375, -50.3212890625, -48.69921875, -47.0771484375, -45.455078125, -43.8330078125, -42.2109375, -40.5888671875, -38.966796875, -37.3447265625, -35.72265625, -34.1005859375, -32.478515625, -30.8564453125, -29.234375, -27.6123046875, -25.990234375, -24.3681640625, -22.74609375, -21.1240234375, -19.501953125, -17.8798828125, -16.2578125, -14.6357421875, -13.013671875, -11.3916015625, -9.76953125, -8.1474609375, -6.525390625, -4.9033203125, -3.28125, -1.6591796875, -0.037109375, 1.5849609375, 3.20703125, 4.8291015625, 6.451171875, 8.0732421875, 9.6953125, 11.3173828125, 12.939453125, 14.5615234375, 16.18359375, 17.8056640625, 19.427734375, 21.0498046875, 22.671875, 24.2939453125, 25.916015625, 27.5380859375, 29.16015625, 30.7822265625, 32.404296875, 34.0263671875, 35.6484375, 37.2705078125, 38.892578125, 40.5146484375, 42.13671875, 43.7587890625, 45.380859375, 47.0029296875, 48.625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 22.0, 29.0, 40.0, 84.0, 147.0, 208.0, 323.0, 611.0, 883.0, 1480.0, 2442.0, 4066.0, 6636.0, 11122.0, 18161.0, 30063.0, 47390.0, 70394.0, 98136.0, 123872.0, 138258.0, 134407.0, 113736.0, 86229.0, 59708.0, 38540.0, 24261.0, 14827.0, 8741.0, 5292.0, 3255.0, 1947.0, 1233.0, 767.0, 419.0, 298.0, 203.0, 113.0, 66.0, 39.0, 26.0, 25.0, 15.0, 9.0, 5.0, 8.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.53125, -34.4794921875, -33.427734375, -32.3759765625, -31.32421875, -30.2724609375, -29.220703125, -28.1689453125, -27.1171875, -26.0654296875, -25.013671875, -23.9619140625, -22.91015625, -21.8583984375, -20.806640625, -19.7548828125, -18.703125, -17.6513671875, -16.599609375, -15.5478515625, -14.49609375, -13.4443359375, -12.392578125, -11.3408203125, -10.2890625, -9.2373046875, -8.185546875, -7.1337890625, -6.08203125, -5.0302734375, -3.978515625, -2.9267578125, -1.875, -0.8232421875, 0.228515625, 1.2802734375, 2.33203125, 3.3837890625, 4.435546875, 5.4873046875, 6.5390625, 7.5908203125, 8.642578125, 9.6943359375, 10.74609375, 11.7978515625, 12.849609375, 13.9013671875, 14.953125, 16.0048828125, 17.056640625, 18.1083984375, 19.16015625, 20.2119140625, 21.263671875, 22.3154296875, 23.3671875, 24.4189453125, 25.470703125, 26.5224609375, 27.57421875, 28.6259765625, 29.677734375, 30.7294921875, 31.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 12.0, 17.0, 13.0, 13.0, 18.0, 35.0, 20.0, 22.0, 26.0, 35.0, 45.0, 32.0, 39.0, 43.0, 30.0, 52.0, 43.0, 46.0, 46.0, 32.0, 43.0, 39.0, 35.0, 28.0, 30.0, 19.0, 23.0, 15.0, 23.0, 22.0, 18.0, 12.0, 12.0, 5.0, 6.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.28125, -32.1279296875, -30.974609375, -29.8212890625, -28.66796875, -27.5146484375, -26.361328125, -25.2080078125, -24.0546875, -22.9013671875, -21.748046875, -20.5947265625, -19.44140625, -18.2880859375, -17.134765625, -15.9814453125, -14.828125, -13.6748046875, -12.521484375, -11.3681640625, -10.21484375, -9.0615234375, -7.908203125, -6.7548828125, -5.6015625, -4.4482421875, -3.294921875, -2.1416015625, -0.98828125, 0.1650390625, 1.318359375, 2.4716796875, 3.625, 4.7783203125, 5.931640625, 7.0849609375, 8.23828125, 9.3916015625, 10.544921875, 11.6982421875, 12.8515625, 14.0048828125, 15.158203125, 16.3115234375, 17.46484375, 18.6181640625, 19.771484375, 20.9248046875, 22.078125, 23.2314453125, 24.384765625, 25.5380859375, 26.69140625, 27.8447265625, 28.998046875, 30.1513671875, 31.3046875, 32.4580078125, 33.611328125, 34.7646484375, 35.91796875, 37.0712890625, 38.224609375, 39.3779296875, 40.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 7.0, 9.0, 13.0, 11.0, 18.0, 17.0, 34.0, 41.0, 81.0, 118.0, 193.0, 294.0, 416.0, 704.0, 1167.0, 1893.0, 3096.0, 4998.0, 7834.0, 12532.0, 19330.0, 29050.0, 41355.0, 56362.0, 73002.0, 88237.0, 99971.0, 105580.0, 104196.0, 95370.0, 82048.0, 65676.0, 50184.0, 35811.0, 24654.0, 16214.0, 10624.0, 6739.0, 4013.0, 2549.0, 1545.0, 976.0, 573.0, 354.0, 248.0, 139.0, 95.0, 71.0, 36.0, 30.0, 17.0, 13.0, 12.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.93359375, -7.67596435546875, -7.4183349609375, -7.16070556640625, -6.903076171875, -6.64544677734375, -6.3878173828125, -6.13018798828125, -5.87255859375, -5.61492919921875, -5.3572998046875, -5.09967041015625, -4.842041015625, -4.58441162109375, -4.3267822265625, -4.06915283203125, -3.8115234375, -3.55389404296875, -3.2962646484375, -3.03863525390625, -2.781005859375, -2.52337646484375, -2.2657470703125, -2.00811767578125, -1.75048828125, -1.49285888671875, -1.2352294921875, -0.97760009765625, -0.719970703125, -0.46234130859375, -0.2047119140625, 0.05291748046875, 0.310546875, 0.56817626953125, 0.8258056640625, 1.08343505859375, 1.341064453125, 1.59869384765625, 1.8563232421875, 2.11395263671875, 2.37158203125, 2.62921142578125, 2.8868408203125, 3.14447021484375, 3.402099609375, 3.65972900390625, 3.9173583984375, 4.17498779296875, 4.4326171875, 4.69024658203125, 4.9478759765625, 5.20550537109375, 5.463134765625, 5.72076416015625, 5.9783935546875, 6.23602294921875, 6.49365234375, 6.75128173828125, 7.0089111328125, 7.26654052734375, 7.524169921875, 7.78179931640625, 8.0394287109375, 8.29705810546875, 8.5546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 3.0, 4.0, 7.0, 8.0, 11.0, 13.0, 8.0, 18.0, 10.0, 22.0, 27.0, 35.0, 37.0, 37.0, 36.0, 48.0, 35.0, 35.0, 40.0, 44.0, 44.0, 46.0, 55.0, 37.0, 39.0, 27.0, 35.0, 41.0, 24.0, 22.0, 20.0, 19.0, 15.0, 22.0, 10.0, 14.0, 12.0, 6.0, 9.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010662078857421875, -0.0010330677032470703, -0.0009999275207519531, -0.0009667873382568359, -0.0009336471557617188, -0.0009005069732666016, -0.0008673667907714844, -0.0008342266082763672, -0.00080108642578125, -0.0007679462432861328, -0.0007348060607910156, -0.0007016658782958984, -0.0006685256958007812, -0.0006353855133056641, -0.0006022453308105469, -0.0005691051483154297, -0.0005359649658203125, -0.0005028247833251953, -0.0004696846008300781, -0.00043654441833496094, -0.00040340423583984375, -0.00037026405334472656, -0.0003371238708496094, -0.0003039836883544922, -0.000270843505859375, -0.0002377033233642578, -0.00020456314086914062, -0.00017142295837402344, -0.00013828277587890625, -0.00010514259338378906, -7.200241088867188e-05, -3.886222839355469e-05, -5.7220458984375e-06, 2.7418136596679688e-05, 6.0558319091796875e-05, 9.369850158691406e-05, 0.00012683868408203125, 0.00015997886657714844, 0.00019311904907226562, 0.0002262592315673828, 0.0002593994140625, 0.0002925395965576172, 0.0003256797790527344, 0.00035881996154785156, 0.00039196014404296875, 0.00042510032653808594, 0.0004582405090332031, 0.0004913806915283203, 0.0005245208740234375, 0.0005576610565185547, 0.0005908012390136719, 0.0006239414215087891, 0.0006570816040039062, 0.0006902217864990234, 0.0007233619689941406, 0.0007565021514892578, 0.000789642333984375, 0.0008227825164794922, 0.0008559226989746094, 0.0008890628814697266, 0.0009222030639648438, 0.0009553432464599609, 0.0009884834289550781, 0.0010216236114501953, 0.0010547637939453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 7.0, 13.0, 16.0, 16.0, 29.0, 31.0, 54.0, 78.0, 103.0, 161.0, 275.0, 487.0, 832.0, 1300.0, 2357.0, 4333.0, 7744.0, 13740.0, 23801.0, 39035.0, 60527.0, 86556.0, 112537.0, 130810.0, 136114.0, 125261.0, 101764.0, 75170.0, 50247.0, 31565.0, 18776.0, 10727.0, 6029.0, 3380.0, 1933.0, 1109.0, 568.0, 366.0, 238.0, 156.0, 111.0, 59.0, 47.0, 31.0, 15.0, 11.0, 10.0, 2.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.9140625, -10.565185546875, -10.21630859375, -9.867431640625, -9.5185546875, -9.169677734375, -8.82080078125, -8.471923828125, -8.123046875, -7.774169921875, -7.42529296875, -7.076416015625, -6.7275390625, -6.378662109375, -6.02978515625, -5.680908203125, -5.33203125, -4.983154296875, -4.63427734375, -4.285400390625, -3.9365234375, -3.587646484375, -3.23876953125, -2.889892578125, -2.541015625, -2.192138671875, -1.84326171875, -1.494384765625, -1.1455078125, -0.796630859375, -0.44775390625, -0.098876953125, 0.25, 0.598876953125, 0.94775390625, 1.296630859375, 1.6455078125, 1.994384765625, 2.34326171875, 2.692138671875, 3.041015625, 3.389892578125, 3.73876953125, 4.087646484375, 4.4365234375, 4.785400390625, 5.13427734375, 5.483154296875, 5.83203125, 6.180908203125, 6.52978515625, 6.878662109375, 7.2275390625, 7.576416015625, 7.92529296875, 8.274169921875, 8.623046875, 8.971923828125, 9.32080078125, 9.669677734375, 10.0185546875, 10.367431640625, 10.71630859375, 11.065185546875, 11.4140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 3.0, 10.0, 13.0, 10.0, 12.0, 19.0, 18.0, 35.0, 41.0, 44.0, 52.0, 56.0, 72.0, 77.0, 62.0, 66.0, 77.0, 56.0, 54.0, 41.0, 33.0, 42.0, 25.0, 17.0, 13.0, 10.0, 5.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.67578125, -7.46533203125, -7.2548828125, -7.04443359375, -6.833984375, -6.62353515625, -6.4130859375, -6.20263671875, -5.9921875, -5.78173828125, -5.5712890625, -5.36083984375, -5.150390625, -4.93994140625, -4.7294921875, -4.51904296875, -4.30859375, -4.09814453125, -3.8876953125, -3.67724609375, -3.466796875, -3.25634765625, -3.0458984375, -2.83544921875, -2.625, -2.41455078125, -2.2041015625, -1.99365234375, -1.783203125, -1.57275390625, -1.3623046875, -1.15185546875, -0.94140625, -0.73095703125, -0.5205078125, -0.31005859375, -0.099609375, 0.11083984375, 0.3212890625, 0.53173828125, 0.7421875, 0.95263671875, 1.1630859375, 1.37353515625, 1.583984375, 1.79443359375, 2.0048828125, 2.21533203125, 2.42578125, 2.63623046875, 2.8466796875, 3.05712890625, 3.267578125, 3.47802734375, 3.6884765625, 3.89892578125, 4.109375, 4.31982421875, 4.5302734375, 4.74072265625, 4.951171875, 5.16162109375, 5.3720703125, 5.58251953125, 5.79296875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 7.0, 5.0, 3.0, 5.0, 13.0, 16.0, 11.0, 17.0, 23.0, 23.0, 22.0, 30.0, 36.0, 49.0, 44.0, 53.0, 54.0, 49.0, 64.0, 52.0, 52.0, 51.0, 54.0, 37.0, 39.0, 36.0, 30.0, 24.0, 31.0, 17.0, 14.0, 13.0, 11.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.94465637207031, -63.11735534667969, -61.29005813598633, -59.4627571105957, -57.635459899902344, -55.80815887451172, -53.980857849121094, -52.153560638427734, -50.326263427734375, -48.49896240234375, -46.67166519165039, -44.844364166259766, -43.017066955566406, -41.18976593017578, -39.362464904785156, -37.5351676940918, -35.70786666870117, -33.88056564331055, -32.05326843261719, -30.225967407226562, -28.398670196533203, -26.571369171142578, -24.744070053100586, -22.916770935058594, -21.0894718170166, -19.26217269897461, -17.434873580932617, -15.607573509216309, -13.780274391174316, -11.952975273132324, -10.125675201416016, -8.298376083374023, -6.471073150634766, -4.643774032592773, -2.816474437713623, -0.9891748428344727, 0.8381242752075195, 2.6654233932495117, 4.49272346496582, 6.3200225830078125, 8.147321701049805, 9.974620819091797, 11.801919937133789, 13.629220008850098, 15.45651912689209, 17.283817291259766, 19.11111831665039, 20.938417434692383, 22.765716552734375, 24.593015670776367, 26.42031478881836, 28.247615814208984, 30.074913024902344, 31.90221405029297, 33.729515075683594, 35.55681228637695, 37.38410949707031, 39.21141052246094, 41.0387077331543, 42.86600875854492, 44.69330596923828, 46.520606994628906, 48.34790802001953, 50.17520523071289, 52.002506256103516]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 3.0, 4.0, 9.0, 12.0, 10.0, 14.0, 14.0, 19.0, 17.0, 19.0, 26.0, 22.0, 23.0, 28.0, 34.0, 35.0, 35.0, 36.0, 33.0, 45.0, 39.0, 48.0, 36.0, 37.0, 45.0, 38.0, 30.0, 34.0, 28.0, 34.0, 30.0, 26.0, 22.0, 14.0, 13.0, 15.0, 16.0, 10.0, 7.0, 12.0, 4.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.636932373046875, -61.700416564941406, -59.7639045715332, -57.827392578125, -55.89087677001953, -53.95436096191406, -52.01784896850586, -50.081336975097656, -48.14482116699219, -46.20830535888672, -44.271793365478516, -42.33528137207031, -40.398765563964844, -38.462249755859375, -36.52573776245117, -34.58922576904297, -32.6527099609375, -30.716196060180664, -28.779682159423828, -26.843168258666992, -24.906654357910156, -22.97014045715332, -21.033626556396484, -19.09711265563965, -17.160598754882812, -15.224084854125977, -13.28757095336914, -11.351057052612305, -9.414543151855469, -7.478029251098633, -5.541515350341797, -3.605001449584961, -1.6684837341308594, 0.26803016662597656, 2.2045440673828125, 4.141057968139648, 6.077571868896484, 8.01408576965332, 9.950599670410156, 11.887113571166992, 13.823627471923828, 15.760141372680664, 17.6966552734375, 19.633169174194336, 21.569683074951172, 23.506196975708008, 25.442710876464844, 27.37922477722168, 29.315738677978516, 31.25225257873535, 33.18876647949219, 35.125282287597656, 37.06179428100586, 38.99830627441406, 40.93482208251953, 42.871337890625, 44.8078498840332, 46.744361877441406, 48.680877685546875, 50.617393493652344, 52.55390548706055, 54.49041748046875, 56.42693328857422, 58.36344909667969, 60.29996109008789]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 10.0, 17.0, 18.0, 26.0, 45.0, 40.0, 60.0, 97.0, 136.0, 196.0, 290.0, 341.0, 482.0, 653.0, 829.0, 1065.0, 1439.0, 1827.0, 2274.0, 2783.0, 3251.0, 3862.0, 4812.0, 1000721.0, 4991.0, 3987.0, 3386.0, 2793.0, 2300.0, 1888.0, 1480.0, 1182.0, 872.0, 653.0, 471.0, 383.0, 264.0, 185.0, 122.0, 102.0, 80.0, 56.0, 40.0, 18.0, 29.0, 20.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-415.7452087402344, -402.57373046875, -389.40228271484375, -376.2308349609375, -363.0593566894531, -349.88787841796875, -336.7164306640625, -323.54498291015625, -310.3735046386719, -297.2020263671875, -284.03057861328125, -270.859130859375, -257.6876525878906, -244.5161895751953, -231.3447265625, -218.1732635498047, -205.00180053710938, -191.83033752441406, -178.65887451171875, -165.48741149902344, -152.31594848632812, -139.1444854736328, -125.9730224609375, -112.80155944824219, -99.63009643554688, -86.45863342285156, -73.28717041015625, -60.11570739746094, -46.944244384765625, -33.77278137207031, -20.601318359375, -7.4298553466796875, 5.741607666015625, 18.913070678710938, 32.08453369140625, 45.25599670410156, 58.427459716796875, 71.59892272949219, 84.7703857421875, 97.94184875488281, 111.11331176757812, 124.28477478027344, 137.45623779296875, 150.62770080566406, 163.79916381835938, 176.9706268310547, 190.14208984375, 203.3135528564453, 216.48501586914062, 229.65647888183594, 242.82794189453125, 255.99940490722656, 269.1708679199219, 282.34234619140625, 295.5137939453125, 308.68524169921875, 321.8567199707031, 335.0281982421875, 348.19964599609375, 361.37109375, 374.5425720214844, 387.71405029296875, 400.885498046875, 414.05694580078125, 427.2284240722656]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 14.0, 18.0, 24.0, 20.0, 30.0, 48.0, 70.0, 102.0, 190.0, 326.0, 623.0, 1038.0, 1880.0, 3605.0, 6820.0, 12820.0, 22376.0, 36227.0, 50954912.0, 349363.0, 33817.0, 20854.0, 11990.0, 6423.0, 3466.0, 1805.0, 1034.0, 594.0, 320.0, 167.0, 123.0, 84.0, 45.0, 32.0, 22.0, 19.0, 11.0, 11.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0], "bins": [-839.9098510742188, -815.8770751953125, -791.8442993164062, -767.8115234375, -743.7787475585938, -719.7459716796875, -695.7131958007812, -671.680419921875, -647.6476440429688, -623.6148681640625, -599.5820922851562, -575.54931640625, -551.5165405273438, -527.4837646484375, -503.45098876953125, -479.418212890625, -455.38543701171875, -431.3526611328125, -407.31988525390625, -383.287109375, -359.25433349609375, -335.2215576171875, -311.18878173828125, -287.156005859375, -263.12322998046875, -239.0904541015625, -215.05767822265625, -191.02490234375, -166.99212646484375, -142.9593505859375, -118.92657470703125, -94.893798828125, -70.8609619140625, -46.82818603515625, -22.79541015625, 1.23736572265625, 25.2701416015625, 49.30291748046875, 73.335693359375, 97.36846923828125, 121.4012451171875, 145.43402099609375, 169.466796875, 193.49957275390625, 217.5323486328125, 241.56512451171875, 265.597900390625, 289.63067626953125, 313.6634521484375, 337.69622802734375, 361.72900390625, 385.76177978515625, 409.7945556640625, 433.82733154296875, 457.860107421875, 481.89288330078125, 505.9256591796875, 529.9584350585938, 553.9912109375, 578.0239868164062, 602.0567626953125, 626.0895385742188, 650.122314453125, 674.1550903320312, 698.1878662109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 6.0, 9.0, 14.0, 20.0, 33.0, 60.0, 95.0, 196.0, 236.0, 132.0, 72.0, 33.0, 36.0, 21.0, 10.0, 11.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-382.77325439453125, -370.09393310546875, -357.4145812988281, -344.7352600097656, -332.0559387207031, -319.3766174316406, -306.697265625, -294.0179443359375, -281.338623046875, -268.6593017578125, -255.97996520996094, -243.30062866210938, -230.62130737304688, -217.9419708251953, -205.26263427734375, -192.58331298828125, -179.9039764404297, -167.22463989257812, -154.54531860351562, -141.86598205566406, -129.18666076660156, -116.50732421875, -103.82799530029297, -91.14866638183594, -78.4693374633789, -65.79000854492188, -53.110679626464844, -40.43134689331055, -27.752017974853516, -15.072689056396484, -2.3933563232421875, 10.285972595214844, 22.965301513671875, 35.644630432128906, 48.32395935058594, 61.003292083740234, 73.6826171875, 86.36195373535156, 99.0412826538086, 111.72061157226562, 124.39994049072266, 137.0792694091797, 149.75860595703125, 162.43792724609375, 175.1172637939453, 187.7965850830078, 200.47592163085938, 213.15524291992188, 225.83457946777344, 238.513916015625, 251.1932373046875, 263.87255859375, 276.5519104003906, 289.2312316894531, 301.9105529785156, 314.58990478515625, 327.26922607421875, 339.94854736328125, 352.6278991699219, 365.3072204589844, 377.9865417480469, 390.6658630371094, 403.34521484375, 416.0245361328125, 428.703857421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 2.0, 3.0, 7.0, 5.0, 8.0, 12.0, 15.0, 23.0, 23.0, 36.0, 48.0, 78.0, 81.0, 118.0, 120.0, 113.0, 82.0, 53.0, 40.0, 27.0, 22.0, 15.0, 11.0, 6.0, 3.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-510.5907287597656, -494.71307373046875, -478.83538818359375, -462.9577331542969, -447.080078125, -431.202392578125, -415.3247375488281, -399.44708251953125, -383.56939697265625, -367.6917419433594, -351.8140563964844, -335.9364013671875, -320.0587158203125, -304.1810607910156, -288.30340576171875, -272.42572021484375, -256.5480651855469, -240.67039489746094, -224.792724609375, -208.91506958007812, -193.0373992919922, -177.15972900390625, -161.28207397460938, -145.40440368652344, -129.5267333984375, -113.64906311035156, -97.77140045166016, -81.89373779296875, -66.01606750488281, -50.138397216796875, -34.26073455810547, -18.383071899414062, -2.50543212890625, 13.372234344482422, 29.249900817871094, 45.127567291259766, 61.00523376464844, 76.88290405273438, 92.76056671142578, 108.63822937011719, 124.51589965820312, 140.39356994628906, 156.271240234375, 172.14889526367188, 188.0265655517578, 203.90423583984375, 219.78189086914062, 235.65956115722656, 251.5372314453125, 267.4148864746094, 283.2925720214844, 299.17022705078125, 315.04791259765625, 330.9255676269531, 346.80322265625, 362.680908203125, 378.5585632324219, 394.43621826171875, 410.31390380859375, 426.1915588378906, 442.0692138671875, 457.9468994140625, 473.8245544433594, 489.70220947265625, 505.57989501953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 11.0, 13.0, 13.0, 25.0, 18.0, 26.0, 25.0, 38.0, 33.0, 59.0, 56.0, 81.0, 101.0, 150.0, 200.0, 282.0, 420.0, 684.0, 1089.0, 1826.0, 3376.0, 6454.0, 14053.0, 36545.0, 191000.0, 3838169.0, 63262.0, 18190.0, 8004.0, 4273.0, 2337.0, 1405.0, 798.0, 450.0, 298.0, 174.0, 122.0, 80.0, 54.0, 28.0, 12.0, 16.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.625, -24.971923828125, -24.31884765625, -23.665771484375, -23.0126953125, -22.359619140625, -21.70654296875, -21.053466796875, -20.400390625, -19.747314453125, -19.09423828125, -18.441162109375, -17.7880859375, -17.135009765625, -16.48193359375, -15.828857421875, -15.17578125, -14.522705078125, -13.86962890625, -13.216552734375, -12.5634765625, -11.910400390625, -11.25732421875, -10.604248046875, -9.951171875, -9.298095703125, -8.64501953125, -7.991943359375, -7.3388671875, -6.685791015625, -6.03271484375, -5.379638671875, -4.7265625, -4.073486328125, -3.42041015625, -2.767333984375, -2.1142578125, -1.461181640625, -0.80810546875, -0.155029296875, 0.498046875, 1.151123046875, 1.80419921875, 2.457275390625, 3.1103515625, 3.763427734375, 4.41650390625, 5.069580078125, 5.72265625, 6.375732421875, 7.02880859375, 7.681884765625, 8.3349609375, 8.988037109375, 9.64111328125, 10.294189453125, 10.947265625, 11.600341796875, 12.25341796875, 12.906494140625, 13.5595703125, 14.212646484375, 14.86572265625, 15.518798828125, 16.171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 1.0, 9.0, 10.0, 7.0, 21.0, 29.0, 79.0, 669.0, 75.0, 33.0, 15.0, 11.0, 6.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7890625, -2.72174072265625, -2.6544189453125, -2.58709716796875, -2.519775390625, -2.45245361328125, -2.3851318359375, -2.31781005859375, -2.25048828125, -2.18316650390625, -2.1158447265625, -2.04852294921875, -1.981201171875, -1.91387939453125, -1.8465576171875, -1.77923583984375, -1.7119140625, -1.64459228515625, -1.5772705078125, -1.50994873046875, -1.442626953125, -1.37530517578125, -1.3079833984375, -1.24066162109375, -1.17333984375, -1.10601806640625, -1.0386962890625, -0.97137451171875, -0.904052734375, -0.83673095703125, -0.7694091796875, -0.70208740234375, -0.634765625, -0.56744384765625, -0.5001220703125, -0.43280029296875, -0.365478515625, -0.29815673828125, -0.2308349609375, -0.16351318359375, -0.09619140625, -0.02886962890625, 0.0384521484375, 0.10577392578125, 0.173095703125, 0.24041748046875, 0.3077392578125, 0.37506103515625, 0.4423828125, 0.50970458984375, 0.5770263671875, 0.64434814453125, 0.711669921875, 0.77899169921875, 0.8463134765625, 0.91363525390625, 0.98095703125, 1.04827880859375, 1.1156005859375, 1.18292236328125, 1.250244140625, 1.31756591796875, 1.3848876953125, 1.45220947265625, 1.51953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 11.0, 19.0, 33.0, 41.0, 66.0, 101.0, 149.0, 331.0, 540.0, 1058.0, 2362.0, 5880.0, 16211.0, 56312.0, 299729.0, 3124039.0, 562236.0, 88230.0, 22946.0, 7888.0, 3083.0, 1415.0, 675.0, 372.0, 183.0, 125.0, 81.0, 45.0, 32.0, 17.0, 18.0, 12.0, 6.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.8046875, -15.320556640625, -14.83642578125, -14.352294921875, -13.8681640625, -13.384033203125, -12.89990234375, -12.415771484375, -11.931640625, -11.447509765625, -10.96337890625, -10.479248046875, -9.9951171875, -9.510986328125, -9.02685546875, -8.542724609375, -8.05859375, -7.574462890625, -7.09033203125, -6.606201171875, -6.1220703125, -5.637939453125, -5.15380859375, -4.669677734375, -4.185546875, -3.701416015625, -3.21728515625, -2.733154296875, -2.2490234375, -1.764892578125, -1.28076171875, -0.796630859375, -0.3125, 0.171630859375, 0.65576171875, 1.139892578125, 1.6240234375, 2.108154296875, 2.59228515625, 3.076416015625, 3.560546875, 4.044677734375, 4.52880859375, 5.012939453125, 5.4970703125, 5.981201171875, 6.46533203125, 6.949462890625, 7.43359375, 7.917724609375, 8.40185546875, 8.885986328125, 9.3701171875, 9.854248046875, 10.33837890625, 10.822509765625, 11.306640625, 11.790771484375, 12.27490234375, 12.759033203125, 13.2431640625, 13.727294921875, 14.21142578125, 14.695556640625, 15.1796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 5.0, 9.0, 3.0, 13.0, 20.0, 26.0, 26.0, 29.0, 36.0, 49.0, 80.0, 102.0, 121.0, 164.0, 199.0, 311.0, 608.0, 974.0, 301.0, 241.0, 177.0, 136.0, 103.0, 100.0, 50.0, 48.0, 35.0, 21.0, 18.0, 11.0, 13.0, 10.0, 12.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53125, -3.40985107421875, -3.2884521484375, -3.16705322265625, -3.045654296875, -2.92425537109375, -2.8028564453125, -2.68145751953125, -2.56005859375, -2.43865966796875, -2.3172607421875, -2.19586181640625, -2.074462890625, -1.95306396484375, -1.8316650390625, -1.71026611328125, -1.5888671875, -1.46746826171875, -1.3460693359375, -1.22467041015625, -1.103271484375, -0.98187255859375, -0.8604736328125, -0.73907470703125, -0.61767578125, -0.49627685546875, -0.3748779296875, -0.25347900390625, -0.132080078125, -0.01068115234375, 0.1107177734375, 0.23211669921875, 0.353515625, 0.47491455078125, 0.5963134765625, 0.71771240234375, 0.839111328125, 0.96051025390625, 1.0819091796875, 1.20330810546875, 1.32470703125, 1.44610595703125, 1.5675048828125, 1.68890380859375, 1.810302734375, 1.93170166015625, 2.0531005859375, 2.17449951171875, 2.2958984375, 2.41729736328125, 2.5386962890625, 2.66009521484375, 2.781494140625, 2.90289306640625, 3.0242919921875, 3.14569091796875, 3.26708984375, 3.38848876953125, 3.5098876953125, 3.63128662109375, 3.752685546875, 3.87408447265625, 3.9954833984375, 4.11688232421875, 4.23828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 27.0, 52.0, 151.0, 266.0, 245.0, 133.0, 60.0, 34.0, 10.0, 14.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.225811004638672, -20.347461700439453, -18.469114303588867, -16.59076690673828, -14.712417602539062, -12.83406925201416, -10.955720901489258, -9.077372550964355, -7.199024200439453, -5.320675849914551, -3.4423274993896484, -1.563979148864746, 0.31436920166015625, 2.1927175521850586, 4.071065902709961, 5.949414253234863, 7.827762603759766, 9.706110954284668, 11.58445930480957, 13.462807655334473, 15.341156005859375, 17.219505310058594, 19.09785270690918, 20.976200103759766, 22.854549407958984, 24.732898712158203, 26.61124610900879, 28.489593505859375, 30.367942810058594, 32.24629211425781, 34.12464141845703, 36.002986907958984, 37.88133239746094, 39.759681701660156, 41.638031005859375, 43.51637649536133, 45.39472579956055, 47.273075103759766, 49.15142059326172, 51.02976989746094, 52.908119201660156, 54.786468505859375, 56.664817810058594, 58.54316329956055, 60.421512603759766, 62.299861907958984, 64.17820739746094, 66.05655670166016, 67.93490600585938, 69.8132553100586, 71.69160461425781, 73.56995391845703, 75.44830322265625, 77.32664489746094, 79.20499420166016, 81.08334350585938, 82.9616928100586, 84.84004211425781, 86.71839141845703, 88.59674072265625, 90.47508239746094, 92.35343170166016, 94.23178100585938, 96.1101303100586, 97.98847961425781]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 5.0, 8.0, 8.0, 9.0, 8.0, 11.0, 13.0, 17.0, 18.0, 19.0, 26.0, 27.0, 32.0, 24.0, 37.0, 35.0, 30.0, 48.0, 42.0, 35.0, 52.0, 41.0, 52.0, 44.0, 37.0, 32.0, 34.0, 28.0, 34.0, 26.0, 23.0, 36.0, 17.0, 14.0, 11.0, 11.0, 17.0, 8.0, 5.0, 3.0, 4.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-19.559181213378906, -18.98025894165039, -18.401336669921875, -17.822412490844727, -17.24349021911621, -16.664567947387695, -16.08564567565918, -15.506723403930664, -14.927800178527832, -14.348877906799316, -13.769954681396484, -13.191032409667969, -12.612110137939453, -12.033186912536621, -11.454264640808105, -10.875341415405273, -10.296419143676758, -9.717496871948242, -9.13857364654541, -8.559651374816895, -7.980728626251221, -7.401805877685547, -6.822883605957031, -6.243960857391357, -5.665038108825684, -5.08611536026001, -4.507192611694336, -3.9282703399658203, -3.3493475914001465, -2.7704248428344727, -2.191502332687378, -1.6125798225402832, -1.0336589813232422, -0.4547363519668579, 0.12418627738952637, 0.7031089067459106, 1.282031536102295, 1.8609542846679688, 2.4398767948150635, 3.018799304962158, 3.597722053527832, 4.176644802093506, 4.75556755065918, 5.334489822387695, 5.913412570953369, 6.492335319519043, 7.071257591247559, 7.650180339813232, 8.229103088378906, 8.808025360107422, 9.386948585510254, 9.96587085723877, 10.544794082641602, 11.123716354370117, 11.702638626098633, 12.281560897827148, 12.86048412322998, 13.439406394958496, 14.018329620361328, 14.597251892089844, 15.17617416381836, 15.755097389221191, 16.334020614624023, 16.91294288635254, 17.491865158081055]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 7.0, 4.0, 7.0, 9.0, 13.0, 34.0, 29.0, 45.0, 90.0, 134.0, 166.0, 324.0, 611.0, 1179.0, 2348.0, 5029.0, 14407.0, 87170.0, 820929.0, 91010.0, 14623.0, 5297.0, 2371.0, 1202.0, 613.0, 333.0, 201.0, 134.0, 86.0, 43.0, 26.0, 23.0, 19.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.515625, -15.023193359375, -14.53076171875, -14.038330078125, -13.5458984375, -13.053466796875, -12.56103515625, -12.068603515625, -11.576171875, -11.083740234375, -10.59130859375, -10.098876953125, -9.6064453125, -9.114013671875, -8.62158203125, -8.129150390625, -7.63671875, -7.144287109375, -6.65185546875, -6.159423828125, -5.6669921875, -5.174560546875, -4.68212890625, -4.189697265625, -3.697265625, -3.204833984375, -2.71240234375, -2.219970703125, -1.7275390625, -1.235107421875, -0.74267578125, -0.250244140625, 0.2421875, 0.734619140625, 1.22705078125, 1.719482421875, 2.2119140625, 2.704345703125, 3.19677734375, 3.689208984375, 4.181640625, 4.674072265625, 5.16650390625, 5.658935546875, 6.1513671875, 6.643798828125, 7.13623046875, 7.628662109375, 8.12109375, 8.613525390625, 9.10595703125, 9.598388671875, 10.0908203125, 10.583251953125, 11.07568359375, 11.568115234375, 12.060546875, 12.552978515625, 13.04541015625, 13.537841796875, 14.0302734375, 14.522705078125, 15.01513671875, 15.507568359375, 16.0]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 5.0, 8.0, 11.0, 11.0, 37.0, 68.0, 135.0, 213.0, 207.0, 160.0, 63.0, 26.0, 15.0, 10.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.91796875, -2.844879150390625, -2.77178955078125, -2.698699951171875, -2.6256103515625, -2.552520751953125, -2.47943115234375, -2.406341552734375, -2.333251953125, -2.260162353515625, -2.18707275390625, -2.113983154296875, -2.0408935546875, -1.967803955078125, -1.89471435546875, -1.821624755859375, -1.74853515625, -1.675445556640625, -1.60235595703125, -1.529266357421875, -1.4561767578125, -1.383087158203125, -1.30999755859375, -1.236907958984375, -1.163818359375, -1.090728759765625, -1.01763916015625, -0.944549560546875, -0.8714599609375, -0.798370361328125, -0.72528076171875, -0.652191162109375, -0.5791015625, -0.506011962890625, -0.43292236328125, -0.359832763671875, -0.2867431640625, -0.213653564453125, -0.14056396484375, -0.067474365234375, 0.005615234375, 0.078704833984375, 0.15179443359375, 0.224884033203125, 0.2979736328125, 0.371063232421875, 0.44415283203125, 0.517242431640625, 0.59033203125, 0.663421630859375, 0.73651123046875, 0.809600830078125, 0.8826904296875, 0.955780029296875, 1.02886962890625, 1.101959228515625, 1.175048828125, 1.248138427734375, 1.32122802734375, 1.394317626953125, 1.4674072265625, 1.540496826171875, 1.61358642578125, 1.686676025390625, 1.759765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 10.0, 16.0, 10.0, 16.0, 28.0, 38.0, 66.0, 132.0, 224.0, 443.0, 1004.0, 2451.0, 7815.0, 31925.0, 193898.0, 641092.0, 134985.0, 24142.0, 6481.0, 2002.0, 835.0, 397.0, 191.0, 108.0, 72.0, 41.0, 27.0, 21.0, 14.0, 12.0, 8.0, 11.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-18.53125, -18.035888671875, -17.54052734375, -17.045166015625, -16.5498046875, -16.054443359375, -15.55908203125, -15.063720703125, -14.568359375, -14.072998046875, -13.57763671875, -13.082275390625, -12.5869140625, -12.091552734375, -11.59619140625, -11.100830078125, -10.60546875, -10.110107421875, -9.61474609375, -9.119384765625, -8.6240234375, -8.128662109375, -7.63330078125, -7.137939453125, -6.642578125, -6.147216796875, -5.65185546875, -5.156494140625, -4.6611328125, -4.165771484375, -3.67041015625, -3.175048828125, -2.6796875, -2.184326171875, -1.68896484375, -1.193603515625, -0.6982421875, -0.202880859375, 0.29248046875, 0.787841796875, 1.283203125, 1.778564453125, 2.27392578125, 2.769287109375, 3.2646484375, 3.760009765625, 4.25537109375, 4.750732421875, 5.24609375, 5.741455078125, 6.23681640625, 6.732177734375, 7.2275390625, 7.722900390625, 8.21826171875, 8.713623046875, 9.208984375, 9.704345703125, 10.19970703125, 10.695068359375, 11.1904296875, 11.685791015625, 12.18115234375, 12.676513671875, 13.171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 12.0, 13.0, 13.0, 17.0, 17.0, 29.0, 24.0, 39.0, 20.0, 43.0, 42.0, 42.0, 38.0, 51.0, 49.0, 55.0, 58.0, 51.0, 62.0, 40.0, 35.0, 32.0, 28.0, 22.0, 22.0, 24.0, 20.0, 11.0, 12.0, 19.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.21875, -8.9222412109375, -8.625732421875, -8.3292236328125, -8.03271484375, -7.7362060546875, -7.439697265625, -7.1431884765625, -6.8466796875, -6.5501708984375, -6.253662109375, -5.9571533203125, -5.66064453125, -5.3641357421875, -5.067626953125, -4.7711181640625, -4.474609375, -4.1781005859375, -3.881591796875, -3.5850830078125, -3.28857421875, -2.9920654296875, -2.695556640625, -2.3990478515625, -2.1025390625, -1.8060302734375, -1.509521484375, -1.2130126953125, -0.91650390625, -0.6199951171875, -0.323486328125, -0.0269775390625, 0.26953125, 0.5660400390625, 0.862548828125, 1.1590576171875, 1.45556640625, 1.7520751953125, 2.048583984375, 2.3450927734375, 2.6416015625, 2.9381103515625, 3.234619140625, 3.5311279296875, 3.82763671875, 4.1241455078125, 4.420654296875, 4.7171630859375, 5.013671875, 5.3101806640625, 5.606689453125, 5.9031982421875, 6.19970703125, 6.4962158203125, 6.792724609375, 7.0892333984375, 7.3857421875, 7.6822509765625, 7.978759765625, 8.2752685546875, 8.57177734375, 8.8682861328125, 9.164794921875, 9.4613037109375, 9.7578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 5.0, 11.0, 10.0, 12.0, 27.0, 31.0, 43.0, 54.0, 85.0, 113.0, 222.0, 442.0, 957.0, 2458.0, 9077.0, 100457.0, 898023.0, 28340.0, 5055.0, 1567.0, 626.0, 314.0, 234.0, 130.0, 86.0, 45.0, 36.0, 25.0, 24.0, 12.0, 9.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.876953125, -45.37890625, -43.880859375, -42.3828125, -40.884765625, -39.38671875, -37.888671875, -36.390625, -34.892578125, -33.39453125, -31.896484375, -30.3984375, -28.900390625, -27.40234375, -25.904296875, -24.40625, -22.908203125, -21.41015625, -19.912109375, -18.4140625, -16.916015625, -15.41796875, -13.919921875, -12.421875, -10.923828125, -9.42578125, -7.927734375, -6.4296875, -4.931640625, -3.43359375, -1.935546875, -0.4375, 1.060546875, 2.55859375, 4.056640625, 5.5546875, 7.052734375, 8.55078125, 10.048828125, 11.546875, 13.044921875, 14.54296875, 16.041015625, 17.5390625, 19.037109375, 20.53515625, 22.033203125, 23.53125, 25.029296875, 26.52734375, 28.025390625, 29.5234375, 31.021484375, 32.51953125, 34.017578125, 35.515625, 37.013671875, 38.51171875, 40.009765625, 41.5078125, 43.005859375, 44.50390625, 46.001953125, 47.5]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 14.0, 21.0, 37.0, 61.0, 95.0, 182.0, 247.0, 124.0, 65.0, 51.0, 26.0, 20.0, 12.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002010345458984375, -0.0019577443599700928, -0.0019051432609558105, -0.0018525421619415283, -0.001799941062927246, -0.0017473399639129639, -0.0016947388648986816, -0.0016421377658843994, -0.0015895366668701172, -0.001536935567855835, -0.0014843344688415527, -0.0014317333698272705, -0.0013791322708129883, -0.001326531171798706, -0.0012739300727844238, -0.0012213289737701416, -0.0011687278747558594, -0.0011161267757415771, -0.001063525676727295, -0.0010109245777130127, -0.0009583234786987305, -0.0009057223796844482, -0.000853121280670166, -0.0008005201816558838, -0.0007479190826416016, -0.0006953179836273193, -0.0006427168846130371, -0.0005901157855987549, -0.0005375146865844727, -0.00048491358757019043, -0.0004323124885559082, -0.000379711389541626, -0.00032711029052734375, -0.0002745091915130615, -0.0002219080924987793, -0.00016930699348449707, -0.00011670589447021484, -6.410479545593262e-05, -1.150369644165039e-05, 4.1097402572631836e-05, 9.369850158691406e-05, 0.0001462996006011963, 0.00019890069961547852, 0.00025150179862976074, 0.00030410289764404297, 0.0003567039966583252, 0.0004093050956726074, 0.00046190619468688965, 0.0005145072937011719, 0.0005671083927154541, 0.0006197094917297363, 0.0006723105907440186, 0.0007249116897583008, 0.000777512788772583, 0.0008301138877868652, 0.0008827149868011475, 0.0009353160858154297, 0.000987917184829712, 0.0010405182838439941, 0.0010931193828582764, 0.0011457204818725586, 0.0011983215808868408, 0.001250922679901123, 0.0013035237789154053, 0.0013561248779296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 0.0, 8.0, 10.0, 4.0, 10.0, 12.0, 14.0, 14.0, 27.0, 25.0, 30.0, 55.0, 85.0, 117.0, 144.0, 247.0, 316.0, 461.0, 840.0, 1360.0, 2445.0, 4595.0, 10390.0, 29017.0, 127547.0, 673836.0, 143353.0, 31263.0, 11180.0, 4915.0, 2402.0, 1348.0, 837.0, 479.0, 328.0, 238.0, 166.0, 111.0, 84.0, 54.0, 49.0, 26.0, 28.0, 17.0, 12.0, 14.0, 12.0, 11.0, 4.0, 11.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-14.890625, -14.446533203125, -14.00244140625, -13.558349609375, -13.1142578125, -12.670166015625, -12.22607421875, -11.781982421875, -11.337890625, -10.893798828125, -10.44970703125, -10.005615234375, -9.5615234375, -9.117431640625, -8.67333984375, -8.229248046875, -7.78515625, -7.341064453125, -6.89697265625, -6.452880859375, -6.0087890625, -5.564697265625, -5.12060546875, -4.676513671875, -4.232421875, -3.788330078125, -3.34423828125, -2.900146484375, -2.4560546875, -2.011962890625, -1.56787109375, -1.123779296875, -0.6796875, -0.235595703125, 0.20849609375, 0.652587890625, 1.0966796875, 1.540771484375, 1.98486328125, 2.428955078125, 2.873046875, 3.317138671875, 3.76123046875, 4.205322265625, 4.6494140625, 5.093505859375, 5.53759765625, 5.981689453125, 6.42578125, 6.869873046875, 7.31396484375, 7.758056640625, 8.2021484375, 8.646240234375, 9.09033203125, 9.534423828125, 9.978515625, 10.422607421875, 10.86669921875, 11.310791015625, 11.7548828125, 12.198974609375, 12.64306640625, 13.087158203125, 13.53125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 10.0, 4.0, 11.0, 15.0, 15.0, 14.0, 39.0, 47.0, 66.0, 109.0, 150.0, 144.0, 117.0, 82.0, 34.0, 45.0, 29.0, 14.0, 14.0, 10.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.7005615234375, -14.244873046875, -13.7891845703125, -13.33349609375, -12.8778076171875, -12.422119140625, -11.9664306640625, -11.5107421875, -11.0550537109375, -10.599365234375, -10.1436767578125, -9.68798828125, -9.2322998046875, -8.776611328125, -8.3209228515625, -7.865234375, -7.4095458984375, -6.953857421875, -6.4981689453125, -6.04248046875, -5.5867919921875, -5.131103515625, -4.6754150390625, -4.2197265625, -3.7640380859375, -3.308349609375, -2.8526611328125, -2.39697265625, -1.9412841796875, -1.485595703125, -1.0299072265625, -0.57421875, -0.1185302734375, 0.337158203125, 0.7928466796875, 1.24853515625, 1.7042236328125, 2.159912109375, 2.6156005859375, 3.0712890625, 3.5269775390625, 3.982666015625, 4.4383544921875, 4.89404296875, 5.3497314453125, 5.805419921875, 6.2611083984375, 6.716796875, 7.1724853515625, 7.628173828125, 8.0838623046875, 8.53955078125, 8.9952392578125, 9.450927734375, 9.9066162109375, 10.3623046875, 10.8179931640625, 11.273681640625, 11.7293701171875, 12.18505859375, 12.6407470703125, 13.096435546875, 13.5521240234375, 14.0078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 15.0, 29.0, 74.0, 276.0, 309.0, 182.0, 67.0, 23.0, 12.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.2783660888672, -133.49208068847656, -125.70580291748047, -117.91952514648438, -110.13323974609375, -102.34696197509766, -94.56068420410156, -86.77439880371094, -78.98812103271484, -71.20184326171875, -63.415557861328125, -55.62928009033203, -47.84299850463867, -40.05671691894531, -32.27043914794922, -24.48415756225586, -16.6978759765625, -8.911595344543457, -1.125314712524414, 6.6609649658203125, 14.447246551513672, 22.23352813720703, 30.019805908203125, 37.806087493896484, 45.592369079589844, 53.3786506652832, 61.16493225097656, 68.95121002197266, 76.73748779296875, 84.52377319335938, 92.31005096435547, 100.09632873535156, 107.88259887695312, 115.66887664794922, 123.45516204833984, 131.24143981933594, 139.02772521972656, 146.81399536132812, 154.60028076171875, 162.38656616210938, 170.1728515625, 177.95913696289062, 185.7454071044922, 193.5316925048828, 201.31797790527344, 209.104248046875, 216.89053344726562, 224.67681884765625, 232.4630889892578, 240.24937438964844, 248.03564453125, 255.82192993164062, 263.60821533203125, 271.3945007324219, 279.1807861328125, 286.967041015625, 294.7533264160156, 302.53961181640625, 310.3258972167969, 318.1121826171875, 325.8984375, 333.6847229003906, 341.47100830078125, 349.2572937011719, 357.0435791015625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 5.0, 6.0, 12.0, 16.0, 16.0, 32.0, 62.0, 100.0, 122.0, 152.0, 139.0, 104.0, 74.0, 50.0, 31.0, 14.0, 13.0, 5.0, 5.0, 4.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.31544494628906, -187.5831298828125, -181.85081481933594, -176.11849975585938, -170.3861846923828, -164.65386962890625, -158.9215545654297, -153.18923950195312, -147.45692443847656, -141.724609375, -135.99229431152344, -130.25997924804688, -124.52766418457031, -118.79534912109375, -113.06303405761719, -107.33071899414062, -101.5984115600586, -95.86609649658203, -90.13378143310547, -84.4014663696289, -78.66915130615234, -72.93683624267578, -67.20452880859375, -61.47220993041992, -55.73989486694336, -50.0075798034668, -44.275264739990234, -38.54295349121094, -32.810638427734375, -27.07832145690918, -21.34600830078125, -15.613693237304688, -9.881378173828125, -4.149063587188721, 1.5832509994506836, 7.31556510925293, 13.047880172729492, 18.780195236206055, 24.512508392333984, 30.244823455810547, 35.97713851928711, 41.70945358276367, 47.441768646240234, 53.17407989501953, 58.906394958496094, 64.63871002197266, 70.37102508544922, 76.10334014892578, 81.83565521240234, 87.5679702758789, 93.30028533935547, 99.03260040283203, 104.7649154663086, 110.49723052978516, 116.22953796386719, 121.96185302734375, 127.69416809082031, 133.42648315429688, 139.15879821777344, 144.89111328125, 150.62342834472656, 156.35574340820312, 162.0880584716797, 167.82037353515625, 173.5526885986328]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 5.0, 10.0, 8.0, 23.0, 24.0, 43.0, 51.0, 77.0, 90.0, 138.0, 214.0, 287.0, 405.0, 674.0, 1153.0, 2092.0, 4315.0, 10871.0, 49209.0, 3813570.0, 273850.0, 22491.0, 6944.0, 3147.0, 1764.0, 991.0, 665.0, 445.0, 262.0, 177.0, 103.0, 68.0, 36.0, 26.0, 17.0, 16.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.625, -54.07080078125, -52.5166015625, -50.96240234375, -49.408203125, -47.85400390625, -46.2998046875, -44.74560546875, -43.19140625, -41.63720703125, -40.0830078125, -38.52880859375, -36.974609375, -35.42041015625, -33.8662109375, -32.31201171875, -30.7578125, -29.20361328125, -27.6494140625, -26.09521484375, -24.541015625, -22.98681640625, -21.4326171875, -19.87841796875, -18.32421875, -16.77001953125, -15.2158203125, -13.66162109375, -12.107421875, -10.55322265625, -8.9990234375, -7.44482421875, -5.890625, -4.33642578125, -2.7822265625, -1.22802734375, 0.326171875, 1.88037109375, 3.4345703125, 4.98876953125, 6.54296875, 8.09716796875, 9.6513671875, 11.20556640625, 12.759765625, 14.31396484375, 15.8681640625, 17.42236328125, 18.9765625, 20.53076171875, 22.0849609375, 23.63916015625, 25.193359375, 26.74755859375, 28.3017578125, 29.85595703125, 31.41015625, 32.96435546875, 34.5185546875, 36.07275390625, 37.626953125, 39.18115234375, 40.7353515625, 42.28955078125, 43.84375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 9.0, 11.0, 7.0, 15.0, 20.0, 41.0, 68.0, 95.0, 144.0, 167.0, 110.0, 118.0, 65.0, 34.0, 21.0, 8.0, 13.0, 5.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.279296875, -2.208984375, -2.138671875, -2.068359375, -1.998046875, -1.927734375, -1.857421875, -1.787109375, -1.716796875, -1.646484375, -1.576171875, -1.505859375, -1.435546875, -1.365234375, -1.294921875, -1.224609375, -1.154296875, -1.083984375, -1.013671875, -0.943359375, -0.873046875, -0.802734375, -0.732421875, -0.662109375, -0.591796875, -0.521484375, -0.451171875, -0.380859375, -0.310546875, -0.240234375, -0.169921875, -0.099609375, -0.029296875, 0.041015625, 0.111328125, 0.181640625, 0.251953125, 0.322265625, 0.392578125, 0.462890625, 0.533203125, 0.603515625, 0.673828125, 0.744140625, 0.814453125, 0.884765625, 0.955078125, 1.025390625, 1.095703125, 1.166015625, 1.236328125, 1.306640625, 1.376953125, 1.447265625, 1.517578125, 1.587890625, 1.658203125, 1.728515625, 1.798828125, 1.869140625, 1.939453125, 2.009765625, 2.080078125, 2.150390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 7.0, 4.0, 8.0, 11.0, 32.0, 44.0, 109.0, 232.0, 571.0, 1724.0, 6971.0, 49606.0, 3820317.0, 293224.0, 16379.0, 3415.0, 1026.0, 336.0, 129.0, 65.0, 32.0, 13.0, 12.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90625, -49.00341796875, -47.1005859375, -45.19775390625, -43.294921875, -41.39208984375, -39.4892578125, -37.58642578125, -35.68359375, -33.78076171875, -31.8779296875, -29.97509765625, -28.072265625, -26.16943359375, -24.2666015625, -22.36376953125, -20.4609375, -18.55810546875, -16.6552734375, -14.75244140625, -12.849609375, -10.94677734375, -9.0439453125, -7.14111328125, -5.23828125, -3.33544921875, -1.4326171875, 0.47021484375, 2.373046875, 4.27587890625, 6.1787109375, 8.08154296875, 9.984375, 11.88720703125, 13.7900390625, 15.69287109375, 17.595703125, 19.49853515625, 21.4013671875, 23.30419921875, 25.20703125, 27.10986328125, 29.0126953125, 30.91552734375, 32.818359375, 34.72119140625, 36.6240234375, 38.52685546875, 40.4296875, 42.33251953125, 44.2353515625, 46.13818359375, 48.041015625, 49.94384765625, 51.8466796875, 53.74951171875, 55.65234375, 57.55517578125, 59.4580078125, 61.36083984375, 63.263671875, 65.16650390625, 67.0693359375, 68.97216796875, 70.875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 3.0, 9.0, 9.0, 12.0, 28.0, 40.0, 72.0, 150.0, 301.0, 907.0, 1817.0, 337.0, 145.0, 88.0, 49.0, 30.0, 17.0, 7.0, 7.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4609375, -6.265869140625, -6.07080078125, -5.875732421875, -5.6806640625, -5.485595703125, -5.29052734375, -5.095458984375, -4.900390625, -4.705322265625, -4.51025390625, -4.315185546875, -4.1201171875, -3.925048828125, -3.72998046875, -3.534912109375, -3.33984375, -3.144775390625, -2.94970703125, -2.754638671875, -2.5595703125, -2.364501953125, -2.16943359375, -1.974365234375, -1.779296875, -1.584228515625, -1.38916015625, -1.194091796875, -0.9990234375, -0.803955078125, -0.60888671875, -0.413818359375, -0.21875, -0.023681640625, 0.17138671875, 0.366455078125, 0.5615234375, 0.756591796875, 0.95166015625, 1.146728515625, 1.341796875, 1.536865234375, 1.73193359375, 1.927001953125, 2.1220703125, 2.317138671875, 2.51220703125, 2.707275390625, 2.90234375, 3.097412109375, 3.29248046875, 3.487548828125, 3.6826171875, 3.877685546875, 4.07275390625, 4.267822265625, 4.462890625, 4.657958984375, 4.85302734375, 5.048095703125, 5.2431640625, 5.438232421875, 5.63330078125, 5.828369140625, 6.0234375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 11.0, 19.0, 39.0, 84.0, 227.0, 296.0, 192.0, 71.0, 34.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.59834289550781, -48.19864273071289, -46.79894256591797, -45.39923858642578, -43.99953842163086, -42.59983825683594, -41.200138092041016, -39.800437927246094, -38.400733947753906, -37.001033782958984, -35.60133361816406, -34.201629638671875, -32.80192947387695, -31.40222930908203, -30.00252914428711, -28.602828979492188, -27.203128814697266, -25.803428649902344, -24.40372657775879, -23.004026412963867, -21.604324340820312, -20.20462417602539, -18.80492401123047, -17.405223846435547, -16.005521774291992, -14.605820655822754, -13.206119537353516, -11.806419372558594, -10.406718254089355, -9.007017135620117, -7.607316970825195, -6.207615852355957, -4.807914733886719, -3.4082138538360596, -2.0085129737854004, -0.6088123321533203, 0.790888786315918, 2.1905899047851562, 3.590290069580078, 4.989991188049316, 6.389692306518555, 7.789393424987793, 9.189094543457031, 10.588794708251953, 11.988495826721191, 13.38819694519043, 14.787897109985352, 16.187599182128906, 17.587299346923828, 18.98699951171875, 20.386701583862305, 21.786401748657227, 23.18610382080078, 24.585803985595703, 25.985504150390625, 27.385204315185547, 28.7849063873291, 30.184606552124023, 31.584308624267578, 32.9840087890625, 34.38370895385742, 35.783409118652344, 37.18311309814453, 38.58281326293945, 39.982513427734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 8.0, 8.0, 21.0, 37.0, 77.0, 95.0, 132.0, 132.0, 123.0, 101.0, 74.0, 49.0, 36.0, 24.0, 16.0, 7.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.13850021362305, -31.123645782470703, -30.10879135131836, -29.093936920166016, -28.079082489013672, -27.064228057861328, -26.049375534057617, -25.034521102905273, -24.01966667175293, -23.004812240600586, -21.989957809448242, -20.9751033782959, -19.960250854492188, -18.945396423339844, -17.9305419921875, -16.915687561035156, -15.900833129882812, -14.885978698730469, -13.871124267578125, -12.856270790100098, -11.841416358947754, -10.82656192779541, -9.811708450317383, -8.796854019165039, -7.781999588012695, -6.767145156860352, -5.752291202545166, -4.7374372482299805, -3.7225828170776367, -2.707728385925293, -1.6928744316101074, -0.6780204772949219, 0.33683013916015625, 1.351684331893921, 2.3665385246276855, 3.38139271736145, 4.396246910095215, 5.411101341247559, 6.425955295562744, 7.44080924987793, 8.455663681030273, 9.470518112182617, 10.485372543334961, 11.500226020812988, 12.515080451965332, 13.529934883117676, 14.544788360595703, 15.559642791748047, 16.57449722290039, 17.589351654052734, 18.604206085205078, 19.619060516357422, 20.633914947509766, 21.64876937866211, 22.66362190246582, 23.678476333618164, 24.693330764770508, 25.70818519592285, 26.723039627075195, 27.73789405822754, 28.75274658203125, 29.767601013183594, 30.782455444335938, 31.79730987548828, 32.812164306640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 6.0, 13.0, 17.0, 23.0, 25.0, 69.0, 118.0, 204.0, 399.0, 1044.0, 2622.0, 8569.0, 35778.0, 293685.0, 615805.0, 69854.0, 13682.0, 4033.0, 1448.0, 565.0, 266.0, 135.0, 61.0, 48.0, 39.0, 11.0, 8.0, 7.0, 7.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -21.36181640625, -20.6767578125, -19.99169921875, -19.306640625, -18.62158203125, -17.9365234375, -17.25146484375, -16.56640625, -15.88134765625, -15.1962890625, -14.51123046875, -13.826171875, -13.14111328125, -12.4560546875, -11.77099609375, -11.0859375, -10.40087890625, -9.7158203125, -9.03076171875, -8.345703125, -7.66064453125, -6.9755859375, -6.29052734375, -5.60546875, -4.92041015625, -4.2353515625, -3.55029296875, -2.865234375, -2.18017578125, -1.4951171875, -0.81005859375, -0.125, 0.56005859375, 1.2451171875, 1.93017578125, 2.615234375, 3.30029296875, 3.9853515625, 4.67041015625, 5.35546875, 6.04052734375, 6.7255859375, 7.41064453125, 8.095703125, 8.78076171875, 9.4658203125, 10.15087890625, 10.8359375, 11.52099609375, 12.2060546875, 12.89111328125, 13.576171875, 14.26123046875, 14.9462890625, 15.63134765625, 16.31640625, 17.00146484375, 17.6865234375, 18.37158203125, 19.056640625, 19.74169921875, 20.4267578125, 21.11181640625, 21.796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 14.0, 13.0, 11.0, 26.0, 32.0, 41.0, 61.0, 82.0, 92.0, 106.0, 92.0, 103.0, 90.0, 48.0, 39.0, 52.0, 19.0, 17.0, 12.0, 9.0, 5.0, 3.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.363037109375, -1.31591796875, -1.268798828125, -1.2216796875, -1.174560546875, -1.12744140625, -1.080322265625, -1.033203125, -0.986083984375, -0.93896484375, -0.891845703125, -0.8447265625, -0.797607421875, -0.75048828125, -0.703369140625, -0.65625, -0.609130859375, -0.56201171875, -0.514892578125, -0.4677734375, -0.420654296875, -0.37353515625, -0.326416015625, -0.279296875, -0.232177734375, -0.18505859375, -0.137939453125, -0.0908203125, -0.043701171875, 0.00341796875, 0.050537109375, 0.09765625, 0.144775390625, 0.19189453125, 0.239013671875, 0.2861328125, 0.333251953125, 0.38037109375, 0.427490234375, 0.474609375, 0.521728515625, 0.56884765625, 0.615966796875, 0.6630859375, 0.710205078125, 0.75732421875, 0.804443359375, 0.8515625, 0.898681640625, 0.94580078125, 0.992919921875, 1.0400390625, 1.087158203125, 1.13427734375, 1.181396484375, 1.228515625, 1.275634765625, 1.32275390625, 1.369873046875, 1.4169921875, 1.464111328125, 1.51123046875, 1.558349609375, 1.60546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 5.0, 9.0, 15.0, 21.0, 34.0, 85.0, 147.0, 363.0, 994.0, 3098.0, 13004.0, 73424.0, 485265.0, 399307.0, 58023.0, 10556.0, 2663.0, 894.0, 316.0, 144.0, 74.0, 43.0, 22.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.65625, -20.06494140625, -19.4736328125, -18.88232421875, -18.291015625, -17.69970703125, -17.1083984375, -16.51708984375, -15.92578125, -15.33447265625, -14.7431640625, -14.15185546875, -13.560546875, -12.96923828125, -12.3779296875, -11.78662109375, -11.1953125, -10.60400390625, -10.0126953125, -9.42138671875, -8.830078125, -8.23876953125, -7.6474609375, -7.05615234375, -6.46484375, -5.87353515625, -5.2822265625, -4.69091796875, -4.099609375, -3.50830078125, -2.9169921875, -2.32568359375, -1.734375, -1.14306640625, -0.5517578125, 0.03955078125, 0.630859375, 1.22216796875, 1.8134765625, 2.40478515625, 2.99609375, 3.58740234375, 4.1787109375, 4.77001953125, 5.361328125, 5.95263671875, 6.5439453125, 7.13525390625, 7.7265625, 8.31787109375, 8.9091796875, 9.50048828125, 10.091796875, 10.68310546875, 11.2744140625, 11.86572265625, 12.45703125, 13.04833984375, 13.6396484375, 14.23095703125, 14.822265625, 15.41357421875, 16.0048828125, 16.59619140625, 17.1875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 7.0, 6.0, 9.0, 9.0, 9.0, 7.0, 7.0, 18.0, 17.0, 19.0, 30.0, 22.0, 37.0, 36.0, 42.0, 43.0, 45.0, 45.0, 42.0, 43.0, 46.0, 40.0, 52.0, 50.0, 43.0, 46.0, 32.0, 34.0, 34.0, 22.0, 12.0, 24.0, 19.0, 17.0, 3.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.109375, -5.90924072265625, -5.7091064453125, -5.50897216796875, -5.308837890625, -5.10870361328125, -4.9085693359375, -4.70843505859375, -4.50830078125, -4.30816650390625, -4.1080322265625, -3.90789794921875, -3.707763671875, -3.50762939453125, -3.3074951171875, -3.10736083984375, -2.9072265625, -2.70709228515625, -2.5069580078125, -2.30682373046875, -2.106689453125, -1.90655517578125, -1.7064208984375, -1.50628662109375, -1.30615234375, -1.10601806640625, -0.9058837890625, -0.70574951171875, -0.505615234375, -0.30548095703125, -0.1053466796875, 0.09478759765625, 0.294921875, 0.49505615234375, 0.6951904296875, 0.89532470703125, 1.095458984375, 1.29559326171875, 1.4957275390625, 1.69586181640625, 1.89599609375, 2.09613037109375, 2.2962646484375, 2.49639892578125, 2.696533203125, 2.89666748046875, 3.0968017578125, 3.29693603515625, 3.4970703125, 3.69720458984375, 3.8973388671875, 4.09747314453125, 4.297607421875, 4.49774169921875, 4.6978759765625, 4.89801025390625, 5.09814453125, 5.29827880859375, 5.4984130859375, 5.69854736328125, 5.898681640625, 6.09881591796875, 6.2989501953125, 6.49908447265625, 6.69921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 19.0, 25.0, 57.0, 125.0, 392.0, 1279.0, 6843.0, 116248.0, 896812.0, 22805.0, 2825.0, 686.0, 225.0, 90.0, 42.0, 22.0, 16.0, 10.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.5, -88.19482421875, -85.8896484375, -83.58447265625, -81.279296875, -78.97412109375, -76.6689453125, -74.36376953125, -72.05859375, -69.75341796875, -67.4482421875, -65.14306640625, -62.837890625, -60.53271484375, -58.2275390625, -55.92236328125, -53.6171875, -51.31201171875, -49.0068359375, -46.70166015625, -44.396484375, -42.09130859375, -39.7861328125, -37.48095703125, -35.17578125, -32.87060546875, -30.5654296875, -28.26025390625, -25.955078125, -23.64990234375, -21.3447265625, -19.03955078125, -16.734375, -14.42919921875, -12.1240234375, -9.81884765625, -7.513671875, -5.20849609375, -2.9033203125, -0.59814453125, 1.70703125, 4.01220703125, 6.3173828125, 8.62255859375, 10.927734375, 13.23291015625, 15.5380859375, 17.84326171875, 20.1484375, 22.45361328125, 24.7587890625, 27.06396484375, 29.369140625, 31.67431640625, 33.9794921875, 36.28466796875, 38.58984375, 40.89501953125, 43.2001953125, 45.50537109375, 47.810546875, 50.11572265625, 52.4208984375, 54.72607421875, 57.03125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 9.0, 12.0, 16.0, 18.0, 21.0, 51.0, 72.0, 104.0, 170.0, 199.0, 101.0, 57.0, 43.0, 30.0, 21.0, 15.0, 15.0, 5.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0021953582763671875, -0.002141699194908142, -0.0020880401134490967, -0.0020343810319900513, -0.001980721950531006, -0.0019270628690719604, -0.001873403787612915, -0.0018197447061538696, -0.0017660856246948242, -0.0017124265432357788, -0.0016587674617767334, -0.001605108380317688, -0.0015514492988586426, -0.0014977902173995972, -0.0014441311359405518, -0.0013904720544815063, -0.001336812973022461, -0.0012831538915634155, -0.0012294948101043701, -0.0011758357286453247, -0.0011221766471862793, -0.0010685175657272339, -0.0010148584842681885, -0.0009611994028091431, -0.0009075403213500977, -0.0008538812398910522, -0.0008002221584320068, -0.0007465630769729614, -0.000692903995513916, -0.0006392449140548706, -0.0005855858325958252, -0.0005319267511367798, -0.0004782676696777344, -0.00042460858821868896, -0.00037094950675964355, -0.00031729042530059814, -0.00026363134384155273, -0.00020997226238250732, -0.00015631318092346191, -0.0001026540994644165, -4.8995018005371094e-05, 4.664063453674316e-06, 5.8323144912719727e-05, 0.00011198222637176514, 0.00016564130783081055, 0.00021930038928985596, 0.00027295947074890137, 0.0003266185522079468, 0.0003802776336669922, 0.0004339367151260376, 0.000487595796585083, 0.0005412548780441284, 0.0005949139595031738, 0.0006485730409622192, 0.0007022321224212646, 0.0007558912038803101, 0.0008095502853393555, 0.0008632093667984009, 0.0009168684482574463, 0.0009705275297164917, 0.0010241866111755371, 0.0010778456926345825, 0.001131504774093628, 0.0011851638555526733, 0.0012388229370117188]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 18.0, 26.0, 24.0, 69.0, 104.0, 156.0, 266.0, 517.0, 1010.0, 2031.0, 4708.0, 12191.0, 38937.0, 205876.0, 631321.0, 108874.0, 25771.0, 9062.0, 3724.0, 1809.0, 862.0, 467.0, 288.0, 171.0, 94.0, 55.0, 30.0, 28.0, 17.0, 14.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.48486328125, -22.7353515625, -21.98583984375, -21.236328125, -20.48681640625, -19.7373046875, -18.98779296875, -18.23828125, -17.48876953125, -16.7392578125, -15.98974609375, -15.240234375, -14.49072265625, -13.7412109375, -12.99169921875, -12.2421875, -11.49267578125, -10.7431640625, -9.99365234375, -9.244140625, -8.49462890625, -7.7451171875, -6.99560546875, -6.24609375, -5.49658203125, -4.7470703125, -3.99755859375, -3.248046875, -2.49853515625, -1.7490234375, -0.99951171875, -0.25, 0.49951171875, 1.2490234375, 1.99853515625, 2.748046875, 3.49755859375, 4.2470703125, 4.99658203125, 5.74609375, 6.49560546875, 7.2451171875, 7.99462890625, 8.744140625, 9.49365234375, 10.2431640625, 10.99267578125, 11.7421875, 12.49169921875, 13.2412109375, 13.99072265625, 14.740234375, 15.48974609375, 16.2392578125, 16.98876953125, 17.73828125, 18.48779296875, 19.2373046875, 19.98681640625, 20.736328125, 21.48583984375, 22.2353515625, 22.98486328125, 23.734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 7.0, 14.0, 15.0, 21.0, 29.0, 41.0, 72.0, 107.0, 133.0, 152.0, 132.0, 85.0, 57.0, 29.0, 31.0, 15.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.07177734375, -16.4873046875, -15.90283203125, -15.318359375, -14.73388671875, -14.1494140625, -13.56494140625, -12.98046875, -12.39599609375, -11.8115234375, -11.22705078125, -10.642578125, -10.05810546875, -9.4736328125, -8.88916015625, -8.3046875, -7.72021484375, -7.1357421875, -6.55126953125, -5.966796875, -5.38232421875, -4.7978515625, -4.21337890625, -3.62890625, -3.04443359375, -2.4599609375, -1.87548828125, -1.291015625, -0.70654296875, -0.1220703125, 0.46240234375, 1.046875, 1.63134765625, 2.2158203125, 2.80029296875, 3.384765625, 3.96923828125, 4.5537109375, 5.13818359375, 5.72265625, 6.30712890625, 6.8916015625, 7.47607421875, 8.060546875, 8.64501953125, 9.2294921875, 9.81396484375, 10.3984375, 10.98291015625, 11.5673828125, 12.15185546875, 12.736328125, 13.32080078125, 13.9052734375, 14.48974609375, 15.07421875, 15.65869140625, 16.2431640625, 16.82763671875, 17.412109375, 17.99658203125, 18.5810546875, 19.16552734375, 19.75]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 20.0, 51.0, 84.0, 123.0, 190.0, 222.0, 131.0, 68.0, 48.0, 23.0, 8.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.49908447265625, -111.6568374633789, -107.81459045410156, -103.97234344482422, -100.13009643554688, -96.28784942626953, -92.44560241699219, -88.60335540771484, -84.7611083984375, -80.91886138916016, -77.07661437988281, -73.23436737060547, -69.39212036132812, -65.54987335205078, -61.70762634277344, -57.865379333496094, -54.023136138916016, -50.18088912963867, -46.33864212036133, -42.496395111083984, -38.65414810180664, -34.81190490722656, -30.969655990600586, -27.127408981323242, -23.2851619720459, -19.442914962768555, -15.600667953491211, -11.758421897888184, -7.91617488861084, -4.0739288330078125, -0.23168182373046875, 3.610565185546875, 7.452812194824219, 11.295059204101562, 15.137306213378906, 18.97955322265625, 22.821800231933594, 26.664045333862305, 30.50629234313965, 34.348541259765625, 38.19078826904297, 42.03303527832031, 45.875282287597656, 49.717529296875, 53.559776306152344, 57.40202331542969, 61.24427032470703, 65.08651733398438, 68.92875671386719, 72.77100372314453, 76.61325073242188, 80.45549774169922, 84.29774475097656, 88.1399917602539, 91.98223876953125, 95.8244857788086, 99.66673278808594, 103.50897979736328, 107.35122680664062, 111.19347381591797, 115.03572082519531, 118.87796783447266, 122.72021484375, 126.56246185302734, 130.4047088623047]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 10.0, 17.0, 32.0, 26.0, 46.0, 66.0, 66.0, 61.0, 90.0, 92.0, 98.0, 97.0, 64.0, 55.0, 45.0, 21.0, 19.0, 14.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-96.20040893554688, -93.76436614990234, -91.32832336425781, -88.89227294921875, -86.45623016357422, -84.02018737792969, -81.58414459228516, -79.14810180664062, -76.71205139160156, -74.27600860595703, -71.8399658203125, -69.40391540527344, -66.9678726196289, -64.53182983398438, -62.095787048339844, -59.65974426269531, -57.22370147705078, -54.78765869140625, -52.35161209106445, -49.91556930541992, -47.479522705078125, -45.043479919433594, -42.60743713378906, -40.17139434814453, -37.735347747802734, -35.2993049621582, -32.863258361816406, -30.427215576171875, -27.99117088317871, -25.555126190185547, -23.119083404541016, -20.68303871154785, -18.246986389160156, -15.810941696166992, -13.374897956848145, -10.938854217529297, -8.502809524536133, -6.066764831542969, -3.630721092224121, -1.1946773529052734, 1.2413673400878906, 3.6774115562438965, 6.113455772399902, 8.54949951171875, 10.985544204711914, 13.421588897705078, 15.857632637023926, 18.293676376342773, 20.729721069335938, 23.1657657623291, 25.601810455322266, 28.037853240966797, 30.47389793395996, 32.909942626953125, 35.345985412597656, 37.78202819824219, 40.218074798583984, 42.654117584228516, 45.09016418457031, 47.526206970214844, 49.962249755859375, 52.39829635620117, 54.8343391418457, 57.2703857421875, 59.70642852783203]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 19.0, 23.0, 42.0, 84.0, 195.0, 457.0, 1403.0, 5682.0, 46001.0, 3981663.0, 146000.0, 9454.0, 1978.0, 594.0, 243.0, 135.0, 77.0, 54.0, 33.0, 27.0, 21.0, 17.0, 9.0, 10.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.875, -50.9638671875, -49.052734375, -47.1416015625, -45.23046875, -43.3193359375, -41.408203125, -39.4970703125, -37.5859375, -35.6748046875, -33.763671875, -31.8525390625, -29.94140625, -28.0302734375, -26.119140625, -24.2080078125, -22.296875, -20.3857421875, -18.474609375, -16.5634765625, -14.65234375, -12.7412109375, -10.830078125, -8.9189453125, -7.0078125, -5.0966796875, -3.185546875, -1.2744140625, 0.63671875, 2.5478515625, 4.458984375, 6.3701171875, 8.28125, 10.1923828125, 12.103515625, 14.0146484375, 15.92578125, 17.8369140625, 19.748046875, 21.6591796875, 23.5703125, 25.4814453125, 27.392578125, 29.3037109375, 31.21484375, 33.1259765625, 35.037109375, 36.9482421875, 38.859375, 40.7705078125, 42.681640625, 44.5927734375, 46.50390625, 48.4150390625, 50.326171875, 52.2373046875, 54.1484375, 56.0595703125, 57.970703125, 59.8818359375, 61.79296875, 63.7041015625, 65.615234375, 67.5263671875, 69.4375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 8.0, 6.0, 16.0, 14.0, 15.0, 24.0, 33.0, 39.0, 43.0, 52.0, 80.0, 83.0, 79.0, 71.0, 92.0, 78.0, 56.0, 37.0, 38.0, 31.0, 25.0, 19.0, 13.0, 10.0, 6.0, 9.0, 4.0, 5.0, 1.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -0.9990081787109375, -0.958953857421875, -0.9188995361328125, -0.87884521484375, -0.8387908935546875, -0.798736572265625, -0.7586822509765625, -0.7186279296875, -0.6785736083984375, -0.638519287109375, -0.5984649658203125, -0.55841064453125, -0.5183563232421875, -0.478302001953125, -0.4382476806640625, -0.398193359375, -0.3581390380859375, -0.318084716796875, -0.2780303955078125, -0.23797607421875, -0.1979217529296875, -0.157867431640625, -0.1178131103515625, -0.0777587890625, -0.0377044677734375, 0.002349853515625, 0.0424041748046875, 0.08245849609375, 0.1225128173828125, 0.162567138671875, 0.2026214599609375, 0.24267578125, 0.2827301025390625, 0.322784423828125, 0.3628387451171875, 0.40289306640625, 0.4429473876953125, 0.483001708984375, 0.5230560302734375, 0.5631103515625, 0.6031646728515625, 0.643218994140625, 0.6832733154296875, 0.72332763671875, 0.7633819580078125, 0.803436279296875, 0.8434906005859375, 0.883544921875, 0.9235992431640625, 0.963653564453125, 1.0037078857421875, 1.04376220703125, 1.0838165283203125, 1.123870849609375, 1.1639251708984375, 1.2039794921875, 1.2440338134765625, 1.284088134765625, 1.3241424560546875, 1.36419677734375, 1.4042510986328125, 1.444305419921875, 1.4843597412109375, 1.5244140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 12.0, 12.0, 19.0, 23.0, 37.0, 63.0, 111.0, 233.0, 821.0, 5080.0, 110572.0, 4019472.0, 53174.0, 3485.0, 657.0, 186.0, 106.0, 62.0, 40.0, 25.0, 24.0, 15.0, 9.0, 6.0, 3.0, 4.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.46875, -61.31103515625, -59.1533203125, -56.99560546875, -54.837890625, -52.68017578125, -50.5224609375, -48.36474609375, -46.20703125, -44.04931640625, -41.8916015625, -39.73388671875, -37.576171875, -35.41845703125, -33.2607421875, -31.10302734375, -28.9453125, -26.78759765625, -24.6298828125, -22.47216796875, -20.314453125, -18.15673828125, -15.9990234375, -13.84130859375, -11.68359375, -9.52587890625, -7.3681640625, -5.21044921875, -3.052734375, -0.89501953125, 1.2626953125, 3.42041015625, 5.578125, 7.73583984375, 9.8935546875, 12.05126953125, 14.208984375, 16.36669921875, 18.5244140625, 20.68212890625, 22.83984375, 24.99755859375, 27.1552734375, 29.31298828125, 31.470703125, 33.62841796875, 35.7861328125, 37.94384765625, 40.1015625, 42.25927734375, 44.4169921875, 46.57470703125, 48.732421875, 50.89013671875, 53.0478515625, 55.20556640625, 57.36328125, 59.52099609375, 61.6787109375, 63.83642578125, 65.994140625, 68.15185546875, 70.3095703125, 72.46728515625, 74.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 9.0, 14.0, 22.0, 38.0, 43.0, 40.0, 76.0, 108.0, 167.0, 262.0, 476.0, 1354.0, 605.0, 282.0, 175.0, 105.0, 86.0, 58.0, 38.0, 29.0, 19.0, 9.0, 10.0, 12.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.5234375, -3.427337646484375, -3.33123779296875, -3.235137939453125, -3.1390380859375, -3.042938232421875, -2.94683837890625, -2.850738525390625, -2.754638671875, -2.658538818359375, -2.56243896484375, -2.466339111328125, -2.3702392578125, -2.274139404296875, -2.17803955078125, -2.081939697265625, -1.98583984375, -1.889739990234375, -1.79364013671875, -1.697540283203125, -1.6014404296875, -1.505340576171875, -1.40924072265625, -1.313140869140625, -1.217041015625, -1.120941162109375, -1.02484130859375, -0.928741455078125, -0.8326416015625, -0.736541748046875, -0.64044189453125, -0.544342041015625, -0.4482421875, -0.352142333984375, -0.25604248046875, -0.159942626953125, -0.0638427734375, 0.032257080078125, 0.12835693359375, 0.224456787109375, 0.320556640625, 0.416656494140625, 0.51275634765625, 0.608856201171875, 0.7049560546875, 0.801055908203125, 0.89715576171875, 0.993255615234375, 1.08935546875, 1.185455322265625, 1.28155517578125, 1.377655029296875, 1.4737548828125, 1.569854736328125, 1.66595458984375, 1.762054443359375, 1.858154296875, 1.954254150390625, 2.05035400390625, 2.146453857421875, 2.2425537109375, 2.338653564453125, 2.43475341796875, 2.530853271484375, 2.626953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 14.0, 28.0, 61.0, 126.0, 194.0, 240.0, 158.0, 90.0, 31.0, 28.0, 16.0, 12.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-55.17634201049805, -53.933753967285156, -52.691162109375, -51.44857406616211, -50.20598602294922, -48.96339797973633, -47.72080993652344, -46.47821807861328, -45.23563003540039, -43.9930419921875, -42.750450134277344, -41.50786209106445, -40.26527404785156, -39.02268600463867, -37.78009796142578, -36.537506103515625, -35.294918060302734, -34.052330017089844, -32.80973815917969, -31.567150115966797, -30.324562072753906, -29.081974029541016, -27.839384078979492, -26.59679412841797, -25.354206085205078, -24.111618041992188, -22.869028091430664, -21.62643814086914, -20.38385009765625, -19.14126205444336, -17.898672103881836, -16.656082153320312, -15.413497924804688, -14.17090892791748, -12.928319931030273, -11.685730934143066, -10.44314193725586, -9.200552940368652, -7.957963943481445, -6.715374946594238, -5.472785949707031, -4.230196952819824, -2.987607955932617, -1.7450189590454102, -0.5024299621582031, 0.7401590347290039, 1.982748031616211, 3.225337028503418, 4.467926025390625, 5.710515022277832, 6.953104019165039, 8.195693016052246, 9.438282012939453, 10.68087100982666, 11.923460006713867, 13.166049003601074, 14.408638000488281, 15.651226997375488, 16.893815994262695, 18.13640594482422, 19.37899398803711, 20.62158203125, 21.864171981811523, 23.106761932373047, 24.349349975585938]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 13.0, 12.0, 11.0, 16.0, 21.0, 28.0, 25.0, 37.0, 36.0, 37.0, 43.0, 46.0, 51.0, 41.0, 65.0, 53.0, 41.0, 56.0, 45.0, 40.0, 22.0, 32.0, 28.0, 36.0, 22.0, 27.0, 21.0, 17.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.40318489074707, -13.015726089477539, -12.628267288208008, -12.24080753326416, -11.853348731994629, -11.465889930725098, -11.078431129455566, -10.690971374511719, -10.303512573242188, -9.916053771972656, -9.528594970703125, -9.141135215759277, -8.753676414489746, -8.366217613220215, -7.978758811950684, -7.591299533843994, -7.203840732574463, -6.816381931304932, -6.428922653198242, -6.041463851928711, -5.6540045738220215, -5.26654577255249, -4.879086494445801, -4.4916276931762695, -4.104168891906738, -3.716709852218628, -3.3292508125305176, -2.9417920112609863, -2.554332733154297, -2.1668739318847656, -1.7794148921966553, -1.391955852508545, -1.0044965744018555, -0.6170375347137451, -0.22957855463027954, 0.15788042545318604, 0.5453394651412964, 0.9327985048294067, 1.3202574253082275, 1.707716464996338, 2.0951755046844482, 2.4826345443725586, 2.870093584060669, 3.2575526237487793, 3.6450114250183105, 4.032470703125, 4.419929504394531, 4.8073883056640625, 5.194847583770752, 5.582306385040283, 5.969765663146973, 6.357224464416504, 6.744683742523193, 7.132142543792725, 7.519601821899414, 7.907060623168945, 8.294519424438477, 8.681978225708008, 9.069437026977539, 9.456896781921387, 9.844355583190918, 10.23181438446045, 10.61927318572998, 11.006732940673828, 11.39419174194336]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 9.0, 10.0, 19.0, 21.0, 48.0, 61.0, 102.0, 144.0, 275.0, 400.0, 792.0, 1402.0, 2609.0, 5354.0, 11173.0, 24762.0, 55403.0, 127565.0, 264028.0, 287747.0, 148353.0, 64238.0, 28093.0, 12961.0, 6160.0, 3102.0, 1605.0, 856.0, 497.0, 288.0, 167.0, 109.0, 75.0, 44.0, 30.0, 17.0, 15.0, 4.0, 3.0, 8.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.7880859375, -7.552734375, -7.3173828125, -7.08203125, -6.8466796875, -6.611328125, -6.3759765625, -6.140625, -5.9052734375, -5.669921875, -5.4345703125, -5.19921875, -4.9638671875, -4.728515625, -4.4931640625, -4.2578125, -4.0224609375, -3.787109375, -3.5517578125, -3.31640625, -3.0810546875, -2.845703125, -2.6103515625, -2.375, -2.1396484375, -1.904296875, -1.6689453125, -1.43359375, -1.1982421875, -0.962890625, -0.7275390625, -0.4921875, -0.2568359375, -0.021484375, 0.2138671875, 0.44921875, 0.6845703125, 0.919921875, 1.1552734375, 1.390625, 1.6259765625, 1.861328125, 2.0966796875, 2.33203125, 2.5673828125, 2.802734375, 3.0380859375, 3.2734375, 3.5087890625, 3.744140625, 3.9794921875, 4.21484375, 4.4501953125, 4.685546875, 4.9208984375, 5.15625, 5.3916015625, 5.626953125, 5.8623046875, 6.09765625, 6.3330078125, 6.568359375, 6.8037109375, 7.0390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 10.0, 12.0, 10.0, 22.0, 22.0, 27.0, 32.0, 56.0, 43.0, 42.0, 56.0, 55.0, 64.0, 54.0, 56.0, 54.0, 63.0, 43.0, 45.0, 43.0, 34.0, 29.0, 30.0, 16.0, 27.0, 12.0, 5.0, 4.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1947708129882812, -1.1620025634765625, -1.1292343139648438, -1.096466064453125, -1.0636978149414062, -1.0309295654296875, -0.9981613159179688, -0.96539306640625, -0.9326248168945312, -0.8998565673828125, -0.8670883178710938, -0.834320068359375, -0.8015518188476562, -0.7687835693359375, -0.7360153198242188, -0.7032470703125, -0.6704788208007812, -0.6377105712890625, -0.6049423217773438, -0.572174072265625, -0.5394058227539062, -0.5066375732421875, -0.47386932373046875, -0.44110107421875, -0.40833282470703125, -0.3755645751953125, -0.34279632568359375, -0.310028076171875, -0.27725982666015625, -0.2444915771484375, -0.21172332763671875, -0.178955078125, -0.14618682861328125, -0.1134185791015625, -0.08065032958984375, -0.047882080078125, -0.01511383056640625, 0.0176544189453125, 0.05042266845703125, 0.08319091796875, 0.11595916748046875, 0.1487274169921875, 0.18149566650390625, 0.214263916015625, 0.24703216552734375, 0.2798004150390625, 0.31256866455078125, 0.3453369140625, 0.37810516357421875, 0.4108734130859375, 0.44364166259765625, 0.476409912109375, 0.5091781616210938, 0.5419464111328125, 0.5747146606445312, 0.60748291015625, 0.6402511596679688, 0.6730194091796875, 0.7057876586914062, 0.738555908203125, 0.7713241577148438, 0.8040924072265625, 0.8368606567382812, 0.86962890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 10.0, 12.0, 10.0, 20.0, 33.0, 30.0, 43.0, 51.0, 79.0, 104.0, 176.0, 242.0, 396.0, 693.0, 1263.0, 2470.0, 5356.0, 12041.0, 29496.0, 74690.0, 199959.0, 360484.0, 221684.0, 83586.0, 31759.0, 12708.0, 5379.0, 2592.0, 1270.0, 683.0, 406.0, 265.0, 168.0, 118.0, 80.0, 54.0, 29.0, 35.0, 20.0, 22.0, 10.0, 8.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5240478515625, -8.235595703125, -7.9471435546875, -7.65869140625, -7.3702392578125, -7.081787109375, -6.7933349609375, -6.5048828125, -6.2164306640625, -5.927978515625, -5.6395263671875, -5.35107421875, -5.0626220703125, -4.774169921875, -4.4857177734375, -4.197265625, -3.9088134765625, -3.620361328125, -3.3319091796875, -3.04345703125, -2.7550048828125, -2.466552734375, -2.1781005859375, -1.8896484375, -1.6011962890625, -1.312744140625, -1.0242919921875, -0.73583984375, -0.4473876953125, -0.158935546875, 0.1295166015625, 0.41796875, 0.7064208984375, 0.994873046875, 1.2833251953125, 1.57177734375, 1.8602294921875, 2.148681640625, 2.4371337890625, 2.7255859375, 3.0140380859375, 3.302490234375, 3.5909423828125, 3.87939453125, 4.1678466796875, 4.456298828125, 4.7447509765625, 5.033203125, 5.3216552734375, 5.610107421875, 5.8985595703125, 6.18701171875, 6.4754638671875, 6.763916015625, 7.0523681640625, 7.3408203125, 7.6292724609375, 7.917724609375, 8.2061767578125, 8.49462890625, 8.7830810546875, 9.071533203125, 9.3599853515625, 9.6484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 6.0, 7.0, 17.0, 13.0, 15.0, 14.0, 13.0, 22.0, 26.0, 13.0, 29.0, 27.0, 26.0, 41.0, 35.0, 40.0, 35.0, 45.0, 35.0, 40.0, 53.0, 44.0, 44.0, 47.0, 44.0, 48.0, 36.0, 28.0, 26.0, 21.0, 28.0, 13.0, 8.0, 15.0, 10.0, 5.0, 8.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.64593505859375, -4.4754638671875, -4.30499267578125, -4.134521484375, -3.96405029296875, -3.7935791015625, -3.62310791015625, -3.45263671875, -3.28216552734375, -3.1116943359375, -2.94122314453125, -2.770751953125, -2.60028076171875, -2.4298095703125, -2.25933837890625, -2.0888671875, -1.91839599609375, -1.7479248046875, -1.57745361328125, -1.406982421875, -1.23651123046875, -1.0660400390625, -0.89556884765625, -0.72509765625, -0.55462646484375, -0.3841552734375, -0.21368408203125, -0.043212890625, 0.12725830078125, 0.2977294921875, 0.46820068359375, 0.638671875, 0.80914306640625, 0.9796142578125, 1.15008544921875, 1.320556640625, 1.49102783203125, 1.6614990234375, 1.83197021484375, 2.00244140625, 2.17291259765625, 2.3433837890625, 2.51385498046875, 2.684326171875, 2.85479736328125, 3.0252685546875, 3.19573974609375, 3.3662109375, 3.53668212890625, 3.7071533203125, 3.87762451171875, 4.048095703125, 4.21856689453125, 4.3890380859375, 4.55950927734375, 4.72998046875, 4.90045166015625, 5.0709228515625, 5.24139404296875, 5.411865234375, 5.58233642578125, 5.7528076171875, 5.92327880859375, 6.09375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 18.0, 21.0, 38.0, 71.0, 129.0, 238.0, 606.0, 1499.0, 4706.0, 18811.0, 131661.0, 721342.0, 142138.0, 19765.0, 4777.0, 1536.0, 615.0, 280.0, 112.0, 67.0, 36.0, 20.0, 18.0, 15.0, 6.0, 2.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.09716796875, -18.4912109375, -17.88525390625, -17.279296875, -16.67333984375, -16.0673828125, -15.46142578125, -14.85546875, -14.24951171875, -13.6435546875, -13.03759765625, -12.431640625, -11.82568359375, -11.2197265625, -10.61376953125, -10.0078125, -9.40185546875, -8.7958984375, -8.18994140625, -7.583984375, -6.97802734375, -6.3720703125, -5.76611328125, -5.16015625, -4.55419921875, -3.9482421875, -3.34228515625, -2.736328125, -2.13037109375, -1.5244140625, -0.91845703125, -0.3125, 0.29345703125, 0.8994140625, 1.50537109375, 2.111328125, 2.71728515625, 3.3232421875, 3.92919921875, 4.53515625, 5.14111328125, 5.7470703125, 6.35302734375, 6.958984375, 7.56494140625, 8.1708984375, 8.77685546875, 9.3828125, 9.98876953125, 10.5947265625, 11.20068359375, 11.806640625, 12.41259765625, 13.0185546875, 13.62451171875, 14.23046875, 14.83642578125, 15.4423828125, 16.04833984375, 16.654296875, 17.26025390625, 17.8662109375, 18.47216796875, 19.078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 3.0, 5.0, 18.0, 13.0, 15.0, 31.0, 48.0, 59.0, 104.0, 154.0, 150.0, 118.0, 79.0, 57.0, 34.0, 24.0, 14.0, 16.0, 10.0, 7.0, 8.0, 9.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008714497089385986, -0.0008321404457092285, -0.0007928311824798584, -0.0007535219192504883, -0.0007142126560211182, -0.000674903392791748, -0.0006355941295623779, -0.0005962848663330078, -0.0005569756031036377, -0.0005176663398742676, -0.00047835707664489746, -0.00043904781341552734, -0.0003997385501861572, -0.0003604292869567871, -0.000321120023727417, -0.0002818107604980469, -0.00024250149726867676, -0.00020319223403930664, -0.00016388297080993652, -0.0001245737075805664, -8.526444435119629e-05, -4.595518112182617e-05, -6.645917892456055e-06, 3.266334533691406e-05, 7.197260856628418e-05, 0.0001112818717956543, 0.00015059113502502441, 0.00018990039825439453, 0.00022920966148376465, 0.00026851892471313477, 0.0003078281879425049, 0.000347137451171875, 0.0003864467144012451, 0.00042575597763061523, 0.00046506524085998535, 0.0005043745040893555, 0.0005436837673187256, 0.0005829930305480957, 0.0006223022937774658, 0.0006616115570068359, 0.0007009208202362061, 0.0007402300834655762, 0.0007795393466949463, 0.0008188486099243164, 0.0008581578731536865, 0.0008974671363830566, 0.0009367763996124268, 0.0009760856628417969, 0.001015394926071167, 0.0010547041893005371, 0.0010940134525299072, 0.0011333227157592773, 0.0011726319789886475, 0.0012119412422180176, 0.0012512505054473877, 0.0012905597686767578, 0.001329869031906128, 0.001369178295135498, 0.0014084875583648682, 0.0014477968215942383, 0.0014871060848236084, 0.0015264153480529785, 0.0015657246112823486, 0.0016050338745117188]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 16.0, 18.0, 29.0, 40.0, 67.0, 126.0, 230.0, 438.0, 1082.0, 3525.0, 15216.0, 125239.0, 743171.0, 137808.0, 15834.0, 3553.0, 1147.0, 484.0, 225.0, 132.0, 60.0, 34.0, 25.0, 16.0, 15.0, 11.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.96875, -25.276611328125, -24.58447265625, -23.892333984375, -23.2001953125, -22.508056640625, -21.81591796875, -21.123779296875, -20.431640625, -19.739501953125, -19.04736328125, -18.355224609375, -17.6630859375, -16.970947265625, -16.27880859375, -15.586669921875, -14.89453125, -14.202392578125, -13.51025390625, -12.818115234375, -12.1259765625, -11.433837890625, -10.74169921875, -10.049560546875, -9.357421875, -8.665283203125, -7.97314453125, -7.281005859375, -6.5888671875, -5.896728515625, -5.20458984375, -4.512451171875, -3.8203125, -3.128173828125, -2.43603515625, -1.743896484375, -1.0517578125, -0.359619140625, 0.33251953125, 1.024658203125, 1.716796875, 2.408935546875, 3.10107421875, 3.793212890625, 4.4853515625, 5.177490234375, 5.86962890625, 6.561767578125, 7.25390625, 7.946044921875, 8.63818359375, 9.330322265625, 10.0224609375, 10.714599609375, 11.40673828125, 12.098876953125, 12.791015625, 13.483154296875, 14.17529296875, 14.867431640625, 15.5595703125, 16.251708984375, 16.94384765625, 17.635986328125, 18.328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 10.0, 15.0, 19.0, 30.0, 53.0, 59.0, 106.0, 118.0, 134.0, 135.0, 106.0, 65.0, 55.0, 35.0, 19.0, 7.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4921875, -10.1700439453125, -9.847900390625, -9.5257568359375, -9.20361328125, -8.8814697265625, -8.559326171875, -8.2371826171875, -7.9150390625, -7.5928955078125, -7.270751953125, -6.9486083984375, -6.62646484375, -6.3043212890625, -5.982177734375, -5.6600341796875, -5.337890625, -5.0157470703125, -4.693603515625, -4.3714599609375, -4.04931640625, -3.7271728515625, -3.405029296875, -3.0828857421875, -2.7607421875, -2.4385986328125, -2.116455078125, -1.7943115234375, -1.47216796875, -1.1500244140625, -0.827880859375, -0.5057373046875, -0.18359375, 0.1385498046875, 0.460693359375, 0.7828369140625, 1.10498046875, 1.4271240234375, 1.749267578125, 2.0714111328125, 2.3935546875, 2.7156982421875, 3.037841796875, 3.3599853515625, 3.68212890625, 4.0042724609375, 4.326416015625, 4.6485595703125, 4.970703125, 5.2928466796875, 5.614990234375, 5.9371337890625, 6.25927734375, 6.5814208984375, 6.903564453125, 7.2257080078125, 7.5478515625, 7.8699951171875, 8.192138671875, 8.5142822265625, 8.83642578125, 9.1585693359375, 9.480712890625, 9.8028564453125, 10.125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 37.0, 149.0, 443.0, 288.0, 65.0, 10.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-405.0683288574219, -397.0955505371094, -389.1227722167969, -381.14996337890625, -373.17718505859375, -365.20440673828125, -357.23162841796875, -349.25885009765625, -341.2860412597656, -333.3132629394531, -325.3404846191406, -317.36767578125, -309.3948974609375, -301.422119140625, -293.4493408203125, -285.4765625, -277.5037841796875, -269.531005859375, -261.5582275390625, -253.58543395996094, -245.61264038085938, -237.63986206054688, -229.66708374023438, -221.6942901611328, -213.72149658203125, -205.74871826171875, -197.7759246826172, -189.8031463623047, -181.83035278320312, -173.85757446289062, -165.88479614257812, -157.91200256347656, -149.939208984375, -141.9664306640625, -133.99363708496094, -126.02085876464844, -118.04806518554688, -110.07528686523438, -102.10250091552734, -94.12971496582031, -86.15692901611328, -78.18414306640625, -70.21135711669922, -62.23857498168945, -54.26578903198242, -46.29300308227539, -38.320220947265625, -30.347434997558594, -22.374649047851562, -14.401864051818848, -6.429079055786133, 1.5437049865722656, 9.516490936279297, 17.489276885986328, 25.462059020996094, 33.434844970703125, 41.407630920410156, 49.38041687011719, 57.35320281982422, 65.32598876953125, 73.29876708984375, 81.27156066894531, 89.24433898925781, 97.21712493896484, 105.18991088867188]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 15.0, 4.0, 7.0, 11.0, 8.0, 24.0, 15.0, 23.0, 30.0, 34.0, 28.0, 34.0, 49.0, 48.0, 53.0, 56.0, 57.0, 54.0, 48.0, 49.0, 54.0, 44.0, 44.0, 41.0, 32.0, 35.0, 20.0, 14.0, 21.0, 13.0, 12.0, 11.0, 6.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.20537567138672, -45.7359733581543, -44.26656723022461, -42.79716491699219, -41.3277587890625, -39.85835647583008, -38.388954162597656, -36.91954803466797, -35.45014190673828, -33.98073959350586, -32.51133346557617, -31.04193115234375, -29.572525024414062, -28.10312271118164, -26.633718490600586, -25.16431427001953, -23.69491195678711, -22.225507736206055, -20.756103515625, -19.286701202392578, -17.81729507446289, -16.34789276123047, -14.878488540649414, -13.40908432006836, -11.939680099487305, -10.47027587890625, -9.000871658325195, -7.531468391418457, -6.062064170837402, -4.592659950256348, -3.1232566833496094, -1.6538524627685547, -0.1844482421875, 1.2849557399749756, 2.754359722137451, 4.223763465881348, 5.693167686462402, 7.162571907043457, 8.631975173950195, 10.10137939453125, 11.570783615112305, 13.04018783569336, 14.509592056274414, 15.978995323181152, 17.44839859008789, 18.917804718017578, 20.38720703125, 21.856611251831055, 23.32601547241211, 24.795419692993164, 26.26482391357422, 27.73422622680664, 29.203632354736328, 30.67303466796875, 32.14244079589844, 33.61184310913086, 35.08124542236328, 36.5506477355957, 38.02005386352539, 39.48945617675781, 40.9588623046875, 42.42826461791992, 43.897666931152344, 45.36707305908203, 46.83647918701172]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 11.0, 15.0, 19.0, 27.0, 37.0, 63.0, 110.0, 309.0, 1279.0, 13210.0, 3783521.0, 387043.0, 7278.0, 922.0, 196.0, 81.0, 44.0, 40.0, 20.0, 17.0, 13.0, 11.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.6875, -81.47900390625, -79.2705078125, -77.06201171875, -74.853515625, -72.64501953125, -70.4365234375, -68.22802734375, -66.01953125, -63.81103515625, -61.6025390625, -59.39404296875, -57.185546875, -54.97705078125, -52.7685546875, -50.56005859375, -48.3515625, -46.14306640625, -43.9345703125, -41.72607421875, -39.517578125, -37.30908203125, -35.1005859375, -32.89208984375, -30.68359375, -28.47509765625, -26.2666015625, -24.05810546875, -21.849609375, -19.64111328125, -17.4326171875, -15.22412109375, -13.015625, -10.80712890625, -8.5986328125, -6.39013671875, -4.181640625, -1.97314453125, 0.2353515625, 2.44384765625, 4.65234375, 6.86083984375, 9.0693359375, 11.27783203125, 13.486328125, 15.69482421875, 17.9033203125, 20.11181640625, 22.3203125, 24.52880859375, 26.7373046875, 28.94580078125, 31.154296875, 33.36279296875, 35.5712890625, 37.77978515625, 39.98828125, 42.19677734375, 44.4052734375, 46.61376953125, 48.822265625, 51.03076171875, 53.2392578125, 55.44775390625, 57.65625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 6.0, 9.0, 13.0, 22.0, 27.0, 25.0, 42.0, 50.0, 78.0, 68.0, 78.0, 88.0, 82.0, 85.0, 70.0, 59.0, 47.0, 44.0, 28.0, 26.0, 16.0, 12.0, 14.0, 6.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.236328125, -2.17742919921875, -2.1185302734375, -2.05963134765625, -2.000732421875, -1.94183349609375, -1.8829345703125, -1.82403564453125, -1.76513671875, -1.70623779296875, -1.6473388671875, -1.58843994140625, -1.529541015625, -1.47064208984375, -1.4117431640625, -1.35284423828125, -1.2939453125, -1.23504638671875, -1.1761474609375, -1.11724853515625, -1.058349609375, -0.99945068359375, -0.9405517578125, -0.88165283203125, -0.82275390625, -0.76385498046875, -0.7049560546875, -0.64605712890625, -0.587158203125, -0.52825927734375, -0.4693603515625, -0.41046142578125, -0.3515625, -0.29266357421875, -0.2337646484375, -0.17486572265625, -0.115966796875, -0.05706787109375, 0.0018310546875, 0.06072998046875, 0.11962890625, 0.17852783203125, 0.2374267578125, 0.29632568359375, 0.355224609375, 0.41412353515625, 0.4730224609375, 0.53192138671875, 0.5908203125, 0.64971923828125, 0.7086181640625, 0.76751708984375, 0.826416015625, 0.88531494140625, 0.9442138671875, 1.00311279296875, 1.06201171875, 1.12091064453125, 1.1798095703125, 1.23870849609375, 1.297607421875, 1.35650634765625, 1.4154052734375, 1.47430419921875, 1.533203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 8.0, 8.0, 15.0, 10.0, 14.0, 26.0, 28.0, 29.0, 42.0, 63.0, 121.0, 188.0, 418.0, 968.0, 2468.0, 7870.0, 32411.0, 251042.0, 3614067.0, 241246.0, 31737.0, 7365.0, 2305.0, 872.0, 380.0, 171.0, 96.0, 71.0, 54.0, 27.0, 20.0, 24.0, 20.0, 13.0, 14.0, 9.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-24.140625, -23.348876953125, -22.55712890625, -21.765380859375, -20.9736328125, -20.181884765625, -19.39013671875, -18.598388671875, -17.806640625, -17.014892578125, -16.22314453125, -15.431396484375, -14.6396484375, -13.847900390625, -13.05615234375, -12.264404296875, -11.47265625, -10.680908203125, -9.88916015625, -9.097412109375, -8.3056640625, -7.513916015625, -6.72216796875, -5.930419921875, -5.138671875, -4.346923828125, -3.55517578125, -2.763427734375, -1.9716796875, -1.179931640625, -0.38818359375, 0.403564453125, 1.1953125, 1.987060546875, 2.77880859375, 3.570556640625, 4.3623046875, 5.154052734375, 5.94580078125, 6.737548828125, 7.529296875, 8.321044921875, 9.11279296875, 9.904541015625, 10.6962890625, 11.488037109375, 12.27978515625, 13.071533203125, 13.86328125, 14.655029296875, 15.44677734375, 16.238525390625, 17.0302734375, 17.822021484375, 18.61376953125, 19.405517578125, 20.197265625, 20.989013671875, 21.78076171875, 22.572509765625, 23.3642578125, 24.156005859375, 24.94775390625, 25.739501953125, 26.53125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 14.0, 16.0, 24.0, 35.0, 43.0, 79.0, 149.0, 265.0, 786.0, 1753.0, 397.0, 186.0, 111.0, 76.0, 36.0, 22.0, 27.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5390625, -3.39276123046875, -3.2464599609375, -3.10015869140625, -2.953857421875, -2.80755615234375, -2.6612548828125, -2.51495361328125, -2.36865234375, -2.22235107421875, -2.0760498046875, -1.92974853515625, -1.783447265625, -1.63714599609375, -1.4908447265625, -1.34454345703125, -1.1982421875, -1.05194091796875, -0.9056396484375, -0.75933837890625, -0.613037109375, -0.46673583984375, -0.3204345703125, -0.17413330078125, -0.02783203125, 0.11846923828125, 0.2647705078125, 0.41107177734375, 0.557373046875, 0.70367431640625, 0.8499755859375, 0.99627685546875, 1.142578125, 1.28887939453125, 1.4351806640625, 1.58148193359375, 1.727783203125, 1.87408447265625, 2.0203857421875, 2.16668701171875, 2.31298828125, 2.45928955078125, 2.6055908203125, 2.75189208984375, 2.898193359375, 3.04449462890625, 3.1907958984375, 3.33709716796875, 3.4833984375, 3.62969970703125, 3.7760009765625, 3.92230224609375, 4.068603515625, 4.21490478515625, 4.3612060546875, 4.50750732421875, 4.65380859375, 4.80010986328125, 4.9464111328125, 5.09271240234375, 5.239013671875, 5.38531494140625, 5.5316162109375, 5.67791748046875, 5.82421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 14.0, 22.0, 124.0, 313.0, 333.0, 143.0, 44.0, 13.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.48643493652344, -80.31743621826172, -78.1484375, -75.97943878173828, -73.81044006347656, -71.64144897460938, -69.47245025634766, -67.30345153808594, -65.13445281982422, -62.9654541015625, -60.79645538330078, -58.62746047973633, -56.45846176147461, -54.28946304321289, -52.12046813964844, -49.95146942138672, -47.782470703125, -45.61347198486328, -43.44447326660156, -41.27547836303711, -39.10647964477539, -36.93748092651367, -34.76848602294922, -32.5994873046875, -30.43048858642578, -28.261489868164062, -26.092493057250977, -23.92349624633789, -21.754497528076172, -19.585498809814453, -17.416501998901367, -15.247504234313965, -13.078506469726562, -10.90950870513916, -8.740510940551758, -6.5715131759643555, -4.402515411376953, -2.233517646789551, -0.06451988220214844, 2.104477882385254, 4.273475646972656, 6.442473411560059, 8.611471176147461, 10.780468940734863, 12.949466705322266, 15.118464469909668, 17.28746223449707, 19.456459045410156, 21.625457763671875, 23.794456481933594, 25.96345329284668, 28.132450103759766, 30.301448822021484, 32.4704475402832, 34.639442443847656, 36.808441162109375, 38.977439880371094, 41.14643859863281, 43.31543731689453, 45.484432220458984, 47.6534309387207, 49.82242965698242, 51.991424560546875, 54.160423278808594, 56.32942199707031]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 6.0, 9.0, 9.0, 12.0, 11.0, 18.0, 18.0, 19.0, 25.0, 25.0, 32.0, 29.0, 37.0, 42.0, 51.0, 52.0, 48.0, 44.0, 54.0, 58.0, 50.0, 40.0, 42.0, 44.0, 34.0, 34.0, 29.0, 27.0, 17.0, 13.0, 18.0, 12.0, 15.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.838549613952637, -14.399466514587402, -13.960384368896484, -13.52130126953125, -13.082218170166016, -12.643136024475098, -12.204052925109863, -11.764970779418945, -11.325887680053711, -10.886804580688477, -10.447722434997559, -10.008639335632324, -9.569557189941406, -9.130474090576172, -8.691390991210938, -8.252307891845703, -7.813225746154785, -7.374143123626709, -6.935060501098633, -6.495977401733398, -6.056894779205322, -5.617812156677246, -5.178729057312012, -4.7396464347839355, -4.300563812255859, -3.861481189727783, -3.422398328781128, -2.9833154678344727, -2.5442328453063965, -2.1051502227783203, -1.666067361831665, -1.2269845008850098, -0.7879009246826172, -0.34881818294525146, 0.09026455879211426, 0.52934730052948, 0.9684300422668457, 1.4075126647949219, 1.8465955257415771, 2.2856783866882324, 2.7247610092163086, 3.1638436317443848, 3.60292649269104, 4.042009353637695, 4.4810919761657715, 4.920174598693848, 5.359257698059082, 5.798340320587158, 6.237422943115234, 6.6765055656433105, 7.115588188171387, 7.554671287536621, 7.993753910064697, 8.432836532592773, 8.871919631958008, 9.311002731323242, 9.75008487701416, 10.189167976379395, 10.628250122070312, 11.067333221435547, 11.506416320800781, 11.9454984664917, 12.384581565856934, 12.823663711547852, 13.262746810913086]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 13.0, 10.0, 8.0, 16.0, 28.0, 27.0, 37.0, 65.0, 97.0, 150.0, 240.0, 354.0, 603.0, 1110.0, 2068.0, 4039.0, 8391.0, 19474.0, 47657.0, 123991.0, 293112.0, 315428.0, 138347.0, 53523.0, 21260.0, 9248.0, 4220.0, 2106.0, 1177.0, 639.0, 401.0, 241.0, 152.0, 108.0, 75.0, 44.0, 27.0, 26.0, 15.0, 9.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.9627685546875, -6.714599609375, -6.4664306640625, -6.21826171875, -5.9700927734375, -5.721923828125, -5.4737548828125, -5.2255859375, -4.9774169921875, -4.729248046875, -4.4810791015625, -4.23291015625, -3.9847412109375, -3.736572265625, -3.4884033203125, -3.240234375, -2.9920654296875, -2.743896484375, -2.4957275390625, -2.24755859375, -1.9993896484375, -1.751220703125, -1.5030517578125, -1.2548828125, -1.0067138671875, -0.758544921875, -0.5103759765625, -0.26220703125, -0.0140380859375, 0.234130859375, 0.4822998046875, 0.73046875, 0.9786376953125, 1.226806640625, 1.4749755859375, 1.72314453125, 1.9713134765625, 2.219482421875, 2.4676513671875, 2.7158203125, 2.9639892578125, 3.212158203125, 3.4603271484375, 3.70849609375, 3.9566650390625, 4.204833984375, 4.4530029296875, 4.701171875, 4.9493408203125, 5.197509765625, 5.4456787109375, 5.69384765625, 5.9420166015625, 6.190185546875, 6.4383544921875, 6.6865234375, 6.9346923828125, 7.182861328125, 7.4310302734375, 7.67919921875, 7.9273681640625, 8.175537109375, 8.4237060546875, 8.671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 7.0, 5.0, 8.0, 19.0, 16.0, 31.0, 33.0, 41.0, 52.0, 71.0, 67.0, 74.0, 65.0, 92.0, 67.0, 52.0, 51.0, 46.0, 40.0, 34.0, 30.0, 34.0, 17.0, 18.0, 10.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.8369140625, -1.7901611328125, -1.743408203125, -1.6966552734375, -1.64990234375, -1.6031494140625, -1.556396484375, -1.5096435546875, -1.462890625, -1.4161376953125, -1.369384765625, -1.3226318359375, -1.27587890625, -1.2291259765625, -1.182373046875, -1.1356201171875, -1.0888671875, -1.0421142578125, -0.995361328125, -0.9486083984375, -0.90185546875, -0.8551025390625, -0.808349609375, -0.7615966796875, -0.71484375, -0.6680908203125, -0.621337890625, -0.5745849609375, -0.52783203125, -0.4810791015625, -0.434326171875, -0.3875732421875, -0.3408203125, -0.2940673828125, -0.247314453125, -0.2005615234375, -0.15380859375, -0.1070556640625, -0.060302734375, -0.0135498046875, 0.033203125, 0.0799560546875, 0.126708984375, 0.1734619140625, 0.22021484375, 0.2669677734375, 0.313720703125, 0.3604736328125, 0.4072265625, 0.4539794921875, 0.500732421875, 0.5474853515625, 0.59423828125, 0.6409912109375, 0.687744140625, 0.7344970703125, 0.78125, 0.8280029296875, 0.874755859375, 0.9215087890625, 0.96826171875, 1.0150146484375, 1.061767578125, 1.1085205078125, 1.1552734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 8.0, 15.0, 23.0, 26.0, 45.0, 52.0, 78.0, 114.0, 178.0, 357.0, 715.0, 1731.0, 4830.0, 16347.0, 69247.0, 334094.0, 475902.0, 109498.0, 24346.0, 6702.0, 2285.0, 893.0, 370.0, 226.0, 146.0, 87.0, 64.0, 48.0, 25.0, 29.0, 18.0, 9.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3880615234375, -12.002685546875, -11.6173095703125, -11.23193359375, -10.8465576171875, -10.461181640625, -10.0758056640625, -9.6904296875, -9.3050537109375, -8.919677734375, -8.5343017578125, -8.14892578125, -7.7635498046875, -7.378173828125, -6.9927978515625, -6.607421875, -6.2220458984375, -5.836669921875, -5.4512939453125, -5.06591796875, -4.6805419921875, -4.295166015625, -3.9097900390625, -3.5244140625, -3.1390380859375, -2.753662109375, -2.3682861328125, -1.98291015625, -1.5975341796875, -1.212158203125, -0.8267822265625, -0.44140625, -0.0560302734375, 0.329345703125, 0.7147216796875, 1.10009765625, 1.4854736328125, 1.870849609375, 2.2562255859375, 2.6416015625, 3.0269775390625, 3.412353515625, 3.7977294921875, 4.18310546875, 4.5684814453125, 4.953857421875, 5.3392333984375, 5.724609375, 6.1099853515625, 6.495361328125, 6.8807373046875, 7.26611328125, 7.6514892578125, 8.036865234375, 8.4222412109375, 8.8076171875, 9.1929931640625, 9.578369140625, 9.9637451171875, 10.34912109375, 10.7344970703125, 11.119873046875, 11.5052490234375, 11.890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 10.0, 10.0, 7.0, 12.0, 27.0, 17.0, 25.0, 26.0, 44.0, 27.0, 34.0, 37.0, 48.0, 38.0, 52.0, 44.0, 45.0, 40.0, 43.0, 35.0, 34.0, 54.0, 31.0, 25.0, 35.0, 24.0, 34.0, 23.0, 17.0, 18.0, 8.0, 9.0, 9.0, 8.0, 6.0, 6.0, 5.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.18359375, -6.01007080078125, -5.8365478515625, -5.66302490234375, -5.489501953125, -5.31597900390625, -5.1424560546875, -4.96893310546875, -4.79541015625, -4.62188720703125, -4.4483642578125, -4.27484130859375, -4.101318359375, -3.92779541015625, -3.7542724609375, -3.58074951171875, -3.4072265625, -3.23370361328125, -3.0601806640625, -2.88665771484375, -2.713134765625, -2.53961181640625, -2.3660888671875, -2.19256591796875, -2.01904296875, -1.84552001953125, -1.6719970703125, -1.49847412109375, -1.324951171875, -1.15142822265625, -0.9779052734375, -0.80438232421875, -0.630859375, -0.45733642578125, -0.2838134765625, -0.11029052734375, 0.063232421875, 0.23675537109375, 0.4102783203125, 0.58380126953125, 0.75732421875, 0.93084716796875, 1.1043701171875, 1.27789306640625, 1.451416015625, 1.62493896484375, 1.7984619140625, 1.97198486328125, 2.1455078125, 2.31903076171875, 2.4925537109375, 2.66607666015625, 2.839599609375, 3.01312255859375, 3.1866455078125, 3.36016845703125, 3.53369140625, 3.70721435546875, 3.8807373046875, 4.05426025390625, 4.227783203125, 4.40130615234375, 4.5748291015625, 4.74835205078125, 4.921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 18.0, 18.0, 25.0, 45.0, 67.0, 118.0, 240.0, 471.0, 1183.0, 3201.0, 10603.0, 54579.0, 792138.0, 157575.0, 19964.0, 5110.0, 1692.0, 745.0, 325.0, 198.0, 74.0, 57.0, 24.0, 22.0, 18.0, 6.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.359375, -23.61474609375, -22.8701171875, -22.12548828125, -21.380859375, -20.63623046875, -19.8916015625, -19.14697265625, -18.40234375, -17.65771484375, -16.9130859375, -16.16845703125, -15.423828125, -14.67919921875, -13.9345703125, -13.18994140625, -12.4453125, -11.70068359375, -10.9560546875, -10.21142578125, -9.466796875, -8.72216796875, -7.9775390625, -7.23291015625, -6.48828125, -5.74365234375, -4.9990234375, -4.25439453125, -3.509765625, -2.76513671875, -2.0205078125, -1.27587890625, -0.53125, 0.21337890625, 0.9580078125, 1.70263671875, 2.447265625, 3.19189453125, 3.9365234375, 4.68115234375, 5.42578125, 6.17041015625, 6.9150390625, 7.65966796875, 8.404296875, 9.14892578125, 9.8935546875, 10.63818359375, 11.3828125, 12.12744140625, 12.8720703125, 13.61669921875, 14.361328125, 15.10595703125, 15.8505859375, 16.59521484375, 17.33984375, 18.08447265625, 18.8291015625, 19.57373046875, 20.318359375, 21.06298828125, 21.8076171875, 22.55224609375, 23.296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 6.0, 18.0, 22.0, 26.0, 34.0, 52.0, 57.0, 101.0, 139.0, 139.0, 114.0, 88.0, 55.0, 36.0, 24.0, 27.0, 10.0, 14.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014429092407226562, -0.001405179500579834, -0.0013674497604370117, -0.0013297200202941895, -0.0012919902801513672, -0.001254260540008545, -0.0012165307998657227, -0.0011788010597229004, -0.0011410713195800781, -0.0011033415794372559, -0.0010656118392944336, -0.0010278820991516113, -0.000990152359008789, -0.0009524226188659668, -0.0009146928787231445, -0.0008769631385803223, -0.0008392333984375, -0.0008015036582946777, -0.0007637739181518555, -0.0007260441780090332, -0.0006883144378662109, -0.0006505846977233887, -0.0006128549575805664, -0.0005751252174377441, -0.0005373954772949219, -0.0004996657371520996, -0.00046193599700927734, -0.0004242062568664551, -0.0003864765167236328, -0.00034874677658081055, -0.0003110170364379883, -0.000273287296295166, -0.00023555755615234375, -0.00019782781600952148, -0.00016009807586669922, -0.00012236833572387695, -8.463859558105469e-05, -4.690885543823242e-05, -9.179115295410156e-06, 2.855062484741211e-05, 6.628036499023438e-05, 0.00010401010513305664, 0.0001417398452758789, 0.00017946958541870117, 0.00021719932556152344, 0.0002549290657043457, 0.00029265880584716797, 0.00033038854598999023, 0.0003681182861328125, 0.00040584802627563477, 0.00044357776641845703, 0.0004813075065612793, 0.0005190372467041016, 0.0005567669868469238, 0.0005944967269897461, 0.0006322264671325684, 0.0006699562072753906, 0.0007076859474182129, 0.0007454156875610352, 0.0007831454277038574, 0.0008208751678466797, 0.000858604907989502, 0.0008963346481323242, 0.0009340643882751465, 0.0009717941284179688]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 20.0, 36.0, 40.0, 85.0, 111.0, 196.0, 363.0, 654.0, 1572.0, 5465.0, 31704.0, 805584.0, 183580.0, 14164.0, 2944.0, 954.0, 433.0, 246.0, 147.0, 92.0, 50.0, 33.0, 24.0, 12.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-34.25, -33.1728515625, -32.095703125, -31.0185546875, -29.94140625, -28.8642578125, -27.787109375, -26.7099609375, -25.6328125, -24.5556640625, -23.478515625, -22.4013671875, -21.32421875, -20.2470703125, -19.169921875, -18.0927734375, -17.015625, -15.9384765625, -14.861328125, -13.7841796875, -12.70703125, -11.6298828125, -10.552734375, -9.4755859375, -8.3984375, -7.3212890625, -6.244140625, -5.1669921875, -4.08984375, -3.0126953125, -1.935546875, -0.8583984375, 0.21875, 1.2958984375, 2.373046875, 3.4501953125, 4.52734375, 5.6044921875, 6.681640625, 7.7587890625, 8.8359375, 9.9130859375, 10.990234375, 12.0673828125, 13.14453125, 14.2216796875, 15.298828125, 16.3759765625, 17.453125, 18.5302734375, 19.607421875, 20.6845703125, 21.76171875, 22.8388671875, 23.916015625, 24.9931640625, 26.0703125, 27.1474609375, 28.224609375, 29.3017578125, 30.37890625, 31.4560546875, 32.533203125, 33.6103515625, 34.6875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 11.0, 14.0, 25.0, 33.0, 35.0, 74.0, 211.0, 306.0, 151.0, 42.0, 32.0, 13.0, 11.0, 8.0, 15.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.29052734375, -21.6748046875, -21.05908203125, -20.443359375, -19.82763671875, -19.2119140625, -18.59619140625, -17.98046875, -17.36474609375, -16.7490234375, -16.13330078125, -15.517578125, -14.90185546875, -14.2861328125, -13.67041015625, -13.0546875, -12.43896484375, -11.8232421875, -11.20751953125, -10.591796875, -9.97607421875, -9.3603515625, -8.74462890625, -8.12890625, -7.51318359375, -6.8974609375, -6.28173828125, -5.666015625, -5.05029296875, -4.4345703125, -3.81884765625, -3.203125, -2.58740234375, -1.9716796875, -1.35595703125, -0.740234375, -0.12451171875, 0.4912109375, 1.10693359375, 1.72265625, 2.33837890625, 2.9541015625, 3.56982421875, 4.185546875, 4.80126953125, 5.4169921875, 6.03271484375, 6.6484375, 7.26416015625, 7.8798828125, 8.49560546875, 9.111328125, 9.72705078125, 10.3427734375, 10.95849609375, 11.57421875, 12.18994140625, 12.8056640625, 13.42138671875, 14.037109375, 14.65283203125, 15.2685546875, 15.88427734375, 16.5]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 11.0, 15.0, 31.0, 87.0, 132.0, 249.0, 234.0, 144.0, 54.0, 22.0, 13.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.14044189453125, -212.7032012939453, -208.26596069335938, -203.8287353515625, -199.39149475097656, -194.95425415039062, -190.5170135498047, -186.07977294921875, -181.64254760742188, -177.20530700683594, -172.76806640625, -168.33084106445312, -163.8936004638672, -159.45635986328125, -155.0191192626953, -150.58187866210938, -146.1446533203125, -141.70741271972656, -137.27017211914062, -132.83294677734375, -128.3957061767578, -123.95846557617188, -119.52122497558594, -115.08399200439453, -110.64674377441406, -106.20950317382812, -101.77227020263672, -97.33502960205078, -92.89779663085938, -88.46055603027344, -84.0233154296875, -79.5860824584961, -75.14885711669922, -70.71161651611328, -66.27438354492188, -61.83714294433594, -57.39990997314453, -52.962669372558594, -48.52543258666992, -44.08819580078125, -39.65095901489258, -35.213722229003906, -30.776485443115234, -26.33924674987793, -21.902009963989258, -17.464773178100586, -13.027534484863281, -8.59029769897461, -4.1530609130859375, 0.2841763496398926, 4.721413612365723, 9.158651351928711, 13.595888137817383, 18.033124923706055, 22.47036361694336, 26.90760040283203, 31.344837188720703, 35.782073974609375, 40.21931076049805, 44.65654754638672, 49.093788146972656, 53.53102111816406, 57.96826171875, 62.40549850463867, 66.84273529052734]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 19.0, 12.0, 32.0, 29.0, 32.0, 30.0, 40.0, 45.0, 65.0, 55.0, 53.0, 57.0, 56.0, 55.0, 51.0, 47.0, 58.0, 43.0, 37.0, 38.0, 35.0, 17.0, 18.0, 22.0, 15.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.30374145507812, -74.46532440185547, -72.62690734863281, -70.78848266601562, -68.95006561279297, -67.11164855957031, -65.27323150634766, -63.434810638427734, -61.59638977050781, -59.757972717285156, -57.919551849365234, -56.08113479614258, -54.242713928222656, -52.404296875, -50.565879821777344, -48.72745895385742, -46.889041900634766, -45.05062484741211, -43.21220397949219, -41.37378692626953, -39.53536605834961, -37.69694900512695, -35.85852813720703, -34.020111083984375, -32.18169403076172, -30.34327507019043, -28.50485610961914, -26.666439056396484, -24.828018188476562, -22.989601135253906, -21.151182174682617, -19.312763214111328, -17.474342346191406, -15.635923385620117, -13.797504425048828, -11.959086418151855, -10.120667457580566, -8.282248497009277, -6.443830490112305, -4.605411529541016, -2.7669925689697266, -0.9285738468170166, 0.9098448753356934, 2.748263359069824, 4.586682319641113, 6.425101280212402, 8.263519287109375, 10.101938247680664, 11.940357208251953, 13.778776168823242, 15.617195129394531, 17.455612182617188, 19.29403305053711, 21.132450103759766, 22.970869064331055, 24.809288024902344, 26.647706985473633, 28.486125946044922, 30.32454490661621, 32.1629638671875, 34.001380920410156, 35.83980178833008, 37.678218841552734, 39.516639709472656, 41.35505676269531]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 11.0, 13.0, 12.0, 17.0, 37.0, 48.0, 70.0, 146.0, 262.0, 621.0, 1756.0, 7074.0, 46766.0, 3500342.0, 602009.0, 28282.0, 4717.0, 1251.0, 417.0, 183.0, 85.0, 49.0, 38.0, 18.0, 18.0, 15.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46875, -34.507080078125, -33.54541015625, -32.583740234375, -31.6220703125, -30.660400390625, -29.69873046875, -28.737060546875, -27.775390625, -26.813720703125, -25.85205078125, -24.890380859375, -23.9287109375, -22.967041015625, -22.00537109375, -21.043701171875, -20.08203125, -19.120361328125, -18.15869140625, -17.197021484375, -16.2353515625, -15.273681640625, -14.31201171875, -13.350341796875, -12.388671875, -11.427001953125, -10.46533203125, -9.503662109375, -8.5419921875, -7.580322265625, -6.61865234375, -5.656982421875, -4.6953125, -3.733642578125, -2.77197265625, -1.810302734375, -0.8486328125, 0.113037109375, 1.07470703125, 2.036376953125, 2.998046875, 3.959716796875, 4.92138671875, 5.883056640625, 6.8447265625, 7.806396484375, 8.76806640625, 9.729736328125, 10.69140625, 11.653076171875, 12.61474609375, 13.576416015625, 14.5380859375, 15.499755859375, 16.46142578125, 17.423095703125, 18.384765625, 19.346435546875, 20.30810546875, 21.269775390625, 22.2314453125, 23.193115234375, 24.15478515625, 25.116455078125, 26.078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 3.0, 3.0, 7.0, 10.0, 13.0, 19.0, 26.0, 32.0, 35.0, 47.0, 58.0, 71.0, 67.0, 89.0, 59.0, 54.0, 75.0, 65.0, 56.0, 36.0, 34.0, 39.0, 31.0, 16.0, 27.0, 7.0, 8.0, 3.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.337890625, -2.2816009521484375, -2.225311279296875, -2.1690216064453125, -2.11273193359375, -2.0564422607421875, -2.000152587890625, -1.9438629150390625, -1.8875732421875, -1.8312835693359375, -1.774993896484375, -1.7187042236328125, -1.66241455078125, -1.6061248779296875, -1.549835205078125, -1.4935455322265625, -1.437255859375, -1.3809661865234375, -1.324676513671875, -1.2683868408203125, -1.21209716796875, -1.1558074951171875, -1.099517822265625, -1.0432281494140625, -0.9869384765625, -0.9306488037109375, -0.874359130859375, -0.8180694580078125, -0.76177978515625, -0.7054901123046875, -0.649200439453125, -0.5929107666015625, -0.53662109375, -0.4803314208984375, -0.424041748046875, -0.3677520751953125, -0.31146240234375, -0.2551727294921875, -0.198883056640625, -0.1425933837890625, -0.0863037109375, -0.0300140380859375, 0.026275634765625, 0.0825653076171875, 0.13885498046875, 0.1951446533203125, 0.251434326171875, 0.3077239990234375, 0.364013671875, 0.4203033447265625, 0.476593017578125, 0.5328826904296875, 0.58917236328125, 0.6454620361328125, 0.701751708984375, 0.7580413818359375, 0.8143310546875, 0.8706207275390625, 0.926910400390625, 0.9832000732421875, 1.03948974609375, 1.0957794189453125, 1.152069091796875, 1.2083587646484375, 1.2646484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 4.0, 10.0, 4.0, 14.0, 28.0, 37.0, 63.0, 84.0, 163.0, 311.0, 623.0, 1605.0, 4608.0, 17137.0, 92248.0, 2657959.0, 1320609.0, 76030.0, 15334.0, 4347.0, 1541.0, 689.0, 344.0, 172.0, 109.0, 73.0, 41.0, 26.0, 21.0, 15.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.66357421875, -21.0927734375, -20.52197265625, -19.951171875, -19.38037109375, -18.8095703125, -18.23876953125, -17.66796875, -17.09716796875, -16.5263671875, -15.95556640625, -15.384765625, -14.81396484375, -14.2431640625, -13.67236328125, -13.1015625, -12.53076171875, -11.9599609375, -11.38916015625, -10.818359375, -10.24755859375, -9.6767578125, -9.10595703125, -8.53515625, -7.96435546875, -7.3935546875, -6.82275390625, -6.251953125, -5.68115234375, -5.1103515625, -4.53955078125, -3.96875, -3.39794921875, -2.8271484375, -2.25634765625, -1.685546875, -1.11474609375, -0.5439453125, 0.02685546875, 0.59765625, 1.16845703125, 1.7392578125, 2.31005859375, 2.880859375, 3.45166015625, 4.0224609375, 4.59326171875, 5.1640625, 5.73486328125, 6.3056640625, 6.87646484375, 7.447265625, 8.01806640625, 8.5888671875, 9.15966796875, 9.73046875, 10.30126953125, 10.8720703125, 11.44287109375, 12.013671875, 12.58447265625, 13.1552734375, 13.72607421875, 14.296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 9.0, 11.0, 10.0, 19.0, 33.0, 52.0, 69.0, 124.0, 200.0, 397.0, 1372.0, 961.0, 329.0, 171.0, 89.0, 67.0, 36.0, 24.0, 19.0, 18.0, 11.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.447540283203125, -2.33062744140625, -2.213714599609375, -2.0968017578125, -1.979888916015625, -1.86297607421875, -1.746063232421875, -1.629150390625, -1.512237548828125, -1.39532470703125, -1.278411865234375, -1.1614990234375, -1.044586181640625, -0.92767333984375, -0.810760498046875, -0.69384765625, -0.576934814453125, -0.46002197265625, -0.343109130859375, -0.2261962890625, -0.109283447265625, 0.00762939453125, 0.124542236328125, 0.241455078125, 0.358367919921875, 0.47528076171875, 0.592193603515625, 0.7091064453125, 0.826019287109375, 0.94293212890625, 1.059844970703125, 1.1767578125, 1.293670654296875, 1.41058349609375, 1.527496337890625, 1.6444091796875, 1.761322021484375, 1.87823486328125, 1.995147705078125, 2.112060546875, 2.228973388671875, 2.34588623046875, 2.462799072265625, 2.5797119140625, 2.696624755859375, 2.81353759765625, 2.930450439453125, 3.04736328125, 3.164276123046875, 3.28118896484375, 3.398101806640625, 3.5150146484375, 3.631927490234375, 3.74884033203125, 3.865753173828125, 3.982666015625, 4.099578857421875, 4.21649169921875, 4.333404541015625, 4.4503173828125, 4.567230224609375, 4.68414306640625, 4.801055908203125, 4.91796875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 24.0, 31.0, 39.0, 67.0, 122.0, 149.0, 157.0, 137.0, 97.0, 64.0, 41.0, 19.0, 13.0, 11.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.037200927734375, -23.248794555664062, -22.460390090942383, -21.67198371887207, -20.883577346801758, -20.095172882080078, -19.306766510009766, -18.518360137939453, -17.729955673217773, -16.94154930114746, -16.15314483642578, -15.364738464355469, -14.576333045959473, -13.787927627563477, -12.999521255493164, -12.211115837097168, -11.422709465026855, -10.63430404663086, -9.845897674560547, -9.05749225616455, -8.269086837768555, -7.4806809425354, -6.692275047302246, -5.90386962890625, -5.115463733673096, -4.327057838439941, -3.5386524200439453, -2.750246524810791, -1.9618408679962158, -1.1734352111816406, -0.38502931594848633, 0.40337610244750977, 1.191781997680664, 1.9801876544952393, 2.7685933113098145, 3.5569992065429688, 4.345404624938965, 5.133810520172119, 5.922216415405273, 6.7106218338012695, 7.499027729034424, 8.287433624267578, 9.075839042663574, 9.86424446105957, 10.652650833129883, 11.441056251525879, 12.229461669921875, 13.017868041992188, 13.806273460388184, 14.59467887878418, 15.383085250854492, 16.171489715576172, 16.959896087646484, 17.748302459716797, 18.53670883178711, 19.32511329650879, 20.1135196685791, 20.901926040649414, 21.690330505371094, 22.478736877441406, 23.26714324951172, 24.0555477142334, 24.84395408630371, 25.63235855102539, 26.420764923095703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 4.0, 11.0, 14.0, 16.0, 20.0, 17.0, 34.0, 33.0, 24.0, 49.0, 34.0, 50.0, 50.0, 54.0, 53.0, 75.0, 54.0, 54.0, 56.0, 39.0, 52.0, 39.0, 41.0, 33.0, 20.0, 17.0, 11.0, 12.0, 11.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.036450386047363, -14.542889595031738, -14.049328804016113, -13.555768013000488, -13.062207221984863, -12.568646430969238, -12.075085639953613, -11.581524848937988, -11.087964057922363, -10.594403266906738, -10.100842475891113, -9.607281684875488, -9.113720893859863, -8.620160102844238, -8.126599311828613, -7.633038520812988, -7.139477729797363, -6.645916938781738, -6.152356147766113, -5.658795356750488, -5.165234565734863, -4.671673774719238, -4.178112983703613, -3.6845521926879883, -3.1909914016723633, -2.6974306106567383, -2.2038698196411133, -1.7103090286254883, -1.2167482376098633, -0.7231874465942383, -0.22962665557861328, 0.2639341354370117, 0.7574958801269531, 1.2510566711425781, 1.7446174621582031, 2.238178253173828, 2.731739044189453, 3.225299835205078, 3.718860626220703, 4.212421417236328, 4.705982208251953, 5.199542999267578, 5.693103790283203, 6.186664581298828, 6.680225372314453, 7.173786163330078, 7.667346954345703, 8.160907745361328, 8.654468536376953, 9.148029327392578, 9.641590118408203, 10.135150909423828, 10.628711700439453, 11.122272491455078, 11.615833282470703, 12.109394073486328, 12.602954864501953, 13.096515655517578, 13.590076446533203, 14.083637237548828, 14.577198028564453, 15.070758819580078, 15.564319610595703, 16.057880401611328, 16.551441192626953]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 14.0, 9.0, 7.0, 20.0, 28.0, 37.0, 46.0, 63.0, 83.0, 124.0, 174.0, 268.0, 438.0, 651.0, 1100.0, 1920.0, 3522.0, 6791.0, 13852.0, 28443.0, 60027.0, 128543.0, 237589.0, 263539.0, 156215.0, 74721.0, 34880.0, 16915.0, 8360.0, 4334.0, 2306.0, 1300.0, 753.0, 475.0, 282.0, 203.0, 132.0, 115.0, 81.0, 62.0, 42.0, 26.0, 19.0, 13.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0], "bins": [-5.984375, -5.8140869140625, -5.643798828125, -5.4735107421875, -5.30322265625, -5.1329345703125, -4.962646484375, -4.7923583984375, -4.6220703125, -4.4517822265625, -4.281494140625, -4.1112060546875, -3.94091796875, -3.7706298828125, -3.600341796875, -3.4300537109375, -3.259765625, -3.0894775390625, -2.919189453125, -2.7489013671875, -2.57861328125, -2.4083251953125, -2.238037109375, -2.0677490234375, -1.8974609375, -1.7271728515625, -1.556884765625, -1.3865966796875, -1.21630859375, -1.0460205078125, -0.875732421875, -0.7054443359375, -0.53515625, -0.3648681640625, -0.194580078125, -0.0242919921875, 0.14599609375, 0.3162841796875, 0.486572265625, 0.6568603515625, 0.8271484375, 0.9974365234375, 1.167724609375, 1.3380126953125, 1.50830078125, 1.6785888671875, 1.848876953125, 2.0191650390625, 2.189453125, 2.3597412109375, 2.530029296875, 2.7003173828125, 2.87060546875, 3.0408935546875, 3.211181640625, 3.3814697265625, 3.5517578125, 3.7220458984375, 3.892333984375, 4.0626220703125, 4.23291015625, 4.4031982421875, 4.573486328125, 4.7437744140625, 4.9140625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 13.0, 17.0, 30.0, 31.0, 25.0, 42.0, 50.0, 62.0, 69.0, 67.0, 87.0, 71.0, 55.0, 79.0, 54.0, 46.0, 35.0, 39.0, 32.0, 23.0, 19.0, 13.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7724609375, -1.7201080322265625, -1.667755126953125, -1.6154022216796875, -1.56304931640625, -1.5106964111328125, -1.458343505859375, -1.4059906005859375, -1.3536376953125, -1.3012847900390625, -1.248931884765625, -1.1965789794921875, -1.14422607421875, -1.0918731689453125, -1.039520263671875, -0.9871673583984375, -0.934814453125, -0.8824615478515625, -0.830108642578125, -0.7777557373046875, -0.72540283203125, -0.6730499267578125, -0.620697021484375, -0.5683441162109375, -0.5159912109375, -0.4636383056640625, -0.411285400390625, -0.3589324951171875, -0.30657958984375, -0.2542266845703125, -0.201873779296875, -0.1495208740234375, -0.09716796875, -0.0448150634765625, 0.007537841796875, 0.0598907470703125, 0.11224365234375, 0.1645965576171875, 0.216949462890625, 0.2693023681640625, 0.3216552734375, 0.3740081787109375, 0.426361083984375, 0.4787139892578125, 0.53106689453125, 0.5834197998046875, 0.635772705078125, 0.6881256103515625, 0.740478515625, 0.7928314208984375, 0.845184326171875, 0.8975372314453125, 0.94989013671875, 1.0022430419921875, 1.054595947265625, 1.1069488525390625, 1.1593017578125, 1.2116546630859375, 1.264007568359375, 1.3163604736328125, 1.36871337890625, 1.4210662841796875, 1.473419189453125, 1.5257720947265625, 1.578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 8.0, 11.0, 25.0, 33.0, 45.0, 72.0, 86.0, 145.0, 279.0, 484.0, 953.0, 2024.0, 4623.0, 12161.0, 33956.0, 103682.0, 297502.0, 366970.0, 148491.0, 48605.0, 16665.0, 6403.0, 2639.0, 1190.0, 597.0, 317.0, 187.0, 125.0, 78.0, 57.0, 33.0, 28.0, 18.0, 16.0, 10.0, 10.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84765625, -7.6036376953125, -7.359619140625, -7.1156005859375, -6.87158203125, -6.6275634765625, -6.383544921875, -6.1395263671875, -5.8955078125, -5.6514892578125, -5.407470703125, -5.1634521484375, -4.91943359375, -4.6754150390625, -4.431396484375, -4.1873779296875, -3.943359375, -3.6993408203125, -3.455322265625, -3.2113037109375, -2.96728515625, -2.7232666015625, -2.479248046875, -2.2352294921875, -1.9912109375, -1.7471923828125, -1.503173828125, -1.2591552734375, -1.01513671875, -0.7711181640625, -0.527099609375, -0.2830810546875, -0.0390625, 0.2049560546875, 0.448974609375, 0.6929931640625, 0.93701171875, 1.1810302734375, 1.425048828125, 1.6690673828125, 1.9130859375, 2.1571044921875, 2.401123046875, 2.6451416015625, 2.88916015625, 3.1331787109375, 3.377197265625, 3.6212158203125, 3.865234375, 4.1092529296875, 4.353271484375, 4.5972900390625, 4.84130859375, 5.0853271484375, 5.329345703125, 5.5733642578125, 5.8173828125, 6.0614013671875, 6.305419921875, 6.5494384765625, 6.79345703125, 7.0374755859375, 7.281494140625, 7.5255126953125, 7.76953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 11.0, 9.0, 10.0, 16.0, 17.0, 17.0, 25.0, 22.0, 20.0, 34.0, 22.0, 34.0, 31.0, 36.0, 28.0, 38.0, 52.0, 41.0, 46.0, 51.0, 43.0, 33.0, 46.0, 29.0, 38.0, 28.0, 23.0, 24.0, 23.0, 34.0, 16.0, 17.0, 12.0, 16.0, 9.0, 19.0, 4.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.88604736328125, -4.7095947265625, -4.53314208984375, -4.356689453125, -4.18023681640625, -4.0037841796875, -3.82733154296875, -3.65087890625, -3.47442626953125, -3.2979736328125, -3.12152099609375, -2.945068359375, -2.76861572265625, -2.5921630859375, -2.41571044921875, -2.2392578125, -2.06280517578125, -1.8863525390625, -1.70989990234375, -1.533447265625, -1.35699462890625, -1.1805419921875, -1.00408935546875, -0.82763671875, -0.65118408203125, -0.4747314453125, -0.29827880859375, -0.121826171875, 0.05462646484375, 0.2310791015625, 0.40753173828125, 0.583984375, 0.76043701171875, 0.9368896484375, 1.11334228515625, 1.289794921875, 1.46624755859375, 1.6427001953125, 1.81915283203125, 1.99560546875, 2.17205810546875, 2.3485107421875, 2.52496337890625, 2.701416015625, 2.87786865234375, 3.0543212890625, 3.23077392578125, 3.4072265625, 3.58367919921875, 3.7601318359375, 3.93658447265625, 4.113037109375, 4.28948974609375, 4.4659423828125, 4.64239501953125, 4.81884765625, 4.99530029296875, 5.1717529296875, 5.34820556640625, 5.524658203125, 5.70111083984375, 5.8775634765625, 6.05401611328125, 6.23046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 9.0, 17.0, 17.0, 20.0, 24.0, 51.0, 69.0, 84.0, 149.0, 214.0, 320.0, 628.0, 961.0, 1816.0, 3312.0, 6775.0, 15809.0, 43010.0, 144743.0, 419356.0, 283148.0, 80759.0, 26343.0, 10348.0, 4739.0, 2465.0, 1301.0, 770.0, 431.0, 277.0, 179.0, 122.0, 87.0, 58.0, 37.0, 33.0, 23.0, 11.0, 15.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5638427734375, -4.424560546875, -4.2852783203125, -4.14599609375, -4.0067138671875, -3.867431640625, -3.7281494140625, -3.5888671875, -3.4495849609375, -3.310302734375, -3.1710205078125, -3.03173828125, -2.8924560546875, -2.753173828125, -2.6138916015625, -2.474609375, -2.3353271484375, -2.196044921875, -2.0567626953125, -1.91748046875, -1.7781982421875, -1.638916015625, -1.4996337890625, -1.3603515625, -1.2210693359375, -1.081787109375, -0.9425048828125, -0.80322265625, -0.6639404296875, -0.524658203125, -0.3853759765625, -0.24609375, -0.1068115234375, 0.032470703125, 0.1717529296875, 0.31103515625, 0.4503173828125, 0.589599609375, 0.7288818359375, 0.8681640625, 1.0074462890625, 1.146728515625, 1.2860107421875, 1.42529296875, 1.5645751953125, 1.703857421875, 1.8431396484375, 1.982421875, 2.1217041015625, 2.260986328125, 2.4002685546875, 2.53955078125, 2.6788330078125, 2.818115234375, 2.9573974609375, 3.0966796875, 3.2359619140625, 3.375244140625, 3.5145263671875, 3.65380859375, 3.7930908203125, 3.932373046875, 4.0716552734375, 4.2109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 15.0, 7.0, 7.0, 16.0, 21.0, 18.0, 21.0, 30.0, 35.0, 48.0, 76.0, 95.0, 111.0, 108.0, 78.0, 80.0, 47.0, 48.0, 23.0, 24.0, 22.0, 16.0, 12.0, 14.0, 6.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005121231079101562, -0.0004955306649208069, -0.0004789382219314575, -0.00046234577894210815, -0.0004457533359527588, -0.0004291608929634094, -0.00041256844997406006, -0.0003959760069847107, -0.00037938356399536133, -0.00036279112100601196, -0.0003461986780166626, -0.00032960623502731323, -0.00031301379203796387, -0.0002964213490486145, -0.00027982890605926514, -0.00026323646306991577, -0.0002466440200805664, -0.00023005157709121704, -0.00021345913410186768, -0.0001968666911125183, -0.00018027424812316895, -0.00016368180513381958, -0.00014708936214447021, -0.00013049691915512085, -0.00011390447616577148, -9.731203317642212e-05, -8.071959018707275e-05, -6.412714719772339e-05, -4.7534704208374023e-05, -3.094226121902466e-05, -1.4349818229675293e-05, 2.2426247596740723e-06, 1.8835067749023438e-05, 3.54275107383728e-05, 5.201995372772217e-05, 6.861239671707153e-05, 8.52048397064209e-05, 0.00010179728269577026, 0.00011838972568511963, 0.000134982168674469, 0.00015157461166381836, 0.00016816705465316772, 0.0001847594976425171, 0.00020135194063186646, 0.00021794438362121582, 0.00023453682661056519, 0.00025112926959991455, 0.0002677217125892639, 0.0002843141555786133, 0.00030090659856796265, 0.000317499041557312, 0.0003340914845466614, 0.00035068392753601074, 0.0003672763705253601, 0.00038386881351470947, 0.00040046125650405884, 0.0004170536994934082, 0.00043364614248275757, 0.00045023858547210693, 0.0004668310284614563, 0.00048342347145080566, 0.000500015914440155, 0.0005166083574295044, 0.0005332008004188538, 0.0005497932434082031]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 0.0, 9.0, 8.0, 18.0, 23.0, 37.0, 44.0, 82.0, 116.0, 204.0, 382.0, 768.0, 1564.0, 3563.0, 10037.0, 33869.0, 143382.0, 521515.0, 253566.0, 54849.0, 15184.0, 5213.0, 2071.0, 940.0, 470.0, 240.0, 163.0, 106.0, 46.0, 29.0, 19.0, 10.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2412109375, -5.037109375, -4.8330078125, -4.62890625, -4.4248046875, -4.220703125, -4.0166015625, -3.8125, -3.6083984375, -3.404296875, -3.2001953125, -2.99609375, -2.7919921875, -2.587890625, -2.3837890625, -2.1796875, -1.9755859375, -1.771484375, -1.5673828125, -1.36328125, -1.1591796875, -0.955078125, -0.7509765625, -0.546875, -0.3427734375, -0.138671875, 0.0654296875, 0.26953125, 0.4736328125, 0.677734375, 0.8818359375, 1.0859375, 1.2900390625, 1.494140625, 1.6982421875, 1.90234375, 2.1064453125, 2.310546875, 2.5146484375, 2.71875, 2.9228515625, 3.126953125, 3.3310546875, 3.53515625, 3.7392578125, 3.943359375, 4.1474609375, 4.3515625, 4.5556640625, 4.759765625, 4.9638671875, 5.16796875, 5.3720703125, 5.576171875, 5.7802734375, 5.984375, 6.1884765625, 6.392578125, 6.5966796875, 6.80078125, 7.0048828125, 7.208984375, 7.4130859375, 7.6171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 8.0, 12.0, 14.0, 23.0, 25.0, 33.0, 32.0, 52.0, 63.0, 68.0, 113.0, 99.0, 104.0, 75.0, 56.0, 53.0, 27.0, 25.0, 25.0, 18.0, 12.0, 9.0, 10.0, 8.0, 3.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.9609375, -5.81011962890625, -5.6593017578125, -5.50848388671875, -5.357666015625, -5.20684814453125, -5.0560302734375, -4.90521240234375, -4.75439453125, -4.60357666015625, -4.4527587890625, -4.30194091796875, -4.151123046875, -4.00030517578125, -3.8494873046875, -3.69866943359375, -3.5478515625, -3.39703369140625, -3.2462158203125, -3.09539794921875, -2.944580078125, -2.79376220703125, -2.6429443359375, -2.49212646484375, -2.34130859375, -2.19049072265625, -2.0396728515625, -1.88885498046875, -1.738037109375, -1.58721923828125, -1.4364013671875, -1.28558349609375, -1.134765625, -0.98394775390625, -0.8331298828125, -0.68231201171875, -0.531494140625, -0.38067626953125, -0.2298583984375, -0.07904052734375, 0.07177734375, 0.22259521484375, 0.3734130859375, 0.52423095703125, 0.675048828125, 0.82586669921875, 0.9766845703125, 1.12750244140625, 1.2783203125, 1.42913818359375, 1.5799560546875, 1.73077392578125, 1.881591796875, 2.03240966796875, 2.1832275390625, 2.33404541015625, 2.48486328125, 2.63568115234375, 2.7864990234375, 2.93731689453125, 3.088134765625, 3.23895263671875, 3.3897705078125, 3.54058837890625, 3.69140625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 17.0, 24.0, 40.0, 66.0, 107.0, 173.0, 192.0, 156.0, 88.0, 57.0, 26.0, 16.0, 15.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.10985565185547, -72.7837905883789, -70.45772552490234, -68.13165283203125, -65.80558776855469, -63.479522705078125, -61.15345764160156, -58.827392578125, -56.50132369995117, -54.17525863647461, -51.84918975830078, -49.52312469482422, -47.197059631347656, -44.87099075317383, -42.544925689697266, -40.21885681152344, -37.892791748046875, -35.56672668457031, -33.240657806396484, -30.914592742919922, -28.588525772094727, -26.26245880126953, -23.93639373779297, -21.610326766967773, -19.284259796142578, -16.958192825317383, -14.632126808166504, -12.306060791015625, -9.97999382019043, -7.653926849365234, -5.3278608322143555, -3.0017948150634766, -0.67572021484375, 1.650346279144287, 3.976412773132324, 6.302479267120361, 8.628545761108398, 10.954612731933594, 13.280678749084473, 15.606744766235352, 17.932811737060547, 20.258878707885742, 22.584945678710938, 24.9110107421875, 27.237077713012695, 29.56314468383789, 31.889209747314453, 34.21527862548828, 36.541343688964844, 38.867408752441406, 41.193477630615234, 43.5195426940918, 45.845611572265625, 48.17167663574219, 50.49774169921875, 52.82380676269531, 55.14987564086914, 57.4759407043457, 59.80200958251953, 62.128074645996094, 64.45413970947266, 66.78021240234375, 69.10627746582031, 71.43234252929688, 73.75840759277344]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 9.0, 15.0, 10.0, 15.0, 10.0, 21.0, 23.0, 40.0, 30.0, 29.0, 52.0, 42.0, 50.0, 49.0, 45.0, 60.0, 47.0, 59.0, 48.0, 41.0, 31.0, 47.0, 47.0, 35.0, 19.0, 16.0, 19.0, 20.0, 13.0, 8.0, 12.0, 4.0, 7.0, 3.0, 3.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40959930419922, -39.10161590576172, -37.793636322021484, -36.48565673828125, -35.17767333984375, -33.86968994140625, -32.561710357666016, -31.25372886657715, -29.94574737548828, -28.637765884399414, -27.329784393310547, -26.02180290222168, -24.713821411132812, -23.405839920043945, -22.097858428955078, -20.78987693786621, -19.481895446777344, -18.173913955688477, -16.86593246459961, -15.557950973510742, -14.249969482421875, -12.941987991333008, -11.63400650024414, -10.326025009155273, -9.018043518066406, -7.710062026977539, -6.402080535888672, -5.094099044799805, -3.7861175537109375, -2.4781360626220703, -1.1701545715332031, 0.13782691955566406, 1.4458084106445312, 2.7537899017333984, 4.061771392822266, 5.369752883911133, 6.677734375, 7.985715866088867, 9.293697357177734, 10.601678848266602, 11.909660339355469, 13.217641830444336, 14.525623321533203, 15.83360481262207, 17.141586303710938, 18.449567794799805, 19.757549285888672, 21.06553077697754, 22.373512268066406, 23.681493759155273, 24.98947525024414, 26.297456741333008, 27.605438232421875, 28.913419723510742, 30.22140121459961, 31.529382705688477, 32.837364196777344, 34.145347595214844, 35.45332717895508, 36.76130676269531, 38.06929016113281, 39.37727355957031, 40.68525314331055, 41.99323272705078, 43.30121612548828]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 8.0, 1.0, 0.0, 3.0, 7.0, 8.0, 4.0, 10.0, 13.0, 15.0, 27.0, 29.0, 40.0, 51.0, 120.0, 157.0, 213.0, 394.0, 637.0, 1120.0, 2201.0, 4779.0, 12988.0, 48797.0, 469079.0, 3513989.0, 105337.0, 21384.0, 6831.0, 2856.0, 1331.0, 777.0, 402.0, 238.0, 157.0, 103.0, 64.0, 35.0, 30.0, 12.0, 9.0, 11.0, 5.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.0362548828125, -11.650634765625, -11.2650146484375, -10.87939453125, -10.4937744140625, -10.108154296875, -9.7225341796875, -9.3369140625, -8.9512939453125, -8.565673828125, -8.1800537109375, -7.79443359375, -7.4088134765625, -7.023193359375, -6.6375732421875, -6.251953125, -5.8663330078125, -5.480712890625, -5.0950927734375, -4.70947265625, -4.3238525390625, -3.938232421875, -3.5526123046875, -3.1669921875, -2.7813720703125, -2.395751953125, -2.0101318359375, -1.62451171875, -1.2388916015625, -0.853271484375, -0.4676513671875, -0.08203125, 0.3035888671875, 0.689208984375, 1.0748291015625, 1.46044921875, 1.8460693359375, 2.231689453125, 2.6173095703125, 3.0029296875, 3.3885498046875, 3.774169921875, 4.1597900390625, 4.54541015625, 4.9310302734375, 5.316650390625, 5.7022705078125, 6.087890625, 6.4735107421875, 6.859130859375, 7.2447509765625, 7.63037109375, 8.0159912109375, 8.401611328125, 8.7872314453125, 9.1728515625, 9.5584716796875, 9.944091796875, 10.3297119140625, 10.71533203125, 11.1009521484375, 11.486572265625, 11.8721923828125, 12.2578125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 17.0, 16.0, 21.0, 25.0, 30.0, 36.0, 49.0, 52.0, 67.0, 73.0, 61.0, 89.0, 81.0, 59.0, 69.0, 46.0, 34.0, 40.0, 27.0, 25.0, 13.0, 18.0, 14.0, 9.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.99609375, -1.9411163330078125, -1.886138916015625, -1.8311614990234375, -1.77618408203125, -1.7212066650390625, -1.666229248046875, -1.6112518310546875, -1.5562744140625, -1.5012969970703125, -1.446319580078125, -1.3913421630859375, -1.33636474609375, -1.2813873291015625, -1.226409912109375, -1.1714324951171875, -1.116455078125, -1.0614776611328125, -1.006500244140625, -0.9515228271484375, -0.89654541015625, -0.8415679931640625, -0.786590576171875, -0.7316131591796875, -0.6766357421875, -0.6216583251953125, -0.566680908203125, -0.5117034912109375, -0.45672607421875, -0.4017486572265625, -0.346771240234375, -0.2917938232421875, -0.23681640625, -0.1818389892578125, -0.126861572265625, -0.0718841552734375, -0.01690673828125, 0.0380706787109375, 0.093048095703125, 0.1480255126953125, 0.2030029296875, 0.2579803466796875, 0.312957763671875, 0.3679351806640625, 0.42291259765625, 0.4778900146484375, 0.532867431640625, 0.5878448486328125, 0.642822265625, 0.6977996826171875, 0.752777099609375, 0.8077545166015625, 0.86273193359375, 0.9177093505859375, 0.972686767578125, 1.0276641845703125, 1.0826416015625, 1.1376190185546875, 1.192596435546875, 1.2475738525390625, 1.30255126953125, 1.3575286865234375, 1.412506103515625, 1.4674835205078125, 1.5224609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 6.0, 3.0, 9.0, 5.0, 8.0, 7.0, 15.0, 21.0, 22.0, 24.0, 26.0, 38.0, 56.0, 76.0, 80.0, 139.0, 304.0, 568.0, 1288.0, 3806.0, 18718.0, 316491.0, 3765987.0, 73071.0, 8927.0, 2434.0, 970.0, 468.0, 240.0, 151.0, 84.0, 66.0, 31.0, 39.0, 24.0, 22.0, 15.0, 3.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.08251953125, -15.4931640625, -14.90380859375, -14.314453125, -13.72509765625, -13.1357421875, -12.54638671875, -11.95703125, -11.36767578125, -10.7783203125, -10.18896484375, -9.599609375, -9.01025390625, -8.4208984375, -7.83154296875, -7.2421875, -6.65283203125, -6.0634765625, -5.47412109375, -4.884765625, -4.29541015625, -3.7060546875, -3.11669921875, -2.52734375, -1.93798828125, -1.3486328125, -0.75927734375, -0.169921875, 0.41943359375, 1.0087890625, 1.59814453125, 2.1875, 2.77685546875, 3.3662109375, 3.95556640625, 4.544921875, 5.13427734375, 5.7236328125, 6.31298828125, 6.90234375, 7.49169921875, 8.0810546875, 8.67041015625, 9.259765625, 9.84912109375, 10.4384765625, 11.02783203125, 11.6171875, 12.20654296875, 12.7958984375, 13.38525390625, 13.974609375, 14.56396484375, 15.1533203125, 15.74267578125, 16.33203125, 16.92138671875, 17.5107421875, 18.10009765625, 18.689453125, 19.27880859375, 19.8681640625, 20.45751953125, 21.046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 12.0, 19.0, 62.0, 155.0, 523.0, 2550.0, 510.0, 138.0, 49.0, 26.0, 14.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.52581787109375, -7.3250732421875, -7.12432861328125, -6.923583984375, -6.72283935546875, -6.5220947265625, -6.32135009765625, -6.12060546875, -5.91986083984375, -5.7191162109375, -5.51837158203125, -5.317626953125, -5.11688232421875, -4.9161376953125, -4.71539306640625, -4.5146484375, -4.31390380859375, -4.1131591796875, -3.91241455078125, -3.711669921875, -3.51092529296875, -3.3101806640625, -3.10943603515625, -2.90869140625, -2.70794677734375, -2.5072021484375, -2.30645751953125, -2.105712890625, -1.90496826171875, -1.7042236328125, -1.50347900390625, -1.302734375, -1.10198974609375, -0.9012451171875, -0.70050048828125, -0.499755859375, -0.29901123046875, -0.0982666015625, 0.10247802734375, 0.30322265625, 0.50396728515625, 0.7047119140625, 0.90545654296875, 1.106201171875, 1.30694580078125, 1.5076904296875, 1.70843505859375, 1.9091796875, 2.10992431640625, 2.3106689453125, 2.51141357421875, 2.712158203125, 2.91290283203125, 3.1136474609375, 3.31439208984375, 3.51513671875, 3.71588134765625, 3.9166259765625, 4.11737060546875, 4.318115234375, 4.51885986328125, 4.7196044921875, 4.92034912109375, 5.12109375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 25.0, 35.0, 71.0, 122.0, 192.0, 202.0, 162.0, 96.0, 53.0, 18.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.397815704345703, -22.56698226928711, -21.73615074157715, -20.905317306518555, -20.074485778808594, -19.24365234375, -18.412818908691406, -17.581985473632812, -16.75115394592285, -15.920321464538574, -15.089488983154297, -14.258655548095703, -13.427823066711426, -12.596990585327148, -11.766157150268555, -10.935324668884277, -10.1044921875, -9.273659706115723, -8.442827224731445, -7.611993789672852, -6.781161308288574, -5.950328826904297, -5.119495868682861, -4.288662910461426, -3.4578304290771484, -2.626997709274292, -1.7961649894714355, -0.9653322696685791, -0.13449954986572266, 0.6963329315185547, 1.5271658897399902, 2.357998847961426, 3.188833236694336, 4.019665718078613, 4.850498676300049, 5.681331634521484, 6.512164115905762, 7.342996597290039, 8.173830032348633, 9.00466251373291, 9.835494995117188, 10.666327476501465, 11.497159957885742, 12.327993392944336, 13.158825874328613, 13.98965835571289, 14.820491790771484, 15.651324272155762, 16.48215675354004, 17.312990188598633, 18.143821716308594, 18.974655151367188, 19.80548858642578, 20.636320114135742, 21.467153549194336, 22.297985076904297, 23.12881851196289, 23.959651947021484, 24.790483474731445, 25.62131690979004, 26.4521484375, 27.282981872558594, 28.113815307617188, 28.94464874267578, 29.775480270385742]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 6.0, 5.0, 4.0, 8.0, 10.0, 13.0, 12.0, 22.0, 28.0, 33.0, 49.0, 52.0, 50.0, 55.0, 54.0, 67.0, 75.0, 62.0, 57.0, 54.0, 55.0, 54.0, 24.0, 30.0, 26.0, 33.0, 16.0, 19.0, 8.0, 6.0, 7.0, 5.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.823177337646484, -11.440985679626465, -11.058794021606445, -10.676602363586426, -10.294410705566406, -9.91221809387207, -9.53002643585205, -9.147834777832031, -8.765643119812012, -8.383451461791992, -8.001259803771973, -7.619067668914795, -7.236876010894775, -6.854684352874756, -6.472492218017578, -6.090300559997559, -5.708108901977539, -5.3259172439575195, -4.9437255859375, -4.561533451080322, -4.179341793060303, -3.797150135040283, -3.4149582386016846, -3.032766342163086, -2.6505746841430664, -2.268383026123047, -1.8861911296844482, -1.5039993524551392, -1.12180757522583, -0.739615797996521, -0.3574240207672119, 0.02476787567138672, 0.40696048736572266, 0.7891522645950317, 1.1713440418243408, 1.55353581905365, 1.935727596282959, 2.3179192543029785, 2.700111150741577, 3.082303047180176, 3.4644947052001953, 3.846686363220215, 4.228878021240234, 4.611070156097412, 4.993261814117432, 5.375453472137451, 5.757645606994629, 6.139837265014648, 6.522028923034668, 6.9042205810546875, 7.286412239074707, 7.668604373931885, 8.050796508789062, 8.432988166809082, 8.815179824829102, 9.197371482849121, 9.57956314086914, 9.96175479888916, 10.34394645690918, 10.7261381149292, 11.108329772949219, 11.490522384643555, 11.872714042663574, 12.254905700683594, 12.637097358703613]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 7.0, 10.0, 20.0, 25.0, 32.0, 59.0, 69.0, 87.0, 129.0, 175.0, 298.0, 447.0, 661.0, 1133.0, 1803.0, 3160.0, 5441.0, 10106.0, 19318.0, 39859.0, 85461.0, 173332.0, 259963.0, 217737.0, 117903.0, 54952.0, 26080.0, 13160.0, 6979.0, 3963.0, 2355.0, 1337.0, 825.0, 541.0, 337.0, 242.0, 152.0, 96.0, 81.0, 45.0, 33.0, 34.0, 25.0, 17.0, 14.0, 8.0, 9.0, 14.0, 2.0, 4.0, 3.0, 1.0, 1.0, 5.0], "bins": [-4.83984375, -4.69189453125, -4.5439453125, -4.39599609375, -4.248046875, -4.10009765625, -3.9521484375, -3.80419921875, -3.65625, -3.50830078125, -3.3603515625, -3.21240234375, -3.064453125, -2.91650390625, -2.7685546875, -2.62060546875, -2.47265625, -2.32470703125, -2.1767578125, -2.02880859375, -1.880859375, -1.73291015625, -1.5849609375, -1.43701171875, -1.2890625, -1.14111328125, -0.9931640625, -0.84521484375, -0.697265625, -0.54931640625, -0.4013671875, -0.25341796875, -0.10546875, 0.04248046875, 0.1904296875, 0.33837890625, 0.486328125, 0.63427734375, 0.7822265625, 0.93017578125, 1.078125, 1.22607421875, 1.3740234375, 1.52197265625, 1.669921875, 1.81787109375, 1.9658203125, 2.11376953125, 2.26171875, 2.40966796875, 2.5576171875, 2.70556640625, 2.853515625, 3.00146484375, 3.1494140625, 3.29736328125, 3.4453125, 3.59326171875, 3.7412109375, 3.88916015625, 4.037109375, 4.18505859375, 4.3330078125, 4.48095703125, 4.62890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 7.0, 5.0, 15.0, 18.0, 18.0, 28.0, 33.0, 46.0, 64.0, 42.0, 58.0, 56.0, 73.0, 71.0, 72.0, 72.0, 60.0, 56.0, 34.0, 37.0, 24.0, 27.0, 24.0, 15.0, 15.0, 10.0, 3.0, 1.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.861328125, -1.8084564208984375, -1.755584716796875, -1.7027130126953125, -1.64984130859375, -1.5969696044921875, -1.544097900390625, -1.4912261962890625, -1.4383544921875, -1.3854827880859375, -1.332611083984375, -1.2797393798828125, -1.22686767578125, -1.1739959716796875, -1.121124267578125, -1.0682525634765625, -1.015380859375, -0.9625091552734375, -0.909637451171875, -0.8567657470703125, -0.80389404296875, -0.7510223388671875, -0.698150634765625, -0.6452789306640625, -0.5924072265625, -0.5395355224609375, -0.486663818359375, -0.4337921142578125, -0.38092041015625, -0.3280487060546875, -0.275177001953125, -0.2223052978515625, -0.16943359375, -0.1165618896484375, -0.063690185546875, -0.0108184814453125, 0.04205322265625, 0.0949249267578125, 0.147796630859375, 0.2006683349609375, 0.2535400390625, 0.3064117431640625, 0.359283447265625, 0.4121551513671875, 0.46502685546875, 0.5178985595703125, 0.570770263671875, 0.6236419677734375, 0.676513671875, 0.7293853759765625, 0.782257080078125, 0.8351287841796875, 0.88800048828125, 0.9408721923828125, 0.993743896484375, 1.0466156005859375, 1.0994873046875, 1.1523590087890625, 1.205230712890625, 1.2581024169921875, 1.31097412109375, 1.3638458251953125, 1.416717529296875, 1.4695892333984375, 1.5224609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 6.0, 13.0, 26.0, 24.0, 40.0, 53.0, 95.0, 164.0, 212.0, 468.0, 783.0, 1443.0, 3182.0, 7363.0, 19574.0, 55449.0, 166590.0, 363975.0, 274831.0, 98971.0, 33161.0, 12220.0, 5100.0, 2224.0, 1125.0, 583.0, 331.0, 167.0, 131.0, 85.0, 37.0, 45.0, 24.0, 10.0, 14.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.572998046875, -5.36474609375, -5.156494140625, -4.9482421875, -4.739990234375, -4.53173828125, -4.323486328125, -4.115234375, -3.906982421875, -3.69873046875, -3.490478515625, -3.2822265625, -3.073974609375, -2.86572265625, -2.657470703125, -2.44921875, -2.240966796875, -2.03271484375, -1.824462890625, -1.6162109375, -1.407958984375, -1.19970703125, -0.991455078125, -0.783203125, -0.574951171875, -0.36669921875, -0.158447265625, 0.0498046875, 0.258056640625, 0.46630859375, 0.674560546875, 0.8828125, 1.091064453125, 1.29931640625, 1.507568359375, 1.7158203125, 1.924072265625, 2.13232421875, 2.340576171875, 2.548828125, 2.757080078125, 2.96533203125, 3.173583984375, 3.3818359375, 3.590087890625, 3.79833984375, 4.006591796875, 4.21484375, 4.423095703125, 4.63134765625, 4.839599609375, 5.0478515625, 5.256103515625, 5.46435546875, 5.672607421875, 5.880859375, 6.089111328125, 6.29736328125, 6.505615234375, 6.7138671875, 6.922119140625, 7.13037109375, 7.338623046875, 7.546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 14.0, 14.0, 21.0, 22.0, 19.0, 33.0, 35.0, 43.0, 42.0, 35.0, 44.0, 45.0, 54.0, 50.0, 52.0, 63.0, 57.0, 66.0, 32.0, 24.0, 33.0, 36.0, 24.0, 23.0, 18.0, 18.0, 18.0, 12.0, 6.0, 4.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.05078125, -5.84576416015625, -5.6407470703125, -5.43572998046875, -5.230712890625, -5.02569580078125, -4.8206787109375, -4.61566162109375, -4.41064453125, -4.20562744140625, -4.0006103515625, -3.79559326171875, -3.590576171875, -3.38555908203125, -3.1805419921875, -2.97552490234375, -2.7705078125, -2.56549072265625, -2.3604736328125, -2.15545654296875, -1.950439453125, -1.74542236328125, -1.5404052734375, -1.33538818359375, -1.13037109375, -0.92535400390625, -0.7203369140625, -0.51531982421875, -0.310302734375, -0.10528564453125, 0.0997314453125, 0.30474853515625, 0.509765625, 0.71478271484375, 0.9197998046875, 1.12481689453125, 1.329833984375, 1.53485107421875, 1.7398681640625, 1.94488525390625, 2.14990234375, 2.35491943359375, 2.5599365234375, 2.76495361328125, 2.969970703125, 3.17498779296875, 3.3800048828125, 3.58502197265625, 3.7900390625, 3.99505615234375, 4.2000732421875, 4.40509033203125, 4.610107421875, 4.81512451171875, 5.0201416015625, 5.22515869140625, 5.43017578125, 5.63519287109375, 5.8402099609375, 6.04522705078125, 6.250244140625, 6.45526123046875, 6.6602783203125, 6.86529541015625, 7.0703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 14.0, 11.0, 20.0, 31.0, 31.0, 43.0, 68.0, 87.0, 145.0, 212.0, 260.0, 333.0, 568.0, 875.0, 1580.0, 3242.0, 8778.0, 39081.0, 280957.0, 573798.0, 109394.0, 17998.0, 5304.0, 2225.0, 1239.0, 686.0, 419.0, 293.0, 247.0, 161.0, 124.0, 80.0, 66.0, 43.0, 23.0, 28.0, 16.0, 12.0, 11.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.80859375, -4.64971923828125, -4.4908447265625, -4.33197021484375, -4.173095703125, -4.01422119140625, -3.8553466796875, -3.69647216796875, -3.53759765625, -3.37872314453125, -3.2198486328125, -3.06097412109375, -2.902099609375, -2.74322509765625, -2.5843505859375, -2.42547607421875, -2.2666015625, -2.10772705078125, -1.9488525390625, -1.78997802734375, -1.631103515625, -1.47222900390625, -1.3133544921875, -1.15447998046875, -0.99560546875, -0.83673095703125, -0.6778564453125, -0.51898193359375, -0.360107421875, -0.20123291015625, -0.0423583984375, 0.11651611328125, 0.275390625, 0.43426513671875, 0.5931396484375, 0.75201416015625, 0.910888671875, 1.06976318359375, 1.2286376953125, 1.38751220703125, 1.54638671875, 1.70526123046875, 1.8641357421875, 2.02301025390625, 2.181884765625, 2.34075927734375, 2.4996337890625, 2.65850830078125, 2.8173828125, 2.97625732421875, 3.1351318359375, 3.29400634765625, 3.452880859375, 3.61175537109375, 3.7706298828125, 3.92950439453125, 4.08837890625, 4.24725341796875, 4.4061279296875, 4.56500244140625, 4.723876953125, 4.88275146484375, 5.0416259765625, 5.20050048828125, 5.359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 11.0, 10.0, 24.0, 22.0, 28.0, 61.0, 64.0, 86.0, 104.0, 100.0, 113.0, 112.0, 69.0, 58.0, 43.0, 26.0, 15.0, 7.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007376670837402344, -0.0007187053561210632, -0.0006997436285018921, -0.000680781900882721, -0.0006618201732635498, -0.0006428584456443787, -0.0006238967180252075, -0.0006049349904060364, -0.0005859732627868652, -0.0005670115351676941, -0.000548049807548523, -0.0005290880799293518, -0.0005101263523101807, -0.0004911646246910095, -0.0004722028970718384, -0.00045324116945266724, -0.0004342794418334961, -0.00041531771421432495, -0.0003963559865951538, -0.00037739425897598267, -0.0003584325313568115, -0.0003394708037376404, -0.00032050907611846924, -0.0003015473484992981, -0.00028258562088012695, -0.0002636238932609558, -0.00024466216564178467, -0.00022570043802261353, -0.00020673871040344238, -0.00018777698278427124, -0.0001688152551651001, -0.00014985352754592896, -0.0001308917999267578, -0.00011193007230758667, -9.296834468841553e-05, -7.400661706924438e-05, -5.504488945007324e-05, -3.60831618309021e-05, -1.7121434211730957e-05, 1.8402934074401855e-06, 2.0802021026611328e-05, 3.976374864578247e-05, 5.872547626495361e-05, 7.768720388412476e-05, 9.66489315032959e-05, 0.00011561065912246704, 0.00013457238674163818, 0.00015353411436080933, 0.00017249584197998047, 0.0001914575695991516, 0.00021041929721832275, 0.0002293810248374939, 0.00024834275245666504, 0.0002673044800758362, 0.0002862662076950073, 0.00030522793531417847, 0.0003241896629333496, 0.00034315139055252075, 0.0003621131181716919, 0.00038107484579086304, 0.0004000365734100342, 0.0004189983010292053, 0.00043796002864837646, 0.0004569217562675476, 0.00047588348388671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 2.0, 6.0, 15.0, 19.0, 33.0, 23.0, 55.0, 88.0, 142.0, 185.0, 381.0, 658.0, 1218.0, 2290.0, 5374.0, 15299.0, 64912.0, 364213.0, 467650.0, 93598.0, 20120.0, 6447.0, 2687.0, 1342.0, 716.0, 407.0, 232.0, 144.0, 97.0, 64.0, 46.0, 27.0, 15.0, 9.0, 12.0, 11.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.60205078125, -4.4541015625, -4.30615234375, -4.158203125, -4.01025390625, -3.8623046875, -3.71435546875, -3.56640625, -3.41845703125, -3.2705078125, -3.12255859375, -2.974609375, -2.82666015625, -2.6787109375, -2.53076171875, -2.3828125, -2.23486328125, -2.0869140625, -1.93896484375, -1.791015625, -1.64306640625, -1.4951171875, -1.34716796875, -1.19921875, -1.05126953125, -0.9033203125, -0.75537109375, -0.607421875, -0.45947265625, -0.3115234375, -0.16357421875, -0.015625, 0.13232421875, 0.2802734375, 0.42822265625, 0.576171875, 0.72412109375, 0.8720703125, 1.02001953125, 1.16796875, 1.31591796875, 1.4638671875, 1.61181640625, 1.759765625, 1.90771484375, 2.0556640625, 2.20361328125, 2.3515625, 2.49951171875, 2.6474609375, 2.79541015625, 2.943359375, 3.09130859375, 3.2392578125, 3.38720703125, 3.53515625, 3.68310546875, 3.8310546875, 3.97900390625, 4.126953125, 4.27490234375, 4.4228515625, 4.57080078125, 4.71875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 12.0, 12.0, 34.0, 34.0, 69.0, 102.0, 157.0, 170.0, 126.0, 103.0, 64.0, 34.0, 23.0, 12.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.48828125, -6.319091796875, -6.14990234375, -5.980712890625, -5.8115234375, -5.642333984375, -5.47314453125, -5.303955078125, -5.134765625, -4.965576171875, -4.79638671875, -4.627197265625, -4.4580078125, -4.288818359375, -4.11962890625, -3.950439453125, -3.78125, -3.612060546875, -3.44287109375, -3.273681640625, -3.1044921875, -2.935302734375, -2.76611328125, -2.596923828125, -2.427734375, -2.258544921875, -2.08935546875, -1.920166015625, -1.7509765625, -1.581787109375, -1.41259765625, -1.243408203125, -1.07421875, -0.905029296875, -0.73583984375, -0.566650390625, -0.3974609375, -0.228271484375, -0.05908203125, 0.110107421875, 0.279296875, 0.448486328125, 0.61767578125, 0.786865234375, 0.9560546875, 1.125244140625, 1.29443359375, 1.463623046875, 1.6328125, 1.802001953125, 1.97119140625, 2.140380859375, 2.3095703125, 2.478759765625, 2.64794921875, 2.817138671875, 2.986328125, 3.155517578125, 3.32470703125, 3.493896484375, 3.6630859375, 3.832275390625, 4.00146484375, 4.170654296875, 4.33984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 7.0, 18.0, 36.0, 35.0, 77.0, 121.0, 155.0, 175.0, 131.0, 122.0, 54.0, 26.0, 16.0, 12.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-79.0996322631836, -77.0844497680664, -75.06926727294922, -73.05408477783203, -71.03890228271484, -69.02371978759766, -67.00853729248047, -64.99336242675781, -62.97817611694336, -60.96299362182617, -58.947811126708984, -56.9326286315918, -54.917449951171875, -52.90226745605469, -50.8870849609375, -48.87190246582031, -46.856719970703125, -44.84153747558594, -42.82635498046875, -40.81117248535156, -38.795989990234375, -36.78080749511719, -34.765628814697266, -32.75044631958008, -30.73526382446289, -28.720081329345703, -26.704898834228516, -24.68971824645996, -22.674535751342773, -20.659353256225586, -18.64417266845703, -16.628990173339844, -14.613815307617188, -12.5986328125, -10.583451271057129, -8.568269729614258, -6.55308723449707, -4.537904739379883, -2.5227231979370117, -0.5075416564941406, 1.5076408386230469, 3.522822856903076, 5.5380048751831055, 7.553186893463135, 9.568368911743164, 11.583551406860352, 13.598732948303223, 15.613914489746094, 17.62909698486328, 19.64427947998047, 21.659461975097656, 23.67464256286621, 25.6898250579834, 27.705007553100586, 29.72018814086914, 31.735370635986328, 33.750553131103516, 35.7657356262207, 37.78091812133789, 39.79610061645508, 41.811279296875, 43.82646179199219, 45.841644287109375, 47.85682678222656, 49.87200927734375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 10.0, 16.0, 15.0, 14.0, 16.0, 25.0, 26.0, 27.0, 35.0, 37.0, 40.0, 49.0, 37.0, 48.0, 46.0, 65.0, 35.0, 49.0, 56.0, 65.0, 44.0, 34.0, 33.0, 31.0, 23.0, 26.0, 14.0, 15.0, 13.0, 12.0, 9.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.208011627197266, -31.07988739013672, -29.951763153076172, -28.823637008666992, -27.695512771606445, -26.5673885345459, -25.43926239013672, -24.311138153076172, -23.183013916015625, -22.054889678955078, -20.92676544189453, -19.79863929748535, -18.670515060424805, -17.542390823364258, -16.414264678955078, -15.286140441894531, -14.158016204833984, -13.029891967773438, -11.901766777038574, -10.773641586303711, -9.645517349243164, -8.517393112182617, -7.389267921447754, -6.261143207550049, -5.133018493652344, -4.004893779754639, -2.8767690658569336, -1.7486443519592285, -0.6205196380615234, 0.5076050758361816, 1.6357297897338867, 2.763854503631592, 3.8919830322265625, 5.020107746124268, 6.148232460021973, 7.276357173919678, 8.404481887817383, 9.53260612487793, 10.660731315612793, 11.788856506347656, 12.916980743408203, 14.04510498046875, 15.173230171203613, 16.301355361938477, 17.429479598999023, 18.55760383605957, 19.68572998046875, 20.813854217529297, 21.941978454589844, 23.07010269165039, 24.198226928710938, 25.326353073120117, 26.454477310180664, 27.58260154724121, 28.71072769165039, 29.838851928710938, 30.966976165771484, 32.09510040283203, 33.22322463989258, 34.351348876953125, 35.47947692871094, 36.607601165771484, 37.73572540283203, 38.86384963989258, 39.991973876953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 5.0, 3.0, 10.0, 10.0, 22.0, 31.0, 50.0, 56.0, 96.0, 104.0, 177.0, 290.0, 506.0, 803.0, 1356.0, 2573.0, 5312.0, 13283.0, 41253.0, 208564.0, 3474906.0, 359398.0, 56366.0, 16606.0, 6248.0, 2802.0, 1430.0, 798.0, 457.0, 274.0, 143.0, 108.0, 80.0, 60.0, 25.0, 20.0, 11.0, 8.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.2265625, -11.9014892578125, -11.576416015625, -11.2513427734375, -10.92626953125, -10.6011962890625, -10.276123046875, -9.9510498046875, -9.6259765625, -9.3009033203125, -8.975830078125, -8.6507568359375, -8.32568359375, -8.0006103515625, -7.675537109375, -7.3504638671875, -7.025390625, -6.7003173828125, -6.375244140625, -6.0501708984375, -5.72509765625, -5.4000244140625, -5.074951171875, -4.7498779296875, -4.4248046875, -4.0997314453125, -3.774658203125, -3.4495849609375, -3.12451171875, -2.7994384765625, -2.474365234375, -2.1492919921875, -1.82421875, -1.4991455078125, -1.174072265625, -0.8489990234375, -0.52392578125, -0.1988525390625, 0.126220703125, 0.4512939453125, 0.7763671875, 1.1014404296875, 1.426513671875, 1.7515869140625, 2.07666015625, 2.4017333984375, 2.726806640625, 3.0518798828125, 3.376953125, 3.7020263671875, 4.027099609375, 4.3521728515625, 4.67724609375, 5.0023193359375, 5.327392578125, 5.6524658203125, 5.9775390625, 6.3026123046875, 6.627685546875, 6.9527587890625, 7.27783203125, 7.6029052734375, 7.927978515625, 8.2530517578125, 8.578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 9.0, 13.0, 15.0, 18.0, 25.0, 29.0, 30.0, 43.0, 53.0, 65.0, 57.0, 64.0, 77.0, 78.0, 74.0, 56.0, 51.0, 58.0, 39.0, 24.0, 25.0, 22.0, 24.0, 10.0, 10.0, 9.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.138671875, -2.0849609375, -2.03125, -1.9775390625, -1.923828125, -1.8701171875, -1.81640625, -1.7626953125, -1.708984375, -1.6552734375, -1.6015625, -1.5478515625, -1.494140625, -1.4404296875, -1.38671875, -1.3330078125, -1.279296875, -1.2255859375, -1.171875, -1.1181640625, -1.064453125, -1.0107421875, -0.95703125, -0.9033203125, -0.849609375, -0.7958984375, -0.7421875, -0.6884765625, -0.634765625, -0.5810546875, -0.52734375, -0.4736328125, -0.419921875, -0.3662109375, -0.3125, -0.2587890625, -0.205078125, -0.1513671875, -0.09765625, -0.0439453125, 0.009765625, 0.0634765625, 0.1171875, 0.1708984375, 0.224609375, 0.2783203125, 0.33203125, 0.3857421875, 0.439453125, 0.4931640625, 0.546875, 0.6005859375, 0.654296875, 0.7080078125, 0.76171875, 0.8154296875, 0.869140625, 0.9228515625, 0.9765625, 1.0302734375, 1.083984375, 1.1376953125, 1.19140625, 1.2451171875, 1.298828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 13.0, 14.0, 23.0, 22.0, 37.0, 56.0, 99.0, 167.0, 377.0, 858.0, 2298.0, 7555.0, 41425.0, 1158725.0, 2910726.0, 58424.0, 9206.0, 2609.0, 883.0, 358.0, 148.0, 92.0, 54.0, 25.0, 27.0, 12.0, 9.0, 11.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.921875, -16.41015625, -15.8984375, -15.38671875, -14.875, -14.36328125, -13.8515625, -13.33984375, -12.828125, -12.31640625, -11.8046875, -11.29296875, -10.78125, -10.26953125, -9.7578125, -9.24609375, -8.734375, -8.22265625, -7.7109375, -7.19921875, -6.6875, -6.17578125, -5.6640625, -5.15234375, -4.640625, -4.12890625, -3.6171875, -3.10546875, -2.59375, -2.08203125, -1.5703125, -1.05859375, -0.546875, -0.03515625, 0.4765625, 0.98828125, 1.5, 2.01171875, 2.5234375, 3.03515625, 3.546875, 4.05859375, 4.5703125, 5.08203125, 5.59375, 6.10546875, 6.6171875, 7.12890625, 7.640625, 8.15234375, 8.6640625, 9.17578125, 9.6875, 10.19921875, 10.7109375, 11.22265625, 11.734375, 12.24609375, 12.7578125, 13.26953125, 13.78125, 14.29296875, 14.8046875, 15.31640625, 15.828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 13.0, 28.0, 43.0, 52.0, 81.0, 169.0, 297.0, 715.0, 1430.0, 575.0, 269.0, 143.0, 64.0, 56.0, 28.0, 27.0, 22.0, 13.0, 8.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.64910888671875, -4.5247802734375, -4.40045166015625, -4.276123046875, -4.15179443359375, -4.0274658203125, -3.90313720703125, -3.77880859375, -3.65447998046875, -3.5301513671875, -3.40582275390625, -3.281494140625, -3.15716552734375, -3.0328369140625, -2.90850830078125, -2.7841796875, -2.65985107421875, -2.5355224609375, -2.41119384765625, -2.286865234375, -2.16253662109375, -2.0382080078125, -1.91387939453125, -1.78955078125, -1.66522216796875, -1.5408935546875, -1.41656494140625, -1.292236328125, -1.16790771484375, -1.0435791015625, -0.91925048828125, -0.794921875, -0.67059326171875, -0.5462646484375, -0.42193603515625, -0.297607421875, -0.17327880859375, -0.0489501953125, 0.07537841796875, 0.19970703125, 0.32403564453125, 0.4483642578125, 0.57269287109375, 0.697021484375, 0.82135009765625, 0.9456787109375, 1.07000732421875, 1.1943359375, 1.31866455078125, 1.4429931640625, 1.56732177734375, 1.691650390625, 1.81597900390625, 1.9403076171875, 2.06463623046875, 2.18896484375, 2.31329345703125, 2.4376220703125, 2.56195068359375, 2.686279296875, 2.81060791015625, 2.9349365234375, 3.05926513671875, 3.18359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 12.0, 11.0, 19.0, 35.0, 59.0, 62.0, 76.0, 130.0, 123.0, 116.0, 105.0, 82.0, 63.0, 41.0, 17.0, 16.0, 9.0, 9.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.54871940612793, -26.7474422454834, -25.946165084838867, -25.144886016845703, -24.343608856201172, -23.54233169555664, -22.74105453491211, -21.939777374267578, -21.138500213623047, -20.337223052978516, -19.535945892333984, -18.734668731689453, -17.93338966369629, -17.132112503051758, -16.330835342407227, -15.529558181762695, -14.728279113769531, -13.927001953125, -13.125723838806152, -12.324446678161621, -11.523168563842773, -10.721891403198242, -9.920614242553711, -9.11933708190918, -8.318058967590332, -7.516781330108643, -6.715503692626953, -5.914226531982422, -5.112948894500732, -4.311671257019043, -3.5103940963745117, -2.7091164588928223, -1.9078388214111328, -1.106561303138733, -0.305283784866333, 0.49599361419677734, 1.2972712516784668, 2.0985488891601562, 2.8998260498046875, 3.701103687286377, 4.502381324768066, 5.303658962249756, 6.104936599731445, 6.906213760375977, 7.707491397857666, 8.508769035339355, 9.310046195983887, 10.111324310302734, 10.912601470947266, 11.713878631591797, 12.515156745910645, 13.316433906555176, 14.117712020874023, 14.918989181518555, 15.720266342163086, 16.521543502807617, 17.32282257080078, 18.124099731445312, 18.925376892089844, 19.726654052734375, 20.52793312072754, 21.32921028137207, 22.1304874420166, 22.931764602661133, 23.733041763305664]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 13.0, 15.0, 23.0, 29.0, 27.0, 36.0, 36.0, 56.0, 49.0, 52.0, 55.0, 73.0, 49.0, 67.0, 51.0, 53.0, 57.0, 53.0, 34.0, 37.0, 31.0, 24.0, 18.0, 11.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.782346725463867, -17.284421920776367, -16.7864990234375, -16.28857421875, -15.7906494140625, -15.292725563049316, -14.794801712036133, -14.296876907348633, -13.79895305633545, -13.301029205322266, -12.803104400634766, -12.305180549621582, -11.807255744934082, -11.309331893920898, -10.811407089233398, -10.313483238220215, -9.815559387207031, -9.317635536193848, -8.819710731506348, -8.321786880493164, -7.823862552642822, -7.3259382247924805, -6.828013896942139, -6.330089569091797, -5.832164764404297, -5.334240436553955, -4.836316108703613, -4.33839225769043, -3.840467929840088, -3.342543601989746, -2.8446192741394043, -2.3466951847076416, -1.848771095275879, -1.3508468866348267, -0.8529226183891296, -0.3549983501434326, 0.14292585849761963, 0.6408500671386719, 1.1387743949890137, 1.6366984844207764, 2.134622812271118, 2.63254714012146, 3.1304712295532227, 3.6283955574035645, 4.126319885253906, 4.62424373626709, 5.12216854095459, 5.620092391967773, 6.118016719818115, 6.615941047668457, 7.113865375518799, 7.611789703369141, 8.109713554382324, 8.607637405395508, 9.105562210083008, 9.603486061096191, 10.101410865783691, 10.599334716796875, 11.097259521484375, 11.595183372497559, 12.093108177185059, 12.591032028198242, 13.088956832885742, 13.586880683898926, 14.08480453491211]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 22.0, 17.0, 45.0, 59.0, 97.0, 150.0, 212.0, 384.0, 709.0, 1278.0, 2642.0, 6922.0, 20253.0, 73088.0, 298000.0, 456866.0, 135066.0, 34147.0, 10744.0, 3994.0, 1779.0, 831.0, 470.0, 277.0, 157.0, 103.0, 81.0, 36.0, 37.0, 22.0, 11.0, 8.0, 9.0, 1.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7890625, -10.4642333984375, -10.139404296875, -9.8145751953125, -9.48974609375, -9.1649169921875, -8.840087890625, -8.5152587890625, -8.1904296875, -7.8656005859375, -7.540771484375, -7.2159423828125, -6.89111328125, -6.5662841796875, -6.241455078125, -5.9166259765625, -5.591796875, -5.2669677734375, -4.942138671875, -4.6173095703125, -4.29248046875, -3.9676513671875, -3.642822265625, -3.3179931640625, -2.9931640625, -2.6683349609375, -2.343505859375, -2.0186767578125, -1.69384765625, -1.3690185546875, -1.044189453125, -0.7193603515625, -0.39453125, -0.0697021484375, 0.255126953125, 0.5799560546875, 0.90478515625, 1.2296142578125, 1.554443359375, 1.8792724609375, 2.2041015625, 2.5289306640625, 2.853759765625, 3.1785888671875, 3.50341796875, 3.8282470703125, 4.153076171875, 4.4779052734375, 4.802734375, 5.1275634765625, 5.452392578125, 5.7772216796875, 6.10205078125, 6.4268798828125, 6.751708984375, 7.0765380859375, 7.4013671875, 7.7261962890625, 8.051025390625, 8.3758544921875, 8.70068359375, 9.0255126953125, 9.350341796875, 9.6751708984375, 10.0]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 14.0, 22.0, 14.0, 27.0, 34.0, 37.0, 45.0, 60.0, 73.0, 83.0, 78.0, 97.0, 75.0, 72.0, 56.0, 52.0, 34.0, 33.0, 29.0, 14.0, 17.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.1169891357421875, -2.056243896484375, -1.9954986572265625, -1.93475341796875, -1.8740081787109375, -1.813262939453125, -1.7525177001953125, -1.6917724609375, -1.6310272216796875, -1.570281982421875, -1.5095367431640625, -1.44879150390625, -1.3880462646484375, -1.327301025390625, -1.2665557861328125, -1.205810546875, -1.1450653076171875, -1.084320068359375, -1.0235748291015625, -0.96282958984375, -0.9020843505859375, -0.841339111328125, -0.7805938720703125, -0.7198486328125, -0.6591033935546875, -0.598358154296875, -0.5376129150390625, -0.47686767578125, -0.4161224365234375, -0.355377197265625, -0.2946319580078125, -0.23388671875, -0.1731414794921875, -0.112396240234375, -0.0516510009765625, 0.00909423828125, 0.0698394775390625, 0.130584716796875, 0.1913299560546875, 0.2520751953125, 0.3128204345703125, 0.373565673828125, 0.4343109130859375, 0.49505615234375, 0.5558013916015625, 0.616546630859375, 0.6772918701171875, 0.738037109375, 0.7987823486328125, 0.859527587890625, 0.9202728271484375, 0.98101806640625, 1.0417633056640625, 1.102508544921875, 1.1632537841796875, 1.2239990234375, 1.2847442626953125, 1.345489501953125, 1.4062347412109375, 1.46697998046875, 1.5277252197265625, 1.588470458984375, 1.6492156982421875, 1.7099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 9.0, 4.0, 13.0, 24.0, 23.0, 45.0, 63.0, 81.0, 152.0, 261.0, 477.0, 864.0, 1652.0, 3514.0, 7370.0, 15957.0, 37534.0, 96157.0, 236723.0, 337700.0, 184607.0, 72217.0, 28951.0, 12646.0, 5734.0, 2693.0, 1321.0, 759.0, 425.0, 222.0, 116.0, 90.0, 46.0, 29.0, 17.0, 15.0, 9.0, 10.0, 5.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.57257080078125, -4.3990478515625, -4.22552490234375, -4.052001953125, -3.87847900390625, -3.7049560546875, -3.53143310546875, -3.35791015625, -3.18438720703125, -3.0108642578125, -2.83734130859375, -2.663818359375, -2.49029541015625, -2.3167724609375, -2.14324951171875, -1.9697265625, -1.79620361328125, -1.6226806640625, -1.44915771484375, -1.275634765625, -1.10211181640625, -0.9285888671875, -0.75506591796875, -0.58154296875, -0.40802001953125, -0.2344970703125, -0.06097412109375, 0.112548828125, 0.28607177734375, 0.4595947265625, 0.63311767578125, 0.806640625, 0.98016357421875, 1.1536865234375, 1.32720947265625, 1.500732421875, 1.67425537109375, 1.8477783203125, 2.02130126953125, 2.19482421875, 2.36834716796875, 2.5418701171875, 2.71539306640625, 2.888916015625, 3.06243896484375, 3.2359619140625, 3.40948486328125, 3.5830078125, 3.75653076171875, 3.9300537109375, 4.10357666015625, 4.277099609375, 4.45062255859375, 4.6241455078125, 4.79766845703125, 4.97119140625, 5.14471435546875, 5.3182373046875, 5.49176025390625, 5.665283203125, 5.83880615234375, 6.0123291015625, 6.18585205078125, 6.359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 8.0, 8.0, 19.0, 18.0, 17.0, 20.0, 26.0, 24.0, 30.0, 42.0, 36.0, 52.0, 46.0, 43.0, 35.0, 47.0, 40.0, 55.0, 45.0, 39.0, 26.0, 54.0, 31.0, 31.0, 28.0, 18.0, 30.0, 22.0, 11.0, 14.0, 13.0, 11.0, 9.0, 5.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -6.03607177734375, -5.8651123046875, -5.69415283203125, -5.523193359375, -5.35223388671875, -5.1812744140625, -5.01031494140625, -4.83935546875, -4.66839599609375, -4.4974365234375, -4.32647705078125, -4.155517578125, -3.98455810546875, -3.8135986328125, -3.64263916015625, -3.4716796875, -3.30072021484375, -3.1297607421875, -2.95880126953125, -2.787841796875, -2.61688232421875, -2.4459228515625, -2.27496337890625, -2.10400390625, -1.93304443359375, -1.7620849609375, -1.59112548828125, -1.420166015625, -1.24920654296875, -1.0782470703125, -0.90728759765625, -0.736328125, -0.56536865234375, -0.3944091796875, -0.22344970703125, -0.052490234375, 0.11846923828125, 0.2894287109375, 0.46038818359375, 0.63134765625, 0.80230712890625, 0.9732666015625, 1.14422607421875, 1.315185546875, 1.48614501953125, 1.6571044921875, 1.82806396484375, 1.9990234375, 2.16998291015625, 2.3409423828125, 2.51190185546875, 2.682861328125, 2.85382080078125, 3.0247802734375, 3.19573974609375, 3.36669921875, 3.53765869140625, 3.7086181640625, 3.87957763671875, 4.050537109375, 4.22149658203125, 4.3924560546875, 4.56341552734375, 4.734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 16.0, 12.0, 17.0, 34.0, 41.0, 83.0, 120.0, 267.0, 553.0, 1127.0, 2921.0, 8230.0, 26459.0, 101527.0, 346812.0, 389186.0, 123286.0, 32340.0, 9581.0, 3307.0, 1315.0, 586.0, 325.0, 161.0, 85.0, 64.0, 33.0, 18.0, 13.0, 15.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.6328125, -3.5321044921875, -3.431396484375, -3.3306884765625, -3.22998046875, -3.1292724609375, -3.028564453125, -2.9278564453125, -2.8271484375, -2.7264404296875, -2.625732421875, -2.5250244140625, -2.42431640625, -2.3236083984375, -2.222900390625, -2.1221923828125, -2.021484375, -1.9207763671875, -1.820068359375, -1.7193603515625, -1.61865234375, -1.5179443359375, -1.417236328125, -1.3165283203125, -1.2158203125, -1.1151123046875, -1.014404296875, -0.9136962890625, -0.81298828125, -0.7122802734375, -0.611572265625, -0.5108642578125, -0.41015625, -0.3094482421875, -0.208740234375, -0.1080322265625, -0.00732421875, 0.0933837890625, 0.194091796875, 0.2947998046875, 0.3955078125, 0.4962158203125, 0.596923828125, 0.6976318359375, 0.79833984375, 0.8990478515625, 0.999755859375, 1.1004638671875, 1.201171875, 1.3018798828125, 1.402587890625, 1.5032958984375, 1.60400390625, 1.7047119140625, 1.805419921875, 1.9061279296875, 2.0068359375, 2.1075439453125, 2.208251953125, 2.3089599609375, 2.40966796875, 2.5103759765625, 2.611083984375, 2.7117919921875, 2.8125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 19.0, 19.0, 27.0, 37.0, 54.0, 75.0, 95.0, 107.0, 127.0, 104.0, 94.0, 69.0, 47.0, 37.0, 24.0, 20.0, 13.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003800392150878906, -0.00036448240280151367, -0.0003489255905151367, -0.00033336877822875977, -0.0003178119659423828, -0.00030225515365600586, -0.0002866983413696289, -0.00027114152908325195, -0.000255584716796875, -0.00024002790451049805, -0.0002244710922241211, -0.00020891427993774414, -0.0001933574676513672, -0.00017780065536499023, -0.00016224384307861328, -0.00014668703079223633, -0.00013113021850585938, -0.00011557340621948242, -0.00010001659393310547, -8.445978164672852e-05, -6.890296936035156e-05, -5.334615707397461e-05, -3.7789344787597656e-05, -2.2232532501220703e-05, -6.67572021484375e-06, 8.881092071533203e-06, 2.4437904357910156e-05, 3.999471664428711e-05, 5.555152893066406e-05, 7.110834121704102e-05, 8.666515350341797e-05, 0.00010222196578979492, 0.00011777877807617188, 0.00013333559036254883, 0.00014889240264892578, 0.00016444921493530273, 0.0001800060272216797, 0.00019556283950805664, 0.0002111196517944336, 0.00022667646408081055, 0.0002422332763671875, 0.00025779008865356445, 0.0002733469009399414, 0.00028890371322631836, 0.0003044605255126953, 0.00032001733779907227, 0.0003355741500854492, 0.00035113096237182617, 0.0003666877746582031, 0.0003822445869445801, 0.00039780139923095703, 0.000413358211517334, 0.00042891502380371094, 0.0004444718360900879, 0.00046002864837646484, 0.0004755854606628418, 0.0004911422729492188, 0.0005066990852355957, 0.0005222558975219727, 0.0005378127098083496, 0.0005533695220947266, 0.0005689263343811035, 0.0005844831466674805, 0.0006000399589538574, 0.0006155967712402344]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 6.0, 7.0, 15.0, 16.0, 21.0, 24.0, 33.0, 64.0, 97.0, 153.0, 275.0, 415.0, 801.0, 1522.0, 3049.0, 6768.0, 16977.0, 46761.0, 152095.0, 400812.0, 282232.0, 87465.0, 28590.0, 10751.0, 4684.0, 2310.0, 1147.0, 576.0, 323.0, 206.0, 121.0, 85.0, 52.0, 35.0, 21.0, 11.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.41015625, -3.3148193359375, -3.219482421875, -3.1241455078125, -3.02880859375, -2.9334716796875, -2.838134765625, -2.7427978515625, -2.6474609375, -2.5521240234375, -2.456787109375, -2.3614501953125, -2.26611328125, -2.1707763671875, -2.075439453125, -1.9801025390625, -1.884765625, -1.7894287109375, -1.694091796875, -1.5987548828125, -1.50341796875, -1.4080810546875, -1.312744140625, -1.2174072265625, -1.1220703125, -1.0267333984375, -0.931396484375, -0.8360595703125, -0.74072265625, -0.6453857421875, -0.550048828125, -0.4547119140625, -0.359375, -0.2640380859375, -0.168701171875, -0.0733642578125, 0.02197265625, 0.1173095703125, 0.212646484375, 0.3079833984375, 0.4033203125, 0.4986572265625, 0.593994140625, 0.6893310546875, 0.78466796875, 0.8800048828125, 0.975341796875, 1.0706787109375, 1.166015625, 1.2613525390625, 1.356689453125, 1.4520263671875, 1.54736328125, 1.6427001953125, 1.738037109375, 1.8333740234375, 1.9287109375, 2.0240478515625, 2.119384765625, 2.2147216796875, 2.31005859375, 2.4053955078125, 2.500732421875, 2.5960693359375, 2.69140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 6.0, 4.0, 2.0, 12.0, 13.0, 23.0, 23.0, 38.0, 49.0, 55.0, 88.0, 85.0, 95.0, 101.0, 104.0, 88.0, 56.0, 45.0, 28.0, 22.0, 18.0, 13.0, 7.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.001953125, -2.902435302734375, -2.80291748046875, -2.703399658203125, -2.6038818359375, -2.504364013671875, -2.40484619140625, -2.305328369140625, -2.205810546875, -2.106292724609375, -2.00677490234375, -1.907257080078125, -1.8077392578125, -1.708221435546875, -1.60870361328125, -1.509185791015625, -1.40966796875, -1.310150146484375, -1.21063232421875, -1.111114501953125, -1.0115966796875, -0.912078857421875, -0.81256103515625, -0.713043212890625, -0.613525390625, -0.514007568359375, -0.41448974609375, -0.314971923828125, -0.2154541015625, -0.115936279296875, -0.01641845703125, 0.083099365234375, 0.1826171875, 0.282135009765625, 0.38165283203125, 0.481170654296875, 0.5806884765625, 0.680206298828125, 0.77972412109375, 0.879241943359375, 0.978759765625, 1.078277587890625, 1.17779541015625, 1.277313232421875, 1.3768310546875, 1.476348876953125, 1.57586669921875, 1.675384521484375, 1.77490234375, 1.874420166015625, 1.97393798828125, 2.073455810546875, 2.1729736328125, 2.272491455078125, 2.37200927734375, 2.471527099609375, 2.571044921875, 2.670562744140625, 2.77008056640625, 2.869598388671875, 2.9691162109375, 3.068634033203125, 3.16815185546875, 3.267669677734375, 3.3671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 11.0, 5.0, 8.0, 7.0, 13.0, 24.0, 36.0, 48.0, 86.0, 120.0, 140.0, 134.0, 106.0, 93.0, 70.0, 41.0, 19.0, 17.0, 10.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.18482208251953, -34.691253662109375, -33.19768142700195, -31.704113006591797, -30.21054458618164, -28.71697425842285, -27.223403930664062, -25.729835510253906, -24.23626708984375, -22.74269676208496, -21.249128341674805, -19.755558013916016, -18.26198959350586, -16.76841926574707, -15.274849891662598, -13.781280517578125, -12.287710189819336, -10.794140815734863, -9.30057144165039, -7.80700159072876, -6.313432216644287, -4.8198628425598145, -3.3262929916381836, -1.832723617553711, -0.3391542434692383, 1.154415249824524, 2.647984743118286, 4.141554355621338, 5.6351237297058105, 7.128693103790283, 8.622262954711914, 10.115832328796387, 11.60940170288086, 13.102971076965332, 14.596540451049805, 16.090110778808594, 17.58367919921875, 19.07724952697754, 20.570819854736328, 22.064388275146484, 23.55795669555664, 25.05152702331543, 26.545095443725586, 28.038665771484375, 29.53223419189453, 31.02580451965332, 32.51937484741211, 34.012943267822266, 35.50651550292969, 37.000083923339844, 38.493656158447266, 39.98722457885742, 41.48079299926758, 42.974361419677734, 44.467933654785156, 45.96150207519531, 47.45507049560547, 48.948638916015625, 50.44221115112305, 51.9357795715332, 53.42934799194336, 54.922916412353516, 56.41648864746094, 57.910057067871094, 59.40362548828125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 6.0, 9.0, 9.0, 11.0, 16.0, 13.0, 18.0, 20.0, 30.0, 37.0, 38.0, 42.0, 40.0, 43.0, 47.0, 50.0, 53.0, 60.0, 64.0, 47.0, 46.0, 46.0, 34.0, 41.0, 31.0, 36.0, 23.0, 19.0, 20.0, 11.0, 9.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.04861068725586, -30.934507369995117, -29.820402145385742, -28.706298828125, -27.592193603515625, -26.478090286254883, -25.36398696899414, -24.249881744384766, -23.135778427124023, -22.02167510986328, -20.907569885253906, -19.793466567993164, -18.679363250732422, -17.565258026123047, -16.451154708862305, -15.337050437927246, -14.222946166992188, -13.108841896057129, -11.99473762512207, -10.880634307861328, -9.76653003692627, -8.652425765991211, -7.5383219718933105, -6.42421817779541, -5.310113906860352, -4.196009635925293, -3.0819058418273926, -1.967801809310913, -0.8536977767944336, 0.260406494140625, 1.3745102882385254, 2.488614082336426, 3.60272216796875, 4.716826438903809, 5.830930233001709, 6.945034027099609, 8.059138298034668, 9.173242568969727, 10.287345886230469, 11.401450157165527, 12.515554428100586, 13.629658699035645, 14.743762969970703, 15.857866287231445, 16.971969604492188, 18.086074829101562, 19.200178146362305, 20.314281463623047, 21.428386688232422, 22.542490005493164, 23.65659523010254, 24.77069854736328, 25.884803771972656, 26.9989070892334, 28.11301040649414, 29.227115631103516, 30.341218948364258, 31.455322265625, 32.569427490234375, 33.68353271484375, 34.79763412475586, 35.911739349365234, 37.02584457397461, 38.13994598388672, 39.254051208496094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 7.0, 8.0, 13.0, 12.0, 19.0, 43.0, 50.0, 64.0, 118.0, 209.0, 339.0, 653.0, 1179.0, 2893.0, 9518.0, 52903.0, 3615858.0, 469979.0, 30128.0, 6405.0, 2005.0, 871.0, 430.0, 263.0, 116.0, 73.0, 55.0, 25.0, 13.0, 10.0, 10.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.40625, -14.9642333984375, -14.522216796875, -14.0802001953125, -13.63818359375, -13.1961669921875, -12.754150390625, -12.3121337890625, -11.8701171875, -11.4281005859375, -10.986083984375, -10.5440673828125, -10.10205078125, -9.6600341796875, -9.218017578125, -8.7760009765625, -8.333984375, -7.8919677734375, -7.449951171875, -7.0079345703125, -6.56591796875, -6.1239013671875, -5.681884765625, -5.2398681640625, -4.7978515625, -4.3558349609375, -3.913818359375, -3.4718017578125, -3.02978515625, -2.5877685546875, -2.145751953125, -1.7037353515625, -1.26171875, -0.8197021484375, -0.377685546875, 0.0643310546875, 0.50634765625, 0.9483642578125, 1.390380859375, 1.8323974609375, 2.2744140625, 2.7164306640625, 3.158447265625, 3.6004638671875, 4.04248046875, 4.4844970703125, 4.926513671875, 5.3685302734375, 5.810546875, 6.2525634765625, 6.694580078125, 7.1365966796875, 7.57861328125, 8.0206298828125, 8.462646484375, 8.9046630859375, 9.3466796875, 9.7886962890625, 10.230712890625, 10.6727294921875, 11.11474609375, 11.5567626953125, 11.998779296875, 12.4407958984375, 12.8828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 11.0, 10.0, 16.0, 23.0, 39.0, 42.0, 54.0, 60.0, 50.0, 76.0, 81.0, 74.0, 86.0, 60.0, 69.0, 63.0, 35.0, 35.0, 28.0, 29.0, 14.0, 15.0, 10.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.3111724853515625, -2.249298095703125, -2.1874237060546875, -2.12554931640625, -2.0636749267578125, -2.001800537109375, -1.9399261474609375, -1.8780517578125, -1.8161773681640625, -1.754302978515625, -1.6924285888671875, -1.63055419921875, -1.5686798095703125, -1.506805419921875, -1.4449310302734375, -1.383056640625, -1.3211822509765625, -1.259307861328125, -1.1974334716796875, -1.13555908203125, -1.0736846923828125, -1.011810302734375, -0.9499359130859375, -0.8880615234375, -0.8261871337890625, -0.764312744140625, -0.7024383544921875, -0.64056396484375, -0.5786895751953125, -0.516815185546875, -0.4549407958984375, -0.39306640625, -0.3311920166015625, -0.269317626953125, -0.2074432373046875, -0.14556884765625, -0.0836944580078125, -0.021820068359375, 0.0400543212890625, 0.1019287109375, 0.1638031005859375, 0.225677490234375, 0.2875518798828125, 0.34942626953125, 0.4113006591796875, 0.473175048828125, 0.5350494384765625, 0.596923828125, 0.6587982177734375, 0.720672607421875, 0.7825469970703125, 0.84442138671875, 0.9062957763671875, 0.968170166015625, 1.0300445556640625, 1.0919189453125, 1.1537933349609375, 1.215667724609375, 1.2775421142578125, 1.33941650390625, 1.4012908935546875, 1.463165283203125, 1.5250396728515625, 1.5869140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 12.0, 4.0, 7.0, 13.0, 14.0, 12.0, 11.0, 27.0, 43.0, 33.0, 41.0, 62.0, 78.0, 80.0, 144.0, 198.0, 383.0, 993.0, 3804.0, 25538.0, 619286.0, 3485350.0, 49393.0, 6123.0, 1331.0, 468.0, 230.0, 139.0, 97.0, 76.0, 52.0, 43.0, 33.0, 29.0, 21.0, 22.0, 19.0, 19.0, 11.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.25, -14.80322265625, -14.3564453125, -13.90966796875, -13.462890625, -13.01611328125, -12.5693359375, -12.12255859375, -11.67578125, -11.22900390625, -10.7822265625, -10.33544921875, -9.888671875, -9.44189453125, -8.9951171875, -8.54833984375, -8.1015625, -7.65478515625, -7.2080078125, -6.76123046875, -6.314453125, -5.86767578125, -5.4208984375, -4.97412109375, -4.52734375, -4.08056640625, -3.6337890625, -3.18701171875, -2.740234375, -2.29345703125, -1.8466796875, -1.39990234375, -0.953125, -0.50634765625, -0.0595703125, 0.38720703125, 0.833984375, 1.28076171875, 1.7275390625, 2.17431640625, 2.62109375, 3.06787109375, 3.5146484375, 3.96142578125, 4.408203125, 4.85498046875, 5.3017578125, 5.74853515625, 6.1953125, 6.64208984375, 7.0888671875, 7.53564453125, 7.982421875, 8.42919921875, 8.8759765625, 9.32275390625, 9.76953125, 10.21630859375, 10.6630859375, 11.10986328125, 11.556640625, 12.00341796875, 12.4501953125, 12.89697265625, 13.34375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 8.0, 20.0, 37.0, 99.0, 303.0, 2505.0, 791.0, 183.0, 73.0, 30.0, 16.0, 12.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.8109130859375, -8.614013671875, -8.4171142578125, -8.22021484375, -8.0233154296875, -7.826416015625, -7.6295166015625, -7.4326171875, -7.2357177734375, -7.038818359375, -6.8419189453125, -6.64501953125, -6.4481201171875, -6.251220703125, -6.0543212890625, -5.857421875, -5.6605224609375, -5.463623046875, -5.2667236328125, -5.06982421875, -4.8729248046875, -4.676025390625, -4.4791259765625, -4.2822265625, -4.0853271484375, -3.888427734375, -3.6915283203125, -3.49462890625, -3.2977294921875, -3.100830078125, -2.9039306640625, -2.70703125, -2.5101318359375, -2.313232421875, -2.1163330078125, -1.91943359375, -1.7225341796875, -1.525634765625, -1.3287353515625, -1.1318359375, -0.9349365234375, -0.738037109375, -0.5411376953125, -0.34423828125, -0.1473388671875, 0.049560546875, 0.2464599609375, 0.443359375, 0.6402587890625, 0.837158203125, 1.0340576171875, 1.23095703125, 1.4278564453125, 1.624755859375, 1.8216552734375, 2.0185546875, 2.2154541015625, 2.412353515625, 2.6092529296875, 2.80615234375, 3.0030517578125, 3.199951171875, 3.3968505859375, 3.59375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 10.0, 23.0, 56.0, 115.0, 172.0, 238.0, 194.0, 112.0, 50.0, 16.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.31610107421875, -25.355833053588867, -24.395566940307617, -23.435298919677734, -22.47503089904785, -21.5147647857666, -20.55449676513672, -19.59423065185547, -18.633962631225586, -17.673694610595703, -16.713428497314453, -15.75316047668457, -14.792893409729004, -13.832626342773438, -12.872358322143555, -11.912091255187988, -10.951823234558105, -9.991556167602539, -9.031288146972656, -8.07102108001709, -7.110754013061523, -6.150486469268799, -5.190218925476074, -4.229951858520508, -3.269684314727783, -2.3094170093536377, -1.3491495847702026, -0.3888821601867676, 0.5713851451873779, 1.5316524505615234, 2.491919994354248, 3.4521870613098145, 4.412454605102539, 5.372722148895264, 6.33298921585083, 7.293256759643555, 8.253523826599121, 9.213790893554688, 10.17405891418457, 11.134325981140137, 12.094593048095703, 13.05486011505127, 14.015128135681152, 14.975395202636719, 15.935662269592285, 16.89592933654785, 17.856197357177734, 18.816463470458984, 19.7767333984375, 20.737001419067383, 21.697267532348633, 22.657535552978516, 23.6178035736084, 24.57806968688965, 25.53833770751953, 26.49860382080078, 27.458871841430664, 28.419139862060547, 29.379405975341797, 30.33967399597168, 31.299942016601562, 32.26020812988281, 33.22047424316406, 34.18074417114258, 35.14101028442383]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 17.0, 20.0, 36.0, 52.0, 49.0, 72.0, 95.0, 89.0, 80.0, 93.0, 88.0, 87.0, 67.0, 40.0, 33.0, 23.0, 16.0, 16.0, 10.0, 3.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.136943817138672, -15.646822929382324, -15.15670108795166, -14.666580200195312, -14.176458358764648, -13.6863374710083, -13.196216583251953, -12.706094741821289, -12.215973854064941, -11.725852966308594, -11.23573112487793, -10.745610237121582, -10.255489349365234, -9.76536750793457, -9.275246620178223, -8.785125732421875, -8.295003890991211, -7.804882526397705, -7.314761161804199, -6.824640274047852, -6.334518909454346, -5.84439754486084, -5.354276657104492, -4.864155292510986, -4.3740339279174805, -3.8839125633239746, -3.393791437149048, -2.903670310974121, -2.4135489463806152, -1.9234275817871094, -1.4333064556121826, -0.9431853294372559, -0.45306396484375, 0.03705728054046631, 0.5271785259246826, 1.017299771308899, 1.5074210166931152, 1.997542381286621, 2.487663507461548, 2.9777846336364746, 3.4679059982299805, 3.9580273628234863, 4.448148727416992, 4.93826961517334, 5.428390979766846, 5.918512344360352, 6.408633232116699, 6.898754596710205, 7.388875961303711, 7.878997325897217, 8.369118690490723, 8.85923957824707, 9.349361419677734, 9.839482307434082, 10.32960319519043, 10.819725036621094, 11.309845924377441, 11.799966812133789, 12.290088653564453, 12.7802095413208, 13.270330429077148, 13.760452270507812, 14.25057315826416, 14.740694046020508, 15.230815887451172]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 9.0, 13.0, 29.0, 22.0, 37.0, 27.0, 65.0, 80.0, 139.0, 238.0, 343.0, 577.0, 1018.0, 1914.0, 3991.0, 9940.0, 26863.0, 86163.0, 281883.0, 404019.0, 156344.0, 46867.0, 15618.0, 6073.0, 2790.0, 1338.0, 789.0, 507.0, 277.0, 176.0, 118.0, 70.0, 67.0, 47.0, 30.0, 18.0, 14.0, 10.0, 7.0, 2.0, 3.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.140625, -7.8714599609375, -7.602294921875, -7.3331298828125, -7.06396484375, -6.7947998046875, -6.525634765625, -6.2564697265625, -5.9873046875, -5.7181396484375, -5.448974609375, -5.1798095703125, -4.91064453125, -4.6414794921875, -4.372314453125, -4.1031494140625, -3.833984375, -3.5648193359375, -3.295654296875, -3.0264892578125, -2.75732421875, -2.4881591796875, -2.218994140625, -1.9498291015625, -1.6806640625, -1.4114990234375, -1.142333984375, -0.8731689453125, -0.60400390625, -0.3348388671875, -0.065673828125, 0.2034912109375, 0.47265625, 0.7418212890625, 1.010986328125, 1.2801513671875, 1.54931640625, 1.8184814453125, 2.087646484375, 2.3568115234375, 2.6259765625, 2.8951416015625, 3.164306640625, 3.4334716796875, 3.70263671875, 3.9718017578125, 4.240966796875, 4.5101318359375, 4.779296875, 5.0484619140625, 5.317626953125, 5.5867919921875, 5.85595703125, 6.1251220703125, 6.394287109375, 6.6634521484375, 6.9326171875, 7.2017822265625, 7.470947265625, 7.7401123046875, 8.00927734375, 8.2784423828125, 8.547607421875, 8.8167724609375, 9.0859375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 17.0, 13.0, 16.0, 44.0, 39.0, 37.0, 49.0, 59.0, 66.0, 94.0, 78.0, 76.0, 80.0, 60.0, 65.0, 58.0, 42.0, 17.0, 24.0, 16.0, 16.0, 11.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.342071533203125, -2.27984619140625, -2.217620849609375, -2.1553955078125, -2.093170166015625, -2.03094482421875, -1.968719482421875, -1.906494140625, -1.844268798828125, -1.78204345703125, -1.719818115234375, -1.6575927734375, -1.595367431640625, -1.53314208984375, -1.470916748046875, -1.40869140625, -1.346466064453125, -1.28424072265625, -1.222015380859375, -1.1597900390625, -1.097564697265625, -1.03533935546875, -0.973114013671875, -0.910888671875, -0.848663330078125, -0.78643798828125, -0.724212646484375, -0.6619873046875, -0.599761962890625, -0.53753662109375, -0.475311279296875, -0.4130859375, -0.350860595703125, -0.28863525390625, -0.226409912109375, -0.1641845703125, -0.101959228515625, -0.03973388671875, 0.022491455078125, 0.084716796875, 0.146942138671875, 0.20916748046875, 0.271392822265625, 0.3336181640625, 0.395843505859375, 0.45806884765625, 0.520294189453125, 0.58251953125, 0.644744873046875, 0.70697021484375, 0.769195556640625, 0.8314208984375, 0.893646240234375, 0.95587158203125, 1.018096923828125, 1.080322265625, 1.142547607421875, 1.20477294921875, 1.266998291015625, 1.3292236328125, 1.391448974609375, 1.45367431640625, 1.515899658203125, 1.578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 14.0, 14.0, 29.0, 32.0, 53.0, 79.0, 106.0, 162.0, 351.0, 591.0, 1139.0, 2347.0, 5060.0, 12117.0, 30993.0, 84232.0, 221596.0, 362188.0, 202662.0, 76085.0, 28342.0, 11177.0, 4723.0, 2061.0, 1065.0, 532.0, 298.0, 177.0, 100.0, 64.0, 37.0, 31.0, 25.0, 18.0, 12.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.2578125, -5.08514404296875, -4.9124755859375, -4.73980712890625, -4.567138671875, -4.39447021484375, -4.2218017578125, -4.04913330078125, -3.87646484375, -3.70379638671875, -3.5311279296875, -3.35845947265625, -3.185791015625, -3.01312255859375, -2.8404541015625, -2.66778564453125, -2.4951171875, -2.32244873046875, -2.1497802734375, -1.97711181640625, -1.804443359375, -1.63177490234375, -1.4591064453125, -1.28643798828125, -1.11376953125, -0.94110107421875, -0.7684326171875, -0.59576416015625, -0.423095703125, -0.25042724609375, -0.0777587890625, 0.09490966796875, 0.267578125, 0.44024658203125, 0.6129150390625, 0.78558349609375, 0.958251953125, 1.13092041015625, 1.3035888671875, 1.47625732421875, 1.64892578125, 1.82159423828125, 1.9942626953125, 2.16693115234375, 2.339599609375, 2.51226806640625, 2.6849365234375, 2.85760498046875, 3.0302734375, 3.20294189453125, 3.3756103515625, 3.54827880859375, 3.720947265625, 3.89361572265625, 4.0662841796875, 4.23895263671875, 4.41162109375, 4.58428955078125, 4.7569580078125, 4.92962646484375, 5.102294921875, 5.27496337890625, 5.4476318359375, 5.62030029296875, 5.79296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 9.0, 13.0, 12.0, 12.0, 10.0, 9.0, 24.0, 19.0, 33.0, 32.0, 31.0, 38.0, 38.0, 41.0, 47.0, 28.0, 38.0, 43.0, 41.0, 41.0, 41.0, 50.0, 43.0, 34.0, 34.0, 39.0, 26.0, 35.0, 28.0, 20.0, 13.0, 14.0, 10.0, 8.0, 13.0, 7.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.546875, -5.38446044921875, -5.2220458984375, -5.05963134765625, -4.897216796875, -4.73480224609375, -4.5723876953125, -4.40997314453125, -4.24755859375, -4.08514404296875, -3.9227294921875, -3.76031494140625, -3.597900390625, -3.43548583984375, -3.2730712890625, -3.11065673828125, -2.9482421875, -2.78582763671875, -2.6234130859375, -2.46099853515625, -2.298583984375, -2.13616943359375, -1.9737548828125, -1.81134033203125, -1.64892578125, -1.48651123046875, -1.3240966796875, -1.16168212890625, -0.999267578125, -0.83685302734375, -0.6744384765625, -0.51202392578125, -0.349609375, -0.18719482421875, -0.0247802734375, 0.13763427734375, 0.300048828125, 0.46246337890625, 0.6248779296875, 0.78729248046875, 0.94970703125, 1.11212158203125, 1.2745361328125, 1.43695068359375, 1.599365234375, 1.76177978515625, 1.9241943359375, 2.08660888671875, 2.2490234375, 2.41143798828125, 2.5738525390625, 2.73626708984375, 2.898681640625, 3.06109619140625, 3.2235107421875, 3.38592529296875, 3.54833984375, 3.71075439453125, 3.8731689453125, 4.03558349609375, 4.197998046875, 4.36041259765625, 4.5228271484375, 4.68524169921875, 4.84765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 9.0, 10.0, 17.0, 27.0, 43.0, 30.0, 64.0, 105.0, 154.0, 217.0, 344.0, 549.0, 883.0, 1529.0, 2630.0, 4894.0, 9711.0, 20241.0, 46365.0, 110511.0, 235371.0, 296431.0, 178212.0, 76763.0, 32373.0, 14733.0, 7247.0, 3709.0, 2020.0, 1210.0, 762.0, 442.0, 322.0, 195.0, 121.0, 83.0, 65.0, 46.0, 40.0, 15.0, 16.0, 13.0, 13.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.060546875, -1.992523193359375, -1.92449951171875, -1.856475830078125, -1.7884521484375, -1.720428466796875, -1.65240478515625, -1.584381103515625, -1.516357421875, -1.448333740234375, -1.38031005859375, -1.312286376953125, -1.2442626953125, -1.176239013671875, -1.10821533203125, -1.040191650390625, -0.97216796875, -0.904144287109375, -0.83612060546875, -0.768096923828125, -0.7000732421875, -0.632049560546875, -0.56402587890625, -0.496002197265625, -0.427978515625, -0.359954833984375, -0.29193115234375, -0.223907470703125, -0.1558837890625, -0.087860107421875, -0.01983642578125, 0.048187255859375, 0.1162109375, 0.184234619140625, 0.25225830078125, 0.320281982421875, 0.3883056640625, 0.456329345703125, 0.52435302734375, 0.592376708984375, 0.660400390625, 0.728424072265625, 0.79644775390625, 0.864471435546875, 0.9324951171875, 1.000518798828125, 1.06854248046875, 1.136566162109375, 1.20458984375, 1.272613525390625, 1.34063720703125, 1.408660888671875, 1.4766845703125, 1.544708251953125, 1.61273193359375, 1.680755615234375, 1.748779296875, 1.816802978515625, 1.88482666015625, 1.952850341796875, 2.0208740234375, 2.088897705078125, 2.15692138671875, 2.224945068359375, 2.29296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 2.0, 7.0, 13.0, 6.0, 5.0, 13.0, 15.0, 19.0, 16.0, 29.0, 33.0, 43.0, 44.0, 56.0, 77.0, 88.0, 89.0, 100.0, 82.0, 64.0, 33.0, 37.0, 28.0, 21.0, 11.0, 14.0, 10.0, 14.0, 7.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004601478576660156, -0.0004458874464035034, -0.0004316270351409912, -0.000417366623878479, -0.0004031062126159668, -0.0003888458013534546, -0.0003745853900909424, -0.0003603249788284302, -0.00034606456756591797, -0.00033180415630340576, -0.00031754374504089355, -0.00030328333377838135, -0.00028902292251586914, -0.00027476251125335693, -0.0002605020999908447, -0.0002462416887283325, -0.0002319812774658203, -0.0002177208662033081, -0.0002034604549407959, -0.0001892000436782837, -0.00017493963241577148, -0.00016067922115325928, -0.00014641880989074707, -0.00013215839862823486, -0.00011789798736572266, -0.00010363757610321045, -8.937716484069824e-05, -7.511675357818604e-05, -6.085634231567383e-05, -4.659593105316162e-05, -3.2335519790649414e-05, -1.8075108528137207e-05, -3.814697265625e-06, 1.0445713996887207e-05, 2.4706125259399414e-05, 3.896653652191162e-05, 5.322694778442383e-05, 6.748735904693604e-05, 8.174777030944824e-05, 9.600818157196045e-05, 0.00011026859283447266, 0.00012452900409698486, 0.00013878941535949707, 0.00015304982662200928, 0.00016731023788452148, 0.0001815706491470337, 0.0001958310604095459, 0.0002100914716720581, 0.0002243518829345703, 0.00023861229419708252, 0.0002528727054595947, 0.00026713311672210693, 0.00028139352798461914, 0.00029565393924713135, 0.00030991435050964355, 0.00032417476177215576, 0.00033843517303466797, 0.0003526955842971802, 0.0003669559955596924, 0.0003812164068222046, 0.0003954768180847168, 0.000409737229347229, 0.0004239976406097412, 0.0004382580518722534, 0.0004525184631347656]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 3.0, 12.0, 16.0, 18.0, 23.0, 41.0, 62.0, 75.0, 166.0, 299.0, 562.0, 1184.0, 2374.0, 5044.0, 12420.0, 33241.0, 101561.0, 303060.0, 372474.0, 141627.0, 45496.0, 16393.0, 6591.0, 2858.0, 1380.0, 705.0, 359.0, 179.0, 145.0, 69.0, 31.0, 23.0, 18.0, 19.0, 4.0, 7.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.052734375, -2.957763671875, -2.86279296875, -2.767822265625, -2.6728515625, -2.577880859375, -2.48291015625, -2.387939453125, -2.29296875, -2.197998046875, -2.10302734375, -2.008056640625, -1.9130859375, -1.818115234375, -1.72314453125, -1.628173828125, -1.533203125, -1.438232421875, -1.34326171875, -1.248291015625, -1.1533203125, -1.058349609375, -0.96337890625, -0.868408203125, -0.7734375, -0.678466796875, -0.58349609375, -0.488525390625, -0.3935546875, -0.298583984375, -0.20361328125, -0.108642578125, -0.013671875, 0.081298828125, 0.17626953125, 0.271240234375, 0.3662109375, 0.461181640625, 0.55615234375, 0.651123046875, 0.74609375, 0.841064453125, 0.93603515625, 1.031005859375, 1.1259765625, 1.220947265625, 1.31591796875, 1.410888671875, 1.505859375, 1.600830078125, 1.69580078125, 1.790771484375, 1.8857421875, 1.980712890625, 2.07568359375, 2.170654296875, 2.265625, 2.360595703125, 2.45556640625, 2.550537109375, 2.6455078125, 2.740478515625, 2.83544921875, 2.930419921875, 3.025390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 7.0, 8.0, 10.0, 13.0, 15.0, 14.0, 20.0, 18.0, 29.0, 33.0, 43.0, 48.0, 55.0, 66.0, 67.0, 58.0, 59.0, 73.0, 47.0, 46.0, 48.0, 27.0, 26.0, 28.0, 25.0, 15.0, 7.0, 16.0, 11.0, 9.0, 5.0, 10.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8916015625, -1.8235321044921875, -1.755462646484375, -1.6873931884765625, -1.61932373046875, -1.5512542724609375, -1.483184814453125, -1.4151153564453125, -1.3470458984375, -1.2789764404296875, -1.210906982421875, -1.1428375244140625, -1.07476806640625, -1.0066986083984375, -0.938629150390625, -0.8705596923828125, -0.802490234375, -0.7344207763671875, -0.666351318359375, -0.5982818603515625, -0.53021240234375, -0.4621429443359375, -0.394073486328125, -0.3260040283203125, -0.2579345703125, -0.1898651123046875, -0.121795654296875, -0.0537261962890625, 0.01434326171875, 0.0824127197265625, 0.150482177734375, 0.2185516357421875, 0.28662109375, 0.3546905517578125, 0.422760009765625, 0.4908294677734375, 0.55889892578125, 0.6269683837890625, 0.695037841796875, 0.7631072998046875, 0.8311767578125, 0.8992462158203125, 0.967315673828125, 1.0353851318359375, 1.10345458984375, 1.1715240478515625, 1.239593505859375, 1.3076629638671875, 1.375732421875, 1.4438018798828125, 1.511871337890625, 1.5799407958984375, 1.64801025390625, 1.7160797119140625, 1.784149169921875, 1.8522186279296875, 1.9202880859375, 1.9883575439453125, 2.056427001953125, 2.1244964599609375, 2.19256591796875, 2.2606353759765625, 2.328704833984375, 2.3967742919921875, 2.46484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 9.0, 21.0, 35.0, 73.0, 124.0, 200.0, 223.0, 161.0, 90.0, 33.0, 19.0, 11.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-132.5499267578125, -129.96517944335938, -127.38043212890625, -124.7956771850586, -122.21092987060547, -119.62618255615234, -117.04143524169922, -114.45668029785156, -111.87193298339844, -109.28718566894531, -106.70243835449219, -104.11768341064453, -101.5329360961914, -98.94818878173828, -96.36344146728516, -93.7786865234375, -91.19393920898438, -88.60919189453125, -86.02444458007812, -83.43968963623047, -80.85494232177734, -78.27019500732422, -75.6854476928711, -73.10069274902344, -70.51595306396484, -67.93120574951172, -65.3464584350586, -62.7617073059082, -60.17695617675781, -57.59220886230469, -55.00746154785156, -52.42271041870117, -49.837955474853516, -47.25320816040039, -44.66845703125, -42.083709716796875, -39.498958587646484, -36.91421127319336, -34.32946014404297, -31.744712829589844, -29.159963607788086, -26.575214385986328, -23.99046516418457, -21.405715942382812, -18.820968627929688, -16.236217498779297, -13.651470184326172, -11.066720962524414, -8.481971740722656, -5.897222518920898, -3.312473773956299, -0.7277250289916992, 1.8570241928100586, 4.441773414611816, 7.026521682739258, 9.611270904541016, 12.196020126342773, 14.780769348144531, 17.36551856994629, 19.950267791748047, 22.535015106201172, 25.119766235351562, 27.704513549804688, 30.289262771606445, 32.8740119934082]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 5.0, 15.0, 10.0, 9.0, 29.0, 15.0, 17.0, 21.0, 28.0, 26.0, 29.0, 37.0, 39.0, 39.0, 37.0, 34.0, 42.0, 61.0, 40.0, 42.0, 40.0, 50.0, 42.0, 34.0, 22.0, 37.0, 33.0, 25.0, 19.0, 22.0, 14.0, 17.0, 10.0, 8.0, 11.0, 7.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.514022827148438, -24.56805419921875, -23.622087478637695, -22.676118850708008, -21.730152130126953, -20.784183502197266, -19.838214874267578, -18.89224624633789, -17.946279525756836, -17.00031089782715, -16.054344177246094, -15.108375549316406, -14.162407875061035, -13.216440200805664, -12.270471572875977, -11.324503898620605, -10.378536224365234, -9.432568550109863, -8.486600875854492, -7.540632247924805, -6.594664573669434, -5.6486968994140625, -4.702728748321533, -3.756760597229004, -2.810792922973633, -1.8648250102996826, -0.9188570976257324, 0.027110815048217773, 0.973078727722168, 1.919046401977539, 2.8650145530700684, 3.8109827041625977, 4.756950378417969, 5.70291805267334, 6.648886203765869, 7.594854354858398, 8.54082202911377, 9.48678970336914, 10.432758331298828, 11.3787260055542, 12.32469367980957, 13.270661354064941, 14.216629028320312, 15.16259765625, 16.108566284179688, 17.054533004760742, 18.00050163269043, 18.946468353271484, 19.892436981201172, 20.83840560913086, 21.784372329711914, 22.7303409576416, 23.676307678222656, 24.622276306152344, 25.56824493408203, 26.51421356201172, 27.460180282592773, 28.40614891052246, 29.352115631103516, 30.298084259033203, 31.24405288696289, 32.19001770019531, 33.135986328125, 34.08195495605469, 35.027923583984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 3.0, 5.0, 8.0, 15.0, 21.0, 23.0, 32.0, 42.0, 64.0, 110.0, 154.0, 240.0, 403.0, 667.0, 1185.0, 2388.0, 5531.0, 16298.0, 75065.0, 3294131.0, 724757.0, 51602.0, 12931.0, 4542.0, 1879.0, 939.0, 505.0, 280.0, 174.0, 98.0, 53.0, 44.0, 21.0, 19.0, 11.0, 6.0, 10.0, 4.0, 9.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.3984375, -14.9920654296875, -14.585693359375, -14.1793212890625, -13.77294921875, -13.3665771484375, -12.960205078125, -12.5538330078125, -12.1474609375, -11.7410888671875, -11.334716796875, -10.9283447265625, -10.52197265625, -10.1156005859375, -9.709228515625, -9.3028564453125, -8.896484375, -8.4901123046875, -8.083740234375, -7.6773681640625, -7.27099609375, -6.8646240234375, -6.458251953125, -6.0518798828125, -5.6455078125, -5.2391357421875, -4.832763671875, -4.4263916015625, -4.02001953125, -3.6136474609375, -3.207275390625, -2.8009033203125, -2.39453125, -1.9881591796875, -1.581787109375, -1.1754150390625, -0.76904296875, -0.3626708984375, 0.043701171875, 0.4500732421875, 0.8564453125, 1.2628173828125, 1.669189453125, 2.0755615234375, 2.48193359375, 2.8883056640625, 3.294677734375, 3.7010498046875, 4.107421875, 4.5137939453125, 4.920166015625, 5.3265380859375, 5.73291015625, 6.1392822265625, 6.545654296875, 6.9520263671875, 7.3583984375, 7.7647705078125, 8.171142578125, 8.5775146484375, 8.98388671875, 9.3902587890625, 9.796630859375, 10.2030029296875, 10.609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 12.0, 21.0, 20.0, 35.0, 31.0, 57.0, 59.0, 54.0, 74.0, 70.0, 78.0, 81.0, 81.0, 51.0, 58.0, 50.0, 32.0, 38.0, 23.0, 17.0, 14.0, 8.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.494140625, -2.429351806640625, -2.36456298828125, -2.299774169921875, -2.2349853515625, -2.170196533203125, -2.10540771484375, -2.040618896484375, -1.975830078125, -1.911041259765625, -1.84625244140625, -1.781463623046875, -1.7166748046875, -1.651885986328125, -1.58709716796875, -1.522308349609375, -1.45751953125, -1.392730712890625, -1.32794189453125, -1.263153076171875, -1.1983642578125, -1.133575439453125, -1.06878662109375, -1.003997802734375, -0.939208984375, -0.874420166015625, -0.80963134765625, -0.744842529296875, -0.6800537109375, -0.615264892578125, -0.55047607421875, -0.485687255859375, -0.4208984375, -0.356109619140625, -0.29132080078125, -0.226531982421875, -0.1617431640625, -0.096954345703125, -0.03216552734375, 0.032623291015625, 0.097412109375, 0.162200927734375, 0.22698974609375, 0.291778564453125, 0.3565673828125, 0.421356201171875, 0.48614501953125, 0.550933837890625, 0.61572265625, 0.680511474609375, 0.74530029296875, 0.810089111328125, 0.8748779296875, 0.939666748046875, 1.00445556640625, 1.069244384765625, 1.134033203125, 1.198822021484375, 1.26361083984375, 1.328399658203125, 1.3931884765625, 1.457977294921875, 1.52276611328125, 1.587554931640625, 1.65234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 16.0, 15.0, 18.0, 25.0, 28.0, 40.0, 28.0, 66.0, 79.0, 137.0, 260.0, 502.0, 1036.0, 2696.0, 9167.0, 55347.0, 2976978.0, 1095280.0, 40797.0, 7506.0, 2255.0, 886.0, 448.0, 219.0, 133.0, 71.0, 67.0, 39.0, 30.0, 20.0, 7.0, 12.0, 16.0, 5.0, 12.0, 10.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9609375, -12.5550537109375, -12.149169921875, -11.7432861328125, -11.33740234375, -10.9315185546875, -10.525634765625, -10.1197509765625, -9.7138671875, -9.3079833984375, -8.902099609375, -8.4962158203125, -8.09033203125, -7.6844482421875, -7.278564453125, -6.8726806640625, -6.466796875, -6.0609130859375, -5.655029296875, -5.2491455078125, -4.84326171875, -4.4373779296875, -4.031494140625, -3.6256103515625, -3.2197265625, -2.8138427734375, -2.407958984375, -2.0020751953125, -1.59619140625, -1.1903076171875, -0.784423828125, -0.3785400390625, 0.02734375, 0.4332275390625, 0.839111328125, 1.2449951171875, 1.65087890625, 2.0567626953125, 2.462646484375, 2.8685302734375, 3.2744140625, 3.6802978515625, 4.086181640625, 4.4920654296875, 4.89794921875, 5.3038330078125, 5.709716796875, 6.1156005859375, 6.521484375, 6.9273681640625, 7.333251953125, 7.7391357421875, 8.14501953125, 8.5509033203125, 8.956787109375, 9.3626708984375, 9.7685546875, 10.1744384765625, 10.580322265625, 10.9862060546875, 11.39208984375, 11.7979736328125, 12.203857421875, 12.6097412109375, 13.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 16.0, 13.0, 20.0, 35.0, 76.0, 158.0, 451.0, 2053.0, 808.0, 214.0, 108.0, 49.0, 24.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94921875, -6.782745361328125, -6.61627197265625, -6.449798583984375, -6.2833251953125, -6.116851806640625, -5.95037841796875, -5.783905029296875, -5.617431640625, -5.450958251953125, -5.28448486328125, -5.118011474609375, -4.9515380859375, -4.785064697265625, -4.61859130859375, -4.452117919921875, -4.28564453125, -4.119171142578125, -3.95269775390625, -3.786224365234375, -3.6197509765625, -3.453277587890625, -3.28680419921875, -3.120330810546875, -2.953857421875, -2.787384033203125, -2.62091064453125, -2.454437255859375, -2.2879638671875, -2.121490478515625, -1.95501708984375, -1.788543701171875, -1.6220703125, -1.455596923828125, -1.28912353515625, -1.122650146484375, -0.9561767578125, -0.789703369140625, -0.62322998046875, -0.456756591796875, -0.290283203125, -0.123809814453125, 0.04266357421875, 0.209136962890625, 0.3756103515625, 0.542083740234375, 0.70855712890625, 0.875030517578125, 1.04150390625, 1.207977294921875, 1.37445068359375, 1.540924072265625, 1.7073974609375, 1.873870849609375, 2.04034423828125, 2.206817626953125, 2.373291015625, 2.539764404296875, 2.70623779296875, 2.872711181640625, 3.0391845703125, 3.205657958984375, 3.37213134765625, 3.538604736328125, 3.705078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 10.0, 9.0, 27.0, 39.0, 80.0, 95.0, 148.0, 184.0, 160.0, 112.0, 74.0, 23.0, 21.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.971343994140625, -42.02943420410156, -41.087528228759766, -40.1456184387207, -39.20370864868164, -38.261802673339844, -37.31989288330078, -36.37798309326172, -35.43607711791992, -34.49416732788086, -33.55226135253906, -32.6103515625, -31.66844367980957, -30.72653579711914, -29.784626007080078, -28.84271812438965, -27.90081024169922, -26.95890235900879, -26.016992568969727, -25.075084686279297, -24.133176803588867, -23.191268920898438, -22.249359130859375, -21.307451248168945, -20.365541458129883, -19.423633575439453, -18.48172378540039, -17.53981590270996, -16.59790802001953, -15.655999183654785, -14.714090347290039, -13.77218246459961, -12.83027458190918, -11.888365745544434, -10.946457862854004, -10.004549026489258, -9.062641143798828, -8.120732307434082, -7.178823947906494, -6.236915588378906, -5.295007228851318, -4.3530988693237305, -3.4111905097961426, -2.4692819118499756, -1.5273735523223877, -0.5854649543762207, 0.3564434051513672, 1.298351764678955, 2.240260124206543, 3.182168483734131, 4.124076843261719, 5.065985679626465, 6.0078935623168945, 6.949802398681641, 7.8917107582092285, 8.833619117736816, 9.775527954101562, 10.717436790466309, 11.659344673156738, 12.601253509521484, 13.543161392211914, 14.48507022857666, 15.426979064941406, 16.368886947631836, 17.310794830322266]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 10.0, 7.0, 15.0, 12.0, 11.0, 15.0, 21.0, 17.0, 23.0, 38.0, 38.0, 45.0, 41.0, 30.0, 50.0, 53.0, 55.0, 57.0, 61.0, 46.0, 49.0, 40.0, 36.0, 29.0, 39.0, 15.0, 26.0, 22.0, 14.0, 16.0, 13.0, 19.0, 6.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.383825302124023, -8.018355369567871, -7.652885437011719, -7.287415504455566, -6.921945571899414, -6.556475639343262, -6.191005706787109, -5.825535774230957, -5.460065841674805, -5.094595909118652, -4.7291259765625, -4.363656044006348, -3.9981861114501953, -3.632716178894043, -3.2672460079193115, -2.901776075363159, -2.5363059043884277, -2.1708359718322754, -1.805366039276123, -1.4398959875106812, -1.0744260549545288, -0.7089561223983765, -0.34348607063293457, 0.021983861923217773, 0.3874537944793701, 0.7529237270355225, 1.1183936595916748, 1.4838637113571167, 1.849333643913269, 2.214803695678711, 2.5802736282348633, 2.9457435607910156, 3.311213493347168, 3.6766834259033203, 4.042153358459473, 4.407623291015625, 4.773093223571777, 5.13856315612793, 5.504033088684082, 5.869503021240234, 6.234972953796387, 6.600442886352539, 6.965912818908691, 7.331382751464844, 7.696852684020996, 8.062322616577148, 8.4277925491333, 8.793262481689453, 9.158733367919922, 9.524203300476074, 9.889673233032227, 10.255143165588379, 10.620613098144531, 10.986083030700684, 11.351552963256836, 11.717022895812988, 12.08249282836914, 12.447962760925293, 12.813432693481445, 13.178902626037598, 13.54437255859375, 13.909842491149902, 14.275312423706055, 14.640782356262207, 15.00625228881836]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 13.0, 13.0, 19.0, 30.0, 37.0, 40.0, 75.0, 102.0, 158.0, 208.0, 339.0, 596.0, 1146.0, 2209.0, 4891.0, 11815.0, 34762.0, 136663.0, 546375.0, 227756.0, 52466.0, 16273.0, 6355.0, 2837.0, 1376.0, 756.0, 441.0, 254.0, 179.0, 126.0, 61.0, 48.0, 41.0, 31.0, 13.0, 16.0, 5.0, 3.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.7689208984375, -8.451904296875, -8.1348876953125, -7.81787109375, -7.5008544921875, -7.183837890625, -6.8668212890625, -6.5498046875, -6.2327880859375, -5.915771484375, -5.5987548828125, -5.28173828125, -4.9647216796875, -4.647705078125, -4.3306884765625, -4.013671875, -3.6966552734375, -3.379638671875, -3.0626220703125, -2.74560546875, -2.4285888671875, -2.111572265625, -1.7945556640625, -1.4775390625, -1.1605224609375, -0.843505859375, -0.5264892578125, -0.20947265625, 0.1075439453125, 0.424560546875, 0.7415771484375, 1.05859375, 1.3756103515625, 1.692626953125, 2.0096435546875, 2.32666015625, 2.6436767578125, 2.960693359375, 3.2777099609375, 3.5947265625, 3.9117431640625, 4.228759765625, 4.5457763671875, 4.86279296875, 5.1798095703125, 5.496826171875, 5.8138427734375, 6.130859375, 6.4478759765625, 6.764892578125, 7.0819091796875, 7.39892578125, 7.7159423828125, 8.032958984375, 8.3499755859375, 8.6669921875, 8.9840087890625, 9.301025390625, 9.6180419921875, 9.93505859375, 10.2520751953125, 10.569091796875, 10.8861083984375, 11.203125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 12.0, 14.0, 14.0, 18.0, 41.0, 44.0, 56.0, 45.0, 61.0, 73.0, 65.0, 87.0, 86.0, 74.0, 62.0, 49.0, 52.0, 37.0, 23.0, 27.0, 15.0, 12.0, 4.0, 8.0, 7.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.548736572265625, -2.48223876953125, -2.415740966796875, -2.3492431640625, -2.282745361328125, -2.21624755859375, -2.149749755859375, -2.083251953125, -2.016754150390625, -1.95025634765625, -1.883758544921875, -1.8172607421875, -1.750762939453125, -1.68426513671875, -1.617767333984375, -1.55126953125, -1.484771728515625, -1.41827392578125, -1.351776123046875, -1.2852783203125, -1.218780517578125, -1.15228271484375, -1.085784912109375, -1.019287109375, -0.952789306640625, -0.88629150390625, -0.819793701171875, -0.7532958984375, -0.686798095703125, -0.62030029296875, -0.553802490234375, -0.4873046875, -0.420806884765625, -0.35430908203125, -0.287811279296875, -0.2213134765625, -0.154815673828125, -0.08831787109375, -0.021820068359375, 0.044677734375, 0.111175537109375, 0.17767333984375, 0.244171142578125, 0.3106689453125, 0.377166748046875, 0.44366455078125, 0.510162353515625, 0.57666015625, 0.643157958984375, 0.70965576171875, 0.776153564453125, 0.8426513671875, 0.909149169921875, 0.97564697265625, 1.042144775390625, 1.108642578125, 1.175140380859375, 1.24163818359375, 1.308135986328125, 1.3746337890625, 1.441131591796875, 1.50762939453125, 1.574127197265625, 1.640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 9.0, 8.0, 15.0, 22.0, 24.0, 41.0, 52.0, 72.0, 100.0, 177.0, 312.0, 515.0, 875.0, 1504.0, 2748.0, 5427.0, 10779.0, 22836.0, 51641.0, 119593.0, 291379.0, 308656.0, 127526.0, 55260.0, 24620.0, 11743.0, 5786.0, 2920.0, 1587.0, 865.0, 524.0, 323.0, 187.0, 130.0, 105.0, 55.0, 41.0, 26.0, 16.0, 17.0, 8.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.33990478515625, -4.1954345703125, -4.05096435546875, -3.906494140625, -3.76202392578125, -3.6175537109375, -3.47308349609375, -3.32861328125, -3.18414306640625, -3.0396728515625, -2.89520263671875, -2.750732421875, -2.60626220703125, -2.4617919921875, -2.31732177734375, -2.1728515625, -2.02838134765625, -1.8839111328125, -1.73944091796875, -1.594970703125, -1.45050048828125, -1.3060302734375, -1.16156005859375, -1.01708984375, -0.87261962890625, -0.7281494140625, -0.58367919921875, -0.439208984375, -0.29473876953125, -0.1502685546875, -0.00579833984375, 0.138671875, 0.28314208984375, 0.4276123046875, 0.57208251953125, 0.716552734375, 0.86102294921875, 1.0054931640625, 1.14996337890625, 1.29443359375, 1.43890380859375, 1.5833740234375, 1.72784423828125, 1.872314453125, 2.01678466796875, 2.1612548828125, 2.30572509765625, 2.4501953125, 2.59466552734375, 2.7391357421875, 2.88360595703125, 3.028076171875, 3.17254638671875, 3.3170166015625, 3.46148681640625, 3.60595703125, 3.75042724609375, 3.8948974609375, 4.03936767578125, 4.183837890625, 4.32830810546875, 4.4727783203125, 4.61724853515625, 4.76171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 8.0, 9.0, 20.0, 18.0, 18.0, 29.0, 28.0, 32.0, 29.0, 31.0, 48.0, 47.0, 43.0, 51.0, 42.0, 49.0, 48.0, 42.0, 38.0, 36.0, 51.0, 37.0, 32.0, 35.0, 25.0, 24.0, 15.0, 23.0, 14.0, 11.0, 9.0, 7.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.25274658203125, -5.0797119140625, -4.90667724609375, -4.733642578125, -4.56060791015625, -4.3875732421875, -4.21453857421875, -4.04150390625, -3.86846923828125, -3.6954345703125, -3.52239990234375, -3.349365234375, -3.17633056640625, -3.0032958984375, -2.83026123046875, -2.6572265625, -2.48419189453125, -2.3111572265625, -2.13812255859375, -1.965087890625, -1.79205322265625, -1.6190185546875, -1.44598388671875, -1.27294921875, -1.09991455078125, -0.9268798828125, -0.75384521484375, -0.580810546875, -0.40777587890625, -0.2347412109375, -0.06170654296875, 0.111328125, 0.28436279296875, 0.4573974609375, 0.63043212890625, 0.803466796875, 0.97650146484375, 1.1495361328125, 1.32257080078125, 1.49560546875, 1.66864013671875, 1.8416748046875, 2.01470947265625, 2.187744140625, 2.36077880859375, 2.5338134765625, 2.70684814453125, 2.8798828125, 3.05291748046875, 3.2259521484375, 3.39898681640625, 3.572021484375, 3.74505615234375, 3.9180908203125, 4.09112548828125, 4.26416015625, 4.43719482421875, 4.6102294921875, 4.78326416015625, 4.956298828125, 5.12933349609375, 5.3023681640625, 5.47540283203125, 5.6484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 14.0, 22.0, 26.0, 45.0, 88.0, 172.0, 361.0, 796.0, 2132.0, 7171.0, 29462.0, 158157.0, 606336.0, 196025.0, 35220.0, 8322.0, 2531.0, 879.0, 378.0, 184.0, 107.0, 50.0, 33.0, 14.0, 9.0, 10.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.1588134765625, -3.044189453125, -2.9295654296875, -2.81494140625, -2.7003173828125, -2.585693359375, -2.4710693359375, -2.3564453125, -2.2418212890625, -2.127197265625, -2.0125732421875, -1.89794921875, -1.7833251953125, -1.668701171875, -1.5540771484375, -1.439453125, -1.3248291015625, -1.210205078125, -1.0955810546875, -0.98095703125, -0.8663330078125, -0.751708984375, -0.6370849609375, -0.5224609375, -0.4078369140625, -0.293212890625, -0.1785888671875, -0.06396484375, 0.0506591796875, 0.165283203125, 0.2799072265625, 0.39453125, 0.5091552734375, 0.623779296875, 0.7384033203125, 0.85302734375, 0.9676513671875, 1.082275390625, 1.1968994140625, 1.3115234375, 1.4261474609375, 1.540771484375, 1.6553955078125, 1.77001953125, 1.8846435546875, 1.999267578125, 2.1138916015625, 2.228515625, 2.3431396484375, 2.457763671875, 2.5723876953125, 2.68701171875, 2.8016357421875, 2.916259765625, 3.0308837890625, 3.1455078125, 3.2601318359375, 3.374755859375, 3.4893798828125, 3.60400390625, 3.7186279296875, 3.833251953125, 3.9478759765625, 4.0625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 9.0, 12.0, 9.0, 10.0, 10.0, 12.0, 25.0, 21.0, 39.0, 51.0, 101.0, 173.0, 174.0, 128.0, 87.0, 50.0, 28.0, 19.0, 10.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004940032958984375, -0.0004758089780807495, -0.0004576146602630615, -0.00043942034244537354, -0.00042122602462768555, -0.00040303170680999756, -0.00038483738899230957, -0.0003666430711746216, -0.0003484487533569336, -0.0003302544355392456, -0.0003120601177215576, -0.00029386579990386963, -0.00027567148208618164, -0.00025747716426849365, -0.00023928284645080566, -0.00022108852863311768, -0.0002028942108154297, -0.0001846998929977417, -0.0001665055751800537, -0.00014831125736236572, -0.00013011693954467773, -0.00011192262172698975, -9.372830390930176e-05, -7.553398609161377e-05, -5.733966827392578e-05, -3.914535045623779e-05, -2.0951032638549805e-05, -2.7567148208618164e-06, 1.5437602996826172e-05, 3.363192081451416e-05, 5.182623863220215e-05, 7.002055644989014e-05, 8.821487426757812e-05, 0.00010640919208526611, 0.0001246035099029541, 0.0001427978277206421, 0.00016099214553833008, 0.00017918646335601807, 0.00019738078117370605, 0.00021557509899139404, 0.00023376941680908203, 0.00025196373462677, 0.000270158052444458, 0.000288352370262146, 0.000306546688079834, 0.00032474100589752197, 0.00034293532371520996, 0.00036112964153289795, 0.00037932395935058594, 0.0003975182771682739, 0.0004157125949859619, 0.0004339069128036499, 0.0004521012306213379, 0.0004702955484390259, 0.0004884898662567139, 0.0005066841840744019, 0.0005248785018920898, 0.0005430728197097778, 0.0005612671375274658, 0.0005794614553451538, 0.0005976557731628418, 0.0006158500909805298, 0.0006340444087982178, 0.0006522387266159058, 0.0006704330444335938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 14.0, 13.0, 25.0, 30.0, 48.0, 78.0, 143.0, 245.0, 486.0, 1023.0, 2342.0, 6093.0, 17654.0, 55378.0, 205834.0, 536014.0, 155870.0, 43993.0, 14414.0, 5082.0, 1943.0, 821.0, 393.0, 235.0, 142.0, 75.0, 47.0, 37.0, 22.0, 23.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.27001953125, -2.1806640625, -2.09130859375, -2.001953125, -1.91259765625, -1.8232421875, -1.73388671875, -1.64453125, -1.55517578125, -1.4658203125, -1.37646484375, -1.287109375, -1.19775390625, -1.1083984375, -1.01904296875, -0.9296875, -0.84033203125, -0.7509765625, -0.66162109375, -0.572265625, -0.48291015625, -0.3935546875, -0.30419921875, -0.21484375, -0.12548828125, -0.0361328125, 0.05322265625, 0.142578125, 0.23193359375, 0.3212890625, 0.41064453125, 0.5, 0.58935546875, 0.6787109375, 0.76806640625, 0.857421875, 0.94677734375, 1.0361328125, 1.12548828125, 1.21484375, 1.30419921875, 1.3935546875, 1.48291015625, 1.572265625, 1.66162109375, 1.7509765625, 1.84033203125, 1.9296875, 2.01904296875, 2.1083984375, 2.19775390625, 2.287109375, 2.37646484375, 2.4658203125, 2.55517578125, 2.64453125, 2.73388671875, 2.8232421875, 2.91259765625, 3.001953125, 3.09130859375, 3.1806640625, 3.27001953125, 3.359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 6.0, 7.0, 10.0, 7.0, 6.0, 13.0, 10.0, 27.0, 39.0, 25.0, 34.0, 29.0, 63.0, 76.0, 110.0, 108.0, 97.0, 70.0, 64.0, 51.0, 34.0, 22.0, 30.0, 15.0, 21.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.54296875, -1.463165283203125, -1.38336181640625, -1.303558349609375, -1.2237548828125, -1.143951416015625, -1.06414794921875, -0.984344482421875, -0.904541015625, -0.824737548828125, -0.74493408203125, -0.665130615234375, -0.5853271484375, -0.505523681640625, -0.42572021484375, -0.345916748046875, -0.26611328125, -0.186309814453125, -0.10650634765625, -0.026702880859375, 0.0531005859375, 0.132904052734375, 0.21270751953125, 0.292510986328125, 0.372314453125, 0.452117919921875, 0.53192138671875, 0.611724853515625, 0.6915283203125, 0.771331787109375, 0.85113525390625, 0.930938720703125, 1.0107421875, 1.090545654296875, 1.17034912109375, 1.250152587890625, 1.3299560546875, 1.409759521484375, 1.48956298828125, 1.569366455078125, 1.649169921875, 1.728973388671875, 1.80877685546875, 1.888580322265625, 1.9683837890625, 2.048187255859375, 2.12799072265625, 2.207794189453125, 2.28759765625, 2.367401123046875, 2.44720458984375, 2.527008056640625, 2.6068115234375, 2.686614990234375, 2.76641845703125, 2.846221923828125, 2.926025390625, 3.005828857421875, 3.08563232421875, 3.165435791015625, 3.2452392578125, 3.325042724609375, 3.40484619140625, 3.484649658203125, 3.564453125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 15.0, 24.0, 71.0, 105.0, 198.0, 243.0, 180.0, 92.0, 43.0, 21.0, 7.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.800048828125, -101.2833023071289, -98.76655578613281, -96.24980926513672, -93.73306274414062, -91.21631622314453, -88.69956970214844, -86.18283081054688, -83.66607666015625, -81.14933013916016, -78.63258361816406, -76.11583709716797, -73.59909057617188, -71.08234405517578, -68.56559753417969, -66.04885864257812, -63.53211212158203, -61.01536560058594, -58.498619079589844, -55.98187255859375, -53.465126037597656, -50.94837951660156, -48.431636810302734, -45.91489028930664, -43.39814376831055, -40.88139724731445, -38.36465072631836, -35.847904205322266, -33.33116149902344, -30.81441307067871, -28.29766845703125, -25.780921936035156, -23.264175415039062, -20.74742889404297, -18.230682373046875, -15.713937759399414, -13.19719123840332, -10.680444717407227, -8.16369915008545, -5.646953582763672, -3.130207061767578, -0.6134610176086426, 1.903285026550293, 4.4200310707092285, 6.936777114868164, 9.453523635864258, 11.970269203186035, 14.487014770507812, 17.003761291503906, 19.5205078125, 22.037254333496094, 24.553998947143555, 27.07074546813965, 29.587491989135742, 32.1042366027832, 34.6209831237793, 37.13772964477539, 39.654476165771484, 42.17122268676758, 44.68796920776367, 47.2047119140625, 49.721458435058594, 52.23820495605469, 54.75495147705078, 57.271697998046875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 12.0, 11.0, 12.0, 12.0, 14.0, 9.0, 15.0, 21.0, 19.0, 20.0, 23.0, 21.0, 26.0, 37.0, 46.0, 32.0, 41.0, 36.0, 40.0, 36.0, 38.0, 36.0, 32.0, 28.0, 37.0, 34.0, 32.0, 31.0, 35.0, 26.0, 25.0, 23.0, 24.0, 17.0, 19.0, 11.0, 16.0, 8.0, 5.0, 6.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-24.43062400817871, -23.727495193481445, -23.024368286132812, -22.321239471435547, -21.618112564086914, -20.91498374938965, -20.211856842041016, -19.50872802734375, -18.805599212646484, -18.10247039794922, -17.399343490600586, -16.69621467590332, -15.993087768554688, -15.289958953857422, -14.586831092834473, -13.883703231811523, -13.18057632446289, -12.477448463439941, -11.774320602416992, -11.071191787719727, -10.368064880371094, -9.664936065673828, -8.961808204650879, -8.25868034362793, -7.5555524826049805, -6.852424621582031, -6.149296760559082, -5.446168422698975, -4.743040561676025, -4.039912700653076, -3.3367843627929688, -2.6336565017700195, -1.9305305480957031, -1.2274025678634644, -0.5242745876312256, 0.17885351181030273, 0.881981372833252, 1.5851092338562012, 2.2882375717163086, 2.991365432739258, 3.694493293762207, 4.397621154785156, 5.1007490158081055, 5.803877353668213, 6.507005214691162, 7.210133075714111, 7.913261413574219, 8.616389274597168, 9.319517135620117, 10.022644996643066, 10.725772857666016, 11.428901672363281, 12.132028579711914, 12.83515739440918, 13.538285255432129, 14.241413116455078, 14.944540977478027, 15.647668838500977, 16.350797653198242, 17.053924560546875, 17.75705337524414, 18.460180282592773, 19.16330909729004, 19.866436004638672, 20.569564819335938]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 7.0, 17.0, 24.0, 28.0, 58.0, 74.0, 156.0, 235.0, 454.0, 1177.0, 3687.0, 24276.0, 3540498.0, 601915.0, 17190.0, 2901.0, 844.0, 343.0, 147.0, 79.0, 51.0, 32.0, 28.0, 11.0, 13.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-38.21875, -37.3486328125, -36.478515625, -35.6083984375, -34.73828125, -33.8681640625, -32.998046875, -32.1279296875, -31.2578125, -30.3876953125, -29.517578125, -28.6474609375, -27.77734375, -26.9072265625, -26.037109375, -25.1669921875, -24.296875, -23.4267578125, -22.556640625, -21.6865234375, -20.81640625, -19.9462890625, -19.076171875, -18.2060546875, -17.3359375, -16.4658203125, -15.595703125, -14.7255859375, -13.85546875, -12.9853515625, -12.115234375, -11.2451171875, -10.375, -9.5048828125, -8.634765625, -7.7646484375, -6.89453125, -6.0244140625, -5.154296875, -4.2841796875, -3.4140625, -2.5439453125, -1.673828125, -0.8037109375, 0.06640625, 0.9365234375, 1.806640625, 2.6767578125, 3.546875, 4.4169921875, 5.287109375, 6.1572265625, 7.02734375, 7.8974609375, 8.767578125, 9.6376953125, 10.5078125, 11.3779296875, 12.248046875, 13.1181640625, 13.98828125, 14.8583984375, 15.728515625, 16.5986328125, 17.46875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 12.0, 12.0, 17.0, 30.0, 31.0, 28.0, 56.0, 53.0, 78.0, 65.0, 83.0, 64.0, 76.0, 90.0, 47.0, 73.0, 40.0, 35.0, 27.0, 15.0, 19.0, 12.0, 9.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.806640625, -2.7386016845703125, -2.670562744140625, -2.6025238037109375, -2.53448486328125, -2.4664459228515625, -2.398406982421875, -2.3303680419921875, -2.2623291015625, -2.1942901611328125, -2.126251220703125, -2.0582122802734375, -1.99017333984375, -1.9221343994140625, -1.854095458984375, -1.7860565185546875, -1.718017578125, -1.6499786376953125, -1.581939697265625, -1.5139007568359375, -1.44586181640625, -1.3778228759765625, -1.309783935546875, -1.2417449951171875, -1.1737060546875, -1.1056671142578125, -1.037628173828125, -0.9695892333984375, -0.90155029296875, -0.8335113525390625, -0.765472412109375, -0.6974334716796875, -0.62939453125, -0.5613555908203125, -0.493316650390625, -0.4252777099609375, -0.35723876953125, -0.2891998291015625, -0.221160888671875, -0.1531219482421875, -0.0850830078125, -0.0170440673828125, 0.050994873046875, 0.1190338134765625, 0.18707275390625, 0.2551116943359375, 0.323150634765625, 0.3911895751953125, 0.459228515625, 0.5272674560546875, 0.595306396484375, 0.6633453369140625, 0.73138427734375, 0.7994232177734375, 0.867462158203125, 0.9355010986328125, 1.0035400390625, 1.0715789794921875, 1.139617919921875, 1.2076568603515625, 1.27569580078125, 1.3437347412109375, 1.411773681640625, 1.4798126220703125, 1.5478515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 2.0, 10.0, 7.0, 5.0, 4.0, 11.0, 15.0, 13.0, 25.0, 21.0, 30.0, 41.0, 61.0, 86.0, 120.0, 219.0, 269.0, 493.0, 932.0, 2277.0, 7240.0, 34790.0, 498050.0, 3539924.0, 90202.0, 13089.0, 3312.0, 1292.0, 630.0, 331.0, 223.0, 168.0, 91.0, 77.0, 50.0, 51.0, 33.0, 27.0, 16.0, 13.0, 10.0, 7.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0390625, -11.6766357421875, -11.314208984375, -10.9517822265625, -10.58935546875, -10.2269287109375, -9.864501953125, -9.5020751953125, -9.1396484375, -8.7772216796875, -8.414794921875, -8.0523681640625, -7.68994140625, -7.3275146484375, -6.965087890625, -6.6026611328125, -6.240234375, -5.8778076171875, -5.515380859375, -5.1529541015625, -4.79052734375, -4.4281005859375, -4.065673828125, -3.7032470703125, -3.3408203125, -2.9783935546875, -2.615966796875, -2.2535400390625, -1.89111328125, -1.5286865234375, -1.166259765625, -0.8038330078125, -0.44140625, -0.0789794921875, 0.283447265625, 0.6458740234375, 1.00830078125, 1.3707275390625, 1.733154296875, 2.0955810546875, 2.4580078125, 2.8204345703125, 3.182861328125, 3.5452880859375, 3.90771484375, 4.2701416015625, 4.632568359375, 4.9949951171875, 5.357421875, 5.7198486328125, 6.082275390625, 6.4447021484375, 6.80712890625, 7.1695556640625, 7.531982421875, 7.8944091796875, 8.2568359375, 8.6192626953125, 8.981689453125, 9.3441162109375, 9.70654296875, 10.0689697265625, 10.431396484375, 10.7938232421875, 11.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 10.0, 14.0, 21.0, 34.0, 53.0, 128.0, 313.0, 1663.0, 1309.0, 270.0, 129.0, 58.0, 36.0, 20.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.83984375, -6.6910400390625, -6.542236328125, -6.3934326171875, -6.24462890625, -6.0958251953125, -5.947021484375, -5.7982177734375, -5.6494140625, -5.5006103515625, -5.351806640625, -5.2030029296875, -5.05419921875, -4.9053955078125, -4.756591796875, -4.6077880859375, -4.458984375, -4.3101806640625, -4.161376953125, -4.0125732421875, -3.86376953125, -3.7149658203125, -3.566162109375, -3.4173583984375, -3.2685546875, -3.1197509765625, -2.970947265625, -2.8221435546875, -2.67333984375, -2.5245361328125, -2.375732421875, -2.2269287109375, -2.078125, -1.9293212890625, -1.780517578125, -1.6317138671875, -1.48291015625, -1.3341064453125, -1.185302734375, -1.0364990234375, -0.8876953125, -0.7388916015625, -0.590087890625, -0.4412841796875, -0.29248046875, -0.1436767578125, 0.005126953125, 0.1539306640625, 0.302734375, 0.4515380859375, 0.600341796875, 0.7491455078125, 0.89794921875, 1.0467529296875, 1.195556640625, 1.3443603515625, 1.4931640625, 1.6419677734375, 1.790771484375, 1.9395751953125, 2.08837890625, 2.2371826171875, 2.385986328125, 2.5347900390625, 2.68359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 8.0, 15.0, 22.0, 33.0, 60.0, 75.0, 121.0, 101.0, 126.0, 119.0, 83.0, 71.0, 57.0, 36.0, 20.0, 13.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.09473419189453, -17.541763305664062, -16.988794326782227, -16.435823440551758, -15.882853507995605, -15.329883575439453, -14.7769136428833, -14.223943710327148, -13.67097282409668, -13.118002891540527, -12.565032958984375, -12.012062072753906, -11.459092140197754, -10.906122207641602, -10.35315227508545, -9.800182342529297, -9.247212409973145, -8.694242477416992, -8.14127254486084, -7.588302135467529, -7.035331726074219, -6.482361793518066, -5.929391860961914, -5.376421928405762, -4.823451519012451, -4.270481586456299, -3.7175111770629883, -3.164541244506836, -2.6115710735321045, -2.058600902557373, -1.5056309700012207, -0.9526607990264893, -0.3996906280517578, 0.15327948331832886, 0.7062495946884155, 1.2592196464538574, 1.8121898174285889, 2.3651599884033203, 2.9181299209594727, 3.471100091934204, 4.0240702629089355, 4.577040195465088, 5.130010604858398, 5.682980537414551, 6.235950469970703, 6.788920879364014, 7.341890811920166, 7.894861221313477, 8.447831153869629, 9.000801086425781, 9.553771018981934, 10.106740951538086, 10.659711837768555, 11.212681770324707, 11.76565170288086, 12.318621635437012, 12.871591567993164, 13.424561500549316, 13.977531433105469, 14.530502319335938, 15.08347225189209, 15.636442184448242, 16.189411163330078, 16.742382049560547, 17.295352935791016]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 2.0, 6.0, 8.0, 13.0, 8.0, 11.0, 16.0, 20.0, 18.0, 32.0, 19.0, 32.0, 32.0, 32.0, 40.0, 30.0, 53.0, 48.0, 57.0, 46.0, 35.0, 39.0, 44.0, 41.0, 37.0, 42.0, 33.0, 28.0, 34.0, 26.0, 20.0, 17.0, 11.0, 9.0, 10.0, 7.0, 3.0, 8.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.39480972290039, -8.118570327758789, -7.842330455780029, -7.5660905838012695, -7.289851188659668, -7.013611316680908, -6.737371444702148, -6.461132049560547, -6.184892654418945, -5.9086527824401855, -5.632413387298584, -5.356173515319824, -5.079934120178223, -4.803694248199463, -4.527454376220703, -4.251214981079102, -3.974975109100342, -3.698735475540161, -3.4224958419799805, -3.1462559700012207, -2.870016574859619, -2.5937767028808594, -2.3175370693206787, -2.041297435760498, -1.7650578022003174, -1.4888181686401367, -1.212578535079956, -0.9363387823104858, -0.6600991487503052, -0.3838595151901245, -0.1076197624206543, 0.16861987113952637, 0.44485950469970703, 0.7210991382598877, 0.9973388314247131, 1.2735785245895386, 1.5498181581497192, 1.8260577917099, 2.10229754447937, 2.378537178039551, 2.6547768115997314, 2.931016445159912, 3.2072560787200928, 3.4834957122802734, 3.759735584259033, 4.035974979400635, 4.3122148513793945, 4.588454246520996, 4.864694118499756, 5.140933990478516, 5.417173385620117, 5.693413257598877, 5.9696526527404785, 6.245892524719238, 6.52213191986084, 6.7983717918396, 7.074611663818359, 7.350851535797119, 7.627090930938721, 7.9033308029174805, 8.179570198059082, 8.455809593200684, 8.732049942016602, 9.008289337158203, 9.284528732299805]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 12.0, 10.0, 19.0, 20.0, 37.0, 64.0, 103.0, 151.0, 251.0, 504.0, 930.0, 2007.0, 5323.0, 18215.0, 82022.0, 578219.0, 293490.0, 48561.0, 11587.0, 3781.0, 1506.0, 761.0, 375.0, 217.0, 139.0, 80.0, 52.0, 32.0, 26.0, 15.0, 15.0, 11.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.4453125, -15.0142822265625, -14.583251953125, -14.1522216796875, -13.72119140625, -13.2901611328125, -12.859130859375, -12.4281005859375, -11.9970703125, -11.5660400390625, -11.135009765625, -10.7039794921875, -10.27294921875, -9.8419189453125, -9.410888671875, -8.9798583984375, -8.548828125, -8.1177978515625, -7.686767578125, -7.2557373046875, -6.82470703125, -6.3936767578125, -5.962646484375, -5.5316162109375, -5.1005859375, -4.6695556640625, -4.238525390625, -3.8074951171875, -3.37646484375, -2.9454345703125, -2.514404296875, -2.0833740234375, -1.65234375, -1.2213134765625, -0.790283203125, -0.3592529296875, 0.07177734375, 0.5028076171875, 0.933837890625, 1.3648681640625, 1.7958984375, 2.2269287109375, 2.657958984375, 3.0889892578125, 3.52001953125, 3.9510498046875, 4.382080078125, 4.8131103515625, 5.244140625, 5.6751708984375, 6.106201171875, 6.5372314453125, 6.96826171875, 7.3992919921875, 7.830322265625, 8.2613525390625, 8.6923828125, 9.1234130859375, 9.554443359375, 9.9854736328125, 10.41650390625, 10.8475341796875, 11.278564453125, 11.7095947265625, 12.140625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 7.0, 5.0, 16.0, 12.0, 17.0, 33.0, 43.0, 40.0, 70.0, 73.0, 70.0, 69.0, 80.0, 89.0, 76.0, 63.0, 47.0, 50.0, 34.0, 32.0, 27.0, 12.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.888671875, -2.8170623779296875, -2.745452880859375, -2.6738433837890625, -2.60223388671875, -2.5306243896484375, -2.459014892578125, -2.3874053955078125, -2.3157958984375, -2.2441864013671875, -2.172576904296875, -2.1009674072265625, -2.02935791015625, -1.9577484130859375, -1.886138916015625, -1.8145294189453125, -1.742919921875, -1.6713104248046875, -1.599700927734375, -1.5280914306640625, -1.45648193359375, -1.3848724365234375, -1.313262939453125, -1.2416534423828125, -1.1700439453125, -1.0984344482421875, -1.026824951171875, -0.9552154541015625, -0.88360595703125, -0.8119964599609375, -0.740386962890625, -0.6687774658203125, -0.59716796875, -0.5255584716796875, -0.453948974609375, -0.3823394775390625, -0.31072998046875, -0.2391204833984375, -0.167510986328125, -0.0959014892578125, -0.0242919921875, 0.0473175048828125, 0.118927001953125, 0.1905364990234375, 0.26214599609375, 0.3337554931640625, 0.405364990234375, 0.4769744873046875, 0.548583984375, 0.6201934814453125, 0.691802978515625, 0.7634124755859375, 0.83502197265625, 0.9066314697265625, 0.978240966796875, 1.0498504638671875, 1.1214599609375, 1.1930694580078125, 1.264678955078125, 1.3362884521484375, 1.40789794921875, 1.4795074462890625, 1.551116943359375, 1.6227264404296875, 1.6943359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 3.0, 10.0, 13.0, 17.0, 23.0, 36.0, 45.0, 73.0, 104.0, 134.0, 242.0, 456.0, 818.0, 1539.0, 3182.0, 6788.0, 15174.0, 35635.0, 88049.0, 250192.0, 398539.0, 147490.0, 56338.0, 23652.0, 10358.0, 4732.0, 2233.0, 1151.0, 629.0, 347.0, 183.0, 116.0, 76.0, 44.0, 31.0, 25.0, 18.0, 18.0, 8.0, 7.0, 3.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.62109375, -4.4683837890625, -4.315673828125, -4.1629638671875, -4.01025390625, -3.8575439453125, -3.704833984375, -3.5521240234375, -3.3994140625, -3.2467041015625, -3.093994140625, -2.9412841796875, -2.78857421875, -2.6358642578125, -2.483154296875, -2.3304443359375, -2.177734375, -2.0250244140625, -1.872314453125, -1.7196044921875, -1.56689453125, -1.4141845703125, -1.261474609375, -1.1087646484375, -0.9560546875, -0.8033447265625, -0.650634765625, -0.4979248046875, -0.34521484375, -0.1925048828125, -0.039794921875, 0.1129150390625, 0.265625, 0.4183349609375, 0.571044921875, 0.7237548828125, 0.87646484375, 1.0291748046875, 1.181884765625, 1.3345947265625, 1.4873046875, 1.6400146484375, 1.792724609375, 1.9454345703125, 2.09814453125, 2.2508544921875, 2.403564453125, 2.5562744140625, 2.708984375, 2.8616943359375, 3.014404296875, 3.1671142578125, 3.31982421875, 3.4725341796875, 3.625244140625, 3.7779541015625, 3.9306640625, 4.0833740234375, 4.236083984375, 4.3887939453125, 4.54150390625, 4.6942138671875, 4.846923828125, 4.9996337890625, 5.15234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 7.0, 12.0, 13.0, 14.0, 8.0, 17.0, 18.0, 21.0, 18.0, 31.0, 37.0, 37.0, 33.0, 51.0, 42.0, 44.0, 42.0, 48.0, 47.0, 43.0, 43.0, 32.0, 27.0, 36.0, 29.0, 35.0, 29.0, 22.0, 30.0, 21.0, 16.0, 12.0, 13.0, 12.0, 11.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.59765625, -5.4412841796875, -5.284912109375, -5.1285400390625, -4.97216796875, -4.8157958984375, -4.659423828125, -4.5030517578125, -4.3466796875, -4.1903076171875, -4.033935546875, -3.8775634765625, -3.72119140625, -3.5648193359375, -3.408447265625, -3.2520751953125, -3.095703125, -2.9393310546875, -2.782958984375, -2.6265869140625, -2.47021484375, -2.3138427734375, -2.157470703125, -2.0010986328125, -1.8447265625, -1.6883544921875, -1.531982421875, -1.3756103515625, -1.21923828125, -1.0628662109375, -0.906494140625, -0.7501220703125, -0.59375, -0.4373779296875, -0.281005859375, -0.1246337890625, 0.03173828125, 0.1881103515625, 0.344482421875, 0.5008544921875, 0.6572265625, 0.8135986328125, 0.969970703125, 1.1263427734375, 1.28271484375, 1.4390869140625, 1.595458984375, 1.7518310546875, 1.908203125, 2.0645751953125, 2.220947265625, 2.3773193359375, 2.53369140625, 2.6900634765625, 2.846435546875, 3.0028076171875, 3.1591796875, 3.3155517578125, 3.471923828125, 3.6282958984375, 3.78466796875, 3.9410400390625, 4.097412109375, 4.2537841796875, 4.41015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 1.0, 3.0, 8.0, 5.0, 7.0, 7.0, 16.0, 20.0, 33.0, 38.0, 45.0, 57.0, 86.0, 167.0, 191.0, 366.0, 699.0, 1405.0, 2978.0, 7169.0, 19374.0, 60546.0, 274749.0, 505403.0, 121845.0, 32669.0, 11730.0, 4624.0, 1963.0, 971.0, 507.0, 294.0, 180.0, 117.0, 75.0, 54.0, 34.0, 24.0, 25.0, 22.0, 10.0, 12.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.470703125, -2.396392822265625, -2.32208251953125, -2.247772216796875, -2.1734619140625, -2.099151611328125, -2.02484130859375, -1.950531005859375, -1.876220703125, -1.801910400390625, -1.72760009765625, -1.653289794921875, -1.5789794921875, -1.504669189453125, -1.43035888671875, -1.356048583984375, -1.28173828125, -1.207427978515625, -1.13311767578125, -1.058807373046875, -0.9844970703125, -0.910186767578125, -0.83587646484375, -0.761566162109375, -0.687255859375, -0.612945556640625, -0.53863525390625, -0.464324951171875, -0.3900146484375, -0.315704345703125, -0.24139404296875, -0.167083740234375, -0.0927734375, -0.018463134765625, 0.05584716796875, 0.130157470703125, 0.2044677734375, 0.278778076171875, 0.35308837890625, 0.427398681640625, 0.501708984375, 0.576019287109375, 0.65032958984375, 0.724639892578125, 0.7989501953125, 0.873260498046875, 0.94757080078125, 1.021881103515625, 1.09619140625, 1.170501708984375, 1.24481201171875, 1.319122314453125, 1.3934326171875, 1.467742919921875, 1.54205322265625, 1.616363525390625, 1.690673828125, 1.764984130859375, 1.83929443359375, 1.913604736328125, 1.9879150390625, 2.062225341796875, 2.13653564453125, 2.210845947265625, 2.28515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 7.0, 11.0, 7.0, 17.0, 15.0, 29.0, 46.0, 92.0, 205.0, 263.0, 122.0, 65.0, 24.0, 22.0, 17.0, 9.0, 15.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00052642822265625, -0.0005025863647460938, -0.0004787445068359375, -0.00045490264892578125, -0.000431060791015625, -0.00040721893310546875, -0.0003833770751953125, -0.00035953521728515625, -0.000335693359375, -0.00031185150146484375, -0.0002880096435546875, -0.00026416778564453125, -0.000240325927734375, -0.00021648406982421875, -0.0001926422119140625, -0.00016880035400390625, -0.00014495849609375, -0.00012111663818359375, -9.72747802734375e-05, -7.343292236328125e-05, -4.9591064453125e-05, -2.574920654296875e-05, -1.9073486328125e-06, 2.193450927734375e-05, 4.57763671875e-05, 6.961822509765625e-05, 9.34600830078125e-05, 0.00011730194091796875, 0.000141143798828125, 0.00016498565673828125, 0.0001888275146484375, 0.00021266937255859375, 0.00023651123046875, 0.00026035308837890625, 0.0002841949462890625, 0.00030803680419921875, 0.000331878662109375, 0.00035572052001953125, 0.0003795623779296875, 0.00040340423583984375, 0.00042724609375, 0.00045108795166015625, 0.0004749298095703125, 0.0004987716674804688, 0.000522613525390625, 0.0005464553833007812, 0.0005702972412109375, 0.0005941390991210938, 0.00061798095703125, 0.0006418228149414062, 0.0006656646728515625, 0.0006895065307617188, 0.000713348388671875, 0.0007371902465820312, 0.0007610321044921875, 0.0007848739624023438, 0.0008087158203125, 0.0008325576782226562, 0.0008563995361328125, 0.0008802413940429688, 0.000904083251953125, 0.0009279251098632812, 0.0009517669677734375, 0.0009756088256835938, 0.00099945068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 19.0, 18.0, 30.0, 35.0, 48.0, 97.0, 126.0, 205.0, 331.0, 512.0, 1125.0, 2591.0, 6642.0, 18620.0, 64991.0, 423369.0, 432428.0, 66533.0, 19076.0, 6571.0, 2575.0, 1164.0, 556.0, 313.0, 185.0, 114.0, 86.0, 47.0, 35.0, 21.0, 19.0, 11.0, 11.0, 11.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.628143310546875, -2.53753662109375, -2.446929931640625, -2.3563232421875, -2.265716552734375, -2.17510986328125, -2.084503173828125, -1.993896484375, -1.903289794921875, -1.81268310546875, -1.722076416015625, -1.6314697265625, -1.540863037109375, -1.45025634765625, -1.359649658203125, -1.26904296875, -1.178436279296875, -1.08782958984375, -0.997222900390625, -0.9066162109375, -0.816009521484375, -0.72540283203125, -0.634796142578125, -0.544189453125, -0.453582763671875, -0.36297607421875, -0.272369384765625, -0.1817626953125, -0.091156005859375, -0.00054931640625, 0.090057373046875, 0.1806640625, 0.271270751953125, 0.36187744140625, 0.452484130859375, 0.5430908203125, 0.633697509765625, 0.72430419921875, 0.814910888671875, 0.905517578125, 0.996124267578125, 1.08673095703125, 1.177337646484375, 1.2679443359375, 1.358551025390625, 1.44915771484375, 1.539764404296875, 1.63037109375, 1.720977783203125, 1.81158447265625, 1.902191162109375, 1.9927978515625, 2.083404541015625, 2.17401123046875, 2.264617919921875, 2.355224609375, 2.445831298828125, 2.53643798828125, 2.627044677734375, 2.7176513671875, 2.808258056640625, 2.89886474609375, 2.989471435546875, 3.080078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 9.0, 4.0, 12.0, 17.0, 24.0, 46.0, 90.0, 136.0, 166.0, 190.0, 105.0, 63.0, 43.0, 17.0, 23.0, 11.0, 9.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.895477294921875, -3.78704833984375, -3.678619384765625, -3.5701904296875, -3.461761474609375, -3.35333251953125, -3.244903564453125, -3.136474609375, -3.028045654296875, -2.91961669921875, -2.811187744140625, -2.7027587890625, -2.594329833984375, -2.48590087890625, -2.377471923828125, -2.26904296875, -2.160614013671875, -2.05218505859375, -1.943756103515625, -1.8353271484375, -1.726898193359375, -1.61846923828125, -1.510040283203125, -1.401611328125, -1.293182373046875, -1.18475341796875, -1.076324462890625, -0.9678955078125, -0.859466552734375, -0.75103759765625, -0.642608642578125, -0.5341796875, -0.425750732421875, -0.31732177734375, -0.208892822265625, -0.1004638671875, 0.007965087890625, 0.11639404296875, 0.224822998046875, 0.333251953125, 0.441680908203125, 0.55010986328125, 0.658538818359375, 0.7669677734375, 0.875396728515625, 0.98382568359375, 1.092254638671875, 1.20068359375, 1.309112548828125, 1.41754150390625, 1.525970458984375, 1.6343994140625, 1.742828369140625, 1.85125732421875, 1.959686279296875, 2.068115234375, 2.176544189453125, 2.28497314453125, 2.393402099609375, 2.5018310546875, 2.610260009765625, 2.71868896484375, 2.827117919921875, 2.935546875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 21.0, 24.0, 53.0, 41.0, 49.0, 78.0, 95.0, 89.0, 92.0, 89.0, 85.0, 69.0, 47.0, 39.0, 29.0, 23.0, 16.0, 13.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.245548248291016, -28.248075485229492, -27.250600814819336, -26.253128051757812, -25.255653381347656, -24.258180618286133, -23.260705947875977, -22.263233184814453, -21.265758514404297, -20.268285751342773, -19.270811080932617, -18.273338317871094, -17.275863647460938, -16.278390884399414, -15.280916213989258, -14.283443450927734, -13.285969734191895, -12.288496017456055, -11.291022300720215, -10.293548583984375, -9.296074867248535, -8.298601150512695, -7.301127910614014, -6.303654193878174, -5.306180477142334, -4.308706760406494, -3.3112330436706543, -2.3137595653533936, -1.3162858486175537, -0.31881237030029297, 0.6786613464355469, 1.6761350631713867, 2.6736087799072266, 3.6710824966430664, 4.668556213378906, 5.666029930114746, 6.663503646850586, 7.660976886749268, 8.658451080322266, 9.655923843383789, 10.653398513793945, 11.650872230529785, 12.648345947265625, 13.645819664001465, 14.643293380737305, 15.640766143798828, 16.638240814208984, 17.635713577270508, 18.63318634033203, 19.630659103393555, 20.62813377380371, 21.625606536865234, 22.62308120727539, 23.620553970336914, 24.61802864074707, 25.615501403808594, 26.61297607421875, 27.610448837280273, 28.60792350769043, 29.605396270751953, 30.60287094116211, 31.600343704223633, 32.597816467285156, 33.59529113769531, 34.59276580810547]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 10.0, 2.0, 10.0, 18.0, 15.0, 21.0, 15.0, 28.0, 44.0, 43.0, 44.0, 40.0, 48.0, 51.0, 55.0, 57.0, 57.0, 57.0, 60.0, 56.0, 34.0, 32.0, 37.0, 35.0, 34.0, 17.0, 14.0, 17.0, 20.0, 11.0, 3.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.37845802307129, -28.3885555267334, -27.398653030395508, -26.40875244140625, -25.41884994506836, -24.42894744873047, -23.439044952392578, -22.449142456054688, -21.459239959716797, -20.469337463378906, -19.479434967041016, -18.489532470703125, -17.499631881713867, -16.509729385375977, -15.519826889038086, -14.529924392700195, -13.540023803710938, -12.550121307373047, -11.560219764709473, -10.570317268371582, -9.580415725708008, -8.590513229370117, -7.600610733032227, -6.610708713531494, -5.620806694030762, -4.630904674530029, -3.6410024166107178, -2.6511001586914062, -1.6611981391906738, -0.6712961196899414, 0.3186063766479492, 1.3085083961486816, 2.298412322998047, 3.2883143424987793, 4.278216361999512, 5.268118858337402, 6.258020877838135, 7.247922897338867, 8.237825393676758, 9.227727890014648, 10.217629432678223, 11.207531929016113, 12.197433471679688, 13.187335968017578, 14.177238464355469, 15.167140007019043, 16.15704345703125, 17.146944046020508, 18.1368465423584, 19.12674903869629, 20.11665153503418, 21.106552124023438, 22.096454620361328, 23.08635711669922, 24.07625961303711, 25.066162109375, 26.05606460571289, 27.04596710205078, 28.035869598388672, 29.025772094726562, 30.01567268371582, 31.00557518005371, 31.9954776763916, 32.98537826538086, 33.97528076171875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 11.0, 8.0, 9.0, 14.0, 8.0, 23.0, 30.0, 43.0, 73.0, 102.0, 150.0, 241.0, 381.0, 786.0, 1517.0, 3329.0, 8932.0, 35865.0, 500005.0, 3564446.0, 58587.0, 12171.0, 4096.0, 1609.0, 802.0, 406.0, 225.0, 152.0, 73.0, 58.0, 39.0, 30.0, 16.0, 12.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-22.75, -22.18310546875, -21.6162109375, -21.04931640625, -20.482421875, -19.91552734375, -19.3486328125, -18.78173828125, -18.21484375, -17.64794921875, -17.0810546875, -16.51416015625, -15.947265625, -15.38037109375, -14.8134765625, -14.24658203125, -13.6796875, -13.11279296875, -12.5458984375, -11.97900390625, -11.412109375, -10.84521484375, -10.2783203125, -9.71142578125, -9.14453125, -8.57763671875, -8.0107421875, -7.44384765625, -6.876953125, -6.31005859375, -5.7431640625, -5.17626953125, -4.609375, -4.04248046875, -3.4755859375, -2.90869140625, -2.341796875, -1.77490234375, -1.2080078125, -0.64111328125, -0.07421875, 0.49267578125, 1.0595703125, 1.62646484375, 2.193359375, 2.76025390625, 3.3271484375, 3.89404296875, 4.4609375, 5.02783203125, 5.5947265625, 6.16162109375, 6.728515625, 7.29541015625, 7.8623046875, 8.42919921875, 8.99609375, 9.56298828125, 10.1298828125, 10.69677734375, 11.263671875, 11.83056640625, 12.3974609375, 12.96435546875, 13.53125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 19.0, 18.0, 21.0, 33.0, 39.0, 52.0, 56.0, 62.0, 72.0, 75.0, 70.0, 79.0, 68.0, 69.0, 53.0, 54.0, 32.0, 32.0, 26.0, 11.0, 5.0, 12.0, 8.0, 9.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.849609375, -2.778839111328125, -2.70806884765625, -2.637298583984375, -2.5665283203125, -2.495758056640625, -2.42498779296875, -2.354217529296875, -2.283447265625, -2.212677001953125, -2.14190673828125, -2.071136474609375, -2.0003662109375, -1.929595947265625, -1.85882568359375, -1.788055419921875, -1.71728515625, -1.646514892578125, -1.57574462890625, -1.504974365234375, -1.4342041015625, -1.363433837890625, -1.29266357421875, -1.221893310546875, -1.151123046875, -1.080352783203125, -1.00958251953125, -0.938812255859375, -0.8680419921875, -0.797271728515625, -0.72650146484375, -0.655731201171875, -0.5849609375, -0.514190673828125, -0.44342041015625, -0.372650146484375, -0.3018798828125, -0.231109619140625, -0.16033935546875, -0.089569091796875, -0.018798828125, 0.051971435546875, 0.12274169921875, 0.193511962890625, 0.2642822265625, 0.335052490234375, 0.40582275390625, 0.476593017578125, 0.54736328125, 0.618133544921875, 0.68890380859375, 0.759674072265625, 0.8304443359375, 0.901214599609375, 0.97198486328125, 1.042755126953125, 1.113525390625, 1.184295654296875, 1.25506591796875, 1.325836181640625, 1.3966064453125, 1.467376708984375, 1.53814697265625, 1.608917236328125, 1.6796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 2.0, 7.0, 9.0, 9.0, 10.0, 11.0, 27.0, 31.0, 46.0, 72.0, 100.0, 174.0, 305.0, 586.0, 1195.0, 2914.0, 9276.0, 44776.0, 665968.0, 3372312.0, 76100.0, 13408.0, 3851.0, 1457.0, 668.0, 342.0, 220.0, 123.0, 81.0, 56.0, 39.0, 32.0, 19.0, 14.0, 11.0, 5.0, 8.0, 0.0, 7.0, 1.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2109375, -10.8388671875, -10.466796875, -10.0947265625, -9.72265625, -9.3505859375, -8.978515625, -8.6064453125, -8.234375, -7.8623046875, -7.490234375, -7.1181640625, -6.74609375, -6.3740234375, -6.001953125, -5.6298828125, -5.2578125, -4.8857421875, -4.513671875, -4.1416015625, -3.76953125, -3.3974609375, -3.025390625, -2.6533203125, -2.28125, -1.9091796875, -1.537109375, -1.1650390625, -0.79296875, -0.4208984375, -0.048828125, 0.3232421875, 0.6953125, 1.0673828125, 1.439453125, 1.8115234375, 2.18359375, 2.5556640625, 2.927734375, 3.2998046875, 3.671875, 4.0439453125, 4.416015625, 4.7880859375, 5.16015625, 5.5322265625, 5.904296875, 6.2763671875, 6.6484375, 7.0205078125, 7.392578125, 7.7646484375, 8.13671875, 8.5087890625, 8.880859375, 9.2529296875, 9.625, 9.9970703125, 10.369140625, 10.7412109375, 11.11328125, 11.4853515625, 11.857421875, 12.2294921875, 12.6015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 9.0, 16.0, 29.0, 36.0, 49.0, 87.0, 161.0, 461.0, 2110.0, 584.0, 193.0, 113.0, 63.0, 43.0, 35.0, 20.0, 10.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.435302734375, -2.32763671875, -2.219970703125, -2.1123046875, -2.004638671875, -1.89697265625, -1.789306640625, -1.681640625, -1.573974609375, -1.46630859375, -1.358642578125, -1.2509765625, -1.143310546875, -1.03564453125, -0.927978515625, -0.8203125, -0.712646484375, -0.60498046875, -0.497314453125, -0.3896484375, -0.281982421875, -0.17431640625, -0.066650390625, 0.041015625, 0.148681640625, 0.25634765625, 0.364013671875, 0.4716796875, 0.579345703125, 0.68701171875, 0.794677734375, 0.90234375, 1.010009765625, 1.11767578125, 1.225341796875, 1.3330078125, 1.440673828125, 1.54833984375, 1.656005859375, 1.763671875, 1.871337890625, 1.97900390625, 2.086669921875, 2.1943359375, 2.302001953125, 2.40966796875, 2.517333984375, 2.625, 2.732666015625, 2.84033203125, 2.947998046875, 3.0556640625, 3.163330078125, 3.27099609375, 3.378662109375, 3.486328125, 3.593994140625, 3.70166015625, 3.809326171875, 3.9169921875, 4.024658203125, 4.13232421875, 4.239990234375, 4.34765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 10.0, 17.0, 40.0, 103.0, 167.0, 206.0, 189.0, 125.0, 57.0, 41.0, 14.0, 7.0, 7.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.32994842529297, -21.462066650390625, -20.59418487548828, -19.726303100585938, -18.858421325683594, -17.99053955078125, -17.122657775878906, -16.254777908325195, -15.386896133422852, -14.519014358520508, -13.651132583618164, -12.78325080871582, -11.915369987487793, -11.04748821258545, -10.179606437683105, -9.311725616455078, -8.443842887878418, -7.575961112976074, -6.708079814910889, -5.840198040008545, -4.972316741943359, -4.104434967041016, -3.236553192138672, -2.3686718940734863, -1.5007901191711426, -0.6329085230827332, 0.23497307300567627, 1.1028547286987305, 1.9707362651824951, 2.8386178016662598, 3.7064995765686035, 4.574380874633789, 5.442262649536133, 6.310144424438477, 7.178025722503662, 8.045907974243164, 8.913788795471191, 9.781670570373535, 10.649552345275879, 11.517433166503906, 12.38531494140625, 13.253196716308594, 14.121078491210938, 14.988960266113281, 15.856841087341309, 16.72472381591797, 17.592605590820312, 18.460485458374023, 19.328369140625, 20.196250915527344, 21.064132690429688, 21.93201446533203, 22.799896240234375, 23.66777801513672, 24.535659790039062, 25.403539657592773, 26.271421432495117, 27.13930320739746, 28.007184982299805, 28.87506675720215, 29.742948532104492, 30.610828399658203, 31.478710174560547, 32.34659194946289, 33.214473724365234]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 2.0, 7.0, 12.0, 5.0, 7.0, 12.0, 16.0, 18.0, 14.0, 20.0, 33.0, 18.0, 34.0, 30.0, 33.0, 39.0, 39.0, 35.0, 37.0, 39.0, 41.0, 45.0, 32.0, 60.0, 30.0, 42.0, 39.0, 37.0, 42.0, 16.0, 25.0, 20.0, 17.0, 13.0, 17.0, 10.0, 12.0, 12.0, 4.0, 10.0, 8.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.11983585357666, -7.871512413024902, -7.6231889724731445, -7.374865531921387, -7.126542091369629, -6.878218650817871, -6.629895210266113, -6.3815717697143555, -6.133248329162598, -5.88492488861084, -5.636601448059082, -5.388278007507324, -5.139954566955566, -4.891631126403809, -4.643307685852051, -4.394984245300293, -4.146660327911377, -3.898336887359619, -3.6500134468078613, -3.4016900062561035, -3.1533665657043457, -2.905043125152588, -2.656719446182251, -2.408396005630493, -2.1600725650787354, -1.9117491245269775, -1.6634256839752197, -1.4151021242141724, -1.1667786836624146, -0.9184552431106567, -0.6701316833496094, -0.42180824279785156, -0.17348527908325195, 0.07483819127082825, 0.32316166162490845, 0.571485161781311, 0.8198086023330688, 1.0681320428848267, 1.316455602645874, 1.5647790431976318, 1.8131024837493896, 2.0614259243011475, 2.3097493648529053, 2.558073043823242, 2.806396484375, 3.054719924926758, 3.3030433654785156, 3.5513668060302734, 3.7996902465820312, 4.048013687133789, 4.296337127685547, 4.544660568237305, 4.7929840087890625, 5.04130744934082, 5.289630889892578, 5.537954330444336, 5.786277770996094, 6.034601211547852, 6.282924652099609, 6.531248092651367, 6.779571533203125, 7.027894973754883, 7.276218414306641, 7.524541854858398, 7.7728657722473145]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 4.0, 8.0, 29.0, 32.0, 55.0, 85.0, 86.0, 160.0, 273.0, 484.0, 944.0, 1765.0, 3979.0, 10487.0, 35435.0, 143822.0, 482953.0, 271863.0, 66756.0, 17899.0, 6081.0, 2487.0, 1198.0, 630.0, 366.0, 242.0, 123.0, 81.0, 65.0, 43.0, 30.0, 21.0, 11.0, 7.0, 11.0, 12.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.1583251953125, -9.816650390625, -9.4749755859375, -9.13330078125, -8.7916259765625, -8.449951171875, -8.1082763671875, -7.7666015625, -7.4249267578125, -7.083251953125, -6.7415771484375, -6.39990234375, -6.0582275390625, -5.716552734375, -5.3748779296875, -5.033203125, -4.6915283203125, -4.349853515625, -4.0081787109375, -3.66650390625, -3.3248291015625, -2.983154296875, -2.6414794921875, -2.2998046875, -1.9581298828125, -1.616455078125, -1.2747802734375, -0.93310546875, -0.5914306640625, -0.249755859375, 0.0919189453125, 0.43359375, 0.7752685546875, 1.116943359375, 1.4586181640625, 1.80029296875, 2.1419677734375, 2.483642578125, 2.8253173828125, 3.1669921875, 3.5086669921875, 3.850341796875, 4.1920166015625, 4.53369140625, 4.8753662109375, 5.217041015625, 5.5587158203125, 5.900390625, 6.2420654296875, 6.583740234375, 6.9254150390625, 7.26708984375, 7.6087646484375, 7.950439453125, 8.2921142578125, 8.6337890625, 8.9754638671875, 9.317138671875, 9.6588134765625, 10.00048828125, 10.3421630859375, 10.683837890625, 11.0255126953125, 11.3671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 8.0, 9.0, 19.0, 21.0, 28.0, 41.0, 47.0, 67.0, 50.0, 74.0, 79.0, 73.0, 74.0, 73.0, 76.0, 50.0, 42.0, 43.0, 37.0, 22.0, 13.0, 20.0, 7.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.990234375, -2.9163818359375, -2.842529296875, -2.7686767578125, -2.69482421875, -2.6209716796875, -2.547119140625, -2.4732666015625, -2.3994140625, -2.3255615234375, -2.251708984375, -2.1778564453125, -2.10400390625, -2.0301513671875, -1.956298828125, -1.8824462890625, -1.80859375, -1.7347412109375, -1.660888671875, -1.5870361328125, -1.51318359375, -1.4393310546875, -1.365478515625, -1.2916259765625, -1.2177734375, -1.1439208984375, -1.070068359375, -0.9962158203125, -0.92236328125, -0.8485107421875, -0.774658203125, -0.7008056640625, -0.626953125, -0.5531005859375, -0.479248046875, -0.4053955078125, -0.33154296875, -0.2576904296875, -0.183837890625, -0.1099853515625, -0.0361328125, 0.0377197265625, 0.111572265625, 0.1854248046875, 0.25927734375, 0.3331298828125, 0.406982421875, 0.4808349609375, 0.5546875, 0.6285400390625, 0.702392578125, 0.7762451171875, 0.85009765625, 0.9239501953125, 0.997802734375, 1.0716552734375, 1.1455078125, 1.2193603515625, 1.293212890625, 1.3670654296875, 1.44091796875, 1.5147705078125, 1.588623046875, 1.6624755859375, 1.736328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 12.0, 7.0, 12.0, 16.0, 20.0, 22.0, 44.0, 64.0, 103.0, 136.0, 248.0, 445.0, 880.0, 1666.0, 3990.0, 10416.0, 31562.0, 104323.0, 317841.0, 378091.0, 135559.0, 40813.0, 13310.0, 4853.0, 1944.0, 891.0, 501.0, 241.0, 195.0, 106.0, 72.0, 31.0, 33.0, 24.0, 12.0, 21.0, 10.0, 11.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.46875, -6.27337646484375, -6.0780029296875, -5.88262939453125, -5.687255859375, -5.49188232421875, -5.2965087890625, -5.10113525390625, -4.90576171875, -4.71038818359375, -4.5150146484375, -4.31964111328125, -4.124267578125, -3.92889404296875, -3.7335205078125, -3.53814697265625, -3.3427734375, -3.14739990234375, -2.9520263671875, -2.75665283203125, -2.561279296875, -2.36590576171875, -2.1705322265625, -1.97515869140625, -1.77978515625, -1.58441162109375, -1.3890380859375, -1.19366455078125, -0.998291015625, -0.80291748046875, -0.6075439453125, -0.41217041015625, -0.216796875, -0.02142333984375, 0.1739501953125, 0.36932373046875, 0.564697265625, 0.76007080078125, 0.9554443359375, 1.15081787109375, 1.34619140625, 1.54156494140625, 1.7369384765625, 1.93231201171875, 2.127685546875, 2.32305908203125, 2.5184326171875, 2.71380615234375, 2.9091796875, 3.10455322265625, 3.2999267578125, 3.49530029296875, 3.690673828125, 3.88604736328125, 4.0814208984375, 4.27679443359375, 4.47216796875, 4.66754150390625, 4.8629150390625, 5.05828857421875, 5.253662109375, 5.44903564453125, 5.6444091796875, 5.83978271484375, 6.03515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 6.0, 8.0, 16.0, 17.0, 34.0, 32.0, 35.0, 43.0, 39.0, 45.0, 44.0, 60.0, 76.0, 50.0, 66.0, 56.0, 48.0, 63.0, 49.0, 34.0, 30.0, 32.0, 25.0, 19.0, 17.0, 10.0, 8.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.77734375, -7.51470947265625, -7.2520751953125, -6.98944091796875, -6.726806640625, -6.46417236328125, -6.2015380859375, -5.93890380859375, -5.67626953125, -5.41363525390625, -5.1510009765625, -4.88836669921875, -4.625732421875, -4.36309814453125, -4.1004638671875, -3.83782958984375, -3.5751953125, -3.31256103515625, -3.0499267578125, -2.78729248046875, -2.524658203125, -2.26202392578125, -1.9993896484375, -1.73675537109375, -1.47412109375, -1.21148681640625, -0.9488525390625, -0.68621826171875, -0.423583984375, -0.16094970703125, 0.1016845703125, 0.36431884765625, 0.626953125, 0.88958740234375, 1.1522216796875, 1.41485595703125, 1.677490234375, 1.94012451171875, 2.2027587890625, 2.46539306640625, 2.72802734375, 2.99066162109375, 3.2532958984375, 3.51593017578125, 3.778564453125, 4.04119873046875, 4.3038330078125, 4.56646728515625, 4.8291015625, 5.09173583984375, 5.3543701171875, 5.61700439453125, 5.879638671875, 6.14227294921875, 6.4049072265625, 6.66754150390625, 6.93017578125, 7.19281005859375, 7.4554443359375, 7.71807861328125, 7.980712890625, 8.24334716796875, 8.5059814453125, 8.76861572265625, 9.03125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 14.0, 27.0, 36.0, 48.0, 87.0, 117.0, 221.0, 410.0, 805.0, 2052.0, 5766.0, 19707.0, 90137.0, 601287.0, 264555.0, 45427.0, 11436.0, 3709.0, 1371.0, 581.0, 301.0, 158.0, 96.0, 66.0, 36.0, 28.0, 16.0, 13.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.234375, -4.0762939453125, -3.918212890625, -3.7601318359375, -3.60205078125, -3.4439697265625, -3.285888671875, -3.1278076171875, -2.9697265625, -2.8116455078125, -2.653564453125, -2.4954833984375, -2.33740234375, -2.1793212890625, -2.021240234375, -1.8631591796875, -1.705078125, -1.5469970703125, -1.388916015625, -1.2308349609375, -1.07275390625, -0.9146728515625, -0.756591796875, -0.5985107421875, -0.4404296875, -0.2823486328125, -0.124267578125, 0.0338134765625, 0.19189453125, 0.3499755859375, 0.508056640625, 0.6661376953125, 0.82421875, 0.9822998046875, 1.140380859375, 1.2984619140625, 1.45654296875, 1.6146240234375, 1.772705078125, 1.9307861328125, 2.0888671875, 2.2469482421875, 2.405029296875, 2.5631103515625, 2.72119140625, 2.8792724609375, 3.037353515625, 3.1954345703125, 3.353515625, 3.5115966796875, 3.669677734375, 3.8277587890625, 3.98583984375, 4.1439208984375, 4.302001953125, 4.4600830078125, 4.6181640625, 4.7762451171875, 4.934326171875, 5.0924072265625, 5.25048828125, 5.4085693359375, 5.566650390625, 5.7247314453125, 5.8828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 10.0, 10.0, 6.0, 19.0, 32.0, 29.0, 40.0, 71.0, 98.0, 136.0, 206.0, 90.0, 70.0, 51.0, 48.0, 35.0, 23.0, 8.0, 11.0, 1.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006742477416992188, -0.0006486028432846069, -0.0006229579448699951, -0.0005973130464553833, -0.0005716681480407715, -0.0005460232496261597, -0.0005203783512115479, -0.000494733452796936, -0.0004690885543823242, -0.0004434436559677124, -0.0004177987575531006, -0.00039215385913848877, -0.00036650896072387695, -0.00034086406230926514, -0.0003152191638946533, -0.0002895742654800415, -0.0002639293670654297, -0.00023828446865081787, -0.00021263957023620605, -0.00018699467182159424, -0.00016134977340698242, -0.0001357048749923706, -0.00011005997657775879, -8.441507816314697e-05, -5.8770179748535156e-05, -3.312528133392334e-05, -7.4803829193115234e-06, 1.8164515495300293e-05, 4.380941390991211e-05, 6.945431232452393e-05, 9.509921073913574e-05, 0.00012074410915374756, 0.00014638900756835938, 0.0001720339059829712, 0.000197678804397583, 0.00022332370281219482, 0.00024896860122680664, 0.00027461349964141846, 0.0003002583980560303, 0.0003259032964706421, 0.0003515481948852539, 0.0003771930932998657, 0.00040283799171447754, 0.00042848289012908936, 0.00045412778854370117, 0.000479772686958313, 0.0005054175853729248, 0.0005310624837875366, 0.0005567073822021484, 0.0005823522806167603, 0.0006079971790313721, 0.0006336420774459839, 0.0006592869758605957, 0.0006849318742752075, 0.0007105767726898193, 0.0007362216711044312, 0.000761866569519043, 0.0007875114679336548, 0.0008131563663482666, 0.0008388012647628784, 0.0008644461631774902, 0.000890091061592102, 0.0009157359600067139, 0.0009413808584213257, 0.0009670257568359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 16.0, 27.0, 41.0, 70.0, 90.0, 165.0, 311.0, 577.0, 1205.0, 2887.0, 8812.0, 34078.0, 162460.0, 640773.0, 151291.0, 32005.0, 8457.0, 2801.0, 1155.0, 548.0, 307.0, 189.0, 84.0, 69.0, 40.0, 29.0, 19.0, 8.0, 4.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.5234375, -5.35845947265625, -5.1934814453125, -5.02850341796875, -4.863525390625, -4.69854736328125, -4.5335693359375, -4.36859130859375, -4.20361328125, -4.03863525390625, -3.8736572265625, -3.70867919921875, -3.543701171875, -3.37872314453125, -3.2137451171875, -3.04876708984375, -2.8837890625, -2.71881103515625, -2.5538330078125, -2.38885498046875, -2.223876953125, -2.05889892578125, -1.8939208984375, -1.72894287109375, -1.56396484375, -1.39898681640625, -1.2340087890625, -1.06903076171875, -0.904052734375, -0.73907470703125, -0.5740966796875, -0.40911865234375, -0.244140625, -0.07916259765625, 0.0858154296875, 0.25079345703125, 0.415771484375, 0.58074951171875, 0.7457275390625, 0.91070556640625, 1.07568359375, 1.24066162109375, 1.4056396484375, 1.57061767578125, 1.735595703125, 1.90057373046875, 2.0655517578125, 2.23052978515625, 2.3955078125, 2.56048583984375, 2.7254638671875, 2.89044189453125, 3.055419921875, 3.22039794921875, 3.3853759765625, 3.55035400390625, 3.71533203125, 3.88031005859375, 4.0452880859375, 4.21026611328125, 4.375244140625, 4.54022216796875, 4.7052001953125, 4.87017822265625, 5.03515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 10.0, 24.0, 19.0, 35.0, 45.0, 81.0, 110.0, 137.0, 161.0, 99.0, 68.0, 57.0, 43.0, 32.0, 19.0, 7.0, 13.0, 9.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.24090576171875, -7.0560302734375, -6.87115478515625, -6.686279296875, -6.50140380859375, -6.3165283203125, -6.13165283203125, -5.94677734375, -5.76190185546875, -5.5770263671875, -5.39215087890625, -5.207275390625, -5.02239990234375, -4.8375244140625, -4.65264892578125, -4.4677734375, -4.28289794921875, -4.0980224609375, -3.91314697265625, -3.728271484375, -3.54339599609375, -3.3585205078125, -3.17364501953125, -2.98876953125, -2.80389404296875, -2.6190185546875, -2.43414306640625, -2.249267578125, -2.06439208984375, -1.8795166015625, -1.69464111328125, -1.509765625, -1.32489013671875, -1.1400146484375, -0.95513916015625, -0.770263671875, -0.58538818359375, -0.4005126953125, -0.21563720703125, -0.03076171875, 0.15411376953125, 0.3389892578125, 0.52386474609375, 0.708740234375, 0.89361572265625, 1.0784912109375, 1.26336669921875, 1.4482421875, 1.63311767578125, 1.8179931640625, 2.00286865234375, 2.187744140625, 2.37261962890625, 2.5574951171875, 2.74237060546875, 2.92724609375, 3.11212158203125, 3.2969970703125, 3.48187255859375, 3.666748046875, 3.85162353515625, 4.0364990234375, 4.22137451171875, 4.40625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 11.0, 10.0, 25.0, 58.0, 109.0, 181.0, 214.0, 171.0, 106.0, 69.0, 25.0, 12.0, 3.0, 8.0, 2.0, 1.0, 1.0], "bins": [-164.5408935546875, -161.4685821533203, -158.39627075195312, -155.323974609375, -152.2516632080078, -149.17935180664062, -146.10704040527344, -143.03472900390625, -139.96243286132812, -136.89012145996094, -133.81781005859375, -130.74551391601562, -127.67320251464844, -124.60089111328125, -121.52857971191406, -118.4562759399414, -115.38396453857422, -112.31165313720703, -109.23934936523438, -106.16703796386719, -103.09473419189453, -100.02242279052734, -96.95011901855469, -93.8778076171875, -90.80549621582031, -87.73318481445312, -84.66088104248047, -81.58856964111328, -78.51626586914062, -75.44395446777344, -72.37164306640625, -69.2993392944336, -66.22703552246094, -63.154727935791016, -60.082420349121094, -57.010108947753906, -53.93780517578125, -50.86549377441406, -47.79318618774414, -44.72087860107422, -41.6485710144043, -38.576263427734375, -35.50395584106445, -32.43164825439453, -29.359338760375977, -26.287031173706055, -23.2147216796875, -20.142414093017578, -17.070106506347656, -13.997798919677734, -10.925490379333496, -7.853181838989258, -4.780874252319336, -1.708566665649414, 1.3637428283691406, 4.4360504150390625, 7.508358001708984, 10.580665588378906, 13.652974128723145, 16.725282669067383, 19.797590255737305, 22.869897842407227, 25.94220733642578, 29.014514923095703, 32.086822509765625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 11.0, 14.0, 16.0, 27.0, 23.0, 23.0, 34.0, 28.0, 30.0, 52.0, 38.0, 34.0, 51.0, 40.0, 53.0, 38.0, 47.0, 40.0, 56.0, 59.0, 42.0, 40.0, 34.0, 34.0, 18.0, 7.0, 19.0, 17.0, 8.0, 6.0, 10.0, 7.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-50.24095153808594, -48.8752555847168, -47.50956344604492, -46.14386749267578, -44.77817153930664, -43.4124755859375, -42.046783447265625, -40.681087493896484, -39.315391540527344, -37.9496955871582, -36.58400344848633, -35.21830749511719, -33.85261154174805, -32.486915588378906, -31.12122344970703, -29.75552749633789, -28.389833450317383, -27.024139404296875, -25.658443450927734, -24.292749404907227, -22.927053451538086, -21.561359405517578, -20.195663452148438, -18.82996940612793, -17.464275360107422, -16.098581314086914, -14.732885360717773, -13.367191314697266, -12.001495361328125, -10.635801315307617, -9.270106315612793, -7.904411315917969, -6.538715362548828, -5.173020362854004, -3.807325601577759, -2.4416308403015137, -1.0759358406066895, 0.28975915908813477, 1.6554536819458008, 3.021148681640625, 4.386843681335449, 5.752538681030273, 7.118233680725098, 8.483928680419922, 9.84962272644043, 11.21531867980957, 12.581012725830078, 13.946707725524902, 15.312402725219727, 16.678096771240234, 18.043792724609375, 19.409486770629883, 20.775182723999023, 22.14087677001953, 23.506572723388672, 24.87226676940918, 26.237960815429688, 27.603654861450195, 28.969350814819336, 30.335044860839844, 31.700740814208984, 33.066436767578125, 34.43212890625, 35.79782485961914, 37.16352081298828]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 5.0, 8.0, 8.0, 6.0, 11.0, 18.0, 23.0, 33.0, 50.0, 83.0, 131.0, 206.0, 396.0, 759.0, 1813.0, 4851.0, 17442.0, 114782.0, 3775065.0, 242739.0, 26028.0, 6174.0, 2000.0, 806.0, 364.0, 189.0, 118.0, 64.0, 38.0, 20.0, 15.0, 9.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0], "bins": [-21.921875, -21.395263671875, -20.86865234375, -20.342041015625, -19.8154296875, -19.288818359375, -18.76220703125, -18.235595703125, -17.708984375, -17.182373046875, -16.65576171875, -16.129150390625, -15.6025390625, -15.075927734375, -14.54931640625, -14.022705078125, -13.49609375, -12.969482421875, -12.44287109375, -11.916259765625, -11.3896484375, -10.863037109375, -10.33642578125, -9.809814453125, -9.283203125, -8.756591796875, -8.22998046875, -7.703369140625, -7.1767578125, -6.650146484375, -6.12353515625, -5.596923828125, -5.0703125, -4.543701171875, -4.01708984375, -3.490478515625, -2.9638671875, -2.437255859375, -1.91064453125, -1.384033203125, -0.857421875, -0.330810546875, 0.19580078125, 0.722412109375, 1.2490234375, 1.775634765625, 2.30224609375, 2.828857421875, 3.35546875, 3.882080078125, 4.40869140625, 4.935302734375, 5.4619140625, 5.988525390625, 6.51513671875, 7.041748046875, 7.568359375, 8.094970703125, 8.62158203125, 9.148193359375, 9.6748046875, 10.201416015625, 10.72802734375, 11.254638671875, 11.78125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 7.0, 14.0, 20.0, 17.0, 38.0, 28.0, 42.0, 53.0, 60.0, 70.0, 58.0, 65.0, 73.0, 48.0, 76.0, 58.0, 41.0, 49.0, 48.0, 30.0, 30.0, 23.0, 13.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.99163818359375, -2.9129638671875, -2.83428955078125, -2.755615234375, -2.67694091796875, -2.5982666015625, -2.51959228515625, -2.44091796875, -2.36224365234375, -2.2835693359375, -2.20489501953125, -2.126220703125, -2.04754638671875, -1.9688720703125, -1.89019775390625, -1.8115234375, -1.73284912109375, -1.6541748046875, -1.57550048828125, -1.496826171875, -1.41815185546875, -1.3394775390625, -1.26080322265625, -1.18212890625, -1.10345458984375, -1.0247802734375, -0.94610595703125, -0.867431640625, -0.78875732421875, -0.7100830078125, -0.63140869140625, -0.552734375, -0.47406005859375, -0.3953857421875, -0.31671142578125, -0.238037109375, -0.15936279296875, -0.0806884765625, -0.00201416015625, 0.07666015625, 0.15533447265625, 0.2340087890625, 0.31268310546875, 0.391357421875, 0.47003173828125, 0.5487060546875, 0.62738037109375, 0.7060546875, 0.78472900390625, 0.8634033203125, 0.94207763671875, 1.020751953125, 1.09942626953125, 1.1781005859375, 1.25677490234375, 1.33544921875, 1.41412353515625, 1.4927978515625, 1.57147216796875, 1.650146484375, 1.72882080078125, 1.8074951171875, 1.88616943359375, 1.96484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 13.0, 14.0, 14.0, 22.0, 43.0, 48.0, 72.0, 108.0, 139.0, 199.0, 295.0, 409.0, 605.0, 911.0, 1552.0, 2664.0, 4650.0, 9444.0, 22187.0, 60925.0, 226237.0, 2716708.0, 929987.0, 140108.0, 42968.0, 16675.0, 7426.0, 3857.0, 2117.0, 1304.0, 798.0, 541.0, 375.0, 283.0, 161.0, 139.0, 88.0, 66.0, 44.0, 28.0, 16.0, 17.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.26171875, -6.08197021484375, -5.9022216796875, -5.72247314453125, -5.542724609375, -5.36297607421875, -5.1832275390625, -5.00347900390625, -4.82373046875, -4.64398193359375, -4.4642333984375, -4.28448486328125, -4.104736328125, -3.92498779296875, -3.7452392578125, -3.56549072265625, -3.3857421875, -3.20599365234375, -3.0262451171875, -2.84649658203125, -2.666748046875, -2.48699951171875, -2.3072509765625, -2.12750244140625, -1.94775390625, -1.76800537109375, -1.5882568359375, -1.40850830078125, -1.228759765625, -1.04901123046875, -0.8692626953125, -0.68951416015625, -0.509765625, -0.33001708984375, -0.1502685546875, 0.02947998046875, 0.209228515625, 0.38897705078125, 0.5687255859375, 0.74847412109375, 0.92822265625, 1.10797119140625, 1.2877197265625, 1.46746826171875, 1.647216796875, 1.82696533203125, 2.0067138671875, 2.18646240234375, 2.3662109375, 2.54595947265625, 2.7257080078125, 2.90545654296875, 3.085205078125, 3.26495361328125, 3.4447021484375, 3.62445068359375, 3.80419921875, 3.98394775390625, 4.1636962890625, 4.34344482421875, 4.523193359375, 4.70294189453125, 4.8826904296875, 5.06243896484375, 5.2421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 13.0, 3.0, 16.0, 20.0, 30.0, 40.0, 66.0, 76.0, 127.0, 259.0, 612.0, 1560.0, 582.0, 236.0, 127.0, 75.0, 63.0, 45.0, 30.0, 19.0, 15.0, 8.0, 10.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.123046875, -3.009552001953125, -2.89605712890625, -2.782562255859375, -2.6690673828125, -2.555572509765625, -2.44207763671875, -2.328582763671875, -2.215087890625, -2.101593017578125, -1.98809814453125, -1.874603271484375, -1.7611083984375, -1.647613525390625, -1.53411865234375, -1.420623779296875, -1.30712890625, -1.193634033203125, -1.08013916015625, -0.966644287109375, -0.8531494140625, -0.739654541015625, -0.62615966796875, -0.512664794921875, -0.399169921875, -0.285675048828125, -0.17218017578125, -0.058685302734375, 0.0548095703125, 0.168304443359375, 0.28179931640625, 0.395294189453125, 0.5087890625, 0.622283935546875, 0.73577880859375, 0.849273681640625, 0.9627685546875, 1.076263427734375, 1.18975830078125, 1.303253173828125, 1.416748046875, 1.530242919921875, 1.64373779296875, 1.757232666015625, 1.8707275390625, 1.984222412109375, 2.09771728515625, 2.211212158203125, 2.32470703125, 2.438201904296875, 2.55169677734375, 2.665191650390625, 2.7786865234375, 2.892181396484375, 3.00567626953125, 3.119171142578125, 3.232666015625, 3.346160888671875, 3.45965576171875, 3.573150634765625, 3.6866455078125, 3.800140380859375, 3.91363525390625, 4.027130126953125, 4.140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 12.0, 32.0, 55.0, 123.0, 160.0, 231.0, 164.0, 112.0, 52.0, 24.0, 14.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-58.99922180175781, -57.81340026855469, -56.6275749206543, -55.44175338745117, -54.25593185424805, -53.070106506347656, -51.88428497314453, -50.698463439941406, -49.51264190673828, -48.326820373535156, -47.140995025634766, -45.95517349243164, -44.769351959228516, -43.583526611328125, -42.397705078125, -41.211883544921875, -40.026058197021484, -38.84023666381836, -37.65441131591797, -36.468589782714844, -35.28276824951172, -34.096946716308594, -32.9111213684082, -31.725299835205078, -30.53947639465332, -29.353652954101562, -28.167831420898438, -26.98200798034668, -25.796184539794922, -24.610363006591797, -23.42453956604004, -22.23871612548828, -21.052898406982422, -19.867074966430664, -18.68125343322754, -17.49542999267578, -16.309608459472656, -15.123785018920898, -13.93796157836914, -12.7521390914917, -11.566316604614258, -10.380494117736816, -9.194671630859375, -8.008848190307617, -6.823025703430176, -5.637203216552734, -4.451380252838135, -3.265557289123535, -2.0797348022460938, -0.8939120769500732, 0.29191064834594727, 1.4777333736419678, 2.6635560989379883, 3.8493785858154297, 5.035201549530029, 6.221024513244629, 7.40684700012207, 8.592669486999512, 9.778491973876953, 10.964315414428711, 12.150137901306152, 13.335960388183594, 14.521783828735352, 15.707606315612793, 16.893428802490234]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 10.0, 7.0, 14.0, 24.0, 28.0, 40.0, 52.0, 63.0, 42.0, 64.0, 63.0, 74.0, 64.0, 68.0, 60.0, 71.0, 56.0, 39.0, 42.0, 31.0, 22.0, 16.0, 16.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.794025421142578, -17.22396469116211, -16.65390396118164, -16.083843231201172, -15.513782501220703, -14.943721771240234, -14.373661041259766, -13.803600311279297, -13.233539581298828, -12.66347885131836, -12.09341812133789, -11.523357391357422, -10.953296661376953, -10.383235931396484, -9.813175201416016, -9.243114471435547, -8.673053741455078, -8.10299301147461, -7.532932281494141, -6.962871551513672, -6.392810821533203, -5.822750091552734, -5.252689361572266, -4.682628631591797, -4.112567901611328, -3.5425071716308594, -2.9724464416503906, -2.402385711669922, -1.8323249816894531, -1.2622642517089844, -0.6922035217285156, -0.12214279174804688, 0.4479179382324219, 1.0179786682128906, 1.5880393981933594, 2.158100128173828, 2.728160858154297, 3.2982215881347656, 3.8682823181152344, 4.438343048095703, 5.008403778076172, 5.578464508056641, 6.148525238037109, 6.718585968017578, 7.288646697998047, 7.858707427978516, 8.428768157958984, 8.998828887939453, 9.568889617919922, 10.13895034790039, 10.70901107788086, 11.279071807861328, 11.849132537841797, 12.419193267822266, 12.989253997802734, 13.559314727783203, 14.129375457763672, 14.69943618774414, 15.26949691772461, 15.839557647705078, 16.409618377685547, 16.979679107666016, 17.549739837646484, 18.119800567626953, 18.689861297607422]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 10.0, 12.0, 25.0, 32.0, 39.0, 49.0, 64.0, 128.0, 225.0, 314.0, 596.0, 967.0, 2001.0, 4517.0, 12302.0, 40104.0, 157050.0, 431576.0, 288535.0, 75824.0, 20760.0, 7257.0, 2991.0, 1343.0, 707.0, 426.0, 233.0, 153.0, 82.0, 64.0, 45.0, 31.0, 20.0, 17.0, 12.0, 7.0, 6.0, 6.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-10.703125, -10.39501953125, -10.0869140625, -9.77880859375, -9.470703125, -9.16259765625, -8.8544921875, -8.54638671875, -8.23828125, -7.93017578125, -7.6220703125, -7.31396484375, -7.005859375, -6.69775390625, -6.3896484375, -6.08154296875, -5.7734375, -5.46533203125, -5.1572265625, -4.84912109375, -4.541015625, -4.23291015625, -3.9248046875, -3.61669921875, -3.30859375, -3.00048828125, -2.6923828125, -2.38427734375, -2.076171875, -1.76806640625, -1.4599609375, -1.15185546875, -0.84375, -0.53564453125, -0.2275390625, 0.08056640625, 0.388671875, 0.69677734375, 1.0048828125, 1.31298828125, 1.62109375, 1.92919921875, 2.2373046875, 2.54541015625, 2.853515625, 3.16162109375, 3.4697265625, 3.77783203125, 4.0859375, 4.39404296875, 4.7021484375, 5.01025390625, 5.318359375, 5.62646484375, 5.9345703125, 6.24267578125, 6.55078125, 6.85888671875, 7.1669921875, 7.47509765625, 7.783203125, 8.09130859375, 8.3994140625, 8.70751953125, 9.015625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 10.0, 2.0, 10.0, 14.0, 19.0, 21.0, 32.0, 43.0, 49.0, 53.0, 64.0, 58.0, 78.0, 84.0, 65.0, 62.0, 63.0, 54.0, 50.0, 37.0, 34.0, 34.0, 23.0, 12.0, 13.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.055145263671875, -2.97357177734375, -2.891998291015625, -2.8104248046875, -2.728851318359375, -2.64727783203125, -2.565704345703125, -2.484130859375, -2.402557373046875, -2.32098388671875, -2.239410400390625, -2.1578369140625, -2.076263427734375, -1.99468994140625, -1.913116455078125, -1.83154296875, -1.749969482421875, -1.66839599609375, -1.586822509765625, -1.5052490234375, -1.423675537109375, -1.34210205078125, -1.260528564453125, -1.178955078125, -1.097381591796875, -1.01580810546875, -0.934234619140625, -0.8526611328125, -0.771087646484375, -0.68951416015625, -0.607940673828125, -0.5263671875, -0.444793701171875, -0.36322021484375, -0.281646728515625, -0.2000732421875, -0.118499755859375, -0.03692626953125, 0.044647216796875, 0.126220703125, 0.207794189453125, 0.28936767578125, 0.370941162109375, 0.4525146484375, 0.534088134765625, 0.61566162109375, 0.697235107421875, 0.77880859375, 0.860382080078125, 0.94195556640625, 1.023529052734375, 1.1051025390625, 1.186676025390625, 1.26824951171875, 1.349822998046875, 1.431396484375, 1.512969970703125, 1.59454345703125, 1.676116943359375, 1.7576904296875, 1.839263916015625, 1.92083740234375, 2.002410888671875, 2.083984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 12.0, 5.0, 8.0, 18.0, 21.0, 30.0, 35.0, 55.0, 64.0, 119.0, 179.0, 230.0, 429.0, 668.0, 1192.0, 2218.0, 4582.0, 10050.0, 22234.0, 52911.0, 128971.0, 261908.0, 290692.0, 155535.0, 65398.0, 27324.0, 11773.0, 5641.0, 2685.0, 1457.0, 752.0, 469.0, 270.0, 185.0, 130.0, 82.0, 42.0, 40.0, 44.0, 24.0, 19.0, 16.0, 9.0, 5.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.91015625, -4.75726318359375, -4.6043701171875, -4.45147705078125, -4.298583984375, -4.14569091796875, -3.9927978515625, -3.83990478515625, -3.68701171875, -3.53411865234375, -3.3812255859375, -3.22833251953125, -3.075439453125, -2.92254638671875, -2.7696533203125, -2.61676025390625, -2.4638671875, -2.31097412109375, -2.1580810546875, -2.00518798828125, -1.852294921875, -1.69940185546875, -1.5465087890625, -1.39361572265625, -1.24072265625, -1.08782958984375, -0.9349365234375, -0.78204345703125, -0.629150390625, -0.47625732421875, -0.3233642578125, -0.17047119140625, -0.017578125, 0.13531494140625, 0.2882080078125, 0.44110107421875, 0.593994140625, 0.74688720703125, 0.8997802734375, 1.05267333984375, 1.20556640625, 1.35845947265625, 1.5113525390625, 1.66424560546875, 1.817138671875, 1.97003173828125, 2.1229248046875, 2.27581787109375, 2.4287109375, 2.58160400390625, 2.7344970703125, 2.88739013671875, 3.040283203125, 3.19317626953125, 3.3460693359375, 3.49896240234375, 3.65185546875, 3.80474853515625, 3.9576416015625, 4.11053466796875, 4.263427734375, 4.41632080078125, 4.5692138671875, 4.72210693359375, 4.875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 8.0, 4.0, 11.0, 17.0, 16.0, 17.0, 33.0, 25.0, 28.0, 28.0, 26.0, 34.0, 39.0, 37.0, 32.0, 50.0, 45.0, 45.0, 49.0, 44.0, 40.0, 41.0, 37.0, 36.0, 37.0, 24.0, 23.0, 24.0, 21.0, 17.0, 20.0, 15.0, 13.0, 10.0, 10.0, 9.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2115478515625, -6.973876953125, -6.7362060546875, -6.49853515625, -6.2608642578125, -6.023193359375, -5.7855224609375, -5.5478515625, -5.3101806640625, -5.072509765625, -4.8348388671875, -4.59716796875, -4.3594970703125, -4.121826171875, -3.8841552734375, -3.646484375, -3.4088134765625, -3.171142578125, -2.9334716796875, -2.69580078125, -2.4581298828125, -2.220458984375, -1.9827880859375, -1.7451171875, -1.5074462890625, -1.269775390625, -1.0321044921875, -0.79443359375, -0.5567626953125, -0.319091796875, -0.0814208984375, 0.15625, 0.3939208984375, 0.631591796875, 0.8692626953125, 1.10693359375, 1.3446044921875, 1.582275390625, 1.8199462890625, 2.0576171875, 2.2952880859375, 2.532958984375, 2.7706298828125, 3.00830078125, 3.2459716796875, 3.483642578125, 3.7213134765625, 3.958984375, 4.1966552734375, 4.434326171875, 4.6719970703125, 4.90966796875, 5.1473388671875, 5.385009765625, 5.6226806640625, 5.8603515625, 6.0980224609375, 6.335693359375, 6.5733642578125, 6.81103515625, 7.0487060546875, 7.286376953125, 7.5240478515625, 7.76171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 11.0, 19.0, 29.0, 46.0, 65.0, 105.0, 169.0, 339.0, 677.0, 1380.0, 3230.0, 10239.0, 36759.0, 146470.0, 412874.0, 312321.0, 89871.0, 22529.0, 6772.0, 2408.0, 1006.0, 553.0, 271.0, 153.0, 103.0, 56.0, 33.0, 19.0, 15.0, 7.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.978515625, -2.867462158203125, -2.75640869140625, -2.645355224609375, -2.5343017578125, -2.423248291015625, -2.31219482421875, -2.201141357421875, -2.090087890625, -1.979034423828125, -1.86798095703125, -1.756927490234375, -1.6458740234375, -1.534820556640625, -1.42376708984375, -1.312713623046875, -1.20166015625, -1.090606689453125, -0.97955322265625, -0.868499755859375, -0.7574462890625, -0.646392822265625, -0.53533935546875, -0.424285888671875, -0.313232421875, -0.202178955078125, -0.09112548828125, 0.019927978515625, 0.1309814453125, 0.242034912109375, 0.35308837890625, 0.464141845703125, 0.5751953125, 0.686248779296875, 0.79730224609375, 0.908355712890625, 1.0194091796875, 1.130462646484375, 1.24151611328125, 1.352569580078125, 1.463623046875, 1.574676513671875, 1.68572998046875, 1.796783447265625, 1.9078369140625, 2.018890380859375, 2.12994384765625, 2.240997314453125, 2.35205078125, 2.463104248046875, 2.57415771484375, 2.685211181640625, 2.7962646484375, 2.907318115234375, 3.01837158203125, 3.129425048828125, 3.240478515625, 3.351531982421875, 3.46258544921875, 3.573638916015625, 3.6846923828125, 3.795745849609375, 3.90679931640625, 4.017852783203125, 4.12890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 7.0, 12.0, 15.0, 19.0, 25.0, 29.0, 42.0, 52.0, 52.0, 64.0, 66.0, 76.0, 69.0, 58.0, 58.0, 66.0, 49.0, 38.0, 54.0, 31.0, 22.0, 19.0, 17.0, 12.0, 9.0, 6.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003688335418701172, -0.00035498663783073425, -0.0003411397337913513, -0.0003272928297519684, -0.00031344592571258545, -0.0002995990216732025, -0.0002857521176338196, -0.00027190521359443665, -0.0002580583095550537, -0.0002442114055156708, -0.00023036450147628784, -0.0002165175974369049, -0.00020267069339752197, -0.00018882378935813904, -0.0001749768853187561, -0.00016112998127937317, -0.00014728307723999023, -0.0001334361732006073, -0.00011958926916122437, -0.00010574236512184143, -9.18954610824585e-05, -7.804855704307556e-05, -6.420165300369263e-05, -5.035474896430969e-05, -3.650784492492676e-05, -2.2660940885543823e-05, -8.814036846160889e-06, 5.032867193222046e-06, 1.887977123260498e-05, 3.2726675271987915e-05, 4.657357931137085e-05, 6.0420483350753784e-05, 7.426738739013672e-05, 8.811429142951965e-05, 0.00010196119546890259, 0.00011580809950828552, 0.00012965500354766846, 0.0001435019075870514, 0.00015734881162643433, 0.00017119571566581726, 0.0001850426197052002, 0.00019888952374458313, 0.00021273642778396606, 0.000226583331823349, 0.00024043023586273193, 0.00025427713990211487, 0.0002681240439414978, 0.00028197094798088074, 0.00029581785202026367, 0.0003096647560596466, 0.00032351166009902954, 0.0003373585641384125, 0.0003512054681777954, 0.00036505237221717834, 0.0003788992762565613, 0.0003927461802959442, 0.00040659308433532715, 0.0004204399883747101, 0.000434286892414093, 0.00044813379645347595, 0.0004619807004928589, 0.0004758276045322418, 0.0004896745085716248, 0.0005035214126110077, 0.0005173683166503906]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 7.0, 7.0, 8.0, 21.0, 27.0, 54.0, 79.0, 110.0, 162.0, 309.0, 508.0, 995.0, 2163.0, 5125.0, 13735.0, 41900.0, 129455.0, 319360.0, 329749.0, 135723.0, 44293.0, 14788.0, 5290.0, 2286.0, 1105.0, 548.0, 279.0, 174.0, 98.0, 58.0, 43.0, 35.0, 19.0, 18.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.81134033203125, -2.7144775390625, -2.61761474609375, -2.520751953125, -2.42388916015625, -2.3270263671875, -2.23016357421875, -2.13330078125, -2.03643798828125, -1.9395751953125, -1.84271240234375, -1.745849609375, -1.64898681640625, -1.5521240234375, -1.45526123046875, -1.3583984375, -1.26153564453125, -1.1646728515625, -1.06781005859375, -0.970947265625, -0.87408447265625, -0.7772216796875, -0.68035888671875, -0.58349609375, -0.48663330078125, -0.3897705078125, -0.29290771484375, -0.196044921875, -0.09918212890625, -0.0023193359375, 0.09454345703125, 0.19140625, 0.28826904296875, 0.3851318359375, 0.48199462890625, 0.578857421875, 0.67572021484375, 0.7725830078125, 0.86944580078125, 0.96630859375, 1.06317138671875, 1.1600341796875, 1.25689697265625, 1.353759765625, 1.45062255859375, 1.5474853515625, 1.64434814453125, 1.7412109375, 1.83807373046875, 1.9349365234375, 2.03179931640625, 2.128662109375, 2.22552490234375, 2.3223876953125, 2.41925048828125, 2.51611328125, 2.61297607421875, 2.7098388671875, 2.80670166015625, 2.903564453125, 3.00042724609375, 3.0972900390625, 3.19415283203125, 3.291015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 9.0, 15.0, 26.0, 32.0, 41.0, 48.0, 60.0, 71.0, 85.0, 107.0, 77.0, 97.0, 77.0, 63.0, 52.0, 45.0, 23.0, 19.0, 15.0, 8.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.0947265625, -3.947265625, -3.7998046875, -3.65234375, -3.5048828125, -3.357421875, -3.2099609375, -3.0625, -2.9150390625, -2.767578125, -2.6201171875, -2.47265625, -2.3251953125, -2.177734375, -2.0302734375, -1.8828125, -1.7353515625, -1.587890625, -1.4404296875, -1.29296875, -1.1455078125, -0.998046875, -0.8505859375, -0.703125, -0.5556640625, -0.408203125, -0.2607421875, -0.11328125, 0.0341796875, 0.181640625, 0.3291015625, 0.4765625, 0.6240234375, 0.771484375, 0.9189453125, 1.06640625, 1.2138671875, 1.361328125, 1.5087890625, 1.65625, 1.8037109375, 1.951171875, 2.0986328125, 2.24609375, 2.3935546875, 2.541015625, 2.6884765625, 2.8359375, 2.9833984375, 3.130859375, 3.2783203125, 3.42578125, 3.5732421875, 3.720703125, 3.8681640625, 4.015625, 4.1630859375, 4.310546875, 4.4580078125, 4.60546875, 4.7529296875, 4.900390625, 5.0478515625, 5.1953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 12.0, 16.0, 91.0, 195.0, 302.0, 222.0, 109.0, 42.0, 12.0, 4.0, 3.0], "bins": [-266.62860107421875, -262.001708984375, -257.3748474121094, -252.7479705810547, -248.12109375, -243.4942169189453, -238.86734008789062, -234.24046325683594, -229.61358642578125, -224.98670959472656, -220.35983276367188, -215.7329559326172, -211.1060791015625, -206.4792022705078, -201.85232543945312, -197.22544860839844, -192.59857177734375, -187.97169494628906, -183.34481811523438, -178.7179412841797, -174.091064453125, -169.4641876220703, -164.83731079101562, -160.21043395996094, -155.5835418701172, -150.9566650390625, -146.3297882080078, -141.70291137695312, -137.07603454589844, -132.44915771484375, -127.82228088378906, -123.19540405273438, -118.56851959228516, -113.94164276123047, -109.31476593017578, -104.6878890991211, -100.0610122680664, -95.43413543701172, -90.8072509765625, -86.18037414550781, -81.55350494384766, -76.92662811279297, -72.29975128173828, -67.6728744506836, -63.045997619628906, -58.41912078857422, -53.792240142822266, -49.16536331176758, -44.538482666015625, -39.91160583496094, -35.28472900390625, -30.65785026550293, -26.030973434448242, -21.404096603393555, -16.777217864990234, -12.150341033935547, -7.523466110229492, -2.8965888023376465, 1.7302885055541992, 6.357166290283203, 10.98404312133789, 15.610919952392578, 20.2377986907959, 24.864675521850586, 29.491552352905273]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 13.0, 12.0, 16.0, 10.0, 17.0, 23.0, 28.0, 20.0, 41.0, 39.0, 43.0, 51.0, 60.0, 40.0, 45.0, 47.0, 58.0, 47.0, 39.0, 40.0, 51.0, 39.0, 34.0, 33.0, 29.0, 19.0, 15.0, 17.0, 11.0, 13.0, 7.0, 10.0, 12.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-60.47257995605469, -58.9484748840332, -57.424373626708984, -55.9002685546875, -54.37616729736328, -52.8520622253418, -51.32795715332031, -49.803855895996094, -48.27975082397461, -46.755645751953125, -45.231544494628906, -43.70743942260742, -42.1833381652832, -40.65923309326172, -39.1351318359375, -37.611026763916016, -36.08692169189453, -34.56281661987305, -33.03871536254883, -31.514610290527344, -29.990507125854492, -28.46640396118164, -26.94230079650879, -25.418197631835938, -23.89409637451172, -22.369993209838867, -20.845890045166016, -19.32178497314453, -17.79768180847168, -16.273578643798828, -14.749475479125977, -13.225371360778809, -11.70126724243164, -10.177164077758789, -8.653059959411621, -7.1289567947387695, -5.60485315322876, -4.08074951171875, -2.5566463470458984, -1.0325422286987305, 0.4915609359741211, 2.015664577484131, 3.5397679805755615, 5.063871383666992, 6.587975025177002, 8.112078666687012, 9.636181831359863, 11.160285949707031, 12.684389114379883, 14.208492279052734, 15.732596397399902, 17.256698608398438, 18.780803680419922, 20.304906845092773, 21.829010009765625, 23.35311508178711, 24.877216339111328, 26.40131950378418, 27.92542266845703, 29.449527740478516, 30.973630905151367, 32.49773406982422, 34.02183532714844, 35.54594039916992, 37.070045471191406]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 9.0, 23.0, 34.0, 42.0, 59.0, 92.0, 168.0, 267.0, 541.0, 1465.0, 5276.0, 39468.0, 4083162.0, 54500.0, 6204.0, 1652.0, 606.0, 275.0, 142.0, 73.0, 57.0, 41.0, 39.0, 29.0, 14.0, 7.0, 11.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.21875, -29.4140625, -28.609375, -27.8046875, -27.0, -26.1953125, -25.390625, -24.5859375, -23.78125, -22.9765625, -22.171875, -21.3671875, -20.5625, -19.7578125, -18.953125, -18.1484375, -17.34375, -16.5390625, -15.734375, -14.9296875, -14.125, -13.3203125, -12.515625, -11.7109375, -10.90625, -10.1015625, -9.296875, -8.4921875, -7.6875, -6.8828125, -6.078125, -5.2734375, -4.46875, -3.6640625, -2.859375, -2.0546875, -1.25, -0.4453125, 0.359375, 1.1640625, 1.96875, 2.7734375, 3.578125, 4.3828125, 5.1875, 5.9921875, 6.796875, 7.6015625, 8.40625, 9.2109375, 10.015625, 10.8203125, 11.625, 12.4296875, 13.234375, 14.0390625, 14.84375, 15.6484375, 16.453125, 17.2578125, 18.0625, 18.8671875, 19.671875, 20.4765625, 21.28125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 14.0, 6.0, 19.0, 16.0, 15.0, 24.0, 46.0, 37.0, 51.0, 45.0, 62.0, 69.0, 60.0, 52.0, 51.0, 57.0, 59.0, 49.0, 50.0, 43.0, 36.0, 33.0, 25.0, 26.0, 18.0, 14.0, 3.0, 4.0, 2.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.119140625, -3.03399658203125, -2.9488525390625, -2.86370849609375, -2.778564453125, -2.69342041015625, -2.6082763671875, -2.52313232421875, -2.43798828125, -2.35284423828125, -2.2677001953125, -2.18255615234375, -2.097412109375, -2.01226806640625, -1.9271240234375, -1.84197998046875, -1.7568359375, -1.67169189453125, -1.5865478515625, -1.50140380859375, -1.416259765625, -1.33111572265625, -1.2459716796875, -1.16082763671875, -1.07568359375, -0.99053955078125, -0.9053955078125, -0.82025146484375, -0.735107421875, -0.64996337890625, -0.5648193359375, -0.47967529296875, -0.39453125, -0.30938720703125, -0.2242431640625, -0.13909912109375, -0.053955078125, 0.03118896484375, 0.1163330078125, 0.20147705078125, 0.28662109375, 0.37176513671875, 0.4569091796875, 0.54205322265625, 0.627197265625, 0.71234130859375, 0.7974853515625, 0.88262939453125, 0.9677734375, 1.05291748046875, 1.1380615234375, 1.22320556640625, 1.308349609375, 1.39349365234375, 1.4786376953125, 1.56378173828125, 1.64892578125, 1.73406982421875, 1.8192138671875, 1.90435791015625, 1.989501953125, 2.07464599609375, 2.1597900390625, 2.24493408203125, 2.330078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 6.0, 15.0, 8.0, 22.0, 26.0, 34.0, 71.0, 70.0, 103.0, 120.0, 176.0, 247.0, 392.0, 526.0, 927.0, 1639.0, 3561.0, 9051.0, 28882.0, 200366.0, 3820927.0, 94085.0, 19765.0, 6741.0, 2768.0, 1423.0, 705.0, 445.0, 315.0, 239.0, 153.0, 99.0, 88.0, 66.0, 66.0, 33.0, 36.0, 22.0, 17.0, 13.0, 11.0, 5.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.03857421875, -7.7646484375, -7.49072265625, -7.216796875, -6.94287109375, -6.6689453125, -6.39501953125, -6.12109375, -5.84716796875, -5.5732421875, -5.29931640625, -5.025390625, -4.75146484375, -4.4775390625, -4.20361328125, -3.9296875, -3.65576171875, -3.3818359375, -3.10791015625, -2.833984375, -2.56005859375, -2.2861328125, -2.01220703125, -1.73828125, -1.46435546875, -1.1904296875, -0.91650390625, -0.642578125, -0.36865234375, -0.0947265625, 0.17919921875, 0.453125, 0.72705078125, 1.0009765625, 1.27490234375, 1.548828125, 1.82275390625, 2.0966796875, 2.37060546875, 2.64453125, 2.91845703125, 3.1923828125, 3.46630859375, 3.740234375, 4.01416015625, 4.2880859375, 4.56201171875, 4.8359375, 5.10986328125, 5.3837890625, 5.65771484375, 5.931640625, 6.20556640625, 6.4794921875, 6.75341796875, 7.02734375, 7.30126953125, 7.5751953125, 7.84912109375, 8.123046875, 8.39697265625, 8.6708984375, 8.94482421875, 9.21875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 13.0, 11.0, 28.0, 70.0, 254.0, 3200.0, 295.0, 84.0, 51.0, 21.0, 18.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.614532470703125, -2.52593994140625, -2.437347412109375, -2.3487548828125, -2.260162353515625, -2.17156982421875, -2.082977294921875, -1.994384765625, -1.905792236328125, -1.81719970703125, -1.728607177734375, -1.6400146484375, -1.551422119140625, -1.46282958984375, -1.374237060546875, -1.28564453125, -1.197052001953125, -1.10845947265625, -1.019866943359375, -0.9312744140625, -0.842681884765625, -0.75408935546875, -0.665496826171875, -0.576904296875, -0.488311767578125, -0.39971923828125, -0.311126708984375, -0.2225341796875, -0.133941650390625, -0.04534912109375, 0.043243408203125, 0.1318359375, 0.220428466796875, 0.30902099609375, 0.397613525390625, 0.4862060546875, 0.574798583984375, 0.66339111328125, 0.751983642578125, 0.840576171875, 0.929168701171875, 1.01776123046875, 1.106353759765625, 1.1949462890625, 1.283538818359375, 1.37213134765625, 1.460723876953125, 1.54931640625, 1.637908935546875, 1.72650146484375, 1.815093994140625, 1.9036865234375, 1.992279052734375, 2.08087158203125, 2.169464111328125, 2.258056640625, 2.346649169921875, 2.43524169921875, 2.523834228515625, 2.6124267578125, 2.701019287109375, 2.78961181640625, 2.878204345703125, 2.966796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 12.0, 20.0, 31.0, 39.0, 69.0, 78.0, 107.0, 120.0, 108.0, 108.0, 89.0, 68.0, 43.0, 36.0, 18.0, 17.0, 11.0, 2.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.088604927062988, -6.84934663772583, -6.610087871551514, -6.3708295822143555, -6.131570816040039, -5.892312526702881, -5.653054237365723, -5.413795471191406, -5.174537181854248, -4.93527889251709, -4.696020126342773, -4.456761837005615, -4.217503070831299, -3.9782447814941406, -3.7389862537384033, -3.499727725982666, -3.2604691982269287, -3.0212106704711914, -2.781952142715454, -2.542693614959717, -2.3034353256225586, -2.0641767978668213, -1.824918270111084, -1.5856598615646362, -1.346401333808899, -1.1071428060531616, -0.8678843975067139, -0.6286258697509766, -0.38936740159988403, -0.1501089334487915, 0.0891495943069458, 0.32840800285339355, 0.5676665306091309, 0.8069249987602234, 1.046183466911316, 1.2854419946670532, 1.524700403213501, 1.7639589309692383, 2.0032174587249756, 2.242475986480713, 2.481734275817871, 2.7209928035736084, 2.9602513313293457, 3.199509620666504, 3.438768148422241, 3.6780266761779785, 3.917285203933716, 4.156543731689453, 4.3958024978637695, 4.635060787200928, 4.874319553375244, 5.113577842712402, 5.352836608886719, 5.592094898223877, 5.831353187561035, 6.070611953735352, 6.30987024307251, 6.549128532409668, 6.788387298583984, 7.027645587921143, 7.266904354095459, 7.506162643432617, 7.745421409606934, 7.984679698944092, 8.22393798828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 7.0, 8.0, 13.0, 2.0, 11.0, 11.0, 13.0, 17.0, 23.0, 21.0, 23.0, 26.0, 36.0, 32.0, 31.0, 25.0, 24.0, 39.0, 31.0, 51.0, 46.0, 29.0, 36.0, 36.0, 36.0, 29.0, 33.0, 35.0, 34.0, 28.0, 33.0, 24.0, 17.0, 21.0, 12.0, 26.0, 13.0, 19.0, 15.0, 6.0, 11.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.9463412761688232, -3.8280091285705566, -3.709676742553711, -3.5913445949554443, -3.4730124473571777, -3.354680061340332, -3.2363479137420654, -3.118015766143799, -2.999683380126953, -2.8813512325286865, -2.763018846511841, -2.644686698913574, -2.5263545513153076, -2.408022403717041, -2.2896900177001953, -2.1713578701019287, -2.053025722503662, -1.934693455696106, -1.8163613080978394, -1.6980290412902832, -1.5796968936920166, -1.4613646268844604, -1.3430323600769043, -1.2247002124786377, -1.1063679456710815, -0.9880357384681702, -0.8697035312652588, -0.7513712644577026, -0.6330390572547913, -0.5147068500518799, -0.39637458324432373, -0.27804237604141235, -0.15971040725708008, -0.04137818515300751, 0.07695403695106506, 0.19528627395629883, 0.3136184811592102, 0.4319506883621216, 0.5502829551696777, 0.6686151623725891, 0.7869473695755005, 0.9052795767784119, 1.0236117839813232, 1.1419440507888794, 1.2602763175964355, 1.3786084651947021, 1.4969407320022583, 1.6152729988098145, 1.733605146408081, 1.8519374132156372, 1.9702695608139038, 2.08860182762146, 2.2069339752197266, 2.3252663612365723, 2.443598508834839, 2.5619306564331055, 2.680263042449951, 2.7985951900482178, 2.9169275760650635, 3.03525972366333, 3.1535918712615967, 3.2719240188598633, 3.390256404876709, 3.5085885524749756, 3.626920700073242]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 8.0, 11.0, 10.0, 11.0, 15.0, 24.0, 36.0, 80.0, 113.0, 169.0, 284.0, 519.0, 899.0, 1967.0, 4200.0, 9806.0, 25283.0, 71125.0, 190495.0, 344867.0, 244884.0, 96073.0, 34166.0, 12854.0, 5362.0, 2552.0, 1237.0, 648.0, 308.0, 205.0, 123.0, 74.0, 52.0, 26.0, 25.0, 8.0, 12.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.4453125, -7.202392578125, -6.95947265625, -6.716552734375, -6.4736328125, -6.230712890625, -5.98779296875, -5.744873046875, -5.501953125, -5.259033203125, -5.01611328125, -4.773193359375, -4.5302734375, -4.287353515625, -4.04443359375, -3.801513671875, -3.55859375, -3.315673828125, -3.07275390625, -2.829833984375, -2.5869140625, -2.343994140625, -2.10107421875, -1.858154296875, -1.615234375, -1.372314453125, -1.12939453125, -0.886474609375, -0.6435546875, -0.400634765625, -0.15771484375, 0.085205078125, 0.328125, 0.571044921875, 0.81396484375, 1.056884765625, 1.2998046875, 1.542724609375, 1.78564453125, 2.028564453125, 2.271484375, 2.514404296875, 2.75732421875, 3.000244140625, 3.2431640625, 3.486083984375, 3.72900390625, 3.971923828125, 4.21484375, 4.457763671875, 4.70068359375, 4.943603515625, 5.1865234375, 5.429443359375, 5.67236328125, 5.915283203125, 6.158203125, 6.401123046875, 6.64404296875, 6.886962890625, 7.1298828125, 7.372802734375, 7.61572265625, 7.858642578125, 8.1015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 11.0, 11.0, 11.0, 15.0, 21.0, 23.0, 40.0, 39.0, 51.0, 44.0, 40.0, 60.0, 56.0, 65.0, 52.0, 67.0, 50.0, 57.0, 48.0, 41.0, 36.0, 33.0, 27.0, 23.0, 21.0, 20.0, 7.0, 11.0, 3.0, 3.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.146484375, -3.06170654296875, -2.9769287109375, -2.89215087890625, -2.807373046875, -2.72259521484375, -2.6378173828125, -2.55303955078125, -2.46826171875, -2.38348388671875, -2.2987060546875, -2.21392822265625, -2.129150390625, -2.04437255859375, -1.9595947265625, -1.87481689453125, -1.7900390625, -1.70526123046875, -1.6204833984375, -1.53570556640625, -1.450927734375, -1.36614990234375, -1.2813720703125, -1.19659423828125, -1.11181640625, -1.02703857421875, -0.9422607421875, -0.85748291015625, -0.772705078125, -0.68792724609375, -0.6031494140625, -0.51837158203125, -0.43359375, -0.34881591796875, -0.2640380859375, -0.17926025390625, -0.094482421875, -0.00970458984375, 0.0750732421875, 0.15985107421875, 0.24462890625, 0.32940673828125, 0.4141845703125, 0.49896240234375, 0.583740234375, 0.66851806640625, 0.7532958984375, 0.83807373046875, 0.9228515625, 1.00762939453125, 1.0924072265625, 1.17718505859375, 1.261962890625, 1.34674072265625, 1.4315185546875, 1.51629638671875, 1.60107421875, 1.68585205078125, 1.7706298828125, 1.85540771484375, 1.940185546875, 2.02496337890625, 2.1097412109375, 2.19451904296875, 2.279296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 13.0, 13.0, 18.0, 20.0, 30.0, 26.0, 60.0, 88.0, 147.0, 260.0, 425.0, 870.0, 2154.0, 5452.0, 16344.0, 57638.0, 221954.0, 481767.0, 189274.0, 49395.0, 14061.0, 4739.0, 1952.0, 777.0, 440.0, 201.0, 151.0, 79.0, 60.0, 34.0, 41.0, 14.0, 17.0, 8.0, 8.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.979248046875, -7.74755859375, -7.515869140625, -7.2841796875, -7.052490234375, -6.82080078125, -6.589111328125, -6.357421875, -6.125732421875, -5.89404296875, -5.662353515625, -5.4306640625, -5.198974609375, -4.96728515625, -4.735595703125, -4.50390625, -4.272216796875, -4.04052734375, -3.808837890625, -3.5771484375, -3.345458984375, -3.11376953125, -2.882080078125, -2.650390625, -2.418701171875, -2.18701171875, -1.955322265625, -1.7236328125, -1.491943359375, -1.26025390625, -1.028564453125, -0.796875, -0.565185546875, -0.33349609375, -0.101806640625, 0.1298828125, 0.361572265625, 0.59326171875, 0.824951171875, 1.056640625, 1.288330078125, 1.52001953125, 1.751708984375, 1.9833984375, 2.215087890625, 2.44677734375, 2.678466796875, 2.91015625, 3.141845703125, 3.37353515625, 3.605224609375, 3.8369140625, 4.068603515625, 4.30029296875, 4.531982421875, 4.763671875, 4.995361328125, 5.22705078125, 5.458740234375, 5.6904296875, 5.922119140625, 6.15380859375, 6.385498046875, 6.6171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 4.0, 9.0, 8.0, 14.0, 13.0, 13.0, 22.0, 12.0, 21.0, 24.0, 26.0, 44.0, 41.0, 33.0, 45.0, 43.0, 50.0, 60.0, 50.0, 35.0, 47.0, 34.0, 41.0, 43.0, 35.0, 29.0, 31.0, 30.0, 24.0, 26.0, 19.0, 16.0, 10.0, 7.0, 7.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.8564453125, -8.556640625, -8.2568359375, -7.95703125, -7.6572265625, -7.357421875, -7.0576171875, -6.7578125, -6.4580078125, -6.158203125, -5.8583984375, -5.55859375, -5.2587890625, -4.958984375, -4.6591796875, -4.359375, -4.0595703125, -3.759765625, -3.4599609375, -3.16015625, -2.8603515625, -2.560546875, -2.2607421875, -1.9609375, -1.6611328125, -1.361328125, -1.0615234375, -0.76171875, -0.4619140625, -0.162109375, 0.1376953125, 0.4375, 0.7373046875, 1.037109375, 1.3369140625, 1.63671875, 1.9365234375, 2.236328125, 2.5361328125, 2.8359375, 3.1357421875, 3.435546875, 3.7353515625, 4.03515625, 4.3349609375, 4.634765625, 4.9345703125, 5.234375, 5.5341796875, 5.833984375, 6.1337890625, 6.43359375, 6.7333984375, 7.033203125, 7.3330078125, 7.6328125, 7.9326171875, 8.232421875, 8.5322265625, 8.83203125, 9.1318359375, 9.431640625, 9.7314453125, 10.03125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 11.0, 21.0, 18.0, 37.0, 63.0, 99.0, 188.0, 344.0, 733.0, 1808.0, 5531.0, 23419.0, 139969.0, 612612.0, 217737.0, 34465.0, 7445.0, 2219.0, 878.0, 410.0, 212.0, 121.0, 72.0, 43.0, 32.0, 17.0, 24.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.970703125, -3.831939697265625, -3.69317626953125, -3.554412841796875, -3.4156494140625, -3.276885986328125, -3.13812255859375, -2.999359130859375, -2.860595703125, -2.721832275390625, -2.58306884765625, -2.444305419921875, -2.3055419921875, -2.166778564453125, -2.02801513671875, -1.889251708984375, -1.75048828125, -1.611724853515625, -1.47296142578125, -1.334197998046875, -1.1954345703125, -1.056671142578125, -0.91790771484375, -0.779144287109375, -0.640380859375, -0.501617431640625, -0.36285400390625, -0.224090576171875, -0.0853271484375, 0.053436279296875, 0.19219970703125, 0.330963134765625, 0.4697265625, 0.608489990234375, 0.74725341796875, 0.886016845703125, 1.0247802734375, 1.163543701171875, 1.30230712890625, 1.441070556640625, 1.579833984375, 1.718597412109375, 1.85736083984375, 1.996124267578125, 2.1348876953125, 2.273651123046875, 2.41241455078125, 2.551177978515625, 2.68994140625, 2.828704833984375, 2.96746826171875, 3.106231689453125, 3.2449951171875, 3.383758544921875, 3.52252197265625, 3.661285400390625, 3.800048828125, 3.938812255859375, 4.07757568359375, 4.216339111328125, 4.3551025390625, 4.493865966796875, 4.63262939453125, 4.771392822265625, 4.91015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 9.0, 14.0, 17.0, 14.0, 28.0, 26.0, 36.0, 58.0, 65.0, 58.0, 80.0, 75.0, 62.0, 71.0, 74.0, 57.0, 55.0, 25.0, 28.0, 32.0, 27.0, 14.0, 12.0, 12.0, 7.0, 7.0, 7.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004916191101074219, -0.0004779547452926636, -0.0004642903804779053, -0.00045062601566314697, -0.00043696165084838867, -0.00042329728603363037, -0.00040963292121887207, -0.00039596855640411377, -0.00038230419158935547, -0.00036863982677459717, -0.00035497546195983887, -0.00034131109714508057, -0.00032764673233032227, -0.00031398236751556396, -0.00030031800270080566, -0.00028665363788604736, -0.00027298927307128906, -0.00025932490825653076, -0.00024566054344177246, -0.00023199617862701416, -0.00021833181381225586, -0.00020466744899749756, -0.00019100308418273926, -0.00017733871936798096, -0.00016367435455322266, -0.00015000998973846436, -0.00013634562492370605, -0.00012268126010894775, -0.00010901689529418945, -9.535253047943115e-05, -8.168816566467285e-05, -6.802380084991455e-05, -5.435943603515625e-05, -4.069507122039795e-05, -2.703070640563965e-05, -1.3366341590881348e-05, 2.980232238769531e-07, 1.3962388038635254e-05, 2.7626752853393555e-05, 4.1291117668151855e-05, 5.4955482482910156e-05, 6.861984729766846e-05, 8.228421211242676e-05, 9.594857692718506e-05, 0.00010961294174194336, 0.00012327730655670166, 0.00013694167137145996, 0.00015060603618621826, 0.00016427040100097656, 0.00017793476581573486, 0.00019159913063049316, 0.00020526349544525146, 0.00021892786026000977, 0.00023259222507476807, 0.00024625658988952637, 0.00025992095470428467, 0.00027358531951904297, 0.00028724968433380127, 0.00030091404914855957, 0.00031457841396331787, 0.00032824277877807617, 0.00034190714359283447, 0.0003555715084075928, 0.0003692358732223511, 0.0003829002380371094]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 10.0, 13.0, 30.0, 47.0, 51.0, 133.0, 216.0, 411.0, 777.0, 2054.0, 6430.0, 27937.0, 162764.0, 597947.0, 203664.0, 34393.0, 7495.0, 2354.0, 876.0, 430.0, 208.0, 134.0, 65.0, 42.0, 21.0, 19.0, 13.0, 10.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.882568359375, -3.74169921875, -3.600830078125, -3.4599609375, -3.319091796875, -3.17822265625, -3.037353515625, -2.896484375, -2.755615234375, -2.61474609375, -2.473876953125, -2.3330078125, -2.192138671875, -2.05126953125, -1.910400390625, -1.76953125, -1.628662109375, -1.48779296875, -1.346923828125, -1.2060546875, -1.065185546875, -0.92431640625, -0.783447265625, -0.642578125, -0.501708984375, -0.36083984375, -0.219970703125, -0.0791015625, 0.061767578125, 0.20263671875, 0.343505859375, 0.484375, 0.625244140625, 0.76611328125, 0.906982421875, 1.0478515625, 1.188720703125, 1.32958984375, 1.470458984375, 1.611328125, 1.752197265625, 1.89306640625, 2.033935546875, 2.1748046875, 2.315673828125, 2.45654296875, 2.597412109375, 2.73828125, 2.879150390625, 3.02001953125, 3.160888671875, 3.3017578125, 3.442626953125, 3.58349609375, 3.724365234375, 3.865234375, 4.006103515625, 4.14697265625, 4.287841796875, 4.4287109375, 4.569580078125, 4.71044921875, 4.851318359375, 4.9921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 13.0, 15.0, 20.0, 29.0, 51.0, 50.0, 74.0, 97.0, 124.0, 136.0, 124.0, 81.0, 60.0, 36.0, 36.0, 13.0, 15.0, 9.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.97265625, -6.7784423828125, -6.584228515625, -6.3900146484375, -6.19580078125, -6.0015869140625, -5.807373046875, -5.6131591796875, -5.4189453125, -5.2247314453125, -5.030517578125, -4.8363037109375, -4.64208984375, -4.4478759765625, -4.253662109375, -4.0594482421875, -3.865234375, -3.6710205078125, -3.476806640625, -3.2825927734375, -3.08837890625, -2.8941650390625, -2.699951171875, -2.5057373046875, -2.3115234375, -2.1173095703125, -1.923095703125, -1.7288818359375, -1.53466796875, -1.3404541015625, -1.146240234375, -0.9520263671875, -0.7578125, -0.5635986328125, -0.369384765625, -0.1751708984375, 0.01904296875, 0.2132568359375, 0.407470703125, 0.6016845703125, 0.7958984375, 0.9901123046875, 1.184326171875, 1.3785400390625, 1.57275390625, 1.7669677734375, 1.961181640625, 2.1553955078125, 2.349609375, 2.5438232421875, 2.738037109375, 2.9322509765625, 3.12646484375, 3.3206787109375, 3.514892578125, 3.7091064453125, 3.9033203125, 4.0975341796875, 4.291748046875, 4.4859619140625, 4.68017578125, 4.8743896484375, 5.068603515625, 5.2628173828125, 5.45703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 8.0, 18.0, 74.0, 148.0, 233.0, 246.0, 148.0, 77.0, 27.0, 16.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.45730590820312, -144.5316619873047, -140.6060333251953, -136.68038940429688, -132.75474548339844, -128.8291015625, -124.90347290039062, -120.97782897949219, -117.05219268798828, -113.12655639648438, -109.20091247558594, -105.27527618408203, -101.3496322631836, -97.42399597167969, -93.49835205078125, -89.57271575927734, -85.64707946777344, -81.72144317626953, -77.7957992553711, -73.87016296386719, -69.94451904296875, -66.01888275146484, -62.09324264526367, -58.1676025390625, -54.24195861816406, -50.31631851196289, -46.39067840576172, -42.46504211425781, -38.53940200805664, -34.61376190185547, -30.688121795654297, -26.762483596801758, -22.83684539794922, -18.911205291748047, -14.985567092895508, -11.059926986694336, -7.1342878341674805, -3.208648681640625, 0.7169914245605469, 4.642629623413086, 8.568269729614258, 12.493908882141113, 16.41954803466797, 20.34518814086914, 24.270828247070312, 28.19646644592285, 32.122108459472656, 36.04774475097656, 39.973384857177734, 43.899024963378906, 47.82466506958008, 51.75030517578125, 55.675941467285156, 59.60158157348633, 63.5272216796875, 67.4528579711914, 71.37850189208984, 75.30413818359375, 79.22978210449219, 83.1554183959961, 87.08106231689453, 91.00669860839844, 94.93234252929688, 98.85797882080078, 102.78361511230469]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 6.0, 9.0, 9.0, 9.0, 6.0, 11.0, 10.0, 13.0, 19.0, 24.0, 18.0, 19.0, 22.0, 26.0, 19.0, 22.0, 36.0, 44.0, 43.0, 36.0, 45.0, 36.0, 39.0, 45.0, 45.0, 46.0, 38.0, 32.0, 34.0, 30.0, 14.0, 29.0, 25.0, 21.0, 22.0, 14.0, 16.0, 12.0, 15.0, 6.0, 10.0, 6.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-42.31019592285156, -40.9565544128418, -39.6029167175293, -38.24927520751953, -36.895633697509766, -35.5419921875, -34.1883544921875, -32.834712982177734, -31.4810733795166, -30.12743377685547, -28.773792266845703, -27.42015266418457, -26.066513061523438, -24.712871551513672, -23.35923194885254, -22.005592346191406, -20.65195083618164, -19.298311233520508, -17.944669723510742, -16.59103012084961, -15.23738956451416, -13.883749008178711, -12.530109405517578, -11.176468849182129, -9.82282829284668, -8.46918773651123, -7.1155476570129395, -5.761907577514648, -4.408267021179199, -3.05462646484375, -1.7009868621826172, -0.34734630584716797, 1.0062942504882812, 2.3599345684051514, 3.7135748863220215, 5.0672149658203125, 6.420855522155762, 7.774496078491211, 9.128135681152344, 10.481776237487793, 11.835416793823242, 13.189057350158691, 14.54269790649414, 15.896337509155273, 17.249977111816406, 18.603618621826172, 19.957258224487305, 21.310897827148438, 22.664539337158203, 24.018178939819336, 25.3718204498291, 26.725460052490234, 28.0791015625, 29.432741165161133, 30.786380767822266, 32.14002227783203, 33.49365997314453, 34.8473014831543, 36.2009391784668, 37.55458068847656, 38.90822219848633, 40.261863708496094, 41.615501403808594, 42.96914291381836, 44.322784423828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 0.0, 8.0, 8.0, 5.0, 6.0, 11.0, 24.0, 35.0, 52.0, 90.0, 155.0, 233.0, 447.0, 1013.0, 2596.0, 9282.0, 72375.0, 4016445.0, 77185.0, 9662.0, 2535.0, 1013.0, 494.0, 238.0, 135.0, 88.0, 51.0, 30.0, 21.0, 19.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -18.095703125, -17.61328125, -17.130859375, -16.6484375, -16.166015625, -15.68359375, -15.201171875, -14.71875, -14.236328125, -13.75390625, -13.271484375, -12.7890625, -12.306640625, -11.82421875, -11.341796875, -10.859375, -10.376953125, -9.89453125, -9.412109375, -8.9296875, -8.447265625, -7.96484375, -7.482421875, -7.0, -6.517578125, -6.03515625, -5.552734375, -5.0703125, -4.587890625, -4.10546875, -3.623046875, -3.140625, -2.658203125, -2.17578125, -1.693359375, -1.2109375, -0.728515625, -0.24609375, 0.236328125, 0.71875, 1.201171875, 1.68359375, 2.166015625, 2.6484375, 3.130859375, 3.61328125, 4.095703125, 4.578125, 5.060546875, 5.54296875, 6.025390625, 6.5078125, 6.990234375, 7.47265625, 7.955078125, 8.4375, 8.919921875, 9.40234375, 9.884765625, 10.3671875, 10.849609375, 11.33203125, 11.814453125, 12.296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 17.0, 9.0, 17.0, 19.0, 22.0, 38.0, 41.0, 38.0, 52.0, 58.0, 53.0, 80.0, 66.0, 51.0, 44.0, 69.0, 45.0, 40.0, 33.0, 44.0, 34.0, 20.0, 24.0, 13.0, 10.0, 9.0, 10.0, 6.0, 7.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.04400634765625, -2.9512939453125, -2.85858154296875, -2.765869140625, -2.67315673828125, -2.5804443359375, -2.48773193359375, -2.39501953125, -2.30230712890625, -2.2095947265625, -2.11688232421875, -2.024169921875, -1.93145751953125, -1.8387451171875, -1.74603271484375, -1.6533203125, -1.56060791015625, -1.4678955078125, -1.37518310546875, -1.282470703125, -1.18975830078125, -1.0970458984375, -1.00433349609375, -0.91162109375, -0.81890869140625, -0.7261962890625, -0.63348388671875, -0.540771484375, -0.44805908203125, -0.3553466796875, -0.26263427734375, -0.169921875, -0.07720947265625, 0.0155029296875, 0.10821533203125, 0.200927734375, 0.29364013671875, 0.3863525390625, 0.47906494140625, 0.57177734375, 0.66448974609375, 0.7572021484375, 0.84991455078125, 0.942626953125, 1.03533935546875, 1.1280517578125, 1.22076416015625, 1.3134765625, 1.40618896484375, 1.4989013671875, 1.59161376953125, 1.684326171875, 1.77703857421875, 1.8697509765625, 1.96246337890625, 2.05517578125, 2.14788818359375, 2.2406005859375, 2.33331298828125, 2.426025390625, 2.51873779296875, 2.6114501953125, 2.70416259765625, 2.796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 9.0, 2.0, 8.0, 9.0, 14.0, 11.0, 25.0, 27.0, 46.0, 58.0, 56.0, 105.0, 160.0, 284.0, 386.0, 608.0, 960.0, 1883.0, 3789.0, 9386.0, 28975.0, 147394.0, 3737330.0, 207134.0, 35545.0, 10656.0, 4269.0, 2056.0, 1110.0, 645.0, 430.0, 251.0, 203.0, 131.0, 100.0, 62.0, 49.0, 36.0, 21.0, 7.0, 14.0, 11.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.12890625, -6.91656494140625, -6.7042236328125, -6.49188232421875, -6.279541015625, -6.06719970703125, -5.8548583984375, -5.64251708984375, -5.43017578125, -5.21783447265625, -5.0054931640625, -4.79315185546875, -4.580810546875, -4.36846923828125, -4.1561279296875, -3.94378662109375, -3.7314453125, -3.51910400390625, -3.3067626953125, -3.09442138671875, -2.882080078125, -2.66973876953125, -2.4573974609375, -2.24505615234375, -2.03271484375, -1.82037353515625, -1.6080322265625, -1.39569091796875, -1.183349609375, -0.97100830078125, -0.7586669921875, -0.54632568359375, -0.333984375, -0.12164306640625, 0.0906982421875, 0.30303955078125, 0.515380859375, 0.72772216796875, 0.9400634765625, 1.15240478515625, 1.36474609375, 1.57708740234375, 1.7894287109375, 2.00177001953125, 2.214111328125, 2.42645263671875, 2.6387939453125, 2.85113525390625, 3.0634765625, 3.27581787109375, 3.4881591796875, 3.70050048828125, 3.912841796875, 4.12518310546875, 4.3375244140625, 4.54986572265625, 4.76220703125, 4.97454833984375, 5.1868896484375, 5.39923095703125, 5.611572265625, 5.82391357421875, 6.0362548828125, 6.24859619140625, 6.4609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 1.0, 3.0, 10.0, 16.0, 35.0, 29.0, 73.0, 150.0, 547.0, 2706.0, 250.0, 105.0, 43.0, 30.0, 24.0, 16.0, 9.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-3.1015625, -3.035888671875, -2.97021484375, -2.904541015625, -2.8388671875, -2.773193359375, -2.70751953125, -2.641845703125, -2.576171875, -2.510498046875, -2.44482421875, -2.379150390625, -2.3134765625, -2.247802734375, -2.18212890625, -2.116455078125, -2.05078125, -1.985107421875, -1.91943359375, -1.853759765625, -1.7880859375, -1.722412109375, -1.65673828125, -1.591064453125, -1.525390625, -1.459716796875, -1.39404296875, -1.328369140625, -1.2626953125, -1.197021484375, -1.13134765625, -1.065673828125, -1.0, -0.934326171875, -0.86865234375, -0.802978515625, -0.7373046875, -0.671630859375, -0.60595703125, -0.540283203125, -0.474609375, -0.408935546875, -0.34326171875, -0.277587890625, -0.2119140625, -0.146240234375, -0.08056640625, -0.014892578125, 0.05078125, 0.116455078125, 0.18212890625, 0.247802734375, 0.3134765625, 0.379150390625, 0.44482421875, 0.510498046875, 0.576171875, 0.641845703125, 0.70751953125, 0.773193359375, 0.8388671875, 0.904541015625, 0.97021484375, 1.035888671875, 1.1015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 19.0, 36.0, 97.0, 208.0, 248.0, 220.0, 111.0, 42.0, 20.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.860515594482422, -31.24277687072754, -30.625038146972656, -30.007299423217773, -29.38956069946289, -28.771821975708008, -28.154083251953125, -27.536346435546875, -26.91860580444336, -26.300867080688477, -25.683128356933594, -25.06538963317871, -24.447650909423828, -23.829912185668945, -23.212173461914062, -22.594436645507812, -21.97669792175293, -21.358959197998047, -20.741220474243164, -20.12348175048828, -19.5057430267334, -18.888004302978516, -18.270265579223633, -17.65252685546875, -17.0347900390625, -16.417051315307617, -15.799312591552734, -15.181573867797852, -14.563835144042969, -13.946096420288086, -13.32835865020752, -12.710619926452637, -12.092878341674805, -11.475139617919922, -10.857400894165039, -10.239662170410156, -9.621923446655273, -9.00418472290039, -8.386446952819824, -7.768708229064941, -7.150969505310059, -6.533230781555176, -5.915492057800293, -5.297753810882568, -4.6800150871276855, -4.062276363372803, -3.444537878036499, -2.8267993927001953, -2.2090606689453125, -1.5913220643997192, -0.973583459854126, -0.3558448553085327, 0.26189374923706055, 0.8796324729919434, 1.497370958328247, 2.115109443664551, 2.7328481674194336, 3.3505868911743164, 3.96832537651062, 4.586063861846924, 5.203802585601807, 5.8215413093566895, 6.439279556274414, 7.057018280029297, 7.67475700378418]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 4.0, 11.0, 10.0, 16.0, 18.0, 27.0, 32.0, 29.0, 41.0, 43.0, 49.0, 43.0, 55.0, 50.0, 65.0, 70.0, 64.0, 45.0, 38.0, 37.0, 39.0, 38.0, 38.0, 25.0, 19.0, 25.0, 15.0, 14.0, 8.0, 5.0, 10.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.079209327697754, -6.895724296569824, -6.7122392654418945, -6.528754234313965, -6.345269203186035, -6.1617841720581055, -5.978299140930176, -5.794814109802246, -5.611329078674316, -5.427844047546387, -5.244359016418457, -5.060873985290527, -4.877388954162598, -4.693903923034668, -4.510418891906738, -4.326933860778809, -4.143448829650879, -3.959963798522949, -3.7764787673950195, -3.59299373626709, -3.40950870513916, -3.2260236740112305, -3.042538642883301, -2.859053611755371, -2.6755685806274414, -2.4920835494995117, -2.308598518371582, -2.1251134872436523, -1.9416284561157227, -1.758143424987793, -1.5746583938598633, -1.3911733627319336, -1.2076878547668457, -1.024202823638916, -0.8407177925109863, -0.6572327613830566, -0.47374773025512695, -0.29026269912719727, -0.10677766799926758, 0.07670736312866211, 0.2601923942565918, 0.4436774253845215, 0.6271624565124512, 0.8106474876403809, 0.9941325187683105, 1.1776175498962402, 1.36110258102417, 1.5445876121520996, 1.7280726432800293, 1.911557674407959, 2.0950427055358887, 2.2785277366638184, 2.462012767791748, 2.6454977989196777, 2.8289828300476074, 3.012467861175537, 3.195952892303467, 3.3794379234313965, 3.562922954559326, 3.746407985687256, 3.9298930168151855, 4.113378047943115, 4.296863079071045, 4.480348110198975, 4.663833141326904]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 10.0, 21.0, 28.0, 37.0, 75.0, 141.0, 331.0, 710.0, 1698.0, 5086.0, 18669.0, 89074.0, 413212.0, 406395.0, 86325.0, 18802.0, 4998.0, 1619.0, 683.0, 291.0, 141.0, 83.0, 53.0, 23.0, 21.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.4007568359375, -11.074951171875, -10.7491455078125, -10.42333984375, -10.0975341796875, -9.771728515625, -9.4459228515625, -9.1201171875, -8.7943115234375, -8.468505859375, -8.1427001953125, -7.81689453125, -7.4910888671875, -7.165283203125, -6.8394775390625, -6.513671875, -6.1878662109375, -5.862060546875, -5.5362548828125, -5.21044921875, -4.8846435546875, -4.558837890625, -4.2330322265625, -3.9072265625, -3.5814208984375, -3.255615234375, -2.9298095703125, -2.60400390625, -2.2781982421875, -1.952392578125, -1.6265869140625, -1.30078125, -0.9749755859375, -0.649169921875, -0.3233642578125, 0.00244140625, 0.3282470703125, 0.654052734375, 0.9798583984375, 1.3056640625, 1.6314697265625, 1.957275390625, 2.2830810546875, 2.60888671875, 2.9346923828125, 3.260498046875, 3.5863037109375, 3.912109375, 4.2379150390625, 4.563720703125, 4.8895263671875, 5.21533203125, 5.5411376953125, 5.866943359375, 6.1927490234375, 6.5185546875, 6.8443603515625, 7.170166015625, 7.4959716796875, 7.82177734375, 8.1475830078125, 8.473388671875, 8.7991943359375, 9.125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 4.0, 8.0, 5.0, 10.0, 14.0, 21.0, 19.0, 24.0, 30.0, 41.0, 58.0, 50.0, 46.0, 53.0, 54.0, 56.0, 63.0, 63.0, 58.0, 43.0, 39.0, 40.0, 41.0, 25.0, 26.0, 25.0, 10.0, 11.0, 11.0, 19.0, 4.0, 3.0, 6.0, 9.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177734375, -3.08697509765625, -2.9962158203125, -2.90545654296875, -2.814697265625, -2.72393798828125, -2.6331787109375, -2.54241943359375, -2.45166015625, -2.36090087890625, -2.2701416015625, -2.17938232421875, -2.088623046875, -1.99786376953125, -1.9071044921875, -1.81634521484375, -1.7255859375, -1.63482666015625, -1.5440673828125, -1.45330810546875, -1.362548828125, -1.27178955078125, -1.1810302734375, -1.09027099609375, -0.99951171875, -0.90875244140625, -0.8179931640625, -0.72723388671875, -0.636474609375, -0.54571533203125, -0.4549560546875, -0.36419677734375, -0.2734375, -0.18267822265625, -0.0919189453125, -0.00115966796875, 0.089599609375, 0.18035888671875, 0.2711181640625, 0.36187744140625, 0.45263671875, 0.54339599609375, 0.6341552734375, 0.72491455078125, 0.815673828125, 0.90643310546875, 0.9971923828125, 1.08795166015625, 1.1787109375, 1.26947021484375, 1.3602294921875, 1.45098876953125, 1.541748046875, 1.63250732421875, 1.7232666015625, 1.81402587890625, 1.90478515625, 1.99554443359375, 2.0863037109375, 2.17706298828125, 2.267822265625, 2.35858154296875, 2.4493408203125, 2.54010009765625, 2.630859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 7.0, 8.0, 7.0, 20.0, 23.0, 33.0, 31.0, 66.0, 111.0, 173.0, 275.0, 529.0, 850.0, 1624.0, 3412.0, 8156.0, 22351.0, 74040.0, 279778.0, 454871.0, 140191.0, 38751.0, 12966.0, 5175.0, 2343.0, 1179.0, 592.0, 337.0, 256.0, 116.0, 90.0, 57.0, 39.0, 23.0, 23.0, 22.0, 8.0, 3.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09375, -6.8924560546875, -6.691162109375, -6.4898681640625, -6.28857421875, -6.0872802734375, -5.885986328125, -5.6846923828125, -5.4833984375, -5.2821044921875, -5.080810546875, -4.8795166015625, -4.67822265625, -4.4769287109375, -4.275634765625, -4.0743408203125, -3.873046875, -3.6717529296875, -3.470458984375, -3.2691650390625, -3.06787109375, -2.8665771484375, -2.665283203125, -2.4639892578125, -2.2626953125, -2.0614013671875, -1.860107421875, -1.6588134765625, -1.45751953125, -1.2562255859375, -1.054931640625, -0.8536376953125, -0.65234375, -0.4510498046875, -0.249755859375, -0.0484619140625, 0.15283203125, 0.3541259765625, 0.555419921875, 0.7567138671875, 0.9580078125, 1.1593017578125, 1.360595703125, 1.5618896484375, 1.76318359375, 1.9644775390625, 2.165771484375, 2.3670654296875, 2.568359375, 2.7696533203125, 2.970947265625, 3.1722412109375, 3.37353515625, 3.5748291015625, 3.776123046875, 3.9774169921875, 4.1787109375, 4.3800048828125, 4.581298828125, 4.7825927734375, 4.98388671875, 5.1851806640625, 5.386474609375, 5.5877685546875, 5.7890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 5.0, 1.0, 2.0, 4.0, 11.0, 8.0, 7.0, 18.0, 40.0, 25.0, 25.0, 33.0, 35.0, 44.0, 45.0, 40.0, 53.0, 42.0, 62.0, 49.0, 55.0, 54.0, 42.0, 37.0, 40.0, 40.0, 34.0, 26.0, 32.0, 19.0, 13.0, 10.0, 8.0, 11.0, 9.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.1484375, -11.76708984375, -11.3857421875, -11.00439453125, -10.623046875, -10.24169921875, -9.8603515625, -9.47900390625, -9.09765625, -8.71630859375, -8.3349609375, -7.95361328125, -7.572265625, -7.19091796875, -6.8095703125, -6.42822265625, -6.046875, -5.66552734375, -5.2841796875, -4.90283203125, -4.521484375, -4.14013671875, -3.7587890625, -3.37744140625, -2.99609375, -2.61474609375, -2.2333984375, -1.85205078125, -1.470703125, -1.08935546875, -0.7080078125, -0.32666015625, 0.0546875, 0.43603515625, 0.8173828125, 1.19873046875, 1.580078125, 1.96142578125, 2.3427734375, 2.72412109375, 3.10546875, 3.48681640625, 3.8681640625, 4.24951171875, 4.630859375, 5.01220703125, 5.3935546875, 5.77490234375, 6.15625, 6.53759765625, 6.9189453125, 7.30029296875, 7.681640625, 8.06298828125, 8.4443359375, 8.82568359375, 9.20703125, 9.58837890625, 9.9697265625, 10.35107421875, 10.732421875, 11.11376953125, 11.4951171875, 11.87646484375, 12.2578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 5.0, 13.0, 14.0, 20.0, 41.0, 66.0, 114.0, 249.0, 629.0, 2165.0, 12237.0, 149277.0, 793988.0, 79175.0, 7955.0, 1653.0, 474.0, 195.0, 100.0, 58.0, 35.0, 27.0, 16.0, 6.0, 12.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.578125, -8.35467529296875, -8.1312255859375, -7.90777587890625, -7.684326171875, -7.46087646484375, -7.2374267578125, -7.01397705078125, -6.79052734375, -6.56707763671875, -6.3436279296875, -6.12017822265625, -5.896728515625, -5.67327880859375, -5.4498291015625, -5.22637939453125, -5.0029296875, -4.77947998046875, -4.5560302734375, -4.33258056640625, -4.109130859375, -3.88568115234375, -3.6622314453125, -3.43878173828125, -3.21533203125, -2.99188232421875, -2.7684326171875, -2.54498291015625, -2.321533203125, -2.09808349609375, -1.8746337890625, -1.65118408203125, -1.427734375, -1.20428466796875, -0.9808349609375, -0.75738525390625, -0.533935546875, -0.31048583984375, -0.0870361328125, 0.13641357421875, 0.35986328125, 0.58331298828125, 0.8067626953125, 1.03021240234375, 1.253662109375, 1.47711181640625, 1.7005615234375, 1.92401123046875, 2.1474609375, 2.37091064453125, 2.5943603515625, 2.81781005859375, 3.041259765625, 3.26470947265625, 3.4881591796875, 3.71160888671875, 3.93505859375, 4.15850830078125, 4.3819580078125, 4.60540771484375, 4.828857421875, 5.05230712890625, 5.2757568359375, 5.49920654296875, 5.72265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 10.0, 11.0, 11.0, 17.0, 18.0, 28.0, 45.0, 43.0, 74.0, 90.0, 104.0, 94.0, 120.0, 72.0, 67.0, 40.0, 57.0, 30.0, 12.0, 14.0, 12.0, 8.0, 9.0, 3.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.000652313232421875, -0.0006333962082862854, -0.0006144791841506958, -0.0005955621600151062, -0.0005766451358795166, -0.000557728111743927, -0.0005388110876083374, -0.0005198940634727478, -0.0005009770393371582, -0.0004820600152015686, -0.000463142991065979, -0.0004442259669303894, -0.0004253089427947998, -0.0004063919186592102, -0.0003874748945236206, -0.000368557870388031, -0.0003496408462524414, -0.0003307238221168518, -0.0003118067979812622, -0.0002928897738456726, -0.000273972749710083, -0.0002550557255744934, -0.0002361387014389038, -0.0002172216773033142, -0.0001983046531677246, -0.000179387629032135, -0.0001604706048965454, -0.0001415535807609558, -0.0001226365566253662, -0.00010371953248977661, -8.480250835418701e-05, -6.588548421859741e-05, -4.696846008300781e-05, -2.8051435947418213e-05, -9.134411811828613e-06, 9.782612323760986e-06, 2.8699636459350586e-05, 4.7616660594940186e-05, 6.653368473052979e-05, 8.545070886611938e-05, 0.00010436773300170898, 0.00012328475713729858, 0.00014220178127288818, 0.00016111880540847778, 0.00018003582954406738, 0.00019895285367965698, 0.00021786987781524658, 0.00023678690195083618, 0.0002557039260864258, 0.0002746209502220154, 0.000293537974357605, 0.0003124549984931946, 0.0003313720226287842, 0.0003502890467643738, 0.0003692060708999634, 0.000388123095035553, 0.0004070401191711426, 0.0004259571433067322, 0.0004448741674423218, 0.0004637911915779114, 0.000482708215713501, 0.0005016252398490906, 0.0005205422639846802, 0.0005394592881202698, 0.0005583763122558594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 17.0, 25.0, 20.0, 35.0, 48.0, 71.0, 118.0, 199.0, 356.0, 735.0, 1992.0, 7377.0, 49509.0, 560870.0, 385069.0, 33411.0, 5601.0, 1622.0, 684.0, 294.0, 177.0, 107.0, 60.0, 31.0, 30.0, 22.0, 14.0, 9.0, 5.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.2421875, -6.04656982421875, -5.8509521484375, -5.65533447265625, -5.459716796875, -5.26409912109375, -5.0684814453125, -4.87286376953125, -4.67724609375, -4.48162841796875, -4.2860107421875, -4.09039306640625, -3.894775390625, -3.69915771484375, -3.5035400390625, -3.30792236328125, -3.1123046875, -2.91668701171875, -2.7210693359375, -2.52545166015625, -2.329833984375, -2.13421630859375, -1.9385986328125, -1.74298095703125, -1.54736328125, -1.35174560546875, -1.1561279296875, -0.96051025390625, -0.764892578125, -0.56927490234375, -0.3736572265625, -0.17803955078125, 0.017578125, 0.21319580078125, 0.4088134765625, 0.60443115234375, 0.800048828125, 0.99566650390625, 1.1912841796875, 1.38690185546875, 1.58251953125, 1.77813720703125, 1.9737548828125, 2.16937255859375, 2.364990234375, 2.56060791015625, 2.7562255859375, 2.95184326171875, 3.1474609375, 3.34307861328125, 3.5386962890625, 3.73431396484375, 3.929931640625, 4.12554931640625, 4.3211669921875, 4.51678466796875, 4.71240234375, 4.90802001953125, 5.1036376953125, 5.29925537109375, 5.494873046875, 5.69049072265625, 5.8861083984375, 6.08172607421875, 6.27734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 7.0, 14.0, 18.0, 55.0, 95.0, 142.0, 179.0, 153.0, 127.0, 95.0, 58.0, 28.0, 15.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.140625, -8.8641357421875, -8.587646484375, -8.3111572265625, -8.03466796875, -7.7581787109375, -7.481689453125, -7.2052001953125, -6.9287109375, -6.6522216796875, -6.375732421875, -6.0992431640625, -5.82275390625, -5.5462646484375, -5.269775390625, -4.9932861328125, -4.716796875, -4.4403076171875, -4.163818359375, -3.8873291015625, -3.61083984375, -3.3343505859375, -3.057861328125, -2.7813720703125, -2.5048828125, -2.2283935546875, -1.951904296875, -1.6754150390625, -1.39892578125, -1.1224365234375, -0.845947265625, -0.5694580078125, -0.29296875, -0.0164794921875, 0.260009765625, 0.5364990234375, 0.81298828125, 1.0894775390625, 1.365966796875, 1.6424560546875, 1.9189453125, 2.1954345703125, 2.471923828125, 2.7484130859375, 3.02490234375, 3.3013916015625, 3.577880859375, 3.8543701171875, 4.130859375, 4.4073486328125, 4.683837890625, 4.9603271484375, 5.23681640625, 5.5133056640625, 5.789794921875, 6.0662841796875, 6.3427734375, 6.6192626953125, 6.895751953125, 7.1722412109375, 7.44873046875, 7.7252197265625, 8.001708984375, 8.2781982421875, 8.5546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 22.0, 43.0, 182.0, 298.0, 248.0, 136.0, 48.0, 13.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0], "bins": [-263.59991455078125, -258.6690673828125, -253.73825073242188, -248.8074188232422, -243.8765869140625, -238.94573974609375, -234.01492309570312, -229.08407592773438, -224.1532440185547, -219.222412109375, -214.2915802001953, -209.36074829101562, -204.42991638183594, -199.49908447265625, -194.5682373046875, -189.6374053955078, -184.70657348632812, -179.77574157714844, -174.84490966796875, -169.91407775878906, -164.98324584960938, -160.05239868164062, -155.12158203125, -150.19073486328125, -145.25991821289062, -140.32908630371094, -135.39825439453125, -130.46742248535156, -125.53658294677734, -120.60575103759766, -115.67491912841797, -110.74407958984375, -105.81324768066406, -100.88241577148438, -95.95158386230469, -91.020751953125, -86.08991241455078, -81.1590805053711, -76.2282485961914, -71.29740905761719, -66.36658477783203, -61.435752868652344, -56.50491714477539, -51.5740852355957, -46.64324951171875, -41.71241760253906, -36.781585693359375, -31.850749969482422, -26.919918060302734, -21.989084243774414, -17.058250427246094, -12.127418518066406, -7.196584701538086, -2.2657508850097656, 2.665081024169922, 7.595916748046875, 12.526748657226562, 17.457582473754883, 22.388416290283203, 27.31924819946289, 32.250083923339844, 37.18091583251953, 42.11174774169922, 47.04258346557617, 51.97341537475586]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 6.0, 6.0, 8.0, 7.0, 10.0, 17.0, 8.0, 19.0, 17.0, 17.0, 20.0, 16.0, 20.0, 31.0, 37.0, 46.0, 28.0, 36.0, 41.0, 41.0, 46.0, 66.0, 47.0, 40.0, 46.0, 38.0, 32.0, 36.0, 32.0, 34.0, 27.0, 20.0, 20.0, 13.0, 13.0, 12.0, 6.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.58829879760742, -51.93267822265625, -50.27705764770508, -48.621437072753906, -46.9658203125, -45.31019973754883, -43.654579162597656, -41.998958587646484, -40.34333801269531, -38.68771743774414, -37.03209686279297, -35.37648010253906, -33.72085952758789, -32.06523895263672, -30.409618377685547, -28.753997802734375, -27.09838104248047, -25.442760467529297, -23.787141799926758, -22.131521224975586, -20.475902557373047, -18.820281982421875, -17.164661407470703, -15.509041786193848, -13.853422164916992, -12.197802543640137, -10.542182922363281, -8.88656234741211, -7.230942726135254, -5.575323104858398, -3.9197025299072266, -2.264082908630371, -0.60845947265625, 1.0471603870391846, 2.702780246734619, 4.358400344848633, 6.014019966125488, 7.669639587402344, 9.325260162353516, 10.980879783630371, 12.636499404907227, 14.292119026184082, 15.947738647460938, 17.60335922241211, 19.25897979736328, 20.91459846496582, 22.570219039916992, 24.22583770751953, 25.881458282470703, 27.537078857421875, 29.192697525024414, 30.848318099975586, 32.503936767578125, 34.1595573425293, 35.81517791748047, 37.47079849243164, 39.12641906738281, 40.782039642333984, 42.437660217285156, 44.09327697753906, 45.748897552490234, 47.404518127441406, 49.06013870239258, 50.71575927734375, 52.371376037597656]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 9.0, 1.0, 5.0, 4.0, 6.0, 11.0, 10.0, 26.0, 21.0, 45.0, 93.0, 150.0, 267.0, 573.0, 1236.0, 3414.0, 14815.0, 3794354.0, 361048.0, 12636.0, 3115.0, 1162.0, 570.0, 290.0, 178.0, 95.0, 53.0, 29.0, 18.0, 16.0, 13.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.0, -25.394775390625, -24.78955078125, -24.184326171875, -23.5791015625, -22.973876953125, -22.36865234375, -21.763427734375, -21.158203125, -20.552978515625, -19.94775390625, -19.342529296875, -18.7373046875, -18.132080078125, -17.52685546875, -16.921630859375, -16.31640625, -15.711181640625, -15.10595703125, -14.500732421875, -13.8955078125, -13.290283203125, -12.68505859375, -12.079833984375, -11.474609375, -10.869384765625, -10.26416015625, -9.658935546875, -9.0537109375, -8.448486328125, -7.84326171875, -7.238037109375, -6.6328125, -6.027587890625, -5.42236328125, -4.817138671875, -4.2119140625, -3.606689453125, -3.00146484375, -2.396240234375, -1.791015625, -1.185791015625, -0.58056640625, 0.024658203125, 0.6298828125, 1.235107421875, 1.84033203125, 2.445556640625, 3.05078125, 3.656005859375, 4.26123046875, 4.866455078125, 5.4716796875, 6.076904296875, 6.68212890625, 7.287353515625, 7.892578125, 8.497802734375, 9.10302734375, 9.708251953125, 10.3134765625, 10.918701171875, 11.52392578125, 12.129150390625, 12.734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 7.0, 4.0, 7.0, 15.0, 4.0, 16.0, 16.0, 17.0, 16.0, 24.0, 40.0, 47.0, 45.0, 41.0, 43.0, 48.0, 43.0, 48.0, 48.0, 52.0, 43.0, 45.0, 35.0, 40.0, 35.0, 29.0, 23.0, 23.0, 27.0, 21.0, 11.0, 11.0, 12.0, 15.0, 10.0, 7.0, 10.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.119140625, -3.03076171875, -2.9423828125, -2.85400390625, -2.765625, -2.67724609375, -2.5888671875, -2.50048828125, -2.412109375, -2.32373046875, -2.2353515625, -2.14697265625, -2.05859375, -1.97021484375, -1.8818359375, -1.79345703125, -1.705078125, -1.61669921875, -1.5283203125, -1.43994140625, -1.3515625, -1.26318359375, -1.1748046875, -1.08642578125, -0.998046875, -0.90966796875, -0.8212890625, -0.73291015625, -0.64453125, -0.55615234375, -0.4677734375, -0.37939453125, -0.291015625, -0.20263671875, -0.1142578125, -0.02587890625, 0.0625, 0.15087890625, 0.2392578125, 0.32763671875, 0.416015625, 0.50439453125, 0.5927734375, 0.68115234375, 0.76953125, 0.85791015625, 0.9462890625, 1.03466796875, 1.123046875, 1.21142578125, 1.2998046875, 1.38818359375, 1.4765625, 1.56494140625, 1.6533203125, 1.74169921875, 1.830078125, 1.91845703125, 2.0068359375, 2.09521484375, 2.18359375, 2.27197265625, 2.3603515625, 2.44873046875, 2.537109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 1.0, 8.0, 6.0, 7.0, 9.0, 8.0, 11.0, 16.0, 25.0, 12.0, 18.0, 39.0, 63.0, 99.0, 143.0, 212.0, 472.0, 865.0, 2026.0, 5913.0, 25818.0, 758550.0, 3361882.0, 27688.0, 6198.0, 2117.0, 903.0, 450.0, 235.0, 130.0, 92.0, 67.0, 54.0, 34.0, 28.0, 14.0, 17.0, 12.0, 11.0, 7.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.6328125, -10.2900390625, -9.947265625, -9.6044921875, -9.26171875, -8.9189453125, -8.576171875, -8.2333984375, -7.890625, -7.5478515625, -7.205078125, -6.8623046875, -6.51953125, -6.1767578125, -5.833984375, -5.4912109375, -5.1484375, -4.8056640625, -4.462890625, -4.1201171875, -3.77734375, -3.4345703125, -3.091796875, -2.7490234375, -2.40625, -2.0634765625, -1.720703125, -1.3779296875, -1.03515625, -0.6923828125, -0.349609375, -0.0068359375, 0.3359375, 0.6787109375, 1.021484375, 1.3642578125, 1.70703125, 2.0498046875, 2.392578125, 2.7353515625, 3.078125, 3.4208984375, 3.763671875, 4.1064453125, 4.44921875, 4.7919921875, 5.134765625, 5.4775390625, 5.8203125, 6.1630859375, 6.505859375, 6.8486328125, 7.19140625, 7.5341796875, 7.876953125, 8.2197265625, 8.5625, 8.9052734375, 9.248046875, 9.5908203125, 9.93359375, 10.2763671875, 10.619140625, 10.9619140625, 11.3046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 5.0, 13.0, 15.0, 23.0, 24.0, 61.0, 152.0, 3039.0, 470.0, 134.0, 51.0, 27.0, 13.0, 11.0, 13.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.359710693359375, -2.28778076171875, -2.215850830078125, -2.1439208984375, -2.071990966796875, -2.00006103515625, -1.928131103515625, -1.856201171875, -1.784271240234375, -1.71234130859375, -1.640411376953125, -1.5684814453125, -1.496551513671875, -1.42462158203125, -1.352691650390625, -1.28076171875, -1.208831787109375, -1.13690185546875, -1.064971923828125, -0.9930419921875, -0.921112060546875, -0.84918212890625, -0.777252197265625, -0.705322265625, -0.633392333984375, -0.56146240234375, -0.489532470703125, -0.4176025390625, -0.345672607421875, -0.27374267578125, -0.201812744140625, -0.1298828125, -0.057952880859375, 0.01397705078125, 0.085906982421875, 0.1578369140625, 0.229766845703125, 0.30169677734375, 0.373626708984375, 0.445556640625, 0.517486572265625, 0.58941650390625, 0.661346435546875, 0.7332763671875, 0.805206298828125, 0.87713623046875, 0.949066162109375, 1.02099609375, 1.092926025390625, 1.16485595703125, 1.236785888671875, 1.3087158203125, 1.380645751953125, 1.45257568359375, 1.524505615234375, 1.596435546875, 1.668365478515625, 1.74029541015625, 1.812225341796875, 1.8841552734375, 1.956085205078125, 2.02801513671875, 2.099945068359375, 2.171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 1.0, 3.0, 3.0, 12.0, 10.0, 11.0, 26.0, 49.0, 73.0, 68.0, 114.0, 146.0, 137.0, 107.0, 80.0, 58.0, 43.0, 20.0, 17.0, 14.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.597040176391602, -9.328974723815918, -9.06091022491455, -8.792844772338867, -8.5247802734375, -8.256714820861816, -7.988649368286133, -7.720584392547607, -7.452519416809082, -7.184454441070557, -6.916389465332031, -6.648324012756348, -6.380259037017822, -6.112194061279297, -5.844128608703613, -5.576063632965088, -5.3079986572265625, -5.039933681488037, -4.771868705749512, -4.503803253173828, -4.235738277435303, -3.9676733016967773, -3.699608087539673, -3.4315428733825684, -3.163477897644043, -2.8954129219055176, -2.627347707748413, -2.3592824935913086, -2.091217517852783, -1.8231524229049683, -1.5550873279571533, -1.2870222330093384, -1.0189571380615234, -0.7508920431137085, -0.48282694816589355, -0.2147618532180786, 0.05330324172973633, 0.32136833667755127, 0.5894334316253662, 0.8574985265731812, 1.125563621520996, 1.393628716468811, 1.661693811416626, 1.929758906364441, 2.197824001312256, 2.4658889770507812, 2.7339541912078857, 3.0020194053649902, 3.2700843811035156, 3.538149356842041, 3.8062145709991455, 4.07427978515625, 4.342344760894775, 4.610409736633301, 4.878475189208984, 5.14654016494751, 5.414605140686035, 5.6826701164245605, 5.950735092163086, 6.2188005447387695, 6.486865520477295, 6.75493049621582, 7.022995948791504, 7.291060924530029, 7.559125900268555]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 0.0, 10.0, 6.0, 8.0, 14.0, 11.0, 20.0, 20.0, 16.0, 19.0, 16.0, 23.0, 30.0, 27.0, 31.0, 42.0, 36.0, 34.0, 34.0, 49.0, 30.0, 33.0, 31.0, 49.0, 40.0, 33.0, 40.0, 27.0, 33.0, 24.0, 32.0, 26.0, 23.0, 28.0, 14.0, 17.0, 11.0, 6.0, 13.0, 10.0, 7.0, 4.0, 3.0, 3.0, 10.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.6032822132110596, -3.4946224689483643, -3.385962724685669, -3.2773029804229736, -3.1686432361602783, -3.059983491897583, -2.951323986053467, -2.8426642417907715, -2.734004497528076, -2.625344753265381, -2.5166850090026855, -2.4080252647399902, -2.299365520477295, -2.1907057762145996, -2.0820460319519043, -1.9733864068984985, -1.8647265434265137, -1.7560667991638184, -1.647407054901123, -1.5387473106384277, -1.4300875663757324, -1.321427822113037, -1.2127681970596313, -1.104108452796936, -0.9954487085342407, -0.8867889642715454, -0.7781292200088501, -0.6694695353507996, -0.5608097910881042, -0.45215004682540894, -0.3434903621673584, -0.23483061790466309, -0.12617111206054688, -0.017511382699012756, 0.09114834666252136, 0.1998080611228943, 0.3084678053855896, 0.4171275496482849, 0.5257872343063354, 0.6344469785690308, 0.7431067228317261, 0.8517664670944214, 0.9604262113571167, 1.0690858364105225, 1.1777455806732178, 1.286405324935913, 1.3950650691986084, 1.5037248134613037, 1.612384557723999, 1.7210443019866943, 1.8297040462493896, 1.938363790512085, 2.0470235347747803, 2.1556832790374756, 2.264342784881592, 2.373002529144287, 2.4816622734069824, 2.5903220176696777, 2.698981761932373, 2.8076415061950684, 2.9163012504577637, 3.024960994720459, 3.1336207389831543, 3.2422804832458496, 3.350940227508545]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 32.0, 35.0, 51.0, 83.0, 106.0, 205.0, 297.0, 482.0, 854.0, 1503.0, 2556.0, 4824.0, 9263.0, 19900.0, 45384.0, 112130.0, 267685.0, 320571.0, 151500.0, 60303.0, 25591.0, 11730.0, 5936.0, 3181.0, 1761.0, 1032.0, 613.0, 328.0, 227.0, 129.0, 72.0, 53.0, 38.0, 22.0, 11.0, 11.0, 13.0, 2.0, 7.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.94140625, -5.777099609375, -5.61279296875, -5.448486328125, -5.2841796875, -5.119873046875, -4.95556640625, -4.791259765625, -4.626953125, -4.462646484375, -4.29833984375, -4.134033203125, -3.9697265625, -3.805419921875, -3.64111328125, -3.476806640625, -3.3125, -3.148193359375, -2.98388671875, -2.819580078125, -2.6552734375, -2.490966796875, -2.32666015625, -2.162353515625, -1.998046875, -1.833740234375, -1.66943359375, -1.505126953125, -1.3408203125, -1.176513671875, -1.01220703125, -0.847900390625, -0.68359375, -0.519287109375, -0.35498046875, -0.190673828125, -0.0263671875, 0.137939453125, 0.30224609375, 0.466552734375, 0.630859375, 0.795166015625, 0.95947265625, 1.123779296875, 1.2880859375, 1.452392578125, 1.61669921875, 1.781005859375, 1.9453125, 2.109619140625, 2.27392578125, 2.438232421875, 2.6025390625, 2.766845703125, 2.93115234375, 3.095458984375, 3.259765625, 3.424072265625, 3.58837890625, 3.752685546875, 3.9169921875, 4.081298828125, 4.24560546875, 4.409912109375, 4.57421875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 3.0, 8.0, 10.0, 14.0, 15.0, 18.0, 24.0, 29.0, 20.0, 23.0, 30.0, 41.0, 46.0, 51.0, 34.0, 43.0, 47.0, 65.0, 42.0, 37.0, 50.0, 39.0, 31.0, 32.0, 30.0, 26.0, 27.0, 18.0, 30.0, 15.0, 16.0, 14.0, 7.0, 9.0, 6.0, 10.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.123046875, -3.034820556640625, -2.94659423828125, -2.858367919921875, -2.7701416015625, -2.681915283203125, -2.59368896484375, -2.505462646484375, -2.417236328125, -2.329010009765625, -2.24078369140625, -2.152557373046875, -2.0643310546875, -1.976104736328125, -1.88787841796875, -1.799652099609375, -1.71142578125, -1.623199462890625, -1.53497314453125, -1.446746826171875, -1.3585205078125, -1.270294189453125, -1.18206787109375, -1.093841552734375, -1.005615234375, -0.917388916015625, -0.82916259765625, -0.740936279296875, -0.6527099609375, -0.564483642578125, -0.47625732421875, -0.388031005859375, -0.2998046875, -0.211578369140625, -0.12335205078125, -0.035125732421875, 0.0531005859375, 0.141326904296875, 0.22955322265625, 0.317779541015625, 0.406005859375, 0.494232177734375, 0.58245849609375, 0.670684814453125, 0.7589111328125, 0.847137451171875, 0.93536376953125, 1.023590087890625, 1.11181640625, 1.200042724609375, 1.28826904296875, 1.376495361328125, 1.4647216796875, 1.552947998046875, 1.64117431640625, 1.729400634765625, 1.817626953125, 1.905853271484375, 1.99407958984375, 2.082305908203125, 2.1705322265625, 2.258758544921875, 2.34698486328125, 2.435211181640625, 2.5234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 5.0, 9.0, 0.0, 9.0, 10.0, 13.0, 22.0, 38.0, 47.0, 90.0, 129.0, 235.0, 399.0, 746.0, 1503.0, 3384.0, 9018.0, 30596.0, 162973.0, 633884.0, 159930.0, 30192.0, 8800.0, 3311.0, 1441.0, 748.0, 443.0, 225.0, 115.0, 71.0, 51.0, 44.0, 26.0, 16.0, 13.0, 9.0, 6.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7218017578125, -8.435791015625, -8.1497802734375, -7.86376953125, -7.5777587890625, -7.291748046875, -7.0057373046875, -6.7197265625, -6.4337158203125, -6.147705078125, -5.8616943359375, -5.57568359375, -5.2896728515625, -5.003662109375, -4.7176513671875, -4.431640625, -4.1456298828125, -3.859619140625, -3.5736083984375, -3.28759765625, -3.0015869140625, -2.715576171875, -2.4295654296875, -2.1435546875, -1.8575439453125, -1.571533203125, -1.2855224609375, -0.99951171875, -0.7135009765625, -0.427490234375, -0.1414794921875, 0.14453125, 0.4305419921875, 0.716552734375, 1.0025634765625, 1.28857421875, 1.5745849609375, 1.860595703125, 2.1466064453125, 2.4326171875, 2.7186279296875, 3.004638671875, 3.2906494140625, 3.57666015625, 3.8626708984375, 4.148681640625, 4.4346923828125, 4.720703125, 5.0067138671875, 5.292724609375, 5.5787353515625, 5.86474609375, 6.1507568359375, 6.436767578125, 6.7227783203125, 7.0087890625, 7.2947998046875, 7.580810546875, 7.8668212890625, 8.15283203125, 8.4388427734375, 8.724853515625, 9.0108642578125, 9.296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 6.0, 13.0, 10.0, 12.0, 17.0, 16.0, 20.0, 32.0, 31.0, 44.0, 35.0, 39.0, 45.0, 52.0, 58.0, 57.0, 44.0, 70.0, 51.0, 48.0, 50.0, 47.0, 39.0, 34.0, 21.0, 16.0, 13.0, 22.0, 12.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0625, -14.5595703125, -14.056640625, -13.5537109375, -13.05078125, -12.5478515625, -12.044921875, -11.5419921875, -11.0390625, -10.5361328125, -10.033203125, -9.5302734375, -9.02734375, -8.5244140625, -8.021484375, -7.5185546875, -7.015625, -6.5126953125, -6.009765625, -5.5068359375, -5.00390625, -4.5009765625, -3.998046875, -3.4951171875, -2.9921875, -2.4892578125, -1.986328125, -1.4833984375, -0.98046875, -0.4775390625, 0.025390625, 0.5283203125, 1.03125, 1.5341796875, 2.037109375, 2.5400390625, 3.04296875, 3.5458984375, 4.048828125, 4.5517578125, 5.0546875, 5.5576171875, 6.060546875, 6.5634765625, 7.06640625, 7.5693359375, 8.072265625, 8.5751953125, 9.078125, 9.5810546875, 10.083984375, 10.5869140625, 11.08984375, 11.5927734375, 12.095703125, 12.5986328125, 13.1015625, 13.6044921875, 14.107421875, 14.6103515625, 15.11328125, 15.6162109375, 16.119140625, 16.6220703125, 17.125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 5.0, 15.0, 15.0, 14.0, 21.0, 22.0, 48.0, 62.0, 99.0, 121.0, 217.0, 378.0, 669.0, 1422.0, 3423.0, 11622.0, 56943.0, 403221.0, 483966.0, 66109.0, 13218.0, 3793.0, 1407.0, 704.0, 347.0, 229.0, 154.0, 86.0, 51.0, 51.0, 19.0, 21.0, 17.0, 17.0, 10.0, 11.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.779296875, -3.6649169921875, -3.550537109375, -3.4361572265625, -3.32177734375, -3.2073974609375, -3.093017578125, -2.9786376953125, -2.8642578125, -2.7498779296875, -2.635498046875, -2.5211181640625, -2.40673828125, -2.2923583984375, -2.177978515625, -2.0635986328125, -1.94921875, -1.8348388671875, -1.720458984375, -1.6060791015625, -1.49169921875, -1.3773193359375, -1.262939453125, -1.1485595703125, -1.0341796875, -0.9197998046875, -0.805419921875, -0.6910400390625, -0.57666015625, -0.4622802734375, -0.347900390625, -0.2335205078125, -0.119140625, -0.0047607421875, 0.109619140625, 0.2239990234375, 0.33837890625, 0.4527587890625, 0.567138671875, 0.6815185546875, 0.7958984375, 0.9102783203125, 1.024658203125, 1.1390380859375, 1.25341796875, 1.3677978515625, 1.482177734375, 1.5965576171875, 1.7109375, 1.8253173828125, 1.939697265625, 2.0540771484375, 2.16845703125, 2.2828369140625, 2.397216796875, 2.5115966796875, 2.6259765625, 2.7403564453125, 2.854736328125, 2.9691162109375, 3.08349609375, 3.1978759765625, 3.312255859375, 3.4266357421875, 3.541015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 13.0, 11.0, 32.0, 33.0, 49.0, 75.0, 101.0, 161.0, 160.0, 108.0, 82.0, 44.0, 48.0, 23.0, 15.0, 13.0, 4.0, 5.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007777214050292969, -0.0007560625672340393, -0.0007344037294387817, -0.0007127448916435242, -0.0006910860538482666, -0.000669427216053009, -0.0006477683782577515, -0.0006261095404624939, -0.0006044507026672363, -0.0005827918648719788, -0.0005611330270767212, -0.0005394741892814636, -0.0005178153514862061, -0.0004961565136909485, -0.0004744976758956909, -0.00045283883810043335, -0.0004311800003051758, -0.0004095211625099182, -0.00038786232471466064, -0.0003662034869194031, -0.0003445446491241455, -0.00032288581132888794, -0.00030122697353363037, -0.0002795681357383728, -0.00025790929794311523, -0.00023625046014785767, -0.0002145916223526001, -0.00019293278455734253, -0.00017127394676208496, -0.0001496151089668274, -0.00012795627117156982, -0.00010629743337631226, -8.463859558105469e-05, -6.297975778579712e-05, -4.132091999053955e-05, -1.9662082195281982e-05, 1.996755599975586e-06, 2.3655593395233154e-05, 4.531443119049072e-05, 6.697326898574829e-05, 8.863210678100586e-05, 0.00011029094457626343, 0.000131949782371521, 0.00015360862016677856, 0.00017526745796203613, 0.0001969262957572937, 0.00021858513355255127, 0.00024024397134780884, 0.0002619028091430664, 0.000283561646938324, 0.00030522048473358154, 0.0003268793225288391, 0.0003485381603240967, 0.00037019699811935425, 0.0003918558359146118, 0.0004135146737098694, 0.00043517351150512695, 0.0004568323493003845, 0.0004784911870956421, 0.0005001500248908997, 0.0005218088626861572, 0.0005434677004814148, 0.0005651265382766724, 0.0005867853760719299, 0.0006084442138671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 4.0, 7.0, 7.0, 7.0, 14.0, 27.0, 31.0, 49.0, 72.0, 111.0, 225.0, 380.0, 731.0, 1482.0, 3711.0, 11661.0, 56787.0, 461039.0, 438641.0, 55380.0, 11412.0, 3591.0, 1485.0, 703.0, 400.0, 220.0, 137.0, 77.0, 54.0, 29.0, 12.0, 17.0, 9.0, 4.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.865234375, -3.736358642578125, -3.60748291015625, -3.478607177734375, -3.3497314453125, -3.220855712890625, -3.09197998046875, -2.963104248046875, -2.834228515625, -2.705352783203125, -2.57647705078125, -2.447601318359375, -2.3187255859375, -2.189849853515625, -2.06097412109375, -1.932098388671875, -1.80322265625, -1.674346923828125, -1.54547119140625, -1.416595458984375, -1.2877197265625, -1.158843994140625, -1.02996826171875, -0.901092529296875, -0.772216796875, -0.643341064453125, -0.51446533203125, -0.385589599609375, -0.2567138671875, -0.127838134765625, 0.00103759765625, 0.129913330078125, 0.2587890625, 0.387664794921875, 0.51654052734375, 0.645416259765625, 0.7742919921875, 0.903167724609375, 1.03204345703125, 1.160919189453125, 1.289794921875, 1.418670654296875, 1.54754638671875, 1.676422119140625, 1.8052978515625, 1.934173583984375, 2.06304931640625, 2.191925048828125, 2.32080078125, 2.449676513671875, 2.57855224609375, 2.707427978515625, 2.8363037109375, 2.965179443359375, 3.09405517578125, 3.222930908203125, 3.351806640625, 3.480682373046875, 3.60955810546875, 3.738433837890625, 3.8673095703125, 3.996185302734375, 4.12506103515625, 4.253936767578125, 4.3828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 14.0, 15.0, 20.0, 23.0, 33.0, 63.0, 91.0, 97.0, 120.0, 133.0, 82.0, 105.0, 65.0, 48.0, 32.0, 17.0, 9.0, 12.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.0078125, -5.84600830078125, -5.6842041015625, -5.52239990234375, -5.360595703125, -5.19879150390625, -5.0369873046875, -4.87518310546875, -4.71337890625, -4.55157470703125, -4.3897705078125, -4.22796630859375, -4.066162109375, -3.90435791015625, -3.7425537109375, -3.58074951171875, -3.4189453125, -3.25714111328125, -3.0953369140625, -2.93353271484375, -2.771728515625, -2.60992431640625, -2.4481201171875, -2.28631591796875, -2.12451171875, -1.96270751953125, -1.8009033203125, -1.63909912109375, -1.477294921875, -1.31549072265625, -1.1536865234375, -0.99188232421875, -0.830078125, -0.66827392578125, -0.5064697265625, -0.34466552734375, -0.182861328125, -0.02105712890625, 0.1407470703125, 0.30255126953125, 0.46435546875, 0.62615966796875, 0.7879638671875, 0.94976806640625, 1.111572265625, 1.27337646484375, 1.4351806640625, 1.59698486328125, 1.7587890625, 1.92059326171875, 2.0823974609375, 2.24420166015625, 2.406005859375, 2.56781005859375, 2.7296142578125, 2.89141845703125, 3.05322265625, 3.21502685546875, 3.3768310546875, 3.53863525390625, 3.700439453125, 3.86224365234375, 4.0240478515625, 4.18585205078125, 4.34765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 22.0, 49.0, 75.0, 166.0, 226.0, 187.0, 120.0, 59.0, 39.0, 24.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.91593933105469, -69.8342514038086, -66.7525634765625, -63.670875549316406, -60.58918762207031, -57.50749969482422, -54.42581558227539, -51.3441276550293, -48.2624397277832, -45.18075180053711, -42.099063873291016, -39.01737976074219, -35.935691833496094, -32.85400390625, -29.772315979003906, -26.690628051757812, -23.60894012451172, -20.527252197265625, -17.44556427001953, -14.36387825012207, -11.282190322875977, -8.200502395629883, -5.118816375732422, -2.037128448486328, 1.0445594787597656, 4.126246929168701, 7.207934379577637, 10.289621353149414, 13.371309280395508, 16.4529972076416, 19.534683227539062, 22.616371154785156, 25.69805908203125, 28.779747009277344, 31.861434936523438, 34.94312286376953, 38.024810791015625, 41.10649871826172, 44.18818283081055, 47.26987075805664, 50.351558685302734, 53.43324661254883, 56.51493453979492, 59.59661865234375, 62.678306579589844, 65.75999450683594, 68.84168243408203, 71.92337036132812, 75.00505828857422, 78.08674621582031, 81.1684341430664, 84.2501220703125, 87.3318099975586, 90.41349792480469, 93.49517822265625, 96.57687377929688, 99.65855407714844, 102.74024200439453, 105.82192993164062, 108.90361785888672, 111.98530578613281, 115.0669937133789, 118.148681640625, 121.23036193847656, 124.31205749511719]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 2.0, 5.0, 12.0, 10.0, 7.0, 11.0, 9.0, 9.0, 27.0, 25.0, 30.0, 29.0, 38.0, 45.0, 43.0, 48.0, 54.0, 72.0, 64.0, 54.0, 44.0, 66.0, 36.0, 42.0, 39.0, 33.0, 20.0, 31.0, 28.0, 19.0, 16.0, 7.0, 6.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-72.47904968261719, -70.36177062988281, -68.24449157714844, -66.12721252441406, -64.00993347167969, -61.89265060424805, -59.775367736816406, -57.65808868408203, -55.540809631347656, -53.42353057861328, -51.306251525878906, -49.188968658447266, -47.07168960571289, -44.954410552978516, -42.837127685546875, -40.7198486328125, -38.602569580078125, -36.48529052734375, -34.368011474609375, -32.250728607177734, -30.13344955444336, -28.016170501708984, -25.898889541625977, -23.78160858154297, -21.664329528808594, -19.54705047607422, -17.42976951599121, -15.31248950958252, -13.195209503173828, -11.077929496765137, -8.960649490356445, -6.843369483947754, -4.726097106933594, -2.6088171005249023, -0.49153709411621094, 1.6257429122924805, 3.743022918701172, 5.860302925109863, 7.977582931518555, 10.094862937927246, 12.212142944335938, 14.329422950744629, 16.44670295715332, 18.563983917236328, 20.681262969970703, 22.798542022705078, 24.915822982788086, 27.033103942871094, 29.15038299560547, 31.267662048339844, 33.38494110107422, 35.50222396850586, 37.619503021240234, 39.73678207397461, 41.85406494140625, 43.971343994140625, 46.088623046875, 48.205902099609375, 50.32318115234375, 52.44046401977539, 54.557743072509766, 56.67502212524414, 58.79230499267578, 60.909584045410156, 63.02686309814453]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 9.0, 10.0, 19.0, 34.0, 33.0, 57.0, 74.0, 142.0, 230.0, 399.0, 795.0, 1606.0, 4124.0, 14049.0, 216250.0, 3921754.0, 24917.0, 5489.0, 2126.0, 911.0, 497.0, 249.0, 189.0, 102.0, 75.0, 35.0, 21.0, 20.0, 18.0, 3.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-25.640625, -25.017578125, -24.39453125, -23.771484375, -23.1484375, -22.525390625, -21.90234375, -21.279296875, -20.65625, -20.033203125, -19.41015625, -18.787109375, -18.1640625, -17.541015625, -16.91796875, -16.294921875, -15.671875, -15.048828125, -14.42578125, -13.802734375, -13.1796875, -12.556640625, -11.93359375, -11.310546875, -10.6875, -10.064453125, -9.44140625, -8.818359375, -8.1953125, -7.572265625, -6.94921875, -6.326171875, -5.703125, -5.080078125, -4.45703125, -3.833984375, -3.2109375, -2.587890625, -1.96484375, -1.341796875, -0.71875, -0.095703125, 0.52734375, 1.150390625, 1.7734375, 2.396484375, 3.01953125, 3.642578125, 4.265625, 4.888671875, 5.51171875, 6.134765625, 6.7578125, 7.380859375, 8.00390625, 8.626953125, 9.25, 9.873046875, 10.49609375, 11.119140625, 11.7421875, 12.365234375, 12.98828125, 13.611328125, 14.234375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 3.0, 20.0, 16.0, 23.0, 40.0, 40.0, 47.0, 55.0, 72.0, 81.0, 73.0, 78.0, 70.0, 61.0, 55.0, 50.0, 53.0, 32.0, 31.0, 30.0, 18.0, 8.0, 16.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.50390625, -5.37677001953125, -5.2496337890625, -5.12249755859375, -4.995361328125, -4.86822509765625, -4.7410888671875, -4.61395263671875, -4.48681640625, -4.35968017578125, -4.2325439453125, -4.10540771484375, -3.978271484375, -3.85113525390625, -3.7239990234375, -3.59686279296875, -3.4697265625, -3.34259033203125, -3.2154541015625, -3.08831787109375, -2.961181640625, -2.83404541015625, -2.7069091796875, -2.57977294921875, -2.45263671875, -2.32550048828125, -2.1983642578125, -2.07122802734375, -1.944091796875, -1.81695556640625, -1.6898193359375, -1.56268310546875, -1.435546875, -1.30841064453125, -1.1812744140625, -1.05413818359375, -0.927001953125, -0.79986572265625, -0.6727294921875, -0.54559326171875, -0.41845703125, -0.29132080078125, -0.1641845703125, -0.03704833984375, 0.090087890625, 0.21722412109375, 0.3443603515625, 0.47149658203125, 0.5986328125, 0.72576904296875, 0.8529052734375, 0.98004150390625, 1.107177734375, 1.23431396484375, 1.3614501953125, 1.48858642578125, 1.61572265625, 1.74285888671875, 1.8699951171875, 1.99713134765625, 2.124267578125, 2.25140380859375, 2.3785400390625, 2.50567626953125, 2.6328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 7.0, 6.0, 9.0, 11.0, 21.0, 26.0, 21.0, 47.0, 38.0, 53.0, 94.0, 171.0, 291.0, 526.0, 894.0, 1886.0, 4110.0, 11310.0, 48773.0, 3749394.0, 333932.0, 27934.0, 8149.0, 3227.0, 1485.0, 769.0, 389.0, 229.0, 123.0, 101.0, 62.0, 36.0, 46.0, 29.0, 16.0, 9.0, 9.0, 7.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.171875, -8.864501953125, -8.55712890625, -8.249755859375, -7.9423828125, -7.635009765625, -7.32763671875, -7.020263671875, -6.712890625, -6.405517578125, -6.09814453125, -5.790771484375, -5.4833984375, -5.176025390625, -4.86865234375, -4.561279296875, -4.25390625, -3.946533203125, -3.63916015625, -3.331787109375, -3.0244140625, -2.717041015625, -2.40966796875, -2.102294921875, -1.794921875, -1.487548828125, -1.18017578125, -0.872802734375, -0.5654296875, -0.258056640625, 0.04931640625, 0.356689453125, 0.6640625, 0.971435546875, 1.27880859375, 1.586181640625, 1.8935546875, 2.200927734375, 2.50830078125, 2.815673828125, 3.123046875, 3.430419921875, 3.73779296875, 4.045166015625, 4.3525390625, 4.659912109375, 4.96728515625, 5.274658203125, 5.58203125, 5.889404296875, 6.19677734375, 6.504150390625, 6.8115234375, 7.118896484375, 7.42626953125, 7.733642578125, 8.041015625, 8.348388671875, 8.65576171875, 8.963134765625, 9.2705078125, 9.577880859375, 9.88525390625, 10.192626953125, 10.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 11.0, 29.0, 74.0, 411.0, 3236.0, 176.0, 54.0, 31.0, 13.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7764892578125, -8.552978515625, -8.3294677734375, -8.10595703125, -7.8824462890625, -7.658935546875, -7.4354248046875, -7.2119140625, -6.9884033203125, -6.764892578125, -6.5413818359375, -6.31787109375, -6.0943603515625, -5.870849609375, -5.6473388671875, -5.423828125, -5.2003173828125, -4.976806640625, -4.7532958984375, -4.52978515625, -4.3062744140625, -4.082763671875, -3.8592529296875, -3.6357421875, -3.4122314453125, -3.188720703125, -2.9652099609375, -2.74169921875, -2.5181884765625, -2.294677734375, -2.0711669921875, -1.84765625, -1.6241455078125, -1.400634765625, -1.1771240234375, -0.95361328125, -0.7301025390625, -0.506591796875, -0.2830810546875, -0.0595703125, 0.1639404296875, 0.387451171875, 0.6109619140625, 0.83447265625, 1.0579833984375, 1.281494140625, 1.5050048828125, 1.728515625, 1.9520263671875, 2.175537109375, 2.3990478515625, 2.62255859375, 2.8460693359375, 3.069580078125, 3.2930908203125, 3.5166015625, 3.7401123046875, 3.963623046875, 4.1871337890625, 4.41064453125, 4.6341552734375, 4.857666015625, 5.0811767578125, 5.3046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 7.0, 7.0, 14.0, 23.0, 36.0, 59.0, 74.0, 114.0, 138.0, 131.0, 122.0, 92.0, 64.0, 43.0, 21.0, 11.0, 12.0, 10.0, 4.0, 5.0, 2.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.669036865234375, -9.156133651733398, -8.643230438232422, -8.130327224731445, -7.617423057556152, -7.104519844055176, -6.591616630554199, -6.078713417053223, -5.565809726715088, -5.052906513214111, -4.540002822875977, -4.027099609375, -3.5141961574554443, -3.0012927055358887, -2.488389492034912, -1.9754860401153564, -1.4625825881958008, -0.9496791958808899, -0.436775803565979, 0.07612752914428711, 0.5890309810638428, 1.1019344329833984, 1.614837646484375, 2.1277410984039307, 2.6406445503234863, 3.153548002243042, 3.6664514541625977, 4.179354667663574, 4.692257881164551, 5.2051615715026855, 5.718064785003662, 6.230968475341797, 6.743871688842773, 7.25677490234375, 7.769678592681885, 8.282581329345703, 8.795485496520996, 9.308388710021973, 9.82129192352295, 10.334195137023926, 10.847099304199219, 11.360002517700195, 11.872905731201172, 12.385808944702148, 12.898713111877441, 13.411616325378418, 13.924519538879395, 14.437422752380371, 14.950325965881348, 15.463229179382324, 15.9761323928833, 16.489036560058594, 17.00193977355957, 17.514842987060547, 18.027746200561523, 18.5406494140625, 19.053552627563477, 19.566455841064453, 20.07935905456543, 20.592262268066406, 21.105165481567383, 21.61806869506836, 22.13097381591797, 22.643877029418945, 23.156780242919922]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 8.0, 10.0, 16.0, 15.0, 20.0, 25.0, 29.0, 35.0, 25.0, 31.0, 45.0, 44.0, 46.0, 50.0, 48.0, 58.0, 64.0, 52.0, 47.0, 48.0, 43.0, 36.0, 35.0, 28.0, 23.0, 25.0, 13.0, 20.0, 15.0, 11.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.150428771972656, -9.795211791992188, -9.439994812011719, -9.084778785705566, -8.729561805725098, -8.374344825744629, -8.019128799438477, -7.663911819458008, -7.308694839477539, -6.95347785949707, -6.59826135635376, -6.243044853210449, -5.8878278732299805, -5.532610893249512, -5.177394390106201, -4.822177886962891, -4.466960906982422, -4.111743927001953, -3.7565274238586426, -3.401310682296753, -3.0460939407348633, -2.6908771991729736, -2.335660457611084, -1.9804437160491943, -1.6252269744873047, -1.270010232925415, -0.9147934913635254, -0.5595767498016357, -0.2043600082397461, 0.15085673332214355, 0.5060734748840332, 0.8612902164459229, 1.216507911682129, 1.5717246532440186, 1.9269413948059082, 2.282158136367798, 2.6373748779296875, 2.992591619491577, 3.347808361053467, 3.7030251026153564, 4.058241844177246, 4.413458824157715, 4.768675327301025, 5.123891830444336, 5.479108810424805, 5.834325790405273, 6.189542293548584, 6.5447587966918945, 6.899975776672363, 7.255192756652832, 7.610409259796143, 7.965625762939453, 8.320842742919922, 8.67605972290039, 9.03127670288086, 9.386492729187012, 9.74170970916748, 10.09692668914795, 10.452142715454102, 10.80735969543457, 11.162576675415039, 11.517793655395508, 11.873010635375977, 12.228226661682129, 12.583443641662598]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 15.0, 18.0, 24.0, 48.0, 60.0, 71.0, 126.0, 186.0, 282.0, 494.0, 724.0, 1464.0, 2696.0, 6395.0, 15954.0, 44749.0, 132914.0, 356906.0, 315059.0, 108806.0, 36967.0, 13595.0, 5461.0, 2411.0, 1211.0, 650.0, 415.0, 261.0, 188.0, 104.0, 76.0, 62.0, 36.0, 30.0, 18.0, 13.0, 14.0, 9.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.1796875, -5.9659423828125, -5.752197265625, -5.5384521484375, -5.32470703125, -5.1109619140625, -4.897216796875, -4.6834716796875, -4.4697265625, -4.2559814453125, -4.042236328125, -3.8284912109375, -3.61474609375, -3.4010009765625, -3.187255859375, -2.9735107421875, -2.759765625, -2.5460205078125, -2.332275390625, -2.1185302734375, -1.90478515625, -1.6910400390625, -1.477294921875, -1.2635498046875, -1.0498046875, -0.8360595703125, -0.622314453125, -0.4085693359375, -0.19482421875, 0.0189208984375, 0.232666015625, 0.4464111328125, 0.66015625, 0.8739013671875, 1.087646484375, 1.3013916015625, 1.51513671875, 1.7288818359375, 1.942626953125, 2.1563720703125, 2.3701171875, 2.5838623046875, 2.797607421875, 3.0113525390625, 3.22509765625, 3.4388427734375, 3.652587890625, 3.8663330078125, 4.080078125, 4.2938232421875, 4.507568359375, 4.7213134765625, 4.93505859375, 5.1488037109375, 5.362548828125, 5.5762939453125, 5.7900390625, 6.0037841796875, 6.217529296875, 6.4312744140625, 6.64501953125, 6.8587646484375, 7.072509765625, 7.2862548828125, 7.5]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 4.0, 14.0, 17.0, 16.0, 24.0, 34.0, 33.0, 54.0, 43.0, 50.0, 56.0, 62.0, 62.0, 57.0, 69.0, 50.0, 61.0, 57.0, 33.0, 38.0, 38.0, 27.0, 19.0, 15.0, 13.0, 11.0, 12.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.7578125, -4.64483642578125, -4.5318603515625, -4.41888427734375, -4.305908203125, -4.19293212890625, -4.0799560546875, -3.96697998046875, -3.85400390625, -3.74102783203125, -3.6280517578125, -3.51507568359375, -3.402099609375, -3.28912353515625, -3.1761474609375, -3.06317138671875, -2.9501953125, -2.83721923828125, -2.7242431640625, -2.61126708984375, -2.498291015625, -2.38531494140625, -2.2723388671875, -2.15936279296875, -2.04638671875, -1.93341064453125, -1.8204345703125, -1.70745849609375, -1.594482421875, -1.48150634765625, -1.3685302734375, -1.25555419921875, -1.142578125, -1.02960205078125, -0.9166259765625, -0.80364990234375, -0.690673828125, -0.57769775390625, -0.4647216796875, -0.35174560546875, -0.23876953125, -0.12579345703125, -0.0128173828125, 0.10015869140625, 0.213134765625, 0.32611083984375, 0.4390869140625, 0.55206298828125, 0.6650390625, 0.77801513671875, 0.8909912109375, 1.00396728515625, 1.116943359375, 1.22991943359375, 1.3428955078125, 1.45587158203125, 1.56884765625, 1.68182373046875, 1.7947998046875, 1.90777587890625, 2.020751953125, 2.13372802734375, 2.2467041015625, 2.35968017578125, 2.47265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 7.0, 10.0, 7.0, 15.0, 20.0, 18.0, 32.0, 48.0, 83.0, 106.0, 162.0, 237.0, 437.0, 785.0, 1735.0, 4374.0, 16266.0, 90690.0, 600648.0, 279451.0, 39083.0, 8654.0, 2835.0, 1205.0, 645.0, 345.0, 210.0, 147.0, 77.0, 62.0, 37.0, 26.0, 34.0, 19.0, 6.0, 8.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.828125, -8.51025390625, -8.1923828125, -7.87451171875, -7.556640625, -7.23876953125, -6.9208984375, -6.60302734375, -6.28515625, -5.96728515625, -5.6494140625, -5.33154296875, -5.013671875, -4.69580078125, -4.3779296875, -4.06005859375, -3.7421875, -3.42431640625, -3.1064453125, -2.78857421875, -2.470703125, -2.15283203125, -1.8349609375, -1.51708984375, -1.19921875, -0.88134765625, -0.5634765625, -0.24560546875, 0.072265625, 0.39013671875, 0.7080078125, 1.02587890625, 1.34375, 1.66162109375, 1.9794921875, 2.29736328125, 2.615234375, 2.93310546875, 3.2509765625, 3.56884765625, 3.88671875, 4.20458984375, 4.5224609375, 4.84033203125, 5.158203125, 5.47607421875, 5.7939453125, 6.11181640625, 6.4296875, 6.74755859375, 7.0654296875, 7.38330078125, 7.701171875, 8.01904296875, 8.3369140625, 8.65478515625, 8.97265625, 9.29052734375, 9.6083984375, 9.92626953125, 10.244140625, 10.56201171875, 10.8798828125, 11.19775390625, 11.515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 5.0, 8.0, 5.0, 11.0, 13.0, 11.0, 26.0, 27.0, 39.0, 28.0, 29.0, 33.0, 30.0, 55.0, 57.0, 37.0, 47.0, 49.0, 51.0, 63.0, 57.0, 53.0, 35.0, 37.0, 27.0, 26.0, 35.0, 24.0, 20.0, 13.0, 6.0, 7.0, 7.0, 8.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.77978515625, -13.3408203125, -12.90185546875, -12.462890625, -12.02392578125, -11.5849609375, -11.14599609375, -10.70703125, -10.26806640625, -9.8291015625, -9.39013671875, -8.951171875, -8.51220703125, -8.0732421875, -7.63427734375, -7.1953125, -6.75634765625, -6.3173828125, -5.87841796875, -5.439453125, -5.00048828125, -4.5615234375, -4.12255859375, -3.68359375, -3.24462890625, -2.8056640625, -2.36669921875, -1.927734375, -1.48876953125, -1.0498046875, -0.61083984375, -0.171875, 0.26708984375, 0.7060546875, 1.14501953125, 1.583984375, 2.02294921875, 2.4619140625, 2.90087890625, 3.33984375, 3.77880859375, 4.2177734375, 4.65673828125, 5.095703125, 5.53466796875, 5.9736328125, 6.41259765625, 6.8515625, 7.29052734375, 7.7294921875, 8.16845703125, 8.607421875, 9.04638671875, 9.4853515625, 9.92431640625, 10.36328125, 10.80224609375, 11.2412109375, 11.68017578125, 12.119140625, 12.55810546875, 12.9970703125, 13.43603515625, 13.875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 3.0, 7.0, 7.0, 24.0, 26.0, 40.0, 75.0, 107.0, 158.0, 359.0, 776.0, 2488.0, 13463.0, 289618.0, 707504.0, 28007.0, 3860.0, 1057.0, 420.0, 226.0, 113.0, 74.0, 41.0, 27.0, 17.0, 16.0, 10.0, 11.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.234375, -8.0240478515625, -7.813720703125, -7.6033935546875, -7.39306640625, -7.1827392578125, -6.972412109375, -6.7620849609375, -6.5517578125, -6.3414306640625, -6.131103515625, -5.9207763671875, -5.71044921875, -5.5001220703125, -5.289794921875, -5.0794677734375, -4.869140625, -4.6588134765625, -4.448486328125, -4.2381591796875, -4.02783203125, -3.8175048828125, -3.607177734375, -3.3968505859375, -3.1865234375, -2.9761962890625, -2.765869140625, -2.5555419921875, -2.34521484375, -2.1348876953125, -1.924560546875, -1.7142333984375, -1.50390625, -1.2935791015625, -1.083251953125, -0.8729248046875, -0.66259765625, -0.4522705078125, -0.241943359375, -0.0316162109375, 0.1787109375, 0.3890380859375, 0.599365234375, 0.8096923828125, 1.02001953125, 1.2303466796875, 1.440673828125, 1.6510009765625, 1.861328125, 2.0716552734375, 2.281982421875, 2.4923095703125, 2.70263671875, 2.9129638671875, 3.123291015625, 3.3336181640625, 3.5439453125, 3.7542724609375, 3.964599609375, 4.1749267578125, 4.38525390625, 4.5955810546875, 4.805908203125, 5.0162353515625, 5.2265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 9.0, 11.0, 12.0, 12.0, 15.0, 40.0, 32.0, 41.0, 60.0, 65.0, 79.0, 76.0, 111.0, 105.0, 64.0, 58.0, 32.0, 34.0, 28.0, 32.0, 10.0, 15.0, 13.0, 12.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000579833984375, -0.0005617290735244751, -0.0005436241626739502, -0.0005255192518234253, -0.0005074143409729004, -0.0004893094301223755, -0.0004712045192718506, -0.0004530996084213257, -0.0004349946975708008, -0.0004168897867202759, -0.000398784875869751, -0.0003806799650192261, -0.00036257505416870117, -0.00034447014331817627, -0.00032636523246765137, -0.00030826032161712646, -0.00029015541076660156, -0.00027205049991607666, -0.00025394558906555176, -0.00023584067821502686, -0.00021773576736450195, -0.00019963085651397705, -0.00018152594566345215, -0.00016342103481292725, -0.00014531612396240234, -0.00012721121311187744, -0.00010910630226135254, -9.100139141082764e-05, -7.289648056030273e-05, -5.479156970977783e-05, -3.668665885925293e-05, -1.8581748008728027e-05, -4.76837158203125e-07, 1.7628073692321777e-05, 3.573298454284668e-05, 5.383789539337158e-05, 7.194280624389648e-05, 9.004771709442139e-05, 0.00010815262794494629, 0.0001262575387954712, 0.0001443624496459961, 0.000162467360496521, 0.0001805722713470459, 0.0001986771821975708, 0.0002167820930480957, 0.0002348870038986206, 0.0002529919147491455, 0.0002710968255996704, 0.0002892017364501953, 0.0003073066473007202, 0.0003254115581512451, 0.00034351646900177, 0.0003616213798522949, 0.0003797262907028198, 0.0003978312015533447, 0.00041593611240386963, 0.00043404102325439453, 0.00045214593410491943, 0.00047025084495544434, 0.0004883557558059692, 0.0005064606666564941, 0.000524565577507019, 0.0005426704883575439, 0.0005607753992080688, 0.0005788803100585938]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 5.0, 3.0, 10.0, 16.0, 24.0, 44.0, 77.0, 164.0, 316.0, 818.0, 2702.0, 19018.0, 743110.0, 269731.0, 9420.0, 1824.0, 663.0, 290.0, 124.0, 75.0, 42.0, 25.0, 19.0, 6.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.34942626953125, -7.0855712890625, -6.82171630859375, -6.557861328125, -6.29400634765625, -6.0301513671875, -5.76629638671875, -5.50244140625, -5.23858642578125, -4.9747314453125, -4.71087646484375, -4.447021484375, -4.18316650390625, -3.9193115234375, -3.65545654296875, -3.3916015625, -3.12774658203125, -2.8638916015625, -2.60003662109375, -2.336181640625, -2.07232666015625, -1.8084716796875, -1.54461669921875, -1.28076171875, -1.01690673828125, -0.7530517578125, -0.48919677734375, -0.225341796875, 0.03851318359375, 0.3023681640625, 0.56622314453125, 0.830078125, 1.09393310546875, 1.3577880859375, 1.62164306640625, 1.885498046875, 2.14935302734375, 2.4132080078125, 2.67706298828125, 2.94091796875, 3.20477294921875, 3.4686279296875, 3.73248291015625, 3.996337890625, 4.26019287109375, 4.5240478515625, 4.78790283203125, 5.0517578125, 5.31561279296875, 5.5794677734375, 5.84332275390625, 6.107177734375, 6.37103271484375, 6.6348876953125, 6.89874267578125, 7.16259765625, 7.42645263671875, 7.6903076171875, 7.95416259765625, 8.218017578125, 8.48187255859375, 8.7457275390625, 9.00958251953125, 9.2734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 17.0, 31.0, 54.0, 104.0, 178.0, 215.0, 161.0, 105.0, 54.0, 37.0, 13.0, 12.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30078125, -4.00250244140625, -3.7042236328125, -3.40594482421875, -3.107666015625, -2.80938720703125, -2.5111083984375, -2.21282958984375, -1.91455078125, -1.61627197265625, -1.3179931640625, -1.01971435546875, -0.721435546875, -0.42315673828125, -0.1248779296875, 0.17340087890625, 0.4716796875, 0.76995849609375, 1.0682373046875, 1.36651611328125, 1.664794921875, 1.96307373046875, 2.2613525390625, 2.55963134765625, 2.85791015625, 3.15618896484375, 3.4544677734375, 3.75274658203125, 4.051025390625, 4.34930419921875, 4.6475830078125, 4.94586181640625, 5.244140625, 5.54241943359375, 5.8406982421875, 6.13897705078125, 6.437255859375, 6.73553466796875, 7.0338134765625, 7.33209228515625, 7.63037109375, 7.92864990234375, 8.2269287109375, 8.52520751953125, 8.823486328125, 9.12176513671875, 9.4200439453125, 9.71832275390625, 10.0166015625, 10.31488037109375, 10.6131591796875, 10.91143798828125, 11.209716796875, 11.50799560546875, 11.8062744140625, 12.10455322265625, 12.40283203125, 12.70111083984375, 12.9993896484375, 13.29766845703125, 13.595947265625, 13.89422607421875, 14.1925048828125, 14.49078369140625, 14.7890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 14.0, 22.0, 55.0, 90.0, 152.0, 192.0, 173.0, 136.0, 76.0, 37.0, 19.0, 12.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.3922119140625, -106.1424560546875, -102.89270782470703, -99.64295196533203, -96.39320373535156, -93.14344787597656, -89.8936996459961, -86.6439437866211, -83.39419555664062, -80.14443969726562, -76.89469146728516, -73.64493560791016, -70.39518737792969, -67.14543151855469, -63.89568328857422, -60.64592742919922, -57.396175384521484, -54.14642333984375, -50.896671295166016, -47.64691925048828, -44.39716720581055, -41.14741516113281, -37.89765930175781, -34.647911071777344, -31.398157119750977, -28.148405075073242, -24.898653030395508, -21.64889907836914, -18.399147033691406, -15.149394989013672, -11.899642944335938, -8.649890899658203, -5.400138854980469, -2.1503865718841553, 1.0993657112121582, 4.349118232727051, 7.598870277404785, 10.848623275756836, 14.09837532043457, 17.348127365112305, 20.59787940979004, 23.847631454467773, 27.097383499145508, 30.347137451171875, 33.59688949584961, 36.846641540527344, 40.09639358520508, 43.34614562988281, 46.59589767456055, 49.84564971923828, 53.095401763916016, 56.34515380859375, 59.594905853271484, 62.84465789794922, 66.09441375732422, 69.34416198730469, 72.59391784667969, 75.84367370605469, 79.09342193603516, 82.34317779541016, 85.59292602539062, 88.84268188476562, 92.0924301147461, 95.3421859741211, 98.59193420410156]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 5.0, 13.0, 13.0, 26.0, 29.0, 34.0, 37.0, 54.0, 60.0, 76.0, 75.0, 67.0, 85.0, 53.0, 67.0, 53.0, 41.0, 40.0, 32.0, 26.0, 27.0, 12.0, 11.0, 9.0, 12.0, 4.0, 7.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.17947387695312, -82.43815612792969, -79.69683837890625, -76.95552062988281, -74.21419525146484, -71.4728775024414, -68.73155975341797, -65.99024200439453, -63.24892044067383, -60.50760269165039, -57.76628112792969, -55.02496337890625, -52.28364562988281, -49.54232406616211, -46.80100631713867, -44.05968475341797, -41.31836700439453, -38.577049255371094, -35.83572769165039, -33.09440994262695, -30.353090286254883, -27.611770629882812, -24.870452880859375, -22.129133224487305, -19.387813568115234, -16.646493911743164, -13.90517520904541, -11.163856506347656, -8.422536849975586, -5.681217193603516, -2.939899444580078, -0.1985797882080078, 2.5427398681640625, 5.284059047698975, 8.025378227233887, 10.76669692993164, 13.508016586303711, 16.24933624267578, 18.99065399169922, 21.73197364807129, 24.47329330444336, 27.21461296081543, 29.9559326171875, 32.69725036621094, 35.438568115234375, 38.17988967895508, 40.921207427978516, 43.66252899169922, 46.403846740722656, 49.145164489746094, 51.8864860534668, 54.627803802490234, 57.36912536621094, 60.110443115234375, 62.85176086425781, 65.59307861328125, 68.33439636230469, 71.07571411132812, 73.81703186035156, 76.558349609375, 79.29967498779297, 82.0409927368164, 84.78231048583984, 87.52362823486328, 90.26495361328125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 4.0, 19.0, 20.0, 40.0, 61.0, 77.0, 120.0, 208.0, 358.0, 710.0, 1278.0, 2859.0, 6764.0, 19459.0, 80764.0, 1322076.0, 2601593.0, 118478.0, 24450.0, 8222.0, 3293.0, 1607.0, 751.0, 409.0, 233.0, 138.0, 83.0, 67.0, 39.0, 23.0, 17.0, 7.0, 13.0, 6.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.79296875, -6.60479736328125, -6.4166259765625, -6.22845458984375, -6.040283203125, -5.85211181640625, -5.6639404296875, -5.47576904296875, -5.28759765625, -5.09942626953125, -4.9112548828125, -4.72308349609375, -4.534912109375, -4.34674072265625, -4.1585693359375, -3.97039794921875, -3.7822265625, -3.59405517578125, -3.4058837890625, -3.21771240234375, -3.029541015625, -2.84136962890625, -2.6531982421875, -2.46502685546875, -2.27685546875, -2.08868408203125, -1.9005126953125, -1.71234130859375, -1.524169921875, -1.33599853515625, -1.1478271484375, -0.95965576171875, -0.771484375, -0.58331298828125, -0.3951416015625, -0.20697021484375, -0.018798828125, 0.16937255859375, 0.3575439453125, 0.54571533203125, 0.73388671875, 0.92205810546875, 1.1102294921875, 1.29840087890625, 1.486572265625, 1.67474365234375, 1.8629150390625, 2.05108642578125, 2.2392578125, 2.42742919921875, 2.6156005859375, 2.80377197265625, 2.991943359375, 3.18011474609375, 3.3682861328125, 3.55645751953125, 3.74462890625, 3.93280029296875, 4.1209716796875, 4.30914306640625, 4.497314453125, 4.68548583984375, 4.8736572265625, 5.06182861328125, 5.25]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 6.0, 12.0, 9.0, 17.0, 19.0, 28.0, 36.0, 36.0, 45.0, 57.0, 64.0, 65.0, 64.0, 75.0, 68.0, 59.0, 58.0, 40.0, 46.0, 45.0, 29.0, 32.0, 21.0, 14.0, 15.0, 11.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1328125, -3.0142822265625, -2.895751953125, -2.7772216796875, -2.65869140625, -2.5401611328125, -2.421630859375, -2.3031005859375, -2.1845703125, -2.0660400390625, -1.947509765625, -1.8289794921875, -1.71044921875, -1.5919189453125, -1.473388671875, -1.3548583984375, -1.236328125, -1.1177978515625, -0.999267578125, -0.8807373046875, -0.76220703125, -0.6436767578125, -0.525146484375, -0.4066162109375, -0.2880859375, -0.1695556640625, -0.051025390625, 0.0675048828125, 0.18603515625, 0.3045654296875, 0.423095703125, 0.5416259765625, 0.66015625, 0.7786865234375, 0.897216796875, 1.0157470703125, 1.13427734375, 1.2528076171875, 1.371337890625, 1.4898681640625, 1.6083984375, 1.7269287109375, 1.845458984375, 1.9639892578125, 2.08251953125, 2.2010498046875, 2.319580078125, 2.4381103515625, 2.556640625, 2.6751708984375, 2.793701171875, 2.9122314453125, 3.03076171875, 3.1492919921875, 3.267822265625, 3.3863525390625, 3.5048828125, 3.6234130859375, 3.741943359375, 3.8604736328125, 3.97900390625, 4.0975341796875, 4.216064453125, 4.3345947265625, 4.453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 6.0, 6.0, 17.0, 9.0, 15.0, 36.0, 50.0, 74.0, 131.0, 277.0, 469.0, 1013.0, 2351.0, 6231.0, 20469.0, 102875.0, 2643385.0, 1316428.0, 75806.0, 16247.0, 4970.0, 1819.0, 782.0, 340.0, 185.0, 93.0, 60.0, 29.0, 25.0, 15.0, 15.0, 10.0, 11.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.62890625, -7.39715576171875, -7.1654052734375, -6.93365478515625, -6.701904296875, -6.47015380859375, -6.2384033203125, -6.00665283203125, -5.77490234375, -5.54315185546875, -5.3114013671875, -5.07965087890625, -4.847900390625, -4.61614990234375, -4.3843994140625, -4.15264892578125, -3.9208984375, -3.68914794921875, -3.4573974609375, -3.22564697265625, -2.993896484375, -2.76214599609375, -2.5303955078125, -2.29864501953125, -2.06689453125, -1.83514404296875, -1.6033935546875, -1.37164306640625, -1.139892578125, -0.90814208984375, -0.6763916015625, -0.44464111328125, -0.212890625, 0.01885986328125, 0.2506103515625, 0.48236083984375, 0.714111328125, 0.94586181640625, 1.1776123046875, 1.40936279296875, 1.64111328125, 1.87286376953125, 2.1046142578125, 2.33636474609375, 2.568115234375, 2.79986572265625, 3.0316162109375, 3.26336669921875, 3.4951171875, 3.72686767578125, 3.9586181640625, 4.19036865234375, 4.422119140625, 4.65386962890625, 4.8856201171875, 5.11737060546875, 5.34912109375, 5.58087158203125, 5.8126220703125, 6.04437255859375, 6.276123046875, 6.50787353515625, 6.7396240234375, 6.97137451171875, 7.203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 7.0, 4.0, 4.0, 1.0, 9.0, 7.0, 12.0, 16.0, 15.0, 16.0, 21.0, 25.0, 52.0, 67.0, 94.0, 148.0, 263.0, 579.0, 903.0, 833.0, 384.0, 184.0, 118.0, 76.0, 58.0, 46.0, 32.0, 21.0, 23.0, 13.0, 10.0, 4.0, 3.0, 2.0, 4.0, 6.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.5703125, -7.37481689453125, -7.1793212890625, -6.98382568359375, -6.788330078125, -6.59283447265625, -6.3973388671875, -6.20184326171875, -6.00634765625, -5.81085205078125, -5.6153564453125, -5.41986083984375, -5.224365234375, -5.02886962890625, -4.8333740234375, -4.63787841796875, -4.4423828125, -4.24688720703125, -4.0513916015625, -3.85589599609375, -3.660400390625, -3.46490478515625, -3.2694091796875, -3.07391357421875, -2.87841796875, -2.68292236328125, -2.4874267578125, -2.29193115234375, -2.096435546875, -1.90093994140625, -1.7054443359375, -1.50994873046875, -1.314453125, -1.11895751953125, -0.9234619140625, -0.72796630859375, -0.532470703125, -0.33697509765625, -0.1414794921875, 0.05401611328125, 0.24951171875, 0.44500732421875, 0.6405029296875, 0.83599853515625, 1.031494140625, 1.22698974609375, 1.4224853515625, 1.61798095703125, 1.8134765625, 2.00897216796875, 2.2044677734375, 2.39996337890625, 2.595458984375, 2.79095458984375, 2.9864501953125, 3.18194580078125, 3.37744140625, 3.57293701171875, 3.7684326171875, 3.96392822265625, 4.159423828125, 4.35491943359375, 4.5504150390625, 4.74591064453125, 4.94140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 4.0, 6.0, 10.0, 34.0, 63.0, 85.0, 163.0, 182.0, 181.0, 112.0, 70.0, 36.0, 20.0, 9.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.44771575927734, -63.25919723510742, -61.0706787109375, -58.88215637207031, -56.69363784790039, -54.50511932373047, -52.31659698486328, -50.12807846069336, -47.93955993652344, -45.751041412353516, -43.562522888183594, -41.374000549316406, -39.185482025146484, -36.99696350097656, -34.808441162109375, -32.61992263793945, -30.43140411376953, -28.24288558959961, -26.054365158081055, -23.8658447265625, -21.677326202392578, -19.488807678222656, -17.3002872467041, -15.111767768859863, -12.923248291015625, -10.734728813171387, -8.546209335327148, -6.35768985748291, -4.169170379638672, -1.9806509017944336, 0.2078685760498047, 2.396388053894043, 4.5849151611328125, 6.773434638977051, 8.961954116821289, 11.150473594665527, 13.338993072509766, 15.527512550354004, 17.716032028198242, 19.904552459716797, 22.09307098388672, 24.28158950805664, 26.470109939575195, 28.65863037109375, 30.847148895263672, 33.035667419433594, 35.22418975830078, 37.4127082824707, 39.601226806640625, 41.78974533081055, 43.97826385498047, 46.166786193847656, 48.35530471801758, 50.5438232421875, 52.73234558105469, 54.92086410522461, 57.10938262939453, 59.29790115356445, 61.486419677734375, 63.67494201660156, 65.86346435546875, 68.0519790649414, 70.2405014038086, 72.42901611328125, 74.61753845214844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 7.0, 12.0, 11.0, 14.0, 15.0, 15.0, 26.0, 25.0, 31.0, 33.0, 30.0, 34.0, 47.0, 45.0, 44.0, 71.0, 46.0, 49.0, 46.0, 49.0, 50.0, 41.0, 29.0, 31.0, 32.0, 16.0, 26.0, 21.0, 17.0, 13.0, 11.0, 3.0, 7.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-35.73024368286133, -34.7208251953125, -33.71140670776367, -32.701988220214844, -31.69257164001465, -30.683155059814453, -29.673736572265625, -28.664318084716797, -27.65489959716797, -26.64548110961914, -25.636064529418945, -24.626646041870117, -23.61722755432129, -22.607810974121094, -21.598392486572266, -20.588973999023438, -19.579557418823242, -18.570138931274414, -17.56072235107422, -16.55130386352539, -15.541885375976562, -14.53246784210205, -13.523050308227539, -12.513631820678711, -11.5042142868042, -10.494796752929688, -9.48537826538086, -8.475960731506348, -7.466542720794678, -6.457124710083008, -5.447707176208496, -4.438289165496826, -3.4288711547851562, -2.4194531440734863, -1.4100353717803955, -0.4006175994873047, 0.6088004112243652, 1.6182184219360352, 2.627635955810547, 3.637053966522217, 4.646471977233887, 5.655889987945557, 6.665307998657227, 7.674725532531738, 8.68414306640625, 9.693561553955078, 10.70297908782959, 11.712396621704102, 12.72181510925293, 13.731232643127441, 14.74065113067627, 15.750068664550781, 16.75948715209961, 17.768905639648438, 18.778322219848633, 19.78774070739746, 20.797157287597656, 21.806575775146484, 22.81599235534668, 23.825410842895508, 24.834829330444336, 25.84424591064453, 26.85366439819336, 27.863082885742188, 28.872501373291016]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 23.0, 29.0, 35.0, 57.0, 87.0, 146.0, 279.0, 511.0, 950.0, 1647.0, 3116.0, 6234.0, 13303.0, 30117.0, 71619.0, 174305.0, 348594.0, 230840.0, 94007.0, 39248.0, 17300.0, 7973.0, 3721.0, 1944.0, 1031.0, 575.0, 361.0, 190.0, 110.0, 64.0, 42.0, 31.0, 17.0, 16.0, 6.0, 3.0, 7.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.421875, -4.27276611328125, -4.1236572265625, -3.97454833984375, -3.825439453125, -3.67633056640625, -3.5272216796875, -3.37811279296875, -3.22900390625, -3.07989501953125, -2.9307861328125, -2.78167724609375, -2.632568359375, -2.48345947265625, -2.3343505859375, -2.18524169921875, -2.0361328125, -1.88702392578125, -1.7379150390625, -1.58880615234375, -1.439697265625, -1.29058837890625, -1.1414794921875, -0.99237060546875, -0.84326171875, -0.69415283203125, -0.5450439453125, -0.39593505859375, -0.246826171875, -0.09771728515625, 0.0513916015625, 0.20050048828125, 0.349609375, 0.49871826171875, 0.6478271484375, 0.79693603515625, 0.946044921875, 1.09515380859375, 1.2442626953125, 1.39337158203125, 1.54248046875, 1.69158935546875, 1.8406982421875, 1.98980712890625, 2.138916015625, 2.28802490234375, 2.4371337890625, 2.58624267578125, 2.7353515625, 2.88446044921875, 3.0335693359375, 3.18267822265625, 3.331787109375, 3.48089599609375, 3.6300048828125, 3.77911376953125, 3.92822265625, 4.07733154296875, 4.2264404296875, 4.37554931640625, 4.524658203125, 4.67376708984375, 4.8228759765625, 4.97198486328125, 5.12109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 2.0, 5.0, 6.0, 12.0, 18.0, 14.0, 23.0, 27.0, 17.0, 25.0, 31.0, 33.0, 33.0, 54.0, 49.0, 58.0, 47.0, 37.0, 37.0, 39.0, 55.0, 56.0, 31.0, 47.0, 37.0, 30.0, 32.0, 25.0, 27.0, 14.0, 8.0, 12.0, 14.0, 8.0, 5.0, 6.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.10546875, -3.019134521484375, -2.93280029296875, -2.846466064453125, -2.7601318359375, -2.673797607421875, -2.58746337890625, -2.501129150390625, -2.414794921875, -2.328460693359375, -2.24212646484375, -2.155792236328125, -2.0694580078125, -1.983123779296875, -1.89678955078125, -1.810455322265625, -1.72412109375, -1.637786865234375, -1.55145263671875, -1.465118408203125, -1.3787841796875, -1.292449951171875, -1.20611572265625, -1.119781494140625, -1.033447265625, -0.947113037109375, -0.86077880859375, -0.774444580078125, -0.6881103515625, -0.601776123046875, -0.51544189453125, -0.429107666015625, -0.3427734375, -0.256439208984375, -0.17010498046875, -0.083770751953125, 0.0025634765625, 0.088897705078125, 0.17523193359375, 0.261566162109375, 0.347900390625, 0.434234619140625, 0.52056884765625, 0.606903076171875, 0.6932373046875, 0.779571533203125, 0.86590576171875, 0.952239990234375, 1.03857421875, 1.124908447265625, 1.21124267578125, 1.297576904296875, 1.3839111328125, 1.470245361328125, 1.55657958984375, 1.642913818359375, 1.729248046875, 1.815582275390625, 1.90191650390625, 1.988250732421875, 2.0745849609375, 2.160919189453125, 2.24725341796875, 2.333587646484375, 2.419921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 2.0, 4.0, 5.0, 13.0, 17.0, 14.0, 31.0, 55.0, 67.0, 131.0, 163.0, 345.0, 575.0, 1178.0, 2784.0, 9576.0, 55982.0, 635469.0, 300504.0, 30957.0, 6325.0, 2162.0, 952.0, 471.0, 271.0, 171.0, 104.0, 69.0, 46.0, 39.0, 24.0, 7.0, 12.0, 10.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.5438232421875, -11.181396484375, -10.8189697265625, -10.45654296875, -10.0941162109375, -9.731689453125, -9.3692626953125, -9.0068359375, -8.6444091796875, -8.281982421875, -7.9195556640625, -7.55712890625, -7.1947021484375, -6.832275390625, -6.4698486328125, -6.107421875, -5.7449951171875, -5.382568359375, -5.0201416015625, -4.65771484375, -4.2952880859375, -3.932861328125, -3.5704345703125, -3.2080078125, -2.8455810546875, -2.483154296875, -2.1207275390625, -1.75830078125, -1.3958740234375, -1.033447265625, -0.6710205078125, -0.30859375, 0.0538330078125, 0.416259765625, 0.7786865234375, 1.14111328125, 1.5035400390625, 1.865966796875, 2.2283935546875, 2.5908203125, 2.9532470703125, 3.315673828125, 3.6781005859375, 4.04052734375, 4.4029541015625, 4.765380859375, 5.1278076171875, 5.490234375, 5.8526611328125, 6.215087890625, 6.5775146484375, 6.93994140625, 7.3023681640625, 7.664794921875, 8.0272216796875, 8.3896484375, 8.7520751953125, 9.114501953125, 9.4769287109375, 9.83935546875, 10.2017822265625, 10.564208984375, 10.9266357421875, 11.2890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 8.0, 10.0, 9.0, 17.0, 27.0, 17.0, 20.0, 25.0, 24.0, 44.0, 41.0, 45.0, 47.0, 47.0, 45.0, 54.0, 57.0, 52.0, 60.0, 53.0, 33.0, 36.0, 39.0, 23.0, 25.0, 27.0, 19.0, 14.0, 14.0, 9.0, 5.0, 4.0, 9.0, 8.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.53125, -14.1326904296875, -13.734130859375, -13.3355712890625, -12.93701171875, -12.5384521484375, -12.139892578125, -11.7413330078125, -11.3427734375, -10.9442138671875, -10.545654296875, -10.1470947265625, -9.74853515625, -9.3499755859375, -8.951416015625, -8.5528564453125, -8.154296875, -7.7557373046875, -7.357177734375, -6.9586181640625, -6.56005859375, -6.1614990234375, -5.762939453125, -5.3643798828125, -4.9658203125, -4.5672607421875, -4.168701171875, -3.7701416015625, -3.37158203125, -2.9730224609375, -2.574462890625, -2.1759033203125, -1.77734375, -1.3787841796875, -0.980224609375, -0.5816650390625, -0.18310546875, 0.2154541015625, 0.614013671875, 1.0125732421875, 1.4111328125, 1.8096923828125, 2.208251953125, 2.6068115234375, 3.00537109375, 3.4039306640625, 3.802490234375, 4.2010498046875, 4.599609375, 4.9981689453125, 5.396728515625, 5.7952880859375, 6.19384765625, 6.5924072265625, 6.990966796875, 7.3895263671875, 7.7880859375, 8.1866455078125, 8.585205078125, 8.9837646484375, 9.38232421875, 9.7808837890625, 10.179443359375, 10.5780029296875, 10.9765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 9.0, 17.0, 31.0, 41.0, 91.0, 198.0, 465.0, 1789.0, 12014.0, 328913.0, 683697.0, 17959.0, 2235.0, 636.0, 216.0, 110.0, 48.0, 19.0, 13.0, 12.0, 13.0, 5.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.655029296875, -7.44287109375, -7.230712890625, -7.0185546875, -6.806396484375, -6.59423828125, -6.382080078125, -6.169921875, -5.957763671875, -5.74560546875, -5.533447265625, -5.3212890625, -5.109130859375, -4.89697265625, -4.684814453125, -4.47265625, -4.260498046875, -4.04833984375, -3.836181640625, -3.6240234375, -3.411865234375, -3.19970703125, -2.987548828125, -2.775390625, -2.563232421875, -2.35107421875, -2.138916015625, -1.9267578125, -1.714599609375, -1.50244140625, -1.290283203125, -1.078125, -0.865966796875, -0.65380859375, -0.441650390625, -0.2294921875, -0.017333984375, 0.19482421875, 0.406982421875, 0.619140625, 0.831298828125, 1.04345703125, 1.255615234375, 1.4677734375, 1.679931640625, 1.89208984375, 2.104248046875, 2.31640625, 2.528564453125, 2.74072265625, 2.952880859375, 3.1650390625, 3.377197265625, 3.58935546875, 3.801513671875, 4.013671875, 4.225830078125, 4.43798828125, 4.650146484375, 4.8623046875, 5.074462890625, 5.28662109375, 5.498779296875, 5.7109375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 7.0, 19.0, 23.0, 26.0, 24.0, 30.0, 40.0, 47.0, 74.0, 98.0, 126.0, 95.0, 79.0, 60.0, 48.0, 42.0, 20.0, 23.0, 17.0, 16.0, 16.0, 8.0, 4.0, 6.0, 7.0, 10.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005321502685546875, -0.0005157887935638428, -0.000499427318572998, -0.0004830658435821533, -0.0004667043685913086, -0.00045034289360046387, -0.00043398141860961914, -0.0004176199436187744, -0.0004012584686279297, -0.00038489699363708496, -0.00036853551864624023, -0.0003521740436553955, -0.0003358125686645508, -0.00031945109367370605, -0.00030308961868286133, -0.0002867281436920166, -0.0002703666687011719, -0.00025400519371032715, -0.00023764371871948242, -0.0002212822437286377, -0.00020492076873779297, -0.00018855929374694824, -0.00017219781875610352, -0.0001558363437652588, -0.00013947486877441406, -0.00012311339378356934, -0.00010675191879272461, -9.039044380187988e-05, -7.402896881103516e-05, -5.766749382019043e-05, -4.13060188293457e-05, -2.4944543838500977e-05, -8.58306884765625e-06, 7.778406143188477e-06, 2.4139881134033203e-05, 4.050135612487793e-05, 5.6862831115722656e-05, 7.322430610656738e-05, 8.958578109741211e-05, 0.00010594725608825684, 0.00012230873107910156, 0.0001386702060699463, 0.00015503168106079102, 0.00017139315605163574, 0.00018775463104248047, 0.0002041161060333252, 0.00022047758102416992, 0.00023683905601501465, 0.0002532005310058594, 0.0002695620059967041, 0.00028592348098754883, 0.00030228495597839355, 0.0003186464309692383, 0.000335007905960083, 0.00035136938095092773, 0.00036773085594177246, 0.0003840923309326172, 0.0004004538059234619, 0.00041681528091430664, 0.00043317675590515137, 0.0004495382308959961, 0.0004658997058868408, 0.00048226118087768555, 0.0004986226558685303, 0.000514984130859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 7.0, 12.0, 13.0, 15.0, 22.0, 41.0, 67.0, 91.0, 128.0, 216.0, 306.0, 561.0, 1038.0, 2178.0, 5536.0, 18852.0, 92937.0, 629639.0, 241762.0, 38858.0, 9664.0, 3290.0, 1434.0, 746.0, 389.0, 260.0, 144.0, 108.0, 72.0, 30.0, 34.0, 25.0, 24.0, 10.0, 13.0, 3.0, 6.0, 9.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.298828125, -3.1915283203125, -3.084228515625, -2.9769287109375, -2.86962890625, -2.7623291015625, -2.655029296875, -2.5477294921875, -2.4404296875, -2.3331298828125, -2.225830078125, -2.1185302734375, -2.01123046875, -1.9039306640625, -1.796630859375, -1.6893310546875, -1.58203125, -1.4747314453125, -1.367431640625, -1.2601318359375, -1.15283203125, -1.0455322265625, -0.938232421875, -0.8309326171875, -0.7236328125, -0.6163330078125, -0.509033203125, -0.4017333984375, -0.29443359375, -0.1871337890625, -0.079833984375, 0.0274658203125, 0.134765625, 0.2420654296875, 0.349365234375, 0.4566650390625, 0.56396484375, 0.6712646484375, 0.778564453125, 0.8858642578125, 0.9931640625, 1.1004638671875, 1.207763671875, 1.3150634765625, 1.42236328125, 1.5296630859375, 1.636962890625, 1.7442626953125, 1.8515625, 1.9588623046875, 2.066162109375, 2.1734619140625, 2.28076171875, 2.3880615234375, 2.495361328125, 2.6026611328125, 2.7099609375, 2.8172607421875, 2.924560546875, 3.0318603515625, 3.13916015625, 3.2464599609375, 3.353759765625, 3.4610595703125, 3.568359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 10.0, 14.0, 13.0, 28.0, 46.0, 64.0, 82.0, 94.0, 116.0, 117.0, 99.0, 79.0, 59.0, 60.0, 40.0, 23.0, 17.0, 9.0, 5.0, 6.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96484375, -2.80120849609375, -2.6375732421875, -2.47393798828125, -2.310302734375, -2.14666748046875, -1.9830322265625, -1.81939697265625, -1.65576171875, -1.49212646484375, -1.3284912109375, -1.16485595703125, -1.001220703125, -0.83758544921875, -0.6739501953125, -0.51031494140625, -0.3466796875, -0.18304443359375, -0.0194091796875, 0.14422607421875, 0.307861328125, 0.47149658203125, 0.6351318359375, 0.79876708984375, 0.96240234375, 1.12603759765625, 1.2896728515625, 1.45330810546875, 1.616943359375, 1.78057861328125, 1.9442138671875, 2.10784912109375, 2.271484375, 2.43511962890625, 2.5987548828125, 2.76239013671875, 2.926025390625, 3.08966064453125, 3.2532958984375, 3.41693115234375, 3.58056640625, 3.74420166015625, 3.9078369140625, 4.07147216796875, 4.235107421875, 4.39874267578125, 4.5623779296875, 4.72601318359375, 4.8896484375, 5.05328369140625, 5.2169189453125, 5.38055419921875, 5.544189453125, 5.70782470703125, 5.8714599609375, 6.03509521484375, 6.19873046875, 6.36236572265625, 6.5260009765625, 6.68963623046875, 6.853271484375, 7.01690673828125, 7.1805419921875, 7.34417724609375, 7.5078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 5.0, 10.0, 21.0, 32.0, 52.0, 103.0, 156.0, 211.0, 142.0, 108.0, 72.0, 23.0, 27.0, 9.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.68687438964844, -76.40668487548828, -74.1264877319336, -71.84629821777344, -69.56610870361328, -67.2859115600586, -65.00572204589844, -62.725528717041016, -60.445335388183594, -58.16514205932617, -55.884952545166016, -53.604759216308594, -51.32456588745117, -49.04437255859375, -46.764183044433594, -44.48398971557617, -42.203800201416016, -39.923606872558594, -37.64341735839844, -35.363224029541016, -33.083030700683594, -30.802839279174805, -28.522647857666016, -26.242454528808594, -23.962263107299805, -21.682071685791016, -19.401878356933594, -17.121686935424805, -14.8414945602417, -12.561302185058594, -10.281110763549805, -8.0009183883667, -5.720726013183594, -3.4405338764190674, -1.160341739654541, 1.1198501586914062, 3.4000425338745117, 5.680234909057617, 7.960426330566406, 10.240618705749512, 12.520811080932617, 14.801003456115723, 17.081195831298828, 19.361387252807617, 21.641578674316406, 23.921772003173828, 26.201963424682617, 28.482154846191406, 30.762348175048828, 33.04254150390625, 35.322731018066406, 37.60292434692383, 39.88311767578125, 42.163307189941406, 44.44350051879883, 46.72369384765625, 49.003883361816406, 51.28407669067383, 53.564266204833984, 55.844459533691406, 58.12465286254883, 60.40484619140625, 62.685035705566406, 64.96522521972656, 67.24542236328125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 8.0, 12.0, 11.0, 18.0, 20.0, 22.0, 28.0, 29.0, 35.0, 38.0, 34.0, 42.0, 57.0, 53.0, 70.0, 48.0, 40.0, 52.0, 52.0, 30.0, 43.0, 31.0, 31.0, 29.0, 31.0, 22.0, 17.0, 24.0, 11.0, 12.0, 11.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.118587493896484, -42.56791687011719, -41.017242431640625, -39.46657180786133, -37.915897369384766, -36.36522674560547, -34.814552307128906, -33.26388168334961, -31.713211059570312, -30.162538528442383, -28.611865997314453, -27.061195373535156, -25.510522842407227, -23.959850311279297, -22.409177780151367, -20.858505249023438, -19.307832717895508, -17.757160186767578, -16.20648765563965, -14.655816078186035, -13.105144500732422, -11.554471969604492, -10.003799438476562, -8.45312786102295, -6.9024553298950195, -5.351783275604248, -3.8011109828948975, -2.250438690185547, -0.6997666358947754, 0.8509054183959961, 2.401577949523926, 3.952249526977539, 5.502922058105469, 7.05359411239624, 8.604266166687012, 10.154938697814941, 11.705610275268555, 13.256282806396484, 14.806955337524414, 16.357627868652344, 17.90829849243164, 19.45897102355957, 21.0096435546875, 22.560314178466797, 24.110986709594727, 25.661659240722656, 27.212331771850586, 28.763004302978516, 30.313676834106445, 31.864349365234375, 33.41501998901367, 34.965694427490234, 36.51636505126953, 38.067039489746094, 39.61771011352539, 41.16838073730469, 42.71905517578125, 44.26972579956055, 45.82040023803711, 47.371070861816406, 48.92174530029297, 50.472415924072266, 52.02308654785156, 53.573760986328125, 55.12443161010742]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 10.0, 6.0, 17.0, 23.0, 32.0, 37.0, 52.0, 76.0, 145.0, 187.0, 536.0, 2256.0, 41275.0, 4114328.0, 32271.0, 1946.0, 493.0, 217.0, 119.0, 70.0, 48.0, 44.0, 26.0, 16.0, 12.0, 12.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.85400390625, -16.1923828125, -15.53076171875, -14.869140625, -14.20751953125, -13.5458984375, -12.88427734375, -12.22265625, -11.56103515625, -10.8994140625, -10.23779296875, -9.576171875, -8.91455078125, -8.2529296875, -7.59130859375, -6.9296875, -6.26806640625, -5.6064453125, -4.94482421875, -4.283203125, -3.62158203125, -2.9599609375, -2.29833984375, -1.63671875, -0.97509765625, -0.3134765625, 0.34814453125, 1.009765625, 1.67138671875, 2.3330078125, 2.99462890625, 3.65625, 4.31787109375, 4.9794921875, 5.64111328125, 6.302734375, 6.96435546875, 7.6259765625, 8.28759765625, 8.94921875, 9.61083984375, 10.2724609375, 10.93408203125, 11.595703125, 12.25732421875, 12.9189453125, 13.58056640625, 14.2421875, 14.90380859375, 15.5654296875, 16.22705078125, 16.888671875, 17.55029296875, 18.2119140625, 18.87353515625, 19.53515625, 20.19677734375, 20.8583984375, 21.52001953125, 22.181640625, 22.84326171875, 23.5048828125, 24.16650390625, 24.828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 16.0, 26.0, 29.0, 38.0, 64.0, 66.0, 82.0, 87.0, 83.0, 103.0, 84.0, 73.0, 64.0, 46.0, 34.0, 29.0, 21.0, 12.0, 10.0, 4.0, 9.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -2.983428955078125, -2.83209228515625, -2.680755615234375, -2.5294189453125, -2.378082275390625, -2.22674560546875, -2.075408935546875, -1.924072265625, -1.772735595703125, -1.62139892578125, -1.470062255859375, -1.3187255859375, -1.167388916015625, -1.01605224609375, -0.864715576171875, -0.71337890625, -0.562042236328125, -0.41070556640625, -0.259368896484375, -0.1080322265625, 0.043304443359375, 0.19464111328125, 0.345977783203125, 0.497314453125, 0.648651123046875, 0.79998779296875, 0.951324462890625, 1.1026611328125, 1.253997802734375, 1.40533447265625, 1.556671142578125, 1.7080078125, 1.859344482421875, 2.01068115234375, 2.162017822265625, 2.3133544921875, 2.464691162109375, 2.61602783203125, 2.767364501953125, 2.918701171875, 3.070037841796875, 3.22137451171875, 3.372711181640625, 3.5240478515625, 3.675384521484375, 3.82672119140625, 3.978057861328125, 4.12939453125, 4.280731201171875, 4.43206787109375, 4.583404541015625, 4.7347412109375, 4.886077880859375, 5.03741455078125, 5.188751220703125, 5.340087890625, 5.491424560546875, 5.64276123046875, 5.794097900390625, 5.9454345703125, 6.096771240234375, 6.24810791015625, 6.399444580078125, 6.55078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 8.0, 17.0, 22.0, 37.0, 57.0, 97.0, 129.0, 187.0, 367.0, 745.0, 1593.0, 4466.0, 15344.0, 73481.0, 1377170.0, 2586978.0, 103796.0, 19844.0, 5944.0, 2142.0, 888.0, 416.0, 223.0, 118.0, 85.0, 38.0, 29.0, 19.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8125, -7.59600830078125, -7.3795166015625, -7.16302490234375, -6.946533203125, -6.73004150390625, -6.5135498046875, -6.29705810546875, -6.08056640625, -5.86407470703125, -5.6475830078125, -5.43109130859375, -5.214599609375, -4.99810791015625, -4.7816162109375, -4.56512451171875, -4.3486328125, -4.13214111328125, -3.9156494140625, -3.69915771484375, -3.482666015625, -3.26617431640625, -3.0496826171875, -2.83319091796875, -2.61669921875, -2.40020751953125, -2.1837158203125, -1.96722412109375, -1.750732421875, -1.53424072265625, -1.3177490234375, -1.10125732421875, -0.884765625, -0.66827392578125, -0.4517822265625, -0.23529052734375, -0.018798828125, 0.19769287109375, 0.4141845703125, 0.63067626953125, 0.84716796875, 1.06365966796875, 1.2801513671875, 1.49664306640625, 1.713134765625, 1.92962646484375, 2.1461181640625, 2.36260986328125, 2.5791015625, 2.79559326171875, 3.0120849609375, 3.22857666015625, 3.445068359375, 3.66156005859375, 3.8780517578125, 4.09454345703125, 4.31103515625, 4.52752685546875, 4.7440185546875, 4.96051025390625, 5.177001953125, 5.39349365234375, 5.6099853515625, 5.82647705078125, 6.04296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 11.0, 6.0, 26.0, 29.0, 45.0, 67.0, 136.0, 252.0, 592.0, 1069.0, 915.0, 446.0, 192.0, 98.0, 55.0, 30.0, 32.0, 11.0, 17.0, 6.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4296875, -7.19610595703125, -6.9625244140625, -6.72894287109375, -6.495361328125, -6.26177978515625, -6.0281982421875, -5.79461669921875, -5.56103515625, -5.32745361328125, -5.0938720703125, -4.86029052734375, -4.626708984375, -4.39312744140625, -4.1595458984375, -3.92596435546875, -3.6923828125, -3.45880126953125, -3.2252197265625, -2.99163818359375, -2.758056640625, -2.52447509765625, -2.2908935546875, -2.05731201171875, -1.82373046875, -1.59014892578125, -1.3565673828125, -1.12298583984375, -0.889404296875, -0.65582275390625, -0.4222412109375, -0.18865966796875, 0.044921875, 0.27850341796875, 0.5120849609375, 0.74566650390625, 0.979248046875, 1.21282958984375, 1.4464111328125, 1.67999267578125, 1.91357421875, 2.14715576171875, 2.3807373046875, 2.61431884765625, 2.847900390625, 3.08148193359375, 3.3150634765625, 3.54864501953125, 3.7822265625, 4.01580810546875, 4.2493896484375, 4.48297119140625, 4.716552734375, 4.95013427734375, 5.1837158203125, 5.41729736328125, 5.65087890625, 5.88446044921875, 6.1180419921875, 6.35162353515625, 6.585205078125, 6.81878662109375, 7.0523681640625, 7.28594970703125, 7.51953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 15.0, 18.0, 59.0, 182.0, 274.0, 238.0, 131.0, 33.0, 13.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.50408172607422, -78.79768371582031, -76.09129333496094, -73.38489532470703, -70.67850494384766, -67.97210693359375, -65.26571655273438, -62.55931854248047, -59.85292434692383, -57.14653015136719, -54.44013595581055, -51.733741760253906, -49.02734375, -46.320953369140625, -43.61455535888672, -40.90816116333008, -38.20176696777344, -35.4953727722168, -32.788978576660156, -30.082582473754883, -27.376188278198242, -24.6697940826416, -21.963397979736328, -19.257003784179688, -16.550609588623047, -13.844215393066406, -11.13782024383545, -8.431425094604492, -5.725030899047852, -3.018636703491211, -0.3122406005859375, 2.394153594970703, 5.100555419921875, 7.806950092315674, 10.513344764709473, 13.21973991394043, 15.92613410949707, 18.63252830505371, 21.338924407958984, 24.045318603515625, 26.751712799072266, 29.458106994628906, 32.16450119018555, 34.87089538574219, 37.577293395996094, 40.28368377685547, 42.990081787109375, 45.696475982666016, 48.402870178222656, 51.1092643737793, 53.81565856933594, 56.522056579589844, 59.22844696044922, 61.934844970703125, 64.6412353515625, 67.3476333618164, 70.05403137207031, 72.76042938232422, 75.4668197631836, 78.1732177734375, 80.87960815429688, 83.58600616455078, 86.29240417480469, 88.99879455566406, 91.70518493652344]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 20.0, 20.0, 18.0, 27.0, 42.0, 45.0, 41.0, 48.0, 43.0, 58.0, 70.0, 61.0, 54.0, 75.0, 52.0, 44.0, 44.0, 34.0, 31.0, 38.0, 25.0, 22.0, 14.0, 9.0, 17.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.87779235839844, -33.782325744628906, -32.686859130859375, -31.591392517089844, -30.495925903320312, -29.40045928955078, -28.30499267578125, -27.20952606201172, -26.114059448242188, -25.018592834472656, -23.923126220703125, -22.827659606933594, -21.732192993164062, -20.63672637939453, -19.541259765625, -18.44579315185547, -17.35032844543457, -16.25486183166504, -15.159395217895508, -14.063928604125977, -12.968461990356445, -11.872995376586914, -10.7775297164917, -9.682063102722168, -8.586596488952637, -7.4911298751831055, -6.395663261413574, -5.300197124481201, -4.20473051071167, -3.1092638969421387, -2.0137977600097656, -0.9183311462402344, 0.17713546752929688, 1.2726019620895386, 2.3680684566497803, 3.4635348320007324, 4.559001445770264, 5.654468059539795, 6.749934196472168, 7.845400810241699, 8.94086742401123, 10.036334037780762, 11.131800651550293, 12.227266311645508, 13.322732925415039, 14.41819953918457, 15.513666152954102, 16.609132766723633, 17.704599380493164, 18.800065994262695, 19.895532608032227, 20.990999221801758, 22.08646583557129, 23.18193244934082, 24.27739715576172, 25.37286376953125, 26.46833038330078, 27.563796997070312, 28.659263610839844, 29.754730224609375, 30.850196838378906, 31.945663452148438, 33.04113006591797, 34.1365966796875, 35.23206329345703]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 12.0, 13.0, 19.0, 22.0, 48.0, 66.0, 106.0, 202.0, 345.0, 637.0, 1195.0, 2188.0, 4690.0, 9831.0, 21773.0, 51898.0, 135916.0, 342105.0, 291853.0, 108566.0, 42343.0, 18332.0, 8176.0, 3975.0, 1948.0, 1008.0, 574.0, 293.0, 165.0, 114.0, 56.0, 35.0, 17.0, 13.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.28515625, -5.1336669921875, -4.982177734375, -4.8306884765625, -4.67919921875, -4.5277099609375, -4.376220703125, -4.2247314453125, -4.0732421875, -3.9217529296875, -3.770263671875, -3.6187744140625, -3.46728515625, -3.3157958984375, -3.164306640625, -3.0128173828125, -2.861328125, -2.7098388671875, -2.558349609375, -2.4068603515625, -2.25537109375, -2.1038818359375, -1.952392578125, -1.8009033203125, -1.6494140625, -1.4979248046875, -1.346435546875, -1.1949462890625, -1.04345703125, -0.8919677734375, -0.740478515625, -0.5889892578125, -0.4375, -0.2860107421875, -0.134521484375, 0.0169677734375, 0.16845703125, 0.3199462890625, 0.471435546875, 0.6229248046875, 0.7744140625, 0.9259033203125, 1.077392578125, 1.2288818359375, 1.38037109375, 1.5318603515625, 1.683349609375, 1.8348388671875, 1.986328125, 2.1378173828125, 2.289306640625, 2.4407958984375, 2.59228515625, 2.7437744140625, 2.895263671875, 3.0467529296875, 3.1982421875, 3.3497314453125, 3.501220703125, 3.6527099609375, 3.80419921875, 3.9556884765625, 4.107177734375, 4.2586669921875, 4.41015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 8.0, 6.0, 6.0, 9.0, 8.0, 13.0, 13.0, 18.0, 31.0, 21.0, 34.0, 27.0, 27.0, 42.0, 48.0, 59.0, 47.0, 50.0, 53.0, 50.0, 44.0, 46.0, 37.0, 42.0, 47.0, 37.0, 26.0, 27.0, 26.0, 21.0, 16.0, 10.0, 17.0, 6.0, 7.0, 6.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.11328125, -3.025909423828125, -2.93853759765625, -2.851165771484375, -2.7637939453125, -2.676422119140625, -2.58905029296875, -2.501678466796875, -2.414306640625, -2.326934814453125, -2.23956298828125, -2.152191162109375, -2.0648193359375, -1.977447509765625, -1.89007568359375, -1.802703857421875, -1.71533203125, -1.627960205078125, -1.54058837890625, -1.453216552734375, -1.3658447265625, -1.278472900390625, -1.19110107421875, -1.103729248046875, -1.016357421875, -0.928985595703125, -0.84161376953125, -0.754241943359375, -0.6668701171875, -0.579498291015625, -0.49212646484375, -0.404754638671875, -0.3173828125, -0.230010986328125, -0.14263916015625, -0.055267333984375, 0.0321044921875, 0.119476318359375, 0.20684814453125, 0.294219970703125, 0.381591796875, 0.468963623046875, 0.55633544921875, 0.643707275390625, 0.7310791015625, 0.818450927734375, 0.90582275390625, 0.993194580078125, 1.08056640625, 1.167938232421875, 1.25531005859375, 1.342681884765625, 1.4300537109375, 1.517425537109375, 1.60479736328125, 1.692169189453125, 1.779541015625, 1.866912841796875, 1.95428466796875, 2.041656494140625, 2.1290283203125, 2.216400146484375, 2.30377197265625, 2.391143798828125, 2.478515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 12.0, 9.0, 14.0, 16.0, 21.0, 41.0, 56.0, 90.0, 163.0, 297.0, 542.0, 1035.0, 2681.0, 8240.0, 37604.0, 278216.0, 625977.0, 72647.0, 14078.0, 3871.0, 1386.0, 680.0, 336.0, 193.0, 117.0, 70.0, 54.0, 32.0, 20.0, 14.0, 7.0, 10.0, 3.0, 4.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.9742431640625, -9.643798828125, -9.3133544921875, -8.98291015625, -8.6524658203125, -8.322021484375, -7.9915771484375, -7.6611328125, -7.3306884765625, -7.000244140625, -6.6697998046875, -6.33935546875, -6.0089111328125, -5.678466796875, -5.3480224609375, -5.017578125, -4.6871337890625, -4.356689453125, -4.0262451171875, -3.69580078125, -3.3653564453125, -3.034912109375, -2.7044677734375, -2.3740234375, -2.0435791015625, -1.713134765625, -1.3826904296875, -1.05224609375, -0.7218017578125, -0.391357421875, -0.0609130859375, 0.26953125, 0.5999755859375, 0.930419921875, 1.2608642578125, 1.59130859375, 1.9217529296875, 2.252197265625, 2.5826416015625, 2.9130859375, 3.2435302734375, 3.573974609375, 3.9044189453125, 4.23486328125, 4.5653076171875, 4.895751953125, 5.2261962890625, 5.556640625, 5.8870849609375, 6.217529296875, 6.5479736328125, 6.87841796875, 7.2088623046875, 7.539306640625, 7.8697509765625, 8.2001953125, 8.5306396484375, 8.861083984375, 9.1915283203125, 9.52197265625, 9.8524169921875, 10.182861328125, 10.5133056640625, 10.84375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 16.0, 9.0, 13.0, 20.0, 19.0, 17.0, 27.0, 29.0, 32.0, 27.0, 43.0, 47.0, 53.0, 59.0, 26.0, 43.0, 50.0, 39.0, 55.0, 53.0, 47.0, 42.0, 39.0, 25.0, 26.0, 22.0, 21.0, 23.0, 12.0, 9.0, 9.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.328125, -9.9725341796875, -9.616943359375, -9.2613525390625, -8.90576171875, -8.5501708984375, -8.194580078125, -7.8389892578125, -7.4833984375, -7.1278076171875, -6.772216796875, -6.4166259765625, -6.06103515625, -5.7054443359375, -5.349853515625, -4.9942626953125, -4.638671875, -4.2830810546875, -3.927490234375, -3.5718994140625, -3.21630859375, -2.8607177734375, -2.505126953125, -2.1495361328125, -1.7939453125, -1.4383544921875, -1.082763671875, -0.7271728515625, -0.37158203125, -0.0159912109375, 0.339599609375, 0.6951904296875, 1.05078125, 1.4063720703125, 1.761962890625, 2.1175537109375, 2.47314453125, 2.8287353515625, 3.184326171875, 3.5399169921875, 3.8955078125, 4.2510986328125, 4.606689453125, 4.9622802734375, 5.31787109375, 5.6734619140625, 6.029052734375, 6.3846435546875, 6.740234375, 7.0958251953125, 7.451416015625, 7.8070068359375, 8.16259765625, 8.5181884765625, 8.873779296875, 9.2293701171875, 9.5849609375, 9.9405517578125, 10.296142578125, 10.6517333984375, 11.00732421875, 11.3629150390625, 11.718505859375, 12.0740966796875, 12.4296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 14.0, 14.0, 18.0, 37.0, 58.0, 123.0, 341.0, 1281.0, 9043.0, 661173.0, 367618.0, 7148.0, 1115.0, 300.0, 125.0, 49.0, 31.0, 20.0, 13.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.4453125, -10.146484375, -9.84765625, -9.548828125, -9.25, -8.951171875, -8.65234375, -8.353515625, -8.0546875, -7.755859375, -7.45703125, -7.158203125, -6.859375, -6.560546875, -6.26171875, -5.962890625, -5.6640625, -5.365234375, -5.06640625, -4.767578125, -4.46875, -4.169921875, -3.87109375, -3.572265625, -3.2734375, -2.974609375, -2.67578125, -2.376953125, -2.078125, -1.779296875, -1.48046875, -1.181640625, -0.8828125, -0.583984375, -0.28515625, 0.013671875, 0.3125, 0.611328125, 0.91015625, 1.208984375, 1.5078125, 1.806640625, 2.10546875, 2.404296875, 2.703125, 3.001953125, 3.30078125, 3.599609375, 3.8984375, 4.197265625, 4.49609375, 4.794921875, 5.09375, 5.392578125, 5.69140625, 5.990234375, 6.2890625, 6.587890625, 6.88671875, 7.185546875, 7.484375, 7.783203125, 8.08203125, 8.380859375, 8.6796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 9.0, 7.0, 8.0, 12.0, 8.0, 14.0, 21.0, 33.0, 44.0, 81.0, 113.0, 137.0, 153.0, 98.0, 79.0, 50.0, 38.0, 21.0, 22.0, 15.0, 9.0, 4.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006747245788574219, -0.0006507784128189087, -0.0006268322467803955, -0.0006028860807418823, -0.0005789399147033691, -0.000554993748664856, -0.0005310475826263428, -0.0005071014165878296, -0.0004831552505493164, -0.0004592090845108032, -0.00043526291847229004, -0.00041131675243377686, -0.00038737058639526367, -0.0003634244203567505, -0.0003394782543182373, -0.0003155320882797241, -0.00029158592224121094, -0.00026763975620269775, -0.00024369359016418457, -0.0002197474241256714, -0.0001958012580871582, -0.00017185509204864502, -0.00014790892601013184, -0.00012396275997161865, -0.00010001659393310547, -7.607042789459229e-05, -5.21242618560791e-05, -2.8178095817565918e-05, -4.231929779052734e-06, 1.971423625946045e-05, 4.366040229797363e-05, 6.760656833648682e-05, 9.1552734375e-05, 0.00011549890041351318, 0.00013944506645202637, 0.00016339123249053955, 0.00018733739852905273, 0.00021128356456756592, 0.0002352297306060791, 0.0002591758966445923, 0.00028312206268310547, 0.00030706822872161865, 0.00033101439476013184, 0.000354960560798645, 0.0003789067268371582, 0.0004028528928756714, 0.00042679905891418457, 0.00045074522495269775, 0.00047469139099121094, 0.0004986375570297241, 0.0005225837230682373, 0.0005465298891067505, 0.0005704760551452637, 0.0005944222211837769, 0.00061836838722229, 0.0006423145532608032, 0.0006662607192993164, 0.0006902068853378296, 0.0007141530513763428, 0.000738099217414856, 0.0007620453834533691, 0.0007859915494918823, 0.0008099377155303955, 0.0008338838815689087, 0.0008578300476074219]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 17.0, 25.0, 31.0, 57.0, 76.0, 134.0, 230.0, 417.0, 882.0, 2062.0, 6248.0, 28239.0, 256099.0, 670544.0, 66407.0, 11328.0, 3260.0, 1211.0, 577.0, 263.0, 157.0, 87.0, 59.0, 40.0, 20.0, 10.0, 14.0, 14.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.96875, -3.84161376953125, -3.7144775390625, -3.58734130859375, -3.460205078125, -3.33306884765625, -3.2059326171875, -3.07879638671875, -2.95166015625, -2.82452392578125, -2.6973876953125, -2.57025146484375, -2.443115234375, -2.31597900390625, -2.1888427734375, -2.06170654296875, -1.9345703125, -1.80743408203125, -1.6802978515625, -1.55316162109375, -1.426025390625, -1.29888916015625, -1.1717529296875, -1.04461669921875, -0.91748046875, -0.79034423828125, -0.6632080078125, -0.53607177734375, -0.408935546875, -0.28179931640625, -0.1546630859375, -0.02752685546875, 0.099609375, 0.22674560546875, 0.3538818359375, 0.48101806640625, 0.608154296875, 0.73529052734375, 0.8624267578125, 0.98956298828125, 1.11669921875, 1.24383544921875, 1.3709716796875, 1.49810791015625, 1.625244140625, 1.75238037109375, 1.8795166015625, 2.00665283203125, 2.1337890625, 2.26092529296875, 2.3880615234375, 2.51519775390625, 2.642333984375, 2.76947021484375, 2.8966064453125, 3.02374267578125, 3.15087890625, 3.27801513671875, 3.4051513671875, 3.53228759765625, 3.659423828125, 3.78656005859375, 3.9136962890625, 4.04083251953125, 4.16796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 10.0, 6.0, 4.0, 23.0, 18.0, 23.0, 32.0, 30.0, 46.0, 59.0, 68.0, 75.0, 75.0, 66.0, 75.0, 63.0, 55.0, 53.0, 48.0, 29.0, 20.0, 25.0, 17.0, 13.0, 12.0, 8.0, 11.0, 8.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.244140625, -3.150115966796875, -3.05609130859375, -2.962066650390625, -2.8680419921875, -2.774017333984375, -2.67999267578125, -2.585968017578125, -2.491943359375, -2.397918701171875, -2.30389404296875, -2.209869384765625, -2.1158447265625, -2.021820068359375, -1.92779541015625, -1.833770751953125, -1.73974609375, -1.645721435546875, -1.55169677734375, -1.457672119140625, -1.3636474609375, -1.269622802734375, -1.17559814453125, -1.081573486328125, -0.987548828125, -0.893524169921875, -0.79949951171875, -0.705474853515625, -0.6114501953125, -0.517425537109375, -0.42340087890625, -0.329376220703125, -0.2353515625, -0.141326904296875, -0.04730224609375, 0.046722412109375, 0.1407470703125, 0.234771728515625, 0.32879638671875, 0.422821044921875, 0.516845703125, 0.610870361328125, 0.70489501953125, 0.798919677734375, 0.8929443359375, 0.986968994140625, 1.08099365234375, 1.175018310546875, 1.26904296875, 1.363067626953125, 1.45709228515625, 1.551116943359375, 1.6451416015625, 1.739166259765625, 1.83319091796875, 1.927215576171875, 2.021240234375, 2.115264892578125, 2.20928955078125, 2.303314208984375, 2.3973388671875, 2.491363525390625, 2.58538818359375, 2.679412841796875, 2.7734375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 15.0, 33.0, 85.0, 177.0, 372.0, 187.0, 85.0, 16.0, 11.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.338134765625, -162.68104553222656, -159.02395629882812, -155.3668670654297, -151.70977783203125, -148.05267333984375, -144.3955841064453, -140.73849487304688, -137.08140563964844, -133.42431640625, -129.76722717285156, -126.1101303100586, -122.45304107666016, -118.79595184326172, -115.13885498046875, -111.48176574707031, -107.82467651367188, -104.16758728027344, -100.510498046875, -96.85340118408203, -93.1963119506836, -89.53922271728516, -85.88212585449219, -82.22503662109375, -78.56794738769531, -74.91085815429688, -71.25376892089844, -67.59667205810547, -63.93958282470703, -60.282493591308594, -56.62540054321289, -52.96830749511719, -49.31121826171875, -45.65412902832031, -41.99703598022461, -38.339942932128906, -34.68285369873047, -31.0257625579834, -27.368671417236328, -23.711580276489258, -20.054489135742188, -16.397397994995117, -12.740306854248047, -9.083215713500977, -5.426124572753906, -1.769033432006836, 1.8880577087402344, 5.545148849487305, 9.202239990234375, 12.859331130981445, 16.516422271728516, 20.173513412475586, 23.830604553222656, 27.487695693969727, 31.144786834716797, 34.8018798828125, 38.45896911621094, 42.116058349609375, 45.77315139770508, 49.43024444580078, 53.08733367919922, 56.744422912597656, 60.40151596069336, 64.05860900878906, 67.7156982421875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 6.0, 8.0, 11.0, 13.0, 10.0, 22.0, 20.0, 14.0, 26.0, 24.0, 31.0, 27.0, 29.0, 26.0, 39.0, 57.0, 73.0, 59.0, 62.0, 54.0, 54.0, 25.0, 42.0, 42.0, 29.0, 27.0, 29.0, 15.0, 21.0, 19.0, 10.0, 10.0, 9.0, 13.0, 5.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.859710693359375, -48.500267028808594, -47.14082717895508, -45.7813835144043, -44.421939849853516, -43.0625, -41.70305633544922, -40.34361267089844, -38.984169006347656, -37.624725341796875, -36.26528549194336, -34.90584182739258, -33.5463981628418, -32.18695831298828, -30.8275146484375, -29.46807098388672, -28.108631134033203, -26.749189376831055, -25.389745712280273, -24.030303955078125, -22.670860290527344, -21.311418533325195, -19.951976776123047, -18.592533111572266, -17.233091354370117, -15.873648643493652, -14.514205932617188, -13.154764175415039, -11.795321464538574, -10.43587875366211, -9.076436996459961, -7.716994285583496, -6.357551574707031, -4.998108863830566, -3.6386666297912598, -2.279224395751953, -0.9197816848754883, 0.43966102600097656, 1.799102783203125, 3.15854549407959, 4.517988204956055, 5.8774309158325195, 7.236873149871826, 8.596315383911133, 9.955758094787598, 11.315200805664062, 12.674642562866211, 14.034085273742676, 15.39352798461914, 16.75296974182129, 18.11241340637207, 19.47185516357422, 20.831298828125, 22.19074058532715, 23.550182342529297, 24.909626007080078, 26.269067764282227, 27.628509521484375, 28.987953186035156, 30.347394943237305, 31.706836700439453, 33.066280364990234, 34.42572021484375, 35.78516387939453, 37.14460754394531]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 11.0, 14.0, 22.0, 14.0, 43.0, 65.0, 91.0, 133.0, 231.0, 426.0, 815.0, 1552.0, 3495.0, 8664.0, 26236.0, 114504.0, 990481.0, 2603335.0, 359707.0, 57667.0, 15895.0, 5804.0, 2471.0, 1187.0, 593.0, 304.0, 192.0, 99.0, 83.0, 52.0, 32.0, 20.0, 12.0, 10.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.0078125, -3.87969970703125, -3.7515869140625, -3.62347412109375, -3.495361328125, -3.36724853515625, -3.2391357421875, -3.11102294921875, -2.98291015625, -2.85479736328125, -2.7266845703125, -2.59857177734375, -2.470458984375, -2.34234619140625, -2.2142333984375, -2.08612060546875, -1.9580078125, -1.82989501953125, -1.7017822265625, -1.57366943359375, -1.445556640625, -1.31744384765625, -1.1893310546875, -1.06121826171875, -0.93310546875, -0.80499267578125, -0.6768798828125, -0.54876708984375, -0.420654296875, -0.29254150390625, -0.1644287109375, -0.03631591796875, 0.091796875, 0.21990966796875, 0.3480224609375, 0.47613525390625, 0.604248046875, 0.73236083984375, 0.8604736328125, 0.98858642578125, 1.11669921875, 1.24481201171875, 1.3729248046875, 1.50103759765625, 1.629150390625, 1.75726318359375, 1.8853759765625, 2.01348876953125, 2.1416015625, 2.26971435546875, 2.3978271484375, 2.52593994140625, 2.654052734375, 2.78216552734375, 2.9102783203125, 3.03839111328125, 3.16650390625, 3.29461669921875, 3.4227294921875, 3.55084228515625, 3.678955078125, 3.80706787109375, 3.9351806640625, 4.06329345703125, 4.19140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 13.0, 29.0, 23.0, 23.0, 32.0, 38.0, 34.0, 47.0, 48.0, 54.0, 60.0, 71.0, 79.0, 62.0, 55.0, 56.0, 31.0, 37.0, 35.0, 27.0, 30.0, 20.0, 15.0, 17.0, 10.0, 6.0, 10.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123046875, -3.024627685546875, -2.92620849609375, -2.827789306640625, -2.7293701171875, -2.630950927734375, -2.53253173828125, -2.434112548828125, -2.335693359375, -2.237274169921875, -2.13885498046875, -2.040435791015625, -1.9420166015625, -1.843597412109375, -1.74517822265625, -1.646759033203125, -1.54833984375, -1.449920654296875, -1.35150146484375, -1.253082275390625, -1.1546630859375, -1.056243896484375, -0.95782470703125, -0.859405517578125, -0.760986328125, -0.662567138671875, -0.56414794921875, -0.465728759765625, -0.3673095703125, -0.268890380859375, -0.17047119140625, -0.072052001953125, 0.0263671875, 0.124786376953125, 0.22320556640625, 0.321624755859375, 0.4200439453125, 0.518463134765625, 0.61688232421875, 0.715301513671875, 0.813720703125, 0.912139892578125, 1.01055908203125, 1.108978271484375, 1.2073974609375, 1.305816650390625, 1.40423583984375, 1.502655029296875, 1.60107421875, 1.699493408203125, 1.79791259765625, 1.896331787109375, 1.9947509765625, 2.093170166015625, 2.19158935546875, 2.290008544921875, 2.388427734375, 2.486846923828125, 2.58526611328125, 2.683685302734375, 2.7821044921875, 2.880523681640625, 2.97894287109375, 3.077362060546875, 3.17578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 12.0, 21.0, 24.0, 41.0, 79.0, 116.0, 262.0, 615.0, 1467.0, 5231.0, 34368.0, 1477983.0, 2613834.0, 49424.0, 7441.0, 2091.0, 687.0, 286.0, 129.0, 70.0, 34.0, 22.0, 7.0, 6.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.7109375, -14.3243408203125, -13.937744140625, -13.5511474609375, -13.16455078125, -12.7779541015625, -12.391357421875, -12.0047607421875, -11.6181640625, -11.2315673828125, -10.844970703125, -10.4583740234375, -10.07177734375, -9.6851806640625, -9.298583984375, -8.9119873046875, -8.525390625, -8.1387939453125, -7.752197265625, -7.3656005859375, -6.97900390625, -6.5924072265625, -6.205810546875, -5.8192138671875, -5.4326171875, -5.0460205078125, -4.659423828125, -4.2728271484375, -3.88623046875, -3.4996337890625, -3.113037109375, -2.7264404296875, -2.33984375, -1.9532470703125, -1.566650390625, -1.1800537109375, -0.79345703125, -0.4068603515625, -0.020263671875, 0.3663330078125, 0.7529296875, 1.1395263671875, 1.526123046875, 1.9127197265625, 2.29931640625, 2.6859130859375, 3.072509765625, 3.4591064453125, 3.845703125, 4.2322998046875, 4.618896484375, 5.0054931640625, 5.39208984375, 5.7786865234375, 6.165283203125, 6.5518798828125, 6.9384765625, 7.3250732421875, 7.711669921875, 8.0982666015625, 8.48486328125, 8.8714599609375, 9.258056640625, 9.6446533203125, 10.03125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 12.0, 11.0, 15.0, 18.0, 34.0, 46.0, 84.0, 123.0, 270.0, 494.0, 912.0, 874.0, 482.0, 246.0, 148.0, 93.0, 47.0, 43.0, 28.0, 18.0, 13.0, 14.0, 11.0, 6.0, 7.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.6766357421875, -9.392333984375, -9.1080322265625, -8.82373046875, -8.5394287109375, -8.255126953125, -7.9708251953125, -7.6865234375, -7.4022216796875, -7.117919921875, -6.8336181640625, -6.54931640625, -6.2650146484375, -5.980712890625, -5.6964111328125, -5.412109375, -5.1278076171875, -4.843505859375, -4.5592041015625, -4.27490234375, -3.9906005859375, -3.706298828125, -3.4219970703125, -3.1376953125, -2.8533935546875, -2.569091796875, -2.2847900390625, -2.00048828125, -1.7161865234375, -1.431884765625, -1.1475830078125, -0.86328125, -0.5789794921875, -0.294677734375, -0.0103759765625, 0.27392578125, 0.5582275390625, 0.842529296875, 1.1268310546875, 1.4111328125, 1.6954345703125, 1.979736328125, 2.2640380859375, 2.54833984375, 2.8326416015625, 3.116943359375, 3.4012451171875, 3.685546875, 3.9698486328125, 4.254150390625, 4.5384521484375, 4.82275390625, 5.1070556640625, 5.391357421875, 5.6756591796875, 5.9599609375, 6.2442626953125, 6.528564453125, 6.8128662109375, 7.09716796875, 7.3814697265625, 7.665771484375, 7.9500732421875, 8.234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 7.0, 15.0, 29.0, 57.0, 93.0, 190.0, 210.0, 182.0, 101.0, 50.0, 22.0, 17.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.16450500488281, -102.4997329711914, -99.8349609375, -97.17018127441406, -94.50540924072266, -91.84063720703125, -89.17586517333984, -86.51109313964844, -83.8463134765625, -81.1815414428711, -78.51676940917969, -75.85198974609375, -73.18721771240234, -70.52244567871094, -67.85767364501953, -65.19290161132812, -62.52812957763672, -59.86335754394531, -57.19858169555664, -54.533809661865234, -51.86903381347656, -49.204261779785156, -46.53948974609375, -43.874717712402344, -41.20994186401367, -38.545169830322266, -35.880393981933594, -33.21562194824219, -30.55084800720215, -27.88607406616211, -25.221302032470703, -22.556528091430664, -19.891754150390625, -17.226980209350586, -14.562207221984863, -11.89743423461914, -9.232660293579102, -6.5678863525390625, -3.90311336517334, -1.2383403778076172, 1.4264335632324219, 4.091207027435303, 6.755980491638184, 9.420753479003906, 12.085527420043945, 14.750301361083984, 17.41507339477539, 20.07984733581543, 22.74462127685547, 25.409395217895508, 28.074169158935547, 30.738941192626953, 33.403717041015625, 36.06848907470703, 38.73326110839844, 41.398033142089844, 44.062808990478516, 46.72758102416992, 49.392356872558594, 52.05712890625, 54.721900939941406, 57.38667678833008, 60.051448822021484, 62.716224670410156, 65.38099670410156]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 6.0, 4.0, 11.0, 9.0, 13.0, 8.0, 14.0, 24.0, 19.0, 36.0, 36.0, 32.0, 41.0, 51.0, 30.0, 47.0, 56.0, 44.0, 50.0, 46.0, 51.0, 41.0, 35.0, 45.0, 43.0, 30.0, 27.0, 27.0, 25.0, 22.0, 13.0, 21.0, 12.0, 6.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-48.99749755859375, -47.688289642333984, -46.37908172607422, -45.06987380981445, -43.76066589355469, -42.45145797729492, -41.142250061035156, -39.833045959472656, -38.523834228515625, -37.21462631225586, -35.905418395996094, -34.59621047973633, -33.28700256347656, -31.977794647216797, -30.668588638305664, -29.3593807220459, -28.050174713134766, -26.740966796875, -25.431758880615234, -24.12255096435547, -22.813343048095703, -21.504135131835938, -20.194929122924805, -18.88572120666504, -17.576513290405273, -16.267305374145508, -14.958097457885742, -13.648890495300293, -12.339682579040527, -11.030474662780762, -9.721267700195312, -8.412059783935547, -7.102851867675781, -5.793643951416016, -4.484436511993408, -3.1752288341522217, -1.8660211563110352, -0.5568132400512695, 0.7523941993713379, 2.0616016387939453, 3.370809555053711, 4.680017471313477, 5.989224910736084, 7.298432350158691, 8.607640266418457, 9.916848182678223, 11.226055145263672, 12.535263061523438, 13.844470977783203, 15.153678894042969, 16.462886810302734, 17.7720947265625, 19.081302642822266, 20.39051055908203, 21.699716567993164, 23.00892448425293, 24.318132400512695, 25.62734031677246, 26.936548233032227, 28.245756149291992, 29.554962158203125, 30.86417007446289, 32.173377990722656, 33.48258590698242, 34.79179382324219]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 10.0, 14.0, 19.0, 34.0, 36.0, 61.0, 117.0, 185.0, 347.0, 594.0, 1170.0, 2313.0, 4562.0, 9549.0, 20966.0, 47598.0, 111186.0, 248225.0, 311919.0, 163217.0, 70097.0, 30072.0, 13422.0, 6318.0, 3036.0, 1588.0, 813.0, 430.0, 255.0, 135.0, 85.0, 59.0, 36.0, 32.0, 14.0, 11.0, 9.0, 4.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.57708740234375, -4.4393310546875, -4.30157470703125, -4.163818359375, -4.02606201171875, -3.8883056640625, -3.75054931640625, -3.61279296875, -3.47503662109375, -3.3372802734375, -3.19952392578125, -3.061767578125, -2.92401123046875, -2.7862548828125, -2.64849853515625, -2.5107421875, -2.37298583984375, -2.2352294921875, -2.09747314453125, -1.959716796875, -1.82196044921875, -1.6842041015625, -1.54644775390625, -1.40869140625, -1.27093505859375, -1.1331787109375, -0.99542236328125, -0.857666015625, -0.71990966796875, -0.5821533203125, -0.44439697265625, -0.306640625, -0.16888427734375, -0.0311279296875, 0.10662841796875, 0.244384765625, 0.38214111328125, 0.5198974609375, 0.65765380859375, 0.79541015625, 0.93316650390625, 1.0709228515625, 1.20867919921875, 1.346435546875, 1.48419189453125, 1.6219482421875, 1.75970458984375, 1.8974609375, 2.03521728515625, 2.1729736328125, 2.31072998046875, 2.448486328125, 2.58624267578125, 2.7239990234375, 2.86175537109375, 2.99951171875, 3.13726806640625, 3.2750244140625, 3.41278076171875, 3.550537109375, 3.68829345703125, 3.8260498046875, 3.96380615234375, 4.1015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 3.0, 11.0, 16.0, 16.0, 19.0, 31.0, 17.0, 32.0, 27.0, 35.0, 39.0, 44.0, 45.0, 40.0, 48.0, 53.0, 58.0, 48.0, 41.0, 61.0, 38.0, 42.0, 33.0, 26.0, 27.0, 26.0, 14.0, 17.0, 17.0, 13.0, 9.0, 5.0, 5.0, 11.0, 6.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.099609375, -3.01336669921875, -2.9271240234375, -2.84088134765625, -2.754638671875, -2.66839599609375, -2.5821533203125, -2.49591064453125, -2.40966796875, -2.32342529296875, -2.2371826171875, -2.15093994140625, -2.064697265625, -1.97845458984375, -1.8922119140625, -1.80596923828125, -1.7197265625, -1.63348388671875, -1.5472412109375, -1.46099853515625, -1.374755859375, -1.28851318359375, -1.2022705078125, -1.11602783203125, -1.02978515625, -0.94354248046875, -0.8572998046875, -0.77105712890625, -0.684814453125, -0.59857177734375, -0.5123291015625, -0.42608642578125, -0.33984375, -0.25360107421875, -0.1673583984375, -0.08111572265625, 0.005126953125, 0.09136962890625, 0.1776123046875, 0.26385498046875, 0.35009765625, 0.43634033203125, 0.5225830078125, 0.60882568359375, 0.695068359375, 0.78131103515625, 0.8675537109375, 0.95379638671875, 1.0400390625, 1.12628173828125, 1.2125244140625, 1.29876708984375, 1.385009765625, 1.47125244140625, 1.5574951171875, 1.64373779296875, 1.72998046875, 1.81622314453125, 1.9024658203125, 1.98870849609375, 2.074951171875, 2.16119384765625, 2.2474365234375, 2.33367919921875, 2.419921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 10.0, 16.0, 17.0, 34.0, 62.0, 67.0, 105.0, 134.0, 238.0, 358.0, 579.0, 1011.0, 2146.0, 6565.0, 36835.0, 611377.0, 351375.0, 27733.0, 5481.0, 2002.0, 916.0, 512.0, 321.0, 203.0, 151.0, 94.0, 62.0, 46.0, 30.0, 15.0, 12.0, 7.0, 10.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8828125, -15.4407958984375, -14.998779296875, -14.5567626953125, -14.11474609375, -13.6727294921875, -13.230712890625, -12.7886962890625, -12.3466796875, -11.9046630859375, -11.462646484375, -11.0206298828125, -10.57861328125, -10.1365966796875, -9.694580078125, -9.2525634765625, -8.810546875, -8.3685302734375, -7.926513671875, -7.4844970703125, -7.04248046875, -6.6004638671875, -6.158447265625, -5.7164306640625, -5.2744140625, -4.8323974609375, -4.390380859375, -3.9483642578125, -3.50634765625, -3.0643310546875, -2.622314453125, -2.1802978515625, -1.73828125, -1.2962646484375, -0.854248046875, -0.4122314453125, 0.02978515625, 0.4718017578125, 0.913818359375, 1.3558349609375, 1.7978515625, 2.2398681640625, 2.681884765625, 3.1239013671875, 3.56591796875, 4.0079345703125, 4.449951171875, 4.8919677734375, 5.333984375, 5.7760009765625, 6.218017578125, 6.6600341796875, 7.10205078125, 7.5440673828125, 7.986083984375, 8.4281005859375, 8.8701171875, 9.3121337890625, 9.754150390625, 10.1961669921875, 10.63818359375, 11.0802001953125, 11.522216796875, 11.9642333984375, 12.40625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 6.0, 5.0, 12.0, 13.0, 14.0, 17.0, 28.0, 23.0, 47.0, 49.0, 55.0, 60.0, 84.0, 64.0, 69.0, 77.0, 62.0, 65.0, 58.0, 42.0, 34.0, 28.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.6470947265625, -21.059814453125, -20.4725341796875, -19.88525390625, -19.2979736328125, -18.710693359375, -18.1234130859375, -17.5361328125, -16.9488525390625, -16.361572265625, -15.7742919921875, -15.18701171875, -14.5997314453125, -14.012451171875, -13.4251708984375, -12.837890625, -12.2506103515625, -11.663330078125, -11.0760498046875, -10.48876953125, -9.9014892578125, -9.314208984375, -8.7269287109375, -8.1396484375, -7.5523681640625, -6.965087890625, -6.3778076171875, -5.79052734375, -5.2032470703125, -4.615966796875, -4.0286865234375, -3.44140625, -2.8541259765625, -2.266845703125, -1.6795654296875, -1.09228515625, -0.5050048828125, 0.082275390625, 0.6695556640625, 1.2568359375, 1.8441162109375, 2.431396484375, 3.0186767578125, 3.60595703125, 4.1932373046875, 4.780517578125, 5.3677978515625, 5.955078125, 6.5423583984375, 7.129638671875, 7.7169189453125, 8.30419921875, 8.8914794921875, 9.478759765625, 10.0660400390625, 10.6533203125, 11.2406005859375, 11.827880859375, 12.4151611328125, 13.00244140625, 13.5897216796875, 14.177001953125, 14.7642822265625, 15.3515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 7.0, 10.0, 10.0, 11.0, 23.0, 35.0, 54.0, 84.0, 142.0, 229.0, 485.0, 1086.0, 3051.0, 13109.0, 95687.0, 764610.0, 145556.0, 18083.0, 3812.0, 1191.0, 559.0, 260.0, 155.0, 94.0, 54.0, 46.0, 27.0, 23.0, 21.0, 8.0, 5.0, 11.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.354736328125, -4.22509765625, -4.095458984375, -3.9658203125, -3.836181640625, -3.70654296875, -3.576904296875, -3.447265625, -3.317626953125, -3.18798828125, -3.058349609375, -2.9287109375, -2.799072265625, -2.66943359375, -2.539794921875, -2.41015625, -2.280517578125, -2.15087890625, -2.021240234375, -1.8916015625, -1.761962890625, -1.63232421875, -1.502685546875, -1.373046875, -1.243408203125, -1.11376953125, -0.984130859375, -0.8544921875, -0.724853515625, -0.59521484375, -0.465576171875, -0.3359375, -0.206298828125, -0.07666015625, 0.052978515625, 0.1826171875, 0.312255859375, 0.44189453125, 0.571533203125, 0.701171875, 0.830810546875, 0.96044921875, 1.090087890625, 1.2197265625, 1.349365234375, 1.47900390625, 1.608642578125, 1.73828125, 1.867919921875, 1.99755859375, 2.127197265625, 2.2568359375, 2.386474609375, 2.51611328125, 2.645751953125, 2.775390625, 2.905029296875, 3.03466796875, 3.164306640625, 3.2939453125, 3.423583984375, 3.55322265625, 3.682861328125, 3.8125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 5.0, 14.0, 11.0, 17.0, 15.0, 26.0, 24.0, 24.0, 46.0, 36.0, 52.0, 97.0, 105.0, 114.0, 86.0, 63.0, 35.0, 39.0, 30.0, 23.0, 20.0, 20.0, 21.0, 11.0, 8.0, 8.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000713348388671875, -0.0006923377513885498, -0.0006713271141052246, -0.0006503164768218994, -0.0006293058395385742, -0.000608295202255249, -0.0005872845649719238, -0.0005662739276885986, -0.0005452632904052734, -0.0005242526531219482, -0.000503242015838623, -0.00048223137855529785, -0.00046122074127197266, -0.00044021010398864746, -0.00041919946670532227, -0.00039818882942199707, -0.0003771781921386719, -0.0003561675548553467, -0.0003351569175720215, -0.0003141462802886963, -0.0002931356430053711, -0.0002721250057220459, -0.0002511143684387207, -0.0002301037311553955, -0.0002090930938720703, -0.00018808245658874512, -0.00016707181930541992, -0.00014606118202209473, -0.00012505054473876953, -0.00010403990745544434, -8.302927017211914e-05, -6.201863288879395e-05, -4.100799560546875e-05, -1.9997358322143555e-05, 1.0132789611816406e-06, 2.2023916244506836e-05, 4.303455352783203e-05, 6.404519081115723e-05, 8.505582809448242e-05, 0.00010606646537780762, 0.0001270771026611328, 0.000148087739944458, 0.0001690983772277832, 0.0001901090145111084, 0.0002111196517944336, 0.0002321302890777588, 0.000253140926361084, 0.0002741515636444092, 0.0002951622009277344, 0.00031617283821105957, 0.00033718347549438477, 0.00035819411277770996, 0.00037920475006103516, 0.00040021538734436035, 0.00042122602462768555, 0.00044223666191101074, 0.00046324729919433594, 0.00048425793647766113, 0.0005052685737609863, 0.0005262792110443115, 0.0005472898483276367, 0.0005683004856109619, 0.0005893111228942871, 0.0006103217601776123, 0.0006313323974609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 3.0, 11.0, 14.0, 14.0, 21.0, 38.0, 60.0, 93.0, 179.0, 324.0, 548.0, 1138.0, 2762.0, 9717.0, 61085.0, 715599.0, 224465.0, 23658.0, 5179.0, 1839.0, 815.0, 400.0, 244.0, 140.0, 87.0, 34.0, 28.0, 20.0, 19.0, 9.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6484375, -3.51214599609375, -3.3758544921875, -3.23956298828125, -3.103271484375, -2.96697998046875, -2.8306884765625, -2.69439697265625, -2.55810546875, -2.42181396484375, -2.2855224609375, -2.14923095703125, -2.012939453125, -1.87664794921875, -1.7403564453125, -1.60406494140625, -1.4677734375, -1.33148193359375, -1.1951904296875, -1.05889892578125, -0.922607421875, -0.78631591796875, -0.6500244140625, -0.51373291015625, -0.37744140625, -0.24114990234375, -0.1048583984375, 0.03143310546875, 0.167724609375, 0.30401611328125, 0.4403076171875, 0.57659912109375, 0.712890625, 0.84918212890625, 0.9854736328125, 1.12176513671875, 1.258056640625, 1.39434814453125, 1.5306396484375, 1.66693115234375, 1.80322265625, 1.93951416015625, 2.0758056640625, 2.21209716796875, 2.348388671875, 2.48468017578125, 2.6209716796875, 2.75726318359375, 2.8935546875, 3.02984619140625, 3.1661376953125, 3.30242919921875, 3.438720703125, 3.57501220703125, 3.7113037109375, 3.84759521484375, 3.98388671875, 4.12017822265625, 4.2564697265625, 4.39276123046875, 4.529052734375, 4.66534423828125, 4.8016357421875, 4.93792724609375, 5.07421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 3.0, 11.0, 12.0, 11.0, 12.0, 14.0, 23.0, 24.0, 31.0, 42.0, 42.0, 43.0, 55.0, 57.0, 65.0, 67.0, 74.0, 55.0, 60.0, 48.0, 41.0, 32.0, 31.0, 22.0, 10.0, 19.0, 20.0, 7.0, 5.0, 12.0, 9.0, 8.0, 5.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.744140625, -2.662750244140625, -2.58135986328125, -2.499969482421875, -2.4185791015625, -2.337188720703125, -2.25579833984375, -2.174407958984375, -2.093017578125, -2.011627197265625, -1.93023681640625, -1.848846435546875, -1.7674560546875, -1.686065673828125, -1.60467529296875, -1.523284912109375, -1.44189453125, -1.360504150390625, -1.27911376953125, -1.197723388671875, -1.1163330078125, -1.034942626953125, -0.95355224609375, -0.872161865234375, -0.790771484375, -0.709381103515625, -0.62799072265625, -0.546600341796875, -0.4652099609375, -0.383819580078125, -0.30242919921875, -0.221038818359375, -0.1396484375, -0.058258056640625, 0.02313232421875, 0.104522705078125, 0.1859130859375, 0.267303466796875, 0.34869384765625, 0.430084228515625, 0.511474609375, 0.592864990234375, 0.67425537109375, 0.755645751953125, 0.8370361328125, 0.918426513671875, 0.99981689453125, 1.081207275390625, 1.16259765625, 1.243988037109375, 1.32537841796875, 1.406768798828125, 1.4881591796875, 1.569549560546875, 1.65093994140625, 1.732330322265625, 1.813720703125, 1.895111083984375, 1.97650146484375, 2.057891845703125, 2.1392822265625, 2.220672607421875, 2.30206298828125, 2.383453369140625, 2.46484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 6.0, 8.0, 22.0, 61.0, 167.0, 397.0, 251.0, 57.0, 25.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.18692016601562, -136.439453125, -131.69198608398438, -126.94451141357422, -122.1970443725586, -117.44957733154297, -112.70210266113281, -107.95463562011719, -103.20716857910156, -98.45970153808594, -93.71223449707031, -88.96475982666016, -84.21729278564453, -79.4698257446289, -74.72235107421875, -69.97488403320312, -65.2274169921875, -60.479949951171875, -55.732479095458984, -50.985008239746094, -46.23754119873047, -41.490074157714844, -36.74260330200195, -31.995132446289062, -27.247665405273438, -22.50019645690918, -17.752727508544922, -13.005258560180664, -8.257789611816406, -3.5103206634521484, 1.2371482849121094, 5.984619140625, 10.732086181640625, 15.479555130004883, 20.22702407836914, 24.9744930267334, 29.721961975097656, 34.46942901611328, 39.21689987182617, 43.96437072753906, 48.71183776855469, 53.45930480957031, 58.2067756652832, 62.954246520996094, 67.70171356201172, 72.44918060302734, 77.1966552734375, 81.94412231445312, 86.69158935546875, 91.43905639648438, 96.1865234375, 100.93399810791016, 105.68146514892578, 110.4289321899414, 115.17640686035156, 119.92387390136719, 124.67134094238281, 129.41880798339844, 134.16627502441406, 138.9137420654297, 143.66122436523438, 148.40869140625, 153.15615844726562, 157.90362548828125, 162.65109252929688]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 4.0, 8.0, 8.0, 9.0, 7.0, 10.0, 17.0, 14.0, 6.0, 21.0, 26.0, 21.0, 18.0, 37.0, 35.0, 45.0, 42.0, 74.0, 55.0, 89.0, 63.0, 52.0, 39.0, 25.0, 47.0, 31.0, 30.0, 26.0, 26.0, 21.0, 15.0, 15.0, 11.0, 5.0, 9.0, 3.0, 11.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-55.543853759765625, -53.96034622192383, -52.3768424987793, -50.7933349609375, -49.2098274230957, -47.62632369995117, -46.042816162109375, -44.459312438964844, -42.87580490112305, -41.29229736328125, -39.70879364013672, -38.12528610229492, -36.541778564453125, -34.958274841308594, -33.3747673034668, -31.791261672973633, -30.207754135131836, -28.624248504638672, -27.040740966796875, -25.45723533630371, -23.873729705810547, -22.29022216796875, -20.706716537475586, -19.123210906982422, -17.539703369140625, -15.956196784973145, -14.37269115447998, -12.7891845703125, -11.205678939819336, -9.622172355651855, -8.038665771484375, -6.455160140991211, -4.871654510498047, -3.2881484031677246, -1.7046420574188232, -0.12113571166992188, 1.4623703956604004, 3.0458765029907227, 4.629383087158203, 6.212888717651367, 7.796395301818848, 9.379901885986328, 10.963407516479492, 12.546914100646973, 14.130420684814453, 15.713926315307617, 17.29743194580078, 18.880939483642578, 20.464445114135742, 22.047950744628906, 23.631458282470703, 25.214963912963867, 26.79846954345703, 28.381977081298828, 29.965482711791992, 31.548988342285156, 33.13249588012695, 34.71600341796875, 36.29950714111328, 37.88301467895508, 39.466522216796875, 41.050025939941406, 42.6335334777832, 44.217041015625, 45.80054473876953]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 25.0, 22.0, 26.0, 38.0, 69.0, 109.0, 165.0, 262.0, 457.0, 837.0, 1568.0, 3137.0, 6547.0, 16142.0, 50738.0, 251196.0, 1875495.0, 1688229.0, 224300.0, 46688.0, 15436.0, 6310.0, 2908.0, 1494.0, 828.0, 480.0, 300.0, 185.0, 91.0, 57.0, 50.0, 31.0, 13.0, 24.0, 3.0, 7.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.75390625, -3.640045166015625, -3.52618408203125, -3.412322998046875, -3.2984619140625, -3.184600830078125, -3.07073974609375, -2.956878662109375, -2.843017578125, -2.729156494140625, -2.61529541015625, -2.501434326171875, -2.3875732421875, -2.273712158203125, -2.15985107421875, -2.045989990234375, -1.93212890625, -1.818267822265625, -1.70440673828125, -1.590545654296875, -1.4766845703125, -1.362823486328125, -1.24896240234375, -1.135101318359375, -1.021240234375, -0.907379150390625, -0.79351806640625, -0.679656982421875, -0.5657958984375, -0.451934814453125, -0.33807373046875, -0.224212646484375, -0.1103515625, 0.003509521484375, 0.11737060546875, 0.231231689453125, 0.3450927734375, 0.458953857421875, 0.57281494140625, 0.686676025390625, 0.800537109375, 0.914398193359375, 1.02825927734375, 1.142120361328125, 1.2559814453125, 1.369842529296875, 1.48370361328125, 1.597564697265625, 1.71142578125, 1.825286865234375, 1.93914794921875, 2.053009033203125, 2.1668701171875, 2.280731201171875, 2.39459228515625, 2.508453369140625, 2.622314453125, 2.736175537109375, 2.85003662109375, 2.963897705078125, 3.0777587890625, 3.191619873046875, 3.30548095703125, 3.419342041015625, 3.533203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 10.0, 6.0, 21.0, 24.0, 27.0, 30.0, 50.0, 45.0, 56.0, 62.0, 71.0, 43.0, 76.0, 88.0, 69.0, 68.0, 40.0, 46.0, 38.0, 25.0, 29.0, 19.0, 11.0, 11.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.26190185546875, -4.1370849609375, -4.01226806640625, -3.887451171875, -3.76263427734375, -3.6378173828125, -3.51300048828125, -3.38818359375, -3.26336669921875, -3.1385498046875, -3.01373291015625, -2.888916015625, -2.76409912109375, -2.6392822265625, -2.51446533203125, -2.3896484375, -2.26483154296875, -2.1400146484375, -2.01519775390625, -1.890380859375, -1.76556396484375, -1.6407470703125, -1.51593017578125, -1.39111328125, -1.26629638671875, -1.1414794921875, -1.01666259765625, -0.891845703125, -0.76702880859375, -0.6422119140625, -0.51739501953125, -0.392578125, -0.26776123046875, -0.1429443359375, -0.01812744140625, 0.106689453125, 0.23150634765625, 0.3563232421875, 0.48114013671875, 0.60595703125, 0.73077392578125, 0.8555908203125, 0.98040771484375, 1.105224609375, 1.23004150390625, 1.3548583984375, 1.47967529296875, 1.6044921875, 1.72930908203125, 1.8541259765625, 1.97894287109375, 2.103759765625, 2.22857666015625, 2.3533935546875, 2.47821044921875, 2.60302734375, 2.72784423828125, 2.8526611328125, 2.97747802734375, 3.102294921875, 3.22711181640625, 3.3519287109375, 3.47674560546875, 3.6015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 29.0, 38.0, 53.0, 66.0, 139.0, 230.0, 347.0, 665.0, 1304.0, 2763.0, 7495.0, 25119.0, 138136.0, 3043321.0, 871731.0, 73236.0, 18230.0, 6285.0, 2493.0, 1183.0, 583.0, 308.0, 167.0, 108.0, 84.0, 33.0, 22.0, 26.0, 10.0, 8.0, 7.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.109375, -8.868408203125, -8.62744140625, -8.386474609375, -8.1455078125, -7.904541015625, -7.66357421875, -7.422607421875, -7.181640625, -6.940673828125, -6.69970703125, -6.458740234375, -6.2177734375, -5.976806640625, -5.73583984375, -5.494873046875, -5.25390625, -5.012939453125, -4.77197265625, -4.531005859375, -4.2900390625, -4.049072265625, -3.80810546875, -3.567138671875, -3.326171875, -3.085205078125, -2.84423828125, -2.603271484375, -2.3623046875, -2.121337890625, -1.88037109375, -1.639404296875, -1.3984375, -1.157470703125, -0.91650390625, -0.675537109375, -0.4345703125, -0.193603515625, 0.04736328125, 0.288330078125, 0.529296875, 0.770263671875, 1.01123046875, 1.252197265625, 1.4931640625, 1.734130859375, 1.97509765625, 2.216064453125, 2.45703125, 2.697998046875, 2.93896484375, 3.179931640625, 3.4208984375, 3.661865234375, 3.90283203125, 4.143798828125, 4.384765625, 4.625732421875, 4.86669921875, 5.107666015625, 5.3486328125, 5.589599609375, 5.83056640625, 6.071533203125, 6.3125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 14.0, 14.0, 16.0, 40.0, 36.0, 66.0, 120.0, 260.0, 540.0, 938.0, 883.0, 486.0, 248.0, 113.0, 82.0, 51.0, 41.0, 28.0, 22.0, 12.0, 13.0, 12.0, 6.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.3974609375, -8.107421875, -7.8173828125, -7.52734375, -7.2373046875, -6.947265625, -6.6572265625, -6.3671875, -6.0771484375, -5.787109375, -5.4970703125, -5.20703125, -4.9169921875, -4.626953125, -4.3369140625, -4.046875, -3.7568359375, -3.466796875, -3.1767578125, -2.88671875, -2.5966796875, -2.306640625, -2.0166015625, -1.7265625, -1.4365234375, -1.146484375, -0.8564453125, -0.56640625, -0.2763671875, 0.013671875, 0.3037109375, 0.59375, 0.8837890625, 1.173828125, 1.4638671875, 1.75390625, 2.0439453125, 2.333984375, 2.6240234375, 2.9140625, 3.2041015625, 3.494140625, 3.7841796875, 4.07421875, 4.3642578125, 4.654296875, 4.9443359375, 5.234375, 5.5244140625, 5.814453125, 6.1044921875, 6.39453125, 6.6845703125, 6.974609375, 7.2646484375, 7.5546875, 7.8447265625, 8.134765625, 8.4248046875, 8.71484375, 9.0048828125, 9.294921875, 9.5849609375, 9.875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 14.0, 37.0, 68.0, 135.0, 214.0, 209.0, 137.0, 75.0, 47.0, 16.0, 10.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.62507247924805, -52.95558166503906, -50.286094665527344, -47.61660385131836, -44.947113037109375, -42.277626037597656, -39.60813522338867, -36.93864440917969, -34.26915740966797, -31.599668502807617, -28.930177688598633, -26.26068878173828, -23.591197967529297, -20.921709060668945, -18.252220153808594, -15.58272933959961, -12.913238525390625, -10.243748664855957, -7.574259281158447, -4.9047698974609375, -2.2352800369262695, 0.43420982360839844, 3.10369873046875, 5.773189544677734, 8.442678451538086, 11.112168312072754, 13.781658172607422, 16.451147079467773, 19.120635986328125, 21.79012680053711, 24.45961570739746, 27.129106521606445, 29.798599243164062, 32.46809005737305, 35.137577056884766, 37.80706787109375, 40.476558685302734, 43.14604949951172, 45.81553649902344, 48.48502731323242, 51.154518127441406, 53.82400894165039, 56.49349594116211, 59.162986755371094, 61.83247756958008, 64.50196838378906, 67.17145538330078, 69.8409423828125, 72.51043701171875, 75.17992401123047, 77.84941864013672, 80.51890563964844, 83.18839263916016, 85.8578872680664, 88.52737426757812, 91.19686889648438, 93.86634826660156, 96.53583526611328, 99.20532989501953, 101.87481689453125, 104.54430389404297, 107.21379852294922, 109.88328552246094, 112.55278015136719, 115.2222671508789]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 15.0, 11.0, 10.0, 11.0, 12.0, 28.0, 32.0, 45.0, 32.0, 44.0, 29.0, 53.0, 66.0, 47.0, 49.0, 62.0, 47.0, 36.0, 44.0, 45.0, 52.0, 39.0, 38.0, 24.0, 28.0, 18.0, 18.0, 13.0, 5.0, 12.0, 8.0, 7.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.58109664916992, -40.25056457519531, -38.9200325012207, -37.589500427246094, -36.258968353271484, -34.928436279296875, -33.597904205322266, -32.267372131347656, -30.936840057373047, -29.606307983398438, -28.275775909423828, -26.94524383544922, -25.61471176147461, -24.2841796875, -22.95364761352539, -21.62311553955078, -20.292585372924805, -18.962053298950195, -17.631521224975586, -16.300989151000977, -14.970457077026367, -13.639925003051758, -12.309393882751465, -10.978861808776855, -9.648329734802246, -8.317797660827637, -6.987265586853027, -5.656733989715576, -4.326201915740967, -2.9956698417663574, -1.6651382446289062, -0.3346061706542969, 0.9959259033203125, 2.326457977294922, 3.656989812850952, 4.987521648406982, 6.318053722381592, 7.648585796356201, 8.979117393493652, 10.309649467468262, 11.640181541442871, 12.97071361541748, 14.30124568939209, 15.631776809692383, 16.962308883666992, 18.2928409576416, 19.62337303161621, 20.95390510559082, 22.28443717956543, 23.61496925354004, 24.94550132751465, 26.276033401489258, 27.606565475463867, 28.937097549438477, 30.267627716064453, 31.598159790039062, 32.92869186401367, 34.25922393798828, 35.58975601196289, 36.9202880859375, 38.25082015991211, 39.58135223388672, 40.91188430786133, 42.24241638183594, 43.57294845581055]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 13.0, 17.0, 22.0, 41.0, 53.0, 50.0, 78.0, 142.0, 182.0, 322.0, 444.0, 769.0, 1326.0, 2145.0, 3819.0, 7143.0, 14110.0, 28659.0, 61832.0, 134294.0, 265653.0, 268652.0, 136708.0, 62017.0, 28932.0, 14372.0, 7175.0, 3910.0, 2190.0, 1352.0, 752.0, 498.0, 292.0, 172.0, 122.0, 98.0, 66.0, 42.0, 26.0, 27.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.935546875, -3.812591552734375, -3.68963623046875, -3.566680908203125, -3.4437255859375, -3.320770263671875, -3.19781494140625, -3.074859619140625, -2.951904296875, -2.828948974609375, -2.70599365234375, -2.583038330078125, -2.4600830078125, -2.337127685546875, -2.21417236328125, -2.091217041015625, -1.96826171875, -1.845306396484375, -1.72235107421875, -1.599395751953125, -1.4764404296875, -1.353485107421875, -1.23052978515625, -1.107574462890625, -0.984619140625, -0.861663818359375, -0.73870849609375, -0.615753173828125, -0.4927978515625, -0.369842529296875, -0.24688720703125, -0.123931884765625, -0.0009765625, 0.121978759765625, 0.24493408203125, 0.367889404296875, 0.4908447265625, 0.613800048828125, 0.73675537109375, 0.859710693359375, 0.982666015625, 1.105621337890625, 1.22857666015625, 1.351531982421875, 1.4744873046875, 1.597442626953125, 1.72039794921875, 1.843353271484375, 1.96630859375, 2.089263916015625, 2.21221923828125, 2.335174560546875, 2.4581298828125, 2.581085205078125, 2.70404052734375, 2.826995849609375, 2.949951171875, 3.072906494140625, 3.19586181640625, 3.318817138671875, 3.4417724609375, 3.564727783203125, 3.68768310546875, 3.810638427734375, 3.93359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 14.0, 6.0, 12.0, 15.0, 9.0, 27.0, 28.0, 25.0, 29.0, 34.0, 33.0, 42.0, 40.0, 38.0, 51.0, 57.0, 34.0, 41.0, 61.0, 54.0, 36.0, 45.0, 37.0, 36.0, 33.0, 30.0, 28.0, 16.0, 18.0, 15.0, 17.0, 7.0, 5.0, 5.0, 4.0, 2.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.1260986328125, -3.033447265625, -2.9407958984375, -2.84814453125, -2.7554931640625, -2.662841796875, -2.5701904296875, -2.4775390625, -2.3848876953125, -2.292236328125, -2.1995849609375, -2.10693359375, -2.0142822265625, -1.921630859375, -1.8289794921875, -1.736328125, -1.6436767578125, -1.551025390625, -1.4583740234375, -1.36572265625, -1.2730712890625, -1.180419921875, -1.0877685546875, -0.9951171875, -0.9024658203125, -0.809814453125, -0.7171630859375, -0.62451171875, -0.5318603515625, -0.439208984375, -0.3465576171875, -0.25390625, -0.1612548828125, -0.068603515625, 0.0240478515625, 0.11669921875, 0.2093505859375, 0.302001953125, 0.3946533203125, 0.4873046875, 0.5799560546875, 0.672607421875, 0.7652587890625, 0.85791015625, 0.9505615234375, 1.043212890625, 1.1358642578125, 1.228515625, 1.3211669921875, 1.413818359375, 1.5064697265625, 1.59912109375, 1.6917724609375, 1.784423828125, 1.8770751953125, 1.9697265625, 2.0623779296875, 2.155029296875, 2.2476806640625, 2.34033203125, 2.4329833984375, 2.525634765625, 2.6182861328125, 2.7109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 16.0, 15.0, 20.0, 42.0, 45.0, 69.0, 137.0, 194.0, 335.0, 499.0, 952.0, 2082.0, 6520.0, 39890.0, 671731.0, 293334.0, 24129.0, 4682.0, 1711.0, 866.0, 502.0, 290.0, 159.0, 93.0, 72.0, 51.0, 27.0, 25.0, 14.0, 14.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7734375, -12.3311767578125, -11.888916015625, -11.4466552734375, -11.00439453125, -10.5621337890625, -10.119873046875, -9.6776123046875, -9.2353515625, -8.7930908203125, -8.350830078125, -7.9085693359375, -7.46630859375, -7.0240478515625, -6.581787109375, -6.1395263671875, -5.697265625, -5.2550048828125, -4.812744140625, -4.3704833984375, -3.92822265625, -3.4859619140625, -3.043701171875, -2.6014404296875, -2.1591796875, -1.7169189453125, -1.274658203125, -0.8323974609375, -0.39013671875, 0.0521240234375, 0.494384765625, 0.9366455078125, 1.37890625, 1.8211669921875, 2.263427734375, 2.7056884765625, 3.14794921875, 3.5902099609375, 4.032470703125, 4.4747314453125, 4.9169921875, 5.3592529296875, 5.801513671875, 6.2437744140625, 6.68603515625, 7.1282958984375, 7.570556640625, 8.0128173828125, 8.455078125, 8.8973388671875, 9.339599609375, 9.7818603515625, 10.22412109375, 10.6663818359375, 11.108642578125, 11.5509033203125, 11.9931640625, 12.4354248046875, 12.877685546875, 13.3199462890625, 13.76220703125, 14.2044677734375, 14.646728515625, 15.0889892578125, 15.53125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 5.0, 6.0, 6.0, 17.0, 24.0, 14.0, 20.0, 17.0, 26.0, 27.0, 42.0, 36.0, 40.0, 47.0, 46.0, 48.0, 59.0, 63.0, 58.0, 44.0, 42.0, 43.0, 42.0, 38.0, 34.0, 33.0, 22.0, 25.0, 14.0, 11.0, 8.0, 9.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5, -11.1029052734375, -10.705810546875, -10.3087158203125, -9.91162109375, -9.5145263671875, -9.117431640625, -8.7203369140625, -8.3232421875, -7.9261474609375, -7.529052734375, -7.1319580078125, -6.73486328125, -6.3377685546875, -5.940673828125, -5.5435791015625, -5.146484375, -4.7493896484375, -4.352294921875, -3.9552001953125, -3.55810546875, -3.1610107421875, -2.763916015625, -2.3668212890625, -1.9697265625, -1.5726318359375, -1.175537109375, -0.7784423828125, -0.38134765625, 0.0157470703125, 0.412841796875, 0.8099365234375, 1.20703125, 1.6041259765625, 2.001220703125, 2.3983154296875, 2.79541015625, 3.1925048828125, 3.589599609375, 3.9866943359375, 4.3837890625, 4.7808837890625, 5.177978515625, 5.5750732421875, 5.97216796875, 6.3692626953125, 6.766357421875, 7.1634521484375, 7.560546875, 7.9576416015625, 8.354736328125, 8.7518310546875, 9.14892578125, 9.5460205078125, 9.943115234375, 10.3402099609375, 10.7373046875, 11.1343994140625, 11.531494140625, 11.9285888671875, 12.32568359375, 12.7227783203125, 13.119873046875, 13.5169677734375, 13.9140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 8.0, 7.0, 16.0, 32.0, 34.0, 94.0, 192.0, 342.0, 951.0, 3825.0, 31869.0, 699691.0, 290166.0, 17367.0, 2608.0, 713.0, 277.0, 146.0, 71.0, 41.0, 29.0, 30.0, 5.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.7578125, -5.605804443359375, -5.45379638671875, -5.301788330078125, -5.1497802734375, -4.997772216796875, -4.84576416015625, -4.693756103515625, -4.541748046875, -4.389739990234375, -4.23773193359375, -4.085723876953125, -3.9337158203125, -3.781707763671875, -3.62969970703125, -3.477691650390625, -3.32568359375, -3.173675537109375, -3.02166748046875, -2.869659423828125, -2.7176513671875, -2.565643310546875, -2.41363525390625, -2.261627197265625, -2.109619140625, -1.957611083984375, -1.80560302734375, -1.653594970703125, -1.5015869140625, -1.349578857421875, -1.19757080078125, -1.045562744140625, -0.8935546875, -0.741546630859375, -0.58953857421875, -0.437530517578125, -0.2855224609375, -0.133514404296875, 0.01849365234375, 0.170501708984375, 0.322509765625, 0.474517822265625, 0.62652587890625, 0.778533935546875, 0.9305419921875, 1.082550048828125, 1.23455810546875, 1.386566162109375, 1.53857421875, 1.690582275390625, 1.84259033203125, 1.994598388671875, 2.1466064453125, 2.298614501953125, 2.45062255859375, 2.602630615234375, 2.754638671875, 2.906646728515625, 3.05865478515625, 3.210662841796875, 3.3626708984375, 3.514678955078125, 3.66668701171875, 3.818695068359375, 3.970703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 10.0, 2.0, 17.0, 21.0, 15.0, 15.0, 32.0, 39.0, 43.0, 39.0, 84.0, 98.0, 99.0, 82.0, 88.0, 52.0, 43.0, 41.0, 21.0, 17.0, 14.0, 17.0, 7.0, 13.0, 14.0, 13.0, 13.0, 7.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005254745483398438, -0.0005087852478027344, -0.000492095947265625, -0.0004754066467285156, -0.00045871734619140625, -0.0004420280456542969, -0.0004253387451171875, -0.0004086494445800781, -0.00039196014404296875, -0.0003752708435058594, -0.00035858154296875, -0.0003418922424316406, -0.00032520294189453125, -0.0003085136413574219, -0.0002918243408203125, -0.0002751350402832031, -0.00025844573974609375, -0.00024175643920898438, -0.000225067138671875, -0.00020837783813476562, -0.00019168853759765625, -0.00017499923706054688, -0.0001583099365234375, -0.00014162063598632812, -0.00012493133544921875, -0.00010824203491210938, -9.1552734375e-05, -7.486343383789062e-05, -5.817413330078125e-05, -4.1484832763671875e-05, -2.47955322265625e-05, -8.106231689453125e-06, 8.58306884765625e-06, 2.5272369384765625e-05, 4.1961669921875e-05, 5.8650970458984375e-05, 7.534027099609375e-05, 9.202957153320312e-05, 0.0001087188720703125, 0.00012540817260742188, 0.00014209747314453125, 0.00015878677368164062, 0.00017547607421875, 0.00019216537475585938, 0.00020885467529296875, 0.00022554397583007812, 0.0002422332763671875, 0.0002589225769042969, 0.00027561187744140625, 0.0002923011779785156, 0.000308990478515625, 0.0003256797790527344, 0.00034236907958984375, 0.0003590583801269531, 0.0003757476806640625, 0.0003924369812011719, 0.00040912628173828125, 0.0004258155822753906, 0.0004425048828125, 0.0004591941833496094, 0.00047588348388671875, 0.0004925727844238281, 0.0005092620849609375, 0.0005259513854980469, 0.0005426406860351562]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 10.0, 20.0, 31.0, 72.0, 105.0, 233.0, 479.0, 1221.0, 3815.0, 21768.0, 347527.0, 636687.0, 29586.0, 4544.0, 1369.0, 531.0, 265.0, 132.0, 65.0, 46.0, 23.0, 8.0, 4.0, 4.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.46099853515625, -4.3126220703125, -4.16424560546875, -4.015869140625, -3.86749267578125, -3.7191162109375, -3.57073974609375, -3.42236328125, -3.27398681640625, -3.1256103515625, -2.97723388671875, -2.828857421875, -2.68048095703125, -2.5321044921875, -2.38372802734375, -2.2353515625, -2.08697509765625, -1.9385986328125, -1.79022216796875, -1.641845703125, -1.49346923828125, -1.3450927734375, -1.19671630859375, -1.04833984375, -0.89996337890625, -0.7515869140625, -0.60321044921875, -0.454833984375, -0.30645751953125, -0.1580810546875, -0.00970458984375, 0.138671875, 0.28704833984375, 0.4354248046875, 0.58380126953125, 0.732177734375, 0.88055419921875, 1.0289306640625, 1.17730712890625, 1.32568359375, 1.47406005859375, 1.6224365234375, 1.77081298828125, 1.919189453125, 2.06756591796875, 2.2159423828125, 2.36431884765625, 2.5126953125, 2.66107177734375, 2.8094482421875, 2.95782470703125, 3.106201171875, 3.25457763671875, 3.4029541015625, 3.55133056640625, 3.69970703125, 3.84808349609375, 3.9964599609375, 4.14483642578125, 4.293212890625, 4.44158935546875, 4.5899658203125, 4.73834228515625, 4.88671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 6.0, 3.0, 10.0, 3.0, 8.0, 11.0, 9.0, 13.0, 13.0, 22.0, 25.0, 31.0, 38.0, 34.0, 49.0, 50.0, 73.0, 61.0, 60.0, 69.0, 68.0, 56.0, 49.0, 51.0, 27.0, 24.0, 24.0, 21.0, 16.0, 11.0, 15.0, 5.0, 13.0, 2.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0546875, -1.9857177734375, -1.916748046875, -1.8477783203125, -1.77880859375, -1.7098388671875, -1.640869140625, -1.5718994140625, -1.5029296875, -1.4339599609375, -1.364990234375, -1.2960205078125, -1.22705078125, -1.1580810546875, -1.089111328125, -1.0201416015625, -0.951171875, -0.8822021484375, -0.813232421875, -0.7442626953125, -0.67529296875, -0.6063232421875, -0.537353515625, -0.4683837890625, -0.3994140625, -0.3304443359375, -0.261474609375, -0.1925048828125, -0.12353515625, -0.0545654296875, 0.014404296875, 0.0833740234375, 0.15234375, 0.2213134765625, 0.290283203125, 0.3592529296875, 0.42822265625, 0.4971923828125, 0.566162109375, 0.6351318359375, 0.7041015625, 0.7730712890625, 0.842041015625, 0.9110107421875, 0.97998046875, 1.0489501953125, 1.117919921875, 1.1868896484375, 1.255859375, 1.3248291015625, 1.393798828125, 1.4627685546875, 1.53173828125, 1.6007080078125, 1.669677734375, 1.7386474609375, 1.8076171875, 1.8765869140625, 1.945556640625, 2.0145263671875, 2.08349609375, 2.1524658203125, 2.221435546875, 2.2904052734375, 2.359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 11.0, 17.0, 27.0, 52.0, 135.0, 338.0, 242.0, 100.0, 44.0, 15.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-159.8489532470703, -156.28546142578125, -152.72195434570312, -149.15846252441406, -145.594970703125, -142.03146362304688, -138.4679718017578, -134.9044647216797, -131.34097290039062, -127.77747344970703, -124.21397399902344, -120.65048217773438, -117.08698272705078, -113.52348327636719, -109.95999145507812, -106.39649200439453, -102.83299255371094, -99.26949310302734, -95.70599365234375, -92.14250183105469, -88.5790023803711, -85.0155029296875, -81.45201110839844, -77.88851165771484, -74.32501220703125, -70.76151275634766, -67.19801330566406, -63.634521484375, -60.071022033691406, -56.50752258300781, -52.944026947021484, -49.380531311035156, -45.817039489746094, -42.2535400390625, -38.69004440307617, -35.126548767089844, -31.56304931640625, -27.99955177307129, -24.436054229736328, -20.872556686401367, -17.309059143066406, -13.745561599731445, -10.182064056396484, -6.618566513061523, -3.0550689697265625, 0.5084285736083984, 4.071926116943359, 7.63542366027832, 11.198921203613281, 14.762418746948242, 18.325916290283203, 21.889413833618164, 25.452911376953125, 29.016408920288086, 32.57990646362305, 36.143402099609375, 39.70690155029297, 43.27040100097656, 46.83389663696289, 50.39739227294922, 53.96089172363281, 57.524391174316406, 61.087886810302734, 64.65138244628906, 68.21488189697266]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 6.0, 6.0, 7.0, 10.0, 8.0, 12.0, 6.0, 17.0, 19.0, 20.0, 17.0, 8.0, 19.0, 32.0, 24.0, 28.0, 26.0, 31.0, 41.0, 67.0, 68.0, 59.0, 51.0, 48.0, 41.0, 28.0, 21.0, 28.0, 21.0, 34.0, 19.0, 21.0, 22.0, 17.0, 19.0, 12.0, 13.0, 9.0, 10.0, 4.0, 6.0, 6.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-40.991546630859375, -39.713523864746094, -38.43549728393555, -37.157474517822266, -35.879451751708984, -34.60142517089844, -33.323402404785156, -32.045379638671875, -30.76735496520996, -29.489330291748047, -28.211307525634766, -26.93328285217285, -25.655258178710938, -24.377235412597656, -23.099210739135742, -21.821186065673828, -20.543163299560547, -19.265138626098633, -17.98711585998535, -16.709091186523438, -15.43106746673584, -14.153043746948242, -12.875019073486328, -11.59699535369873, -10.318971633911133, -9.040947914123535, -7.762923717498779, -6.484899520874023, -5.206875801086426, -3.928852081298828, -2.6508278846740723, -1.3728036880493164, -0.09477615356445312, 1.1832478046417236, 2.4612717628479004, 3.739295721054077, 5.017319679260254, 6.295343399047852, 7.573367595672607, 8.851391792297363, 10.129415512084961, 11.407439231872559, 12.685462951660156, 13.96348762512207, 15.241511344909668, 16.519535064697266, 17.79755973815918, 19.075584411621094, 20.353607177734375, 21.63163185119629, 22.90965461730957, 24.187679290771484, 25.465702056884766, 26.74372673034668, 28.021751403808594, 29.299774169921875, 30.57779884338379, 31.855823516845703, 33.133846282958984, 34.411869049072266, 35.68989562988281, 36.967918395996094, 38.245941162109375, 39.52396774291992, 40.8019905090332]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 11.0, 17.0, 17.0, 17.0, 23.0, 49.0, 44.0, 64.0, 83.0, 144.0, 246.0, 419.0, 798.0, 1764.0, 4353.0, 14408.0, 84344.0, 1416460.0, 2479737.0, 160370.0, 20804.0, 5607.0, 2201.0, 954.0, 493.0, 307.0, 148.0, 100.0, 68.0, 54.0, 42.0, 30.0, 16.0, 19.0, 13.0, 8.0, 11.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.45635986328125, -4.3033447265625, -4.15032958984375, -3.997314453125, -3.84429931640625, -3.6912841796875, -3.53826904296875, -3.38525390625, -3.23223876953125, -3.0792236328125, -2.92620849609375, -2.773193359375, -2.62017822265625, -2.4671630859375, -2.31414794921875, -2.1611328125, -2.00811767578125, -1.8551025390625, -1.70208740234375, -1.549072265625, -1.39605712890625, -1.2430419921875, -1.09002685546875, -0.93701171875, -0.78399658203125, -0.6309814453125, -0.47796630859375, -0.324951171875, -0.17193603515625, -0.0189208984375, 0.13409423828125, 0.287109375, 0.44012451171875, 0.5931396484375, 0.74615478515625, 0.899169921875, 1.05218505859375, 1.2052001953125, 1.35821533203125, 1.51123046875, 1.66424560546875, 1.8172607421875, 1.97027587890625, 2.123291015625, 2.27630615234375, 2.4293212890625, 2.58233642578125, 2.7353515625, 2.88836669921875, 3.0413818359375, 3.19439697265625, 3.347412109375, 3.50042724609375, 3.6534423828125, 3.80645751953125, 3.95947265625, 4.11248779296875, 4.2655029296875, 4.41851806640625, 4.571533203125, 4.72454833984375, 4.8775634765625, 5.03057861328125, 5.18359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 15.0, 24.0, 19.0, 21.0, 26.0, 32.0, 29.0, 43.0, 37.0, 38.0, 45.0, 42.0, 47.0, 52.0, 48.0, 34.0, 39.0, 46.0, 37.0, 32.0, 40.0, 37.0, 31.0, 26.0, 19.0, 24.0, 14.0, 16.0, 8.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.88629150390625, -2.7999267578125, -2.71356201171875, -2.627197265625, -2.54083251953125, -2.4544677734375, -2.36810302734375, -2.28173828125, -2.19537353515625, -2.1090087890625, -2.02264404296875, -1.936279296875, -1.84991455078125, -1.7635498046875, -1.67718505859375, -1.5908203125, -1.50445556640625, -1.4180908203125, -1.33172607421875, -1.245361328125, -1.15899658203125, -1.0726318359375, -0.98626708984375, -0.89990234375, -0.81353759765625, -0.7271728515625, -0.64080810546875, -0.554443359375, -0.46807861328125, -0.3817138671875, -0.29534912109375, -0.208984375, -0.12261962890625, -0.0362548828125, 0.05010986328125, 0.136474609375, 0.22283935546875, 0.3092041015625, 0.39556884765625, 0.48193359375, 0.56829833984375, 0.6546630859375, 0.74102783203125, 0.827392578125, 0.91375732421875, 1.0001220703125, 1.08648681640625, 1.1728515625, 1.25921630859375, 1.3455810546875, 1.43194580078125, 1.518310546875, 1.60467529296875, 1.6910400390625, 1.77740478515625, 1.86376953125, 1.95013427734375, 2.0364990234375, 2.12286376953125, 2.209228515625, 2.29559326171875, 2.3819580078125, 2.46832275390625, 2.5546875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 20.0, 29.0, 46.0, 84.0, 129.0, 265.0, 604.0, 1439.0, 3970.0, 14574.0, 90001.0, 2978742.0, 1033022.0, 53792.0, 11380.0, 3590.0, 1345.0, 599.0, 279.0, 141.0, 72.0, 57.0, 35.0, 20.0, 4.0, 9.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.33038330078125, -5.0865478515625, -4.84271240234375, -4.598876953125, -4.35504150390625, -4.1112060546875, -3.86737060546875, -3.62353515625, -3.37969970703125, -3.1358642578125, -2.89202880859375, -2.648193359375, -2.40435791015625, -2.1605224609375, -1.91668701171875, -1.6728515625, -1.42901611328125, -1.1851806640625, -0.94134521484375, -0.697509765625, -0.45367431640625, -0.2098388671875, 0.03399658203125, 0.27783203125, 0.52166748046875, 0.7655029296875, 1.00933837890625, 1.253173828125, 1.49700927734375, 1.7408447265625, 1.98468017578125, 2.228515625, 2.47235107421875, 2.7161865234375, 2.96002197265625, 3.203857421875, 3.44769287109375, 3.6915283203125, 3.93536376953125, 4.17919921875, 4.42303466796875, 4.6668701171875, 4.91070556640625, 5.154541015625, 5.39837646484375, 5.6422119140625, 5.88604736328125, 6.1298828125, 6.37371826171875, 6.6175537109375, 6.86138916015625, 7.105224609375, 7.34906005859375, 7.5928955078125, 7.83673095703125, 8.08056640625, 8.32440185546875, 8.5682373046875, 8.81207275390625, 9.055908203125, 9.29974365234375, 9.5435791015625, 9.78741455078125, 10.03125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 8.0, 23.0, 29.0, 25.0, 56.0, 62.0, 143.0, 222.0, 401.0, 661.0, 884.0, 605.0, 370.0, 184.0, 113.0, 57.0, 43.0, 33.0, 30.0, 27.0, 14.0, 7.0, 10.0, 7.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.889404296875, -5.68896484375, -5.488525390625, -5.2880859375, -5.087646484375, -4.88720703125, -4.686767578125, -4.486328125, -4.285888671875, -4.08544921875, -3.885009765625, -3.6845703125, -3.484130859375, -3.28369140625, -3.083251953125, -2.8828125, -2.682373046875, -2.48193359375, -2.281494140625, -2.0810546875, -1.880615234375, -1.68017578125, -1.479736328125, -1.279296875, -1.078857421875, -0.87841796875, -0.677978515625, -0.4775390625, -0.277099609375, -0.07666015625, 0.123779296875, 0.32421875, 0.524658203125, 0.72509765625, 0.925537109375, 1.1259765625, 1.326416015625, 1.52685546875, 1.727294921875, 1.927734375, 2.128173828125, 2.32861328125, 2.529052734375, 2.7294921875, 2.929931640625, 3.13037109375, 3.330810546875, 3.53125, 3.731689453125, 3.93212890625, 4.132568359375, 4.3330078125, 4.533447265625, 4.73388671875, 4.934326171875, 5.134765625, 5.335205078125, 5.53564453125, 5.736083984375, 5.9365234375, 6.136962890625, 6.33740234375, 6.537841796875, 6.73828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 7.0, 14.0, 61.0, 142.0, 272.0, 241.0, 141.0, 52.0, 18.0, 15.0, 9.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.62208557128906, -73.77632904052734, -70.93058013916016, -68.08482360839844, -65.23906707763672, -62.393314361572266, -59.54756164550781, -56.701805114746094, -53.856048583984375, -51.01029586791992, -48.1645393371582, -45.31878662109375, -42.47303009033203, -39.62727737426758, -36.781524658203125, -33.935768127441406, -31.090015411376953, -28.244260787963867, -25.39850616455078, -22.552753448486328, -19.70699691772461, -16.861244201660156, -14.01548957824707, -11.169734954833984, -8.323980331420898, -5.4782257080078125, -2.6324715614318848, 0.21328258514404297, 3.059037208557129, 5.904791831970215, 8.750545501708984, 11.59630012512207, 14.442054748535156, 17.287809371948242, 20.133563995361328, 22.97931671142578, 25.8250732421875, 28.670825958251953, 31.51658058166504, 34.362335205078125, 37.208091735839844, 40.0538444519043, 42.899600982666016, 45.74535369873047, 48.59111022949219, 51.43686294555664, 54.282615661621094, 57.12837219238281, 59.974124908447266, 62.81987762451172, 65.66563415527344, 68.51139068603516, 71.35713958740234, 74.20289611816406, 77.04865264892578, 79.8944091796875, 82.74015808105469, 85.5859146118164, 88.4316635131836, 91.27742004394531, 94.12317657470703, 96.96893310546875, 99.81468200683594, 102.66043853759766, 105.50619506835938]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 10.0, 14.0, 17.0, 13.0, 20.0, 30.0, 28.0, 26.0, 38.0, 49.0, 32.0, 41.0, 42.0, 49.0, 43.0, 49.0, 40.0, 58.0, 42.0, 39.0, 47.0, 32.0, 31.0, 25.0, 32.0, 17.0, 20.0, 12.0, 24.0, 10.0, 14.0, 7.0, 15.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.549673080444336, -29.599855422973633, -28.65003776550293, -27.70022201538086, -26.750404357910156, -25.800586700439453, -24.85076904296875, -23.900951385498047, -22.951133728027344, -22.00131607055664, -21.051498413085938, -20.101680755615234, -19.151865005493164, -18.20204734802246, -17.252229690551758, -16.302412033081055, -15.352596282958984, -14.402778625488281, -13.452961921691895, -12.503144264221191, -11.553327560424805, -10.603509902954102, -9.653692245483398, -8.703874588012695, -7.754057884216309, -6.804240703582764, -5.854423522949219, -4.904605865478516, -3.9547886848449707, -3.004971504211426, -2.0551538467407227, -1.1053366661071777, -0.155517578125, 0.7942997217178345, 1.744117021560669, 2.693934440612793, 3.643751621246338, 4.593568801879883, 5.543386459350586, 6.493203639984131, 7.443020820617676, 8.392838478088379, 9.342655181884766, 10.292472839355469, 11.242290496826172, 12.192107200622559, 13.141924858093262, 14.091741561889648, 15.041559219360352, 15.991376876831055, 16.941194534301758, 17.891010284423828, 18.84082794189453, 19.790645599365234, 20.740463256835938, 21.69028091430664, 22.640098571777344, 23.589916229248047, 24.53973388671875, 25.489551544189453, 26.439367294311523, 27.389184951782227, 28.33900260925293, 29.288820266723633, 30.238636016845703]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 8.0, 5.0, 5.0, 6.0, 20.0, 13.0, 33.0, 53.0, 70.0, 127.0, 254.0, 498.0, 920.0, 2102.0, 5388.0, 14556.0, 46237.0, 166431.0, 433583.0, 267140.0, 75277.0, 22489.0, 7745.0, 2916.0, 1317.0, 593.0, 304.0, 170.0, 109.0, 58.0, 34.0, 28.0, 21.0, 13.0, 11.0, 10.0, 5.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.11328125, -6.929443359375, -6.74560546875, -6.561767578125, -6.3779296875, -6.194091796875, -6.01025390625, -5.826416015625, -5.642578125, -5.458740234375, -5.27490234375, -5.091064453125, -4.9072265625, -4.723388671875, -4.53955078125, -4.355712890625, -4.171875, -3.988037109375, -3.80419921875, -3.620361328125, -3.4365234375, -3.252685546875, -3.06884765625, -2.885009765625, -2.701171875, -2.517333984375, -2.33349609375, -2.149658203125, -1.9658203125, -1.781982421875, -1.59814453125, -1.414306640625, -1.23046875, -1.046630859375, -0.86279296875, -0.678955078125, -0.4951171875, -0.311279296875, -0.12744140625, 0.056396484375, 0.240234375, 0.424072265625, 0.60791015625, 0.791748046875, 0.9755859375, 1.159423828125, 1.34326171875, 1.527099609375, 1.7109375, 1.894775390625, 2.07861328125, 2.262451171875, 2.4462890625, 2.630126953125, 2.81396484375, 2.997802734375, 3.181640625, 3.365478515625, 3.54931640625, 3.733154296875, 3.9169921875, 4.100830078125, 4.28466796875, 4.468505859375, 4.65234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 5.0, 8.0, 12.0, 12.0, 12.0, 17.0, 21.0, 28.0, 30.0, 32.0, 26.0, 39.0, 37.0, 33.0, 42.0, 46.0, 34.0, 35.0, 33.0, 48.0, 41.0, 44.0, 41.0, 37.0, 35.0, 42.0, 34.0, 26.0, 14.0, 26.0, 17.0, 14.0, 19.0, 9.0, 10.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.8302001953125, -2.744384765625, -2.6585693359375, -2.57275390625, -2.4869384765625, -2.401123046875, -2.3153076171875, -2.2294921875, -2.1436767578125, -2.057861328125, -1.9720458984375, -1.88623046875, -1.8004150390625, -1.714599609375, -1.6287841796875, -1.54296875, -1.4571533203125, -1.371337890625, -1.2855224609375, -1.19970703125, -1.1138916015625, -1.028076171875, -0.9422607421875, -0.8564453125, -0.7706298828125, -0.684814453125, -0.5989990234375, -0.51318359375, -0.4273681640625, -0.341552734375, -0.2557373046875, -0.169921875, -0.0841064453125, 0.001708984375, 0.0875244140625, 0.17333984375, 0.2591552734375, 0.344970703125, 0.4307861328125, 0.5166015625, 0.6024169921875, 0.688232421875, 0.7740478515625, 0.85986328125, 0.9456787109375, 1.031494140625, 1.1173095703125, 1.203125, 1.2889404296875, 1.374755859375, 1.4605712890625, 1.54638671875, 1.6322021484375, 1.718017578125, 1.8038330078125, 1.8896484375, 1.9754638671875, 2.061279296875, 2.1470947265625, 2.23291015625, 2.3187255859375, 2.404541015625, 2.4903564453125, 2.576171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 10.0, 4.0, 4.0, 9.0, 10.0, 19.0, 25.0, 28.0, 54.0, 89.0, 127.0, 245.0, 380.0, 826.0, 1682.0, 4134.0, 11829.0, 45658.0, 255715.0, 607474.0, 89386.0, 19967.0, 6184.0, 2278.0, 1102.0, 506.0, 320.0, 164.0, 95.0, 57.0, 53.0, 30.0, 22.0, 23.0, 12.0, 7.0, 7.0, 3.0, 7.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.80078125, -7.56585693359375, -7.3309326171875, -7.09600830078125, -6.861083984375, -6.62615966796875, -6.3912353515625, -6.15631103515625, -5.92138671875, -5.68646240234375, -5.4515380859375, -5.21661376953125, -4.981689453125, -4.74676513671875, -4.5118408203125, -4.27691650390625, -4.0419921875, -3.80706787109375, -3.5721435546875, -3.33721923828125, -3.102294921875, -2.86737060546875, -2.6324462890625, -2.39752197265625, -2.16259765625, -1.92767333984375, -1.6927490234375, -1.45782470703125, -1.222900390625, -0.98797607421875, -0.7530517578125, -0.51812744140625, -0.283203125, -0.04827880859375, 0.1866455078125, 0.42156982421875, 0.656494140625, 0.89141845703125, 1.1263427734375, 1.36126708984375, 1.59619140625, 1.83111572265625, 2.0660400390625, 2.30096435546875, 2.535888671875, 2.77081298828125, 3.0057373046875, 3.24066162109375, 3.4755859375, 3.71051025390625, 3.9454345703125, 4.18035888671875, 4.415283203125, 4.65020751953125, 4.8851318359375, 5.12005615234375, 5.35498046875, 5.58990478515625, 5.8248291015625, 6.05975341796875, 6.294677734375, 6.52960205078125, 6.7645263671875, 6.99945068359375, 7.234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 4.0, 8.0, 13.0, 12.0, 18.0, 12.0, 29.0, 33.0, 31.0, 41.0, 46.0, 56.0, 78.0, 58.0, 64.0, 53.0, 67.0, 54.0, 58.0, 39.0, 39.0, 33.0, 33.0, 19.0, 22.0, 23.0, 14.0, 6.0, 6.0, 5.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.640625, -13.233154296875, -12.82568359375, -12.418212890625, -12.0107421875, -11.603271484375, -11.19580078125, -10.788330078125, -10.380859375, -9.973388671875, -9.56591796875, -9.158447265625, -8.7509765625, -8.343505859375, -7.93603515625, -7.528564453125, -7.12109375, -6.713623046875, -6.30615234375, -5.898681640625, -5.4912109375, -5.083740234375, -4.67626953125, -4.268798828125, -3.861328125, -3.453857421875, -3.04638671875, -2.638916015625, -2.2314453125, -1.823974609375, -1.41650390625, -1.009033203125, -0.6015625, -0.194091796875, 0.21337890625, 0.620849609375, 1.0283203125, 1.435791015625, 1.84326171875, 2.250732421875, 2.658203125, 3.065673828125, 3.47314453125, 3.880615234375, 4.2880859375, 4.695556640625, 5.10302734375, 5.510498046875, 5.91796875, 6.325439453125, 6.73291015625, 7.140380859375, 7.5478515625, 7.955322265625, 8.36279296875, 8.770263671875, 9.177734375, 9.585205078125, 9.99267578125, 10.400146484375, 10.8076171875, 11.215087890625, 11.62255859375, 12.030029296875, 12.4375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 7.0, 16.0, 17.0, 24.0, 32.0, 35.0, 51.0, 79.0, 157.0, 252.0, 408.0, 783.0, 1776.0, 4514.0, 13955.0, 54259.0, 264603.0, 583692.0, 91250.0, 21564.0, 6398.0, 2390.0, 1030.0, 507.0, 277.0, 177.0, 81.0, 55.0, 44.0, 32.0, 22.0, 18.0, 9.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.25604248046875, -2.1859130859375, -2.11578369140625, -2.045654296875, -1.97552490234375, -1.9053955078125, -1.83526611328125, -1.76513671875, -1.69500732421875, -1.6248779296875, -1.55474853515625, -1.484619140625, -1.41448974609375, -1.3443603515625, -1.27423095703125, -1.2041015625, -1.13397216796875, -1.0638427734375, -0.99371337890625, -0.923583984375, -0.85345458984375, -0.7833251953125, -0.71319580078125, -0.64306640625, -0.57293701171875, -0.5028076171875, -0.43267822265625, -0.362548828125, -0.29241943359375, -0.2222900390625, -0.15216064453125, -0.08203125, -0.01190185546875, 0.0582275390625, 0.12835693359375, 0.198486328125, 0.26861572265625, 0.3387451171875, 0.40887451171875, 0.47900390625, 0.54913330078125, 0.6192626953125, 0.68939208984375, 0.759521484375, 0.82965087890625, 0.8997802734375, 0.96990966796875, 1.0400390625, 1.11016845703125, 1.1802978515625, 1.25042724609375, 1.320556640625, 1.39068603515625, 1.4608154296875, 1.53094482421875, 1.60107421875, 1.67120361328125, 1.7413330078125, 1.81146240234375, 1.881591796875, 1.95172119140625, 2.0218505859375, 2.09197998046875, 2.162109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 1.0, 8.0, 17.0, 15.0, 26.0, 57.0, 76.0, 142.0, 190.0, 180.0, 132.0, 56.0, 39.0, 17.0, 14.0, 7.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005517005920410156, -0.0005206689238548279, -0.0004896372556686401, -0.0004586055874824524, -0.00042757391929626465, -0.0003965422511100769, -0.00036551058292388916, -0.0003344789147377014, -0.00030344724655151367, -0.00027241557836532593, -0.00024138391017913818, -0.00021035224199295044, -0.0001793205738067627, -0.00014828890562057495, -0.00011725723743438721, -8.622556924819946e-05, -5.519390106201172e-05, -2.4162232875823975e-05, 6.8694353103637695e-06, 3.7901103496551514e-05, 6.893277168273926e-05, 9.9964439868927e-05, 0.00013099610805511475, 0.0001620277762413025, 0.00019305944442749023, 0.00022409111261367798, 0.0002551227807998657, 0.00028615444898605347, 0.0003171861171722412, 0.00034821778535842896, 0.0003792494535446167, 0.00041028112173080444, 0.0004413127899169922, 0.00047234445810317993, 0.0005033761262893677, 0.0005344077944755554, 0.0005654394626617432, 0.0005964711308479309, 0.0006275027990341187, 0.0006585344672203064, 0.0006895661354064941, 0.0007205978035926819, 0.0007516294717788696, 0.0007826611399650574, 0.0008136928081512451, 0.0008447244763374329, 0.0008757561445236206, 0.0009067878127098083, 0.0009378194808959961, 0.0009688511490821838, 0.0009998828172683716, 0.0010309144854545593, 0.001061946153640747, 0.0010929778218269348, 0.0011240094900131226, 0.0011550411581993103, 0.001186072826385498, 0.0012171044945716858, 0.0012481361627578735, 0.0012791678309440613, 0.001310199499130249, 0.0013412311673164368, 0.0013722628355026245, 0.0014032945036888123, 0.001434326171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 18.0, 27.0, 29.0, 65.0, 92.0, 122.0, 219.0, 357.0, 658.0, 1253.0, 2766.0, 7724.0, 28619.0, 156743.0, 663487.0, 146154.0, 27308.0, 7391.0, 2758.0, 1234.0, 636.0, 321.0, 211.0, 115.0, 72.0, 51.0, 37.0, 16.0, 14.0, 10.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.99609375, -1.91455078125, -1.8330078125, -1.75146484375, -1.669921875, -1.58837890625, -1.5068359375, -1.42529296875, -1.34375, -1.26220703125, -1.1806640625, -1.09912109375, -1.017578125, -0.93603515625, -0.8544921875, -0.77294921875, -0.69140625, -0.60986328125, -0.5283203125, -0.44677734375, -0.365234375, -0.28369140625, -0.2021484375, -0.12060546875, -0.0390625, 0.04248046875, 0.1240234375, 0.20556640625, 0.287109375, 0.36865234375, 0.4501953125, 0.53173828125, 0.61328125, 0.69482421875, 0.7763671875, 0.85791015625, 0.939453125, 1.02099609375, 1.1025390625, 1.18408203125, 1.265625, 1.34716796875, 1.4287109375, 1.51025390625, 1.591796875, 1.67333984375, 1.7548828125, 1.83642578125, 1.91796875, 1.99951171875, 2.0810546875, 2.16259765625, 2.244140625, 2.32568359375, 2.4072265625, 2.48876953125, 2.5703125, 2.65185546875, 2.7333984375, 2.81494140625, 2.896484375, 2.97802734375, 3.0595703125, 3.14111328125, 3.22265625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 6.0, 17.0, 17.0, 29.0, 27.0, 30.0, 53.0, 83.0, 67.0, 88.0, 93.0, 93.0, 78.0, 71.0, 78.0, 37.0, 36.0, 28.0, 21.0, 6.0, 7.0, 4.0, 12.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.541015625, -3.454254150390625, -3.36749267578125, -3.280731201171875, -3.1939697265625, -3.107208251953125, -3.02044677734375, -2.933685302734375, -2.846923828125, -2.760162353515625, -2.67340087890625, -2.586639404296875, -2.4998779296875, -2.413116455078125, -2.32635498046875, -2.239593505859375, -2.15283203125, -2.066070556640625, -1.97930908203125, -1.892547607421875, -1.8057861328125, -1.719024658203125, -1.63226318359375, -1.545501708984375, -1.458740234375, -1.371978759765625, -1.28521728515625, -1.198455810546875, -1.1116943359375, -1.024932861328125, -0.93817138671875, -0.851409912109375, -0.7646484375, -0.677886962890625, -0.59112548828125, -0.504364013671875, -0.4176025390625, -0.330841064453125, -0.24407958984375, -0.157318115234375, -0.070556640625, 0.016204833984375, 0.10296630859375, 0.189727783203125, 0.2764892578125, 0.363250732421875, 0.45001220703125, 0.536773681640625, 0.62353515625, 0.710296630859375, 0.79705810546875, 0.883819580078125, 0.9705810546875, 1.057342529296875, 1.14410400390625, 1.230865478515625, 1.317626953125, 1.404388427734375, 1.49114990234375, 1.577911376953125, 1.6646728515625, 1.751434326171875, 1.83819580078125, 1.924957275390625, 2.01171875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 20.0, 51.0, 95.0, 170.0, 300.0, 175.0, 98.0, 38.0, 21.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.49407958984375, -65.19925689697266, -62.9044303894043, -60.6096076965332, -58.31478500366211, -56.01995849609375, -53.725135803222656, -51.43031311035156, -49.13549041748047, -46.840667724609375, -44.545841217041016, -42.25101852416992, -39.95619583129883, -37.66136932373047, -35.366546630859375, -33.07172393798828, -30.776897430419922, -28.482072830200195, -26.1872501373291, -23.892425537109375, -21.59760284423828, -19.302778244018555, -17.007953643798828, -14.713130950927734, -12.418306350708008, -10.123482704162598, -7.828658580780029, -5.533834457397461, -3.239010810852051, -0.9441871643066406, 1.350637435913086, 3.6454601287841797, 5.940284729003906, 8.235108375549316, 10.529932022094727, 12.824756622314453, 15.119580268859863, 17.414403915405273, 19.709228515625, 22.004051208496094, 24.29887580871582, 26.593700408935547, 28.88852310180664, 31.183347702026367, 33.478172302246094, 35.77299499511719, 38.06781768798828, 40.362640380859375, 42.657466888427734, 44.95228958129883, 47.24711608886719, 49.54193878173828, 51.836761474609375, 54.13158416748047, 56.42641067504883, 58.72123336791992, 61.01605987548828, 63.310882568359375, 65.60570526123047, 67.90052795410156, 70.19535827636719, 72.49018096923828, 74.78500366210938, 77.07982635498047, 79.37464904785156]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 7.0, 5.0, 11.0, 10.0, 17.0, 17.0, 19.0, 15.0, 19.0, 25.0, 33.0, 31.0, 30.0, 33.0, 50.0, 58.0, 57.0, 77.0, 67.0, 54.0, 33.0, 41.0, 37.0, 29.0, 26.0, 21.0, 23.0, 14.0, 15.0, 13.0, 17.0, 11.0, 11.0, 6.0, 14.0, 4.0, 5.0, 9.0, 2.0, 10.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.40778350830078, -35.24851989746094, -34.089256286621094, -32.929996490478516, -31.770732879638672, -30.611469268798828, -29.452205657958984, -28.29294204711914, -27.13368034362793, -25.974416732788086, -24.815155029296875, -23.65589141845703, -22.496627807617188, -21.337366104125977, -20.178102493286133, -19.018840789794922, -17.859577178955078, -16.700313568115234, -15.541051864624023, -14.38178825378418, -13.222525596618652, -12.063262939453125, -10.903999328613281, -9.744736671447754, -8.585474014282227, -7.426211357116699, -6.266948223114014, -5.107685089111328, -3.948422431945801, -2.7891597747802734, -1.629896640777588, -0.47063350677490234, 0.688629150390625, 1.8478920459747314, 3.007154941558838, 4.166418075561523, 5.325680732727051, 6.484943389892578, 7.644206523895264, 8.80346965789795, 9.962732315063477, 11.121994972229004, 12.281257629394531, 13.440521240234375, 14.599783897399902, 15.75904655456543, 16.918310165405273, 18.077571868896484, 19.236835479736328, 20.396099090576172, 21.555360794067383, 22.714624404907227, 23.873886108398438, 25.03314971923828, 26.192413330078125, 27.35167694091797, 28.51093864440918, 29.670202255249023, 30.829463958740234, 31.988727569580078, 33.14799118041992, 34.3072509765625, 35.466514587402344, 36.62577819824219, 37.78504180908203]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 11.0, 11.0, 24.0, 25.0, 26.0, 41.0, 50.0, 95.0, 111.0, 142.0, 258.0, 401.0, 648.0, 1135.0, 2100.0, 4486.0, 10839.0, 37503.0, 221877.0, 1679154.0, 1899777.0, 268757.0, 45001.0, 11770.0, 4762.0, 2235.0, 1143.0, 713.0, 396.0, 249.0, 161.0, 87.0, 60.0, 49.0, 45.0, 33.0, 22.0, 22.0, 12.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.22265625, -3.115386962890625, -3.00811767578125, -2.900848388671875, -2.7935791015625, -2.686309814453125, -2.57904052734375, -2.471771240234375, -2.364501953125, -2.257232666015625, -2.14996337890625, -2.042694091796875, -1.9354248046875, -1.828155517578125, -1.72088623046875, -1.613616943359375, -1.50634765625, -1.399078369140625, -1.29180908203125, -1.184539794921875, -1.0772705078125, -0.970001220703125, -0.86273193359375, -0.755462646484375, -0.648193359375, -0.540924072265625, -0.43365478515625, -0.326385498046875, -0.2191162109375, -0.111846923828125, -0.00457763671875, 0.102691650390625, 0.2099609375, 0.317230224609375, 0.42449951171875, 0.531768798828125, 0.6390380859375, 0.746307373046875, 0.85357666015625, 0.960845947265625, 1.068115234375, 1.175384521484375, 1.28265380859375, 1.389923095703125, 1.4971923828125, 1.604461669921875, 1.71173095703125, 1.819000244140625, 1.92626953125, 2.033538818359375, 2.14080810546875, 2.248077392578125, 2.3553466796875, 2.462615966796875, 2.56988525390625, 2.677154541015625, 2.784423828125, 2.891693115234375, 2.99896240234375, 3.106231689453125, 3.2135009765625, 3.320770263671875, 3.42803955078125, 3.535308837890625, 3.642578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 14.0, 9.0, 27.0, 21.0, 25.0, 26.0, 24.0, 31.0, 33.0, 31.0, 40.0, 52.0, 56.0, 46.0, 47.0, 50.0, 53.0, 40.0, 42.0, 35.0, 44.0, 39.0, 26.0, 26.0, 16.0, 18.0, 12.0, 13.0, 12.0, 11.0, 7.0, 8.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.837890625, -2.751800537109375, -2.66571044921875, -2.579620361328125, -2.4935302734375, -2.407440185546875, -2.32135009765625, -2.235260009765625, -2.149169921875, -2.063079833984375, -1.97698974609375, -1.890899658203125, -1.8048095703125, -1.718719482421875, -1.63262939453125, -1.546539306640625, -1.46044921875, -1.374359130859375, -1.28826904296875, -1.202178955078125, -1.1160888671875, -1.029998779296875, -0.94390869140625, -0.857818603515625, -0.771728515625, -0.685638427734375, -0.59954833984375, -0.513458251953125, -0.4273681640625, -0.341278076171875, -0.25518798828125, -0.169097900390625, -0.0830078125, 0.003082275390625, 0.08917236328125, 0.175262451171875, 0.2613525390625, 0.347442626953125, 0.43353271484375, 0.519622802734375, 0.605712890625, 0.691802978515625, 0.77789306640625, 0.863983154296875, 0.9500732421875, 1.036163330078125, 1.12225341796875, 1.208343505859375, 1.29443359375, 1.380523681640625, 1.46661376953125, 1.552703857421875, 1.6387939453125, 1.724884033203125, 1.81097412109375, 1.897064208984375, 1.983154296875, 2.069244384765625, 2.15533447265625, 2.241424560546875, 2.3275146484375, 2.413604736328125, 2.49969482421875, 2.585784912109375, 2.671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 16.0, 15.0, 29.0, 66.0, 99.0, 150.0, 331.0, 697.0, 2041.0, 9936.0, 118702.0, 3909323.0, 138402.0, 10970.0, 2156.0, 697.0, 291.0, 170.0, 67.0, 40.0, 29.0, 15.0, 9.0, 10.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1796875, -9.8348388671875, -9.489990234375, -9.1451416015625, -8.80029296875, -8.4554443359375, -8.110595703125, -7.7657470703125, -7.4208984375, -7.0760498046875, -6.731201171875, -6.3863525390625, -6.04150390625, -5.6966552734375, -5.351806640625, -5.0069580078125, -4.662109375, -4.3172607421875, -3.972412109375, -3.6275634765625, -3.28271484375, -2.9378662109375, -2.593017578125, -2.2481689453125, -1.9033203125, -1.5584716796875, -1.213623046875, -0.8687744140625, -0.52392578125, -0.1790771484375, 0.165771484375, 0.5106201171875, 0.85546875, 1.2003173828125, 1.545166015625, 1.8900146484375, 2.23486328125, 2.5797119140625, 2.924560546875, 3.2694091796875, 3.6142578125, 3.9591064453125, 4.303955078125, 4.6488037109375, 4.99365234375, 5.3385009765625, 5.683349609375, 6.0281982421875, 6.373046875, 6.7178955078125, 7.062744140625, 7.4075927734375, 7.75244140625, 8.0972900390625, 8.442138671875, 8.7869873046875, 9.1318359375, 9.4766845703125, 9.821533203125, 10.1663818359375, 10.51123046875, 10.8560791015625, 11.200927734375, 11.5457763671875, 11.890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 11.0, 11.0, 26.0, 37.0, 79.0, 130.0, 323.0, 768.0, 1145.0, 804.0, 357.0, 137.0, 82.0, 41.0, 26.0, 29.0, 27.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.375, -12.084228515625, -11.79345703125, -11.502685546875, -11.2119140625, -10.921142578125, -10.63037109375, -10.339599609375, -10.048828125, -9.758056640625, -9.46728515625, -9.176513671875, -8.8857421875, -8.594970703125, -8.30419921875, -8.013427734375, -7.72265625, -7.431884765625, -7.14111328125, -6.850341796875, -6.5595703125, -6.268798828125, -5.97802734375, -5.687255859375, -5.396484375, -5.105712890625, -4.81494140625, -4.524169921875, -4.2333984375, -3.942626953125, -3.65185546875, -3.361083984375, -3.0703125, -2.779541015625, -2.48876953125, -2.197998046875, -1.9072265625, -1.616455078125, -1.32568359375, -1.034912109375, -0.744140625, -0.453369140625, -0.16259765625, 0.128173828125, 0.4189453125, 0.709716796875, 1.00048828125, 1.291259765625, 1.58203125, 1.872802734375, 2.16357421875, 2.454345703125, 2.7451171875, 3.035888671875, 3.32666015625, 3.617431640625, 3.908203125, 4.198974609375, 4.48974609375, 4.780517578125, 5.0712890625, 5.362060546875, 5.65283203125, 5.943603515625, 6.234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 15.0, 44.0, 295.0, 458.0, 144.0, 31.0, 11.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.48411560058594, -83.87215423583984, -79.26019287109375, -74.64823150634766, -70.03627014160156, -65.42430877685547, -60.812347412109375, -56.20038604736328, -51.58842468261719, -46.976463317871094, -42.364501953125, -37.752540588378906, -33.14057922363281, -28.52861785888672, -23.916656494140625, -19.30469512939453, -14.692733764648438, -10.080772399902344, -5.46881103515625, -0.8568496704101562, 3.7551116943359375, 8.367073059082031, 12.979034423828125, 17.59099578857422, 22.202957153320312, 26.814918518066406, 31.4268798828125, 36.038841247558594, 40.65080261230469, 45.26276397705078, 49.874725341796875, 54.48668670654297, 59.0986328125, 63.710594177246094, 68.32255554199219, 72.93451690673828, 77.54647827148438, 82.15843963623047, 86.77040100097656, 91.38236236572266, 95.99432373046875, 100.60628509521484, 105.21824645996094, 109.83020782470703, 114.44216918945312, 119.05413055419922, 123.66609191894531, 128.27804565429688, 132.8900146484375, 137.50198364257812, 142.1139373779297, 146.72589111328125, 151.33786010742188, 155.9498291015625, 160.56178283691406, 165.17373657226562, 169.78570556640625, 174.39767456054688, 179.00962829589844, 183.62158203125, 188.23355102539062, 192.84552001953125, 197.4574737548828, 202.06942749023438, 206.681396484375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 8.0, 3.0, 8.0, 7.0, 10.0, 12.0, 17.0, 14.0, 25.0, 32.0, 29.0, 35.0, 25.0, 31.0, 43.0, 48.0, 50.0, 58.0, 50.0, 85.0, 57.0, 52.0, 37.0, 35.0, 43.0, 33.0, 42.0, 20.0, 17.0, 17.0, 18.0, 10.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.300844192504883, -29.37302589416504, -28.445205688476562, -27.51738739013672, -26.589567184448242, -25.6617488861084, -24.733928680419922, -23.806110382080078, -22.878292083740234, -21.95047378540039, -21.022653579711914, -20.09483528137207, -19.167015075683594, -18.23919677734375, -17.311378479003906, -16.38355827331543, -15.45573902130127, -14.52791976928711, -13.60010051727295, -12.672281265258789, -11.744462966918945, -10.816643714904785, -9.888824462890625, -8.961006164550781, -8.033185958862305, -7.1053667068481445, -6.177547931671143, -5.249728679656982, -4.3219099044799805, -3.3940906524658203, -2.46627140045166, -1.5384526252746582, -0.6106338500976562, 0.3171852231025696, 1.2450042963027954, 2.172823429107666, 3.100642442703247, 4.028461456298828, 4.956280708312988, 5.88409948348999, 6.81191873550415, 7.7397379875183105, 8.667556762695312, 9.595376014709473, 10.523195266723633, 11.451013565063477, 12.378833770751953, 13.306652069091797, 14.234471321105957, 15.162290573120117, 16.09010887145996, 17.017929077148438, 17.94574737548828, 18.873565673828125, 19.8013858795166, 20.729204177856445, 21.657024383544922, 22.584842681884766, 23.512662887573242, 24.440481185913086, 25.368301391601562, 26.296119689941406, 27.22393798828125, 28.151758193969727, 29.07957649230957]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 10.0, 13.0, 18.0, 13.0, 22.0, 42.0, 48.0, 88.0, 133.0, 170.0, 276.0, 437.0, 655.0, 1140.0, 1799.0, 3201.0, 5759.0, 11099.0, 22619.0, 50154.0, 113378.0, 251480.0, 301169.0, 155330.0, 67682.0, 30304.0, 14580.0, 7125.0, 3926.0, 2197.0, 1357.0, 815.0, 530.0, 316.0, 207.0, 145.0, 90.0, 75.0, 41.0, 31.0, 27.0, 21.0, 11.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.9375, -2.83685302734375, -2.7362060546875, -2.63555908203125, -2.534912109375, -2.43426513671875, -2.3336181640625, -2.23297119140625, -2.13232421875, -2.03167724609375, -1.9310302734375, -1.83038330078125, -1.729736328125, -1.62908935546875, -1.5284423828125, -1.42779541015625, -1.3271484375, -1.22650146484375, -1.1258544921875, -1.02520751953125, -0.924560546875, -0.82391357421875, -0.7232666015625, -0.62261962890625, -0.52197265625, -0.42132568359375, -0.3206787109375, -0.22003173828125, -0.119384765625, -0.01873779296875, 0.0819091796875, 0.18255615234375, 0.283203125, 0.38385009765625, 0.4844970703125, 0.58514404296875, 0.685791015625, 0.78643798828125, 0.8870849609375, 0.98773193359375, 1.08837890625, 1.18902587890625, 1.2896728515625, 1.39031982421875, 1.490966796875, 1.59161376953125, 1.6922607421875, 1.79290771484375, 1.8935546875, 1.99420166015625, 2.0948486328125, 2.19549560546875, 2.296142578125, 2.39678955078125, 2.4974365234375, 2.59808349609375, 2.69873046875, 2.79937744140625, 2.9000244140625, 3.00067138671875, 3.101318359375, 3.20196533203125, 3.3026123046875, 3.40325927734375, 3.50390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 15.0, 8.0, 11.0, 14.0, 18.0, 15.0, 23.0, 21.0, 34.0, 26.0, 20.0, 39.0, 32.0, 46.0, 37.0, 46.0, 53.0, 51.0, 53.0, 43.0, 56.0, 35.0, 35.0, 30.0, 33.0, 32.0, 16.0, 25.0, 19.0, 9.0, 19.0, 10.0, 14.0, 14.0, 9.0, 6.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.740234375, -2.6551513671875, -2.570068359375, -2.4849853515625, -2.39990234375, -2.3148193359375, -2.229736328125, -2.1446533203125, -2.0595703125, -1.9744873046875, -1.889404296875, -1.8043212890625, -1.71923828125, -1.6341552734375, -1.549072265625, -1.4639892578125, -1.37890625, -1.2938232421875, -1.208740234375, -1.1236572265625, -1.03857421875, -0.9534912109375, -0.868408203125, -0.7833251953125, -0.6982421875, -0.6131591796875, -0.528076171875, -0.4429931640625, -0.35791015625, -0.2728271484375, -0.187744140625, -0.1026611328125, -0.017578125, 0.0675048828125, 0.152587890625, 0.2376708984375, 0.32275390625, 0.4078369140625, 0.492919921875, 0.5780029296875, 0.6630859375, 0.7481689453125, 0.833251953125, 0.9183349609375, 1.00341796875, 1.0885009765625, 1.173583984375, 1.2586669921875, 1.34375, 1.4288330078125, 1.513916015625, 1.5989990234375, 1.68408203125, 1.7691650390625, 1.854248046875, 1.9393310546875, 2.0244140625, 2.1094970703125, 2.194580078125, 2.2796630859375, 2.36474609375, 2.4498291015625, 2.534912109375, 2.6199951171875, 2.705078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 6.0, 11.0, 19.0, 21.0, 23.0, 36.0, 70.0, 91.0, 107.0, 189.0, 241.0, 413.0, 750.0, 1505.0, 3858.0, 13536.0, 80965.0, 730193.0, 181746.0, 24300.0, 5863.0, 2074.0, 994.0, 499.0, 351.0, 205.0, 105.0, 97.0, 70.0, 46.0, 42.0, 28.0, 21.0, 16.0, 13.0, 4.0, 7.0, 3.0, 6.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.6328125, -8.37652587890625, -8.1202392578125, -7.86395263671875, -7.607666015625, -7.35137939453125, -7.0950927734375, -6.83880615234375, -6.58251953125, -6.32623291015625, -6.0699462890625, -5.81365966796875, -5.557373046875, -5.30108642578125, -5.0447998046875, -4.78851318359375, -4.5322265625, -4.27593994140625, -4.0196533203125, -3.76336669921875, -3.507080078125, -3.25079345703125, -2.9945068359375, -2.73822021484375, -2.48193359375, -2.22564697265625, -1.9693603515625, -1.71307373046875, -1.456787109375, -1.20050048828125, -0.9442138671875, -0.68792724609375, -0.431640625, -0.17535400390625, 0.0809326171875, 0.33721923828125, 0.593505859375, 0.84979248046875, 1.1060791015625, 1.36236572265625, 1.61865234375, 1.87493896484375, 2.1312255859375, 2.38751220703125, 2.643798828125, 2.90008544921875, 3.1563720703125, 3.41265869140625, 3.6689453125, 3.92523193359375, 4.1815185546875, 4.43780517578125, 4.694091796875, 4.95037841796875, 5.2066650390625, 5.46295166015625, 5.71923828125, 5.97552490234375, 6.2318115234375, 6.48809814453125, 6.744384765625, 7.00067138671875, 7.2569580078125, 7.51324462890625, 7.76953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 7.0, 18.0, 24.0, 21.0, 26.0, 37.0, 43.0, 47.0, 58.0, 65.0, 64.0, 63.0, 65.0, 76.0, 70.0, 61.0, 47.0, 35.0, 32.0, 28.0, 18.0, 22.0, 7.0, 10.0, 11.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.0078125, -14.5643310546875, -14.120849609375, -13.6773681640625, -13.23388671875, -12.7904052734375, -12.346923828125, -11.9034423828125, -11.4599609375, -11.0164794921875, -10.572998046875, -10.1295166015625, -9.68603515625, -9.2425537109375, -8.799072265625, -8.3555908203125, -7.912109375, -7.4686279296875, -7.025146484375, -6.5816650390625, -6.13818359375, -5.6947021484375, -5.251220703125, -4.8077392578125, -4.3642578125, -3.9207763671875, -3.477294921875, -3.0338134765625, -2.59033203125, -2.1468505859375, -1.703369140625, -1.2598876953125, -0.81640625, -0.3729248046875, 0.070556640625, 0.5140380859375, 0.95751953125, 1.4010009765625, 1.844482421875, 2.2879638671875, 2.7314453125, 3.1749267578125, 3.618408203125, 4.0618896484375, 4.50537109375, 4.9488525390625, 5.392333984375, 5.8358154296875, 6.279296875, 6.7227783203125, 7.166259765625, 7.6097412109375, 8.05322265625, 8.4967041015625, 8.940185546875, 9.3836669921875, 9.8271484375, 10.2706298828125, 10.714111328125, 11.1575927734375, 11.60107421875, 12.0445556640625, 12.488037109375, 12.9315185546875, 13.375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 9.0, 6.0, 7.0, 15.0, 20.0, 22.0, 46.0, 61.0, 66.0, 121.0, 199.0, 313.0, 551.0, 1030.0, 2255.0, 5446.0, 15510.0, 56273.0, 326836.0, 552083.0, 60590.0, 16531.0, 5757.0, 2300.0, 1121.0, 523.0, 281.0, 181.0, 109.0, 75.0, 64.0, 35.0, 30.0, 21.0, 16.0, 11.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.75390625, -1.6934814453125, -1.633056640625, -1.5726318359375, -1.51220703125, -1.4517822265625, -1.391357421875, -1.3309326171875, -1.2705078125, -1.2100830078125, -1.149658203125, -1.0892333984375, -1.02880859375, -0.9683837890625, -0.907958984375, -0.8475341796875, -0.787109375, -0.7266845703125, -0.666259765625, -0.6058349609375, -0.54541015625, -0.4849853515625, -0.424560546875, -0.3641357421875, -0.3037109375, -0.2432861328125, -0.182861328125, -0.1224365234375, -0.06201171875, -0.0015869140625, 0.058837890625, 0.1192626953125, 0.1796875, 0.2401123046875, 0.300537109375, 0.3609619140625, 0.42138671875, 0.4818115234375, 0.542236328125, 0.6026611328125, 0.6630859375, 0.7235107421875, 0.783935546875, 0.8443603515625, 0.90478515625, 0.9652099609375, 1.025634765625, 1.0860595703125, 1.146484375, 1.2069091796875, 1.267333984375, 1.3277587890625, 1.38818359375, 1.4486083984375, 1.509033203125, 1.5694580078125, 1.6298828125, 1.6903076171875, 1.750732421875, 1.8111572265625, 1.87158203125, 1.9320068359375, 1.992431640625, 2.0528564453125, 2.11328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 6.0, 11.0, 17.0, 23.0, 31.0, 40.0, 46.0, 50.0, 94.0, 108.0, 123.0, 95.0, 72.0, 64.0, 39.0, 45.0, 23.0, 23.0, 22.0, 12.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004248619079589844, -0.0004113242030143738, -0.0003977864980697632, -0.0003842487931251526, -0.000370711088180542, -0.0003571733832359314, -0.0003436356782913208, -0.0003300979733467102, -0.0003165602684020996, -0.000303022563457489, -0.0002894848585128784, -0.0002759471535682678, -0.0002624094486236572, -0.00024887174367904663, -0.00023533403873443604, -0.00022179633378982544, -0.00020825862884521484, -0.00019472092390060425, -0.00018118321895599365, -0.00016764551401138306, -0.00015410780906677246, -0.00014057010412216187, -0.00012703239917755127, -0.00011349469423294067, -9.995698928833008e-05, -8.641928434371948e-05, -7.288157939910889e-05, -5.934387445449829e-05, -4.5806169509887695e-05, -3.22684645652771e-05, -1.8730759620666504e-05, -5.193054676055908e-06, 8.344650268554688e-06, 2.1882355213165283e-05, 3.542006015777588e-05, 4.8957765102386475e-05, 6.249547004699707e-05, 7.603317499160767e-05, 8.957087993621826e-05, 0.00010310858488082886, 0.00011664628982543945, 0.00013018399477005005, 0.00014372169971466064, 0.00015725940465927124, 0.00017079710960388184, 0.00018433481454849243, 0.00019787251949310303, 0.00021141022443771362, 0.00022494792938232422, 0.00023848563432693481, 0.0002520233392715454, 0.000265561044216156, 0.0002790987491607666, 0.0002926364541053772, 0.0003061741590499878, 0.0003197118639945984, 0.000333249568939209, 0.0003467872738838196, 0.0003603249788284302, 0.00037386268377304077, 0.00038740038871765137, 0.00040093809366226196, 0.00041447579860687256, 0.00042801350355148315, 0.00044155120849609375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 22.0, 13.0, 22.0, 23.0, 32.0, 53.0, 77.0, 96.0, 132.0, 188.0, 277.0, 457.0, 712.0, 1236.0, 2307.0, 4639.0, 9930.0, 23690.0, 63981.0, 220097.0, 556929.0, 101938.0, 34486.0, 13645.0, 6188.0, 3030.0, 1570.0, 935.0, 577.0, 373.0, 269.0, 188.0, 111.0, 76.0, 53.0, 51.0, 29.0, 26.0, 12.0, 14.0, 8.0, 7.0, 9.0, 5.0, 2.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0], "bins": [-1.443359375, -1.3998870849609375, -1.356414794921875, -1.3129425048828125, -1.26947021484375, -1.2259979248046875, -1.182525634765625, -1.1390533447265625, -1.0955810546875, -1.0521087646484375, -1.008636474609375, -0.9651641845703125, -0.92169189453125, -0.8782196044921875, -0.834747314453125, -0.7912750244140625, -0.747802734375, -0.7043304443359375, -0.660858154296875, -0.6173858642578125, -0.57391357421875, -0.5304412841796875, -0.486968994140625, -0.4434967041015625, -0.4000244140625, -0.3565521240234375, -0.313079833984375, -0.2696075439453125, -0.22613525390625, -0.1826629638671875, -0.139190673828125, -0.0957183837890625, -0.05224609375, -0.0087738037109375, 0.034698486328125, 0.0781707763671875, 0.12164306640625, 0.1651153564453125, 0.208587646484375, 0.2520599365234375, 0.2955322265625, 0.3390045166015625, 0.382476806640625, 0.4259490966796875, 0.46942138671875, 0.5128936767578125, 0.556365966796875, 0.5998382568359375, 0.643310546875, 0.6867828369140625, 0.730255126953125, 0.7737274169921875, 0.81719970703125, 0.8606719970703125, 0.904144287109375, 0.9476165771484375, 0.9910888671875, 1.0345611572265625, 1.078033447265625, 1.1215057373046875, 1.16497802734375, 1.2084503173828125, 1.251922607421875, 1.2953948974609375, 1.3388671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 17.0, 16.0, 13.0, 27.0, 34.0, 29.0, 48.0, 47.0, 62.0, 83.0, 110.0, 75.0, 89.0, 75.0, 52.0, 47.0, 24.0, 25.0, 21.0, 16.0, 11.0, 11.0, 8.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.017578125, -1.95404052734375, -1.8905029296875, -1.82696533203125, -1.763427734375, -1.69989013671875, -1.6363525390625, -1.57281494140625, -1.50927734375, -1.44573974609375, -1.3822021484375, -1.31866455078125, -1.255126953125, -1.19158935546875, -1.1280517578125, -1.06451416015625, -1.0009765625, -0.93743896484375, -0.8739013671875, -0.81036376953125, -0.746826171875, -0.68328857421875, -0.6197509765625, -0.55621337890625, -0.49267578125, -0.42913818359375, -0.3656005859375, -0.30206298828125, -0.238525390625, -0.17498779296875, -0.1114501953125, -0.04791259765625, 0.015625, 0.07916259765625, 0.1427001953125, 0.20623779296875, 0.269775390625, 0.33331298828125, 0.3968505859375, 0.46038818359375, 0.52392578125, 0.58746337890625, 0.6510009765625, 0.71453857421875, 0.778076171875, 0.84161376953125, 0.9051513671875, 0.96868896484375, 1.0322265625, 1.09576416015625, 1.1593017578125, 1.22283935546875, 1.286376953125, 1.34991455078125, 1.4134521484375, 1.47698974609375, 1.54052734375, 1.60406494140625, 1.6676025390625, 1.73114013671875, 1.794677734375, 1.85821533203125, 1.9217529296875, 1.98529052734375, 2.048828125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 15.0, 29.0, 44.0, 93.0, 240.0, 300.0, 129.0, 67.0, 35.0, 17.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-66.8045883178711, -64.78838348388672, -62.772186279296875, -60.7559814453125, -58.73978042602539, -56.72357940673828, -54.707374572753906, -52.6911735534668, -50.67497253417969, -48.65877151489258, -46.64257049560547, -44.626365661621094, -42.610164642333984, -40.593963623046875, -38.5777587890625, -36.56155776977539, -34.54535675048828, -32.52915573120117, -30.51295280456543, -28.496749877929688, -26.480548858642578, -24.46434783935547, -22.448144912719727, -20.431941986083984, -18.415740966796875, -16.399539947509766, -14.383337020874023, -12.367135047912598, -10.350933074951172, -8.334731101989746, -6.31852912902832, -4.3023271560668945, -2.2861175537109375, -0.2699155807495117, 1.746286392211914, 3.76248836517334, 5.778690338134766, 7.794892311096191, 9.811094284057617, 11.827296257019043, 13.843498229980469, 15.859700202941895, 17.87590217590332, 19.892105102539062, 21.908306121826172, 23.92450714111328, 25.940710067749023, 27.956912994384766, 29.973114013671875, 31.989315032958984, 34.005516052246094, 36.02172088623047, 38.03792190551758, 40.05412292480469, 42.07032775878906, 44.08652877807617, 46.10272979736328, 48.11893081665039, 50.1351318359375, 52.151336669921875, 54.167537689208984, 56.183738708496094, 58.19994354248047, 60.21614456176758, 62.23234558105469]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 2.0, 7.0, 8.0, 15.0, 6.0, 14.0, 10.0, 24.0, 17.0, 19.0, 29.0, 25.0, 28.0, 38.0, 44.0, 79.0, 100.0, 131.0, 74.0, 40.0, 38.0, 47.0, 30.0, 33.0, 21.0, 24.0, 15.0, 20.0, 13.0, 8.0, 11.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.314613342285156, -41.775787353515625, -40.23696517944336, -38.69813919067383, -37.1593132019043, -35.620487213134766, -34.0816650390625, -32.54283905029297, -31.004013061523438, -29.46518898010254, -27.926362991333008, -26.38753890991211, -24.848712921142578, -23.30988883972168, -21.77106475830078, -20.23223876953125, -18.69341468811035, -17.154590606689453, -15.615764617919922, -14.076940536499023, -12.538114547729492, -10.999290466308594, -9.460465431213379, -7.921640396118164, -6.382815361022949, -4.843990325927734, -3.3051655292510986, -1.766340732574463, -0.22751569747924805, 1.3113093376159668, 2.8501338958740234, 4.388958930969238, 5.927783966064453, 7.466609001159668, 9.005434036254883, 10.544258117675781, 12.083084106445312, 13.621908187866211, 15.160733222961426, 16.69955825805664, 18.238384246826172, 19.77720832824707, 21.3160343170166, 22.8548583984375, 24.39368438720703, 25.93250846862793, 27.471332550048828, 29.01015853881836, 30.548982620239258, 32.087806701660156, 33.62663269042969, 35.16545867919922, 36.704280853271484, 38.243106842041016, 39.78193283081055, 41.32075500488281, 42.859580993652344, 44.398406982421875, 45.93722915649414, 47.47605514526367, 49.0148811340332, 50.553707122802734, 52.092529296875, 53.63135528564453, 55.17018127441406]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 15.0, 17.0, 15.0, 24.0, 30.0, 67.0, 78.0, 118.0, 209.0, 355.0, 553.0, 943.0, 1730.0, 3281.0, 6830.0, 15841.0, 47405.0, 187506.0, 830117.0, 1974901.0, 845839.0, 197394.0, 50325.0, 16421.0, 6854.0, 3186.0, 1742.0, 925.0, 602.0, 364.0, 209.0, 144.0, 80.0, 47.0, 26.0, 32.0, 18.0, 14.0, 10.0, 6.0, 0.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.298828125, -3.2059326171875, -3.113037109375, -3.0201416015625, -2.92724609375, -2.8343505859375, -2.741455078125, -2.6485595703125, -2.5556640625, -2.4627685546875, -2.369873046875, -2.2769775390625, -2.18408203125, -2.0911865234375, -1.998291015625, -1.9053955078125, -1.8125, -1.7196044921875, -1.626708984375, -1.5338134765625, -1.44091796875, -1.3480224609375, -1.255126953125, -1.1622314453125, -1.0693359375, -0.9764404296875, -0.883544921875, -0.7906494140625, -0.69775390625, -0.6048583984375, -0.511962890625, -0.4190673828125, -0.326171875, -0.2332763671875, -0.140380859375, -0.0474853515625, 0.04541015625, 0.1383056640625, 0.231201171875, 0.3240966796875, 0.4169921875, 0.5098876953125, 0.602783203125, 0.6956787109375, 0.78857421875, 0.8814697265625, 0.974365234375, 1.0672607421875, 1.16015625, 1.2530517578125, 1.345947265625, 1.4388427734375, 1.53173828125, 1.6246337890625, 1.717529296875, 1.8104248046875, 1.9033203125, 1.9962158203125, 2.089111328125, 2.1820068359375, 2.27490234375, 2.3677978515625, 2.460693359375, 2.5535888671875, 2.646484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 4.0, 8.0, 6.0, 10.0, 16.0, 9.0, 14.0, 15.0, 21.0, 18.0, 21.0, 30.0, 32.0, 25.0, 28.0, 45.0, 41.0, 35.0, 54.0, 45.0, 46.0, 34.0, 49.0, 41.0, 53.0, 36.0, 32.0, 33.0, 30.0, 35.0, 22.0, 18.0, 17.0, 13.0, 9.0, 7.0, 11.0, 10.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.7265625, -2.644683837890625, -2.56280517578125, -2.480926513671875, -2.3990478515625, -2.317169189453125, -2.23529052734375, -2.153411865234375, -2.071533203125, -1.989654541015625, -1.90777587890625, -1.825897216796875, -1.7440185546875, -1.662139892578125, -1.58026123046875, -1.498382568359375, -1.41650390625, -1.334625244140625, -1.25274658203125, -1.170867919921875, -1.0889892578125, -1.007110595703125, -0.92523193359375, -0.843353271484375, -0.761474609375, -0.679595947265625, -0.59771728515625, -0.515838623046875, -0.4339599609375, -0.352081298828125, -0.27020263671875, -0.188323974609375, -0.1064453125, -0.024566650390625, 0.05731201171875, 0.139190673828125, 0.2210693359375, 0.302947998046875, 0.38482666015625, 0.466705322265625, 0.548583984375, 0.630462646484375, 0.71234130859375, 0.794219970703125, 0.8760986328125, 0.957977294921875, 1.03985595703125, 1.121734619140625, 1.20361328125, 1.285491943359375, 1.36737060546875, 1.449249267578125, 1.5311279296875, 1.613006591796875, 1.69488525390625, 1.776763916015625, 1.858642578125, 1.940521240234375, 2.02239990234375, 2.104278564453125, 2.1861572265625, 2.268035888671875, 2.34991455078125, 2.431793212890625, 2.513671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 11.0, 16.0, 33.0, 22.0, 40.0, 71.0, 97.0, 171.0, 340.0, 801.0, 1961.0, 5445.0, 20490.0, 145008.0, 3192979.0, 760392.0, 50109.0, 10474.0, 3285.0, 1304.0, 506.0, 280.0, 140.0, 81.0, 52.0, 40.0, 25.0, 19.0, 15.0, 10.0, 6.0, 15.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6484375, -6.4322509765625, -6.216064453125, -5.9998779296875, -5.78369140625, -5.5675048828125, -5.351318359375, -5.1351318359375, -4.9189453125, -4.7027587890625, -4.486572265625, -4.2703857421875, -4.05419921875, -3.8380126953125, -3.621826171875, -3.4056396484375, -3.189453125, -2.9732666015625, -2.757080078125, -2.5408935546875, -2.32470703125, -2.1085205078125, -1.892333984375, -1.6761474609375, -1.4599609375, -1.2437744140625, -1.027587890625, -0.8114013671875, -0.59521484375, -0.3790283203125, -0.162841796875, 0.0533447265625, 0.26953125, 0.4857177734375, 0.701904296875, 0.9180908203125, 1.13427734375, 1.3504638671875, 1.566650390625, 1.7828369140625, 1.9990234375, 2.2152099609375, 2.431396484375, 2.6475830078125, 2.86376953125, 3.0799560546875, 3.296142578125, 3.5123291015625, 3.728515625, 3.9447021484375, 4.160888671875, 4.3770751953125, 4.59326171875, 4.8094482421875, 5.025634765625, 5.2418212890625, 5.4580078125, 5.6741943359375, 5.890380859375, 6.1065673828125, 6.32275390625, 6.5389404296875, 6.755126953125, 6.9713134765625, 7.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 12.0, 18.0, 24.0, 22.0, 38.0, 66.0, 111.0, 145.0, 280.0, 482.0, 689.0, 721.0, 526.0, 318.0, 207.0, 116.0, 74.0, 59.0, 28.0, 25.0, 24.0, 19.0, 16.0, 4.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1328125, -6.9105224609375, -6.688232421875, -6.4659423828125, -6.24365234375, -6.0213623046875, -5.799072265625, -5.5767822265625, -5.3544921875, -5.1322021484375, -4.909912109375, -4.6876220703125, -4.46533203125, -4.2430419921875, -4.020751953125, -3.7984619140625, -3.576171875, -3.3538818359375, -3.131591796875, -2.9093017578125, -2.68701171875, -2.4647216796875, -2.242431640625, -2.0201416015625, -1.7978515625, -1.5755615234375, -1.353271484375, -1.1309814453125, -0.90869140625, -0.6864013671875, -0.464111328125, -0.2418212890625, -0.01953125, 0.2027587890625, 0.425048828125, 0.6473388671875, 0.86962890625, 1.0919189453125, 1.314208984375, 1.5364990234375, 1.7587890625, 1.9810791015625, 2.203369140625, 2.4256591796875, 2.64794921875, 2.8702392578125, 3.092529296875, 3.3148193359375, 3.537109375, 3.7593994140625, 3.981689453125, 4.2039794921875, 4.42626953125, 4.6485595703125, 4.870849609375, 5.0931396484375, 5.3154296875, 5.5377197265625, 5.760009765625, 5.9822998046875, 6.20458984375, 6.4268798828125, 6.649169921875, 6.8714599609375, 7.09375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 8.0, 20.0, 88.0, 359.0, 380.0, 108.0, 30.0, 11.0, 5.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.929710388183594, -33.081817626953125, -28.23392677307129, -23.386035919189453, -18.538143157958984, -13.690250396728516, -8.84235954284668, -3.9944686889648438, 0.853424072265625, 5.701315879821777, 10.54920768737793, 15.397099494934082, 20.244991302490234, 25.092884063720703, 29.94077491760254, 34.788665771484375, 39.636558532714844, 44.48445129394531, 49.33234405517578, 54.180233001708984, 59.02812576293945, 63.87601852416992, 68.72390747070312, 73.5718002319336, 78.41969299316406, 83.26758575439453, 88.115478515625, 92.96337127685547, 97.81126403808594, 102.65914916992188, 107.50704193115234, 112.35493469238281, 117.20281982421875, 122.05071258544922, 126.89860534667969, 131.74649047851562, 136.59439086914062, 141.44227600097656, 146.29017639160156, 151.1380615234375, 155.9859619140625, 160.83384704589844, 165.68174743652344, 170.52963256835938, 175.37753295898438, 180.2254180908203, 185.0733184814453, 189.92120361328125, 194.7690887451172, 199.61697387695312, 204.46487426757812, 209.31275939941406, 214.16065979003906, 219.008544921875, 223.8564453125, 228.70433044433594, 233.55221557617188, 238.4001007080078, 243.2480010986328, 248.09588623046875, 252.94378662109375, 257.79168701171875, 262.6395568847656, 267.4874572753906, 272.3353576660156]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 13.0, 10.0, 17.0, 17.0, 23.0, 31.0, 29.0, 39.0, 51.0, 31.0, 50.0, 41.0, 36.0, 47.0, 52.0, 47.0, 41.0, 41.0, 53.0, 46.0, 40.0, 27.0, 37.0, 26.0, 29.0, 24.0, 18.0, 19.0, 13.0, 8.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.295001983642578, -27.263147354125977, -26.231292724609375, -25.199438095092773, -24.167583465576172, -23.13572883605957, -22.10387420654297, -21.072019577026367, -20.040164947509766, -19.008310317993164, -17.976455688476562, -16.94460105895996, -15.91274642944336, -14.880891799926758, -13.849037170410156, -12.817182540893555, -11.785327911376953, -10.753473281860352, -9.72161865234375, -8.689764022827148, -7.657909393310547, -6.626054763793945, -5.594200134277344, -4.562345504760742, -3.5304908752441406, -2.498636245727539, -1.4667816162109375, -0.43492698669433594, 0.5969276428222656, 1.6287822723388672, 2.6606369018554688, 3.6924915313720703, 4.7243499755859375, 5.756204605102539, 6.788059234619141, 7.819913864135742, 8.851768493652344, 9.883623123168945, 10.915477752685547, 11.947332382202148, 12.97918701171875, 14.011041641235352, 15.042896270751953, 16.074750900268555, 17.106605529785156, 18.138460159301758, 19.17031478881836, 20.20216941833496, 21.234024047851562, 22.265878677368164, 23.297733306884766, 24.329587936401367, 25.36144256591797, 26.39329719543457, 27.425151824951172, 28.457006454467773, 29.488861083984375, 30.520715713500977, 31.552570343017578, 32.58442687988281, 33.61627960205078, 34.64813232421875, 35.679988861083984, 36.71184539794922, 37.74369812011719]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 7.0, 13.0, 16.0, 16.0, 27.0, 45.0, 61.0, 104.0, 154.0, 225.0, 327.0, 502.0, 810.0, 1229.0, 1913.0, 3277.0, 5790.0, 9851.0, 18017.0, 35778.0, 77726.0, 182094.0, 328513.0, 206749.0, 88458.0, 40174.0, 20334.0, 10750.0, 6134.0, 3485.0, 2108.0, 1344.0, 897.0, 576.0, 327.0, 229.0, 154.0, 116.0, 64.0, 42.0, 35.0, 20.0, 23.0, 11.0, 7.0, 9.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.00579833984375, -2.9041748046875, -2.80255126953125, -2.700927734375, -2.59930419921875, -2.4976806640625, -2.39605712890625, -2.29443359375, -2.19281005859375, -2.0911865234375, -1.98956298828125, -1.887939453125, -1.78631591796875, -1.6846923828125, -1.58306884765625, -1.4814453125, -1.37982177734375, -1.2781982421875, -1.17657470703125, -1.074951171875, -0.97332763671875, -0.8717041015625, -0.77008056640625, -0.66845703125, -0.56683349609375, -0.4652099609375, -0.36358642578125, -0.261962890625, -0.16033935546875, -0.0587158203125, 0.04290771484375, 0.14453125, 0.24615478515625, 0.3477783203125, 0.44940185546875, 0.551025390625, 0.65264892578125, 0.7542724609375, 0.85589599609375, 0.95751953125, 1.05914306640625, 1.1607666015625, 1.26239013671875, 1.364013671875, 1.46563720703125, 1.5672607421875, 1.66888427734375, 1.7705078125, 1.87213134765625, 1.9737548828125, 2.07537841796875, 2.177001953125, 2.27862548828125, 2.3802490234375, 2.48187255859375, 2.58349609375, 2.68511962890625, 2.7867431640625, 2.88836669921875, 2.989990234375, 3.09161376953125, 3.1932373046875, 3.29486083984375, 3.396484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 14.0, 16.0, 21.0, 29.0, 17.0, 20.0, 25.0, 33.0, 37.0, 35.0, 39.0, 50.0, 44.0, 44.0, 42.0, 39.0, 47.0, 50.0, 37.0, 38.0, 23.0, 28.0, 26.0, 27.0, 23.0, 25.0, 14.0, 19.0, 13.0, 11.0, 13.0, 9.0, 4.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0], "bins": [-2.93359375, -2.85009765625, -2.7666015625, -2.68310546875, -2.599609375, -2.51611328125, -2.4326171875, -2.34912109375, -2.265625, -2.18212890625, -2.0986328125, -2.01513671875, -1.931640625, -1.84814453125, -1.7646484375, -1.68115234375, -1.59765625, -1.51416015625, -1.4306640625, -1.34716796875, -1.263671875, -1.18017578125, -1.0966796875, -1.01318359375, -0.9296875, -0.84619140625, -0.7626953125, -0.67919921875, -0.595703125, -0.51220703125, -0.4287109375, -0.34521484375, -0.26171875, -0.17822265625, -0.0947265625, -0.01123046875, 0.072265625, 0.15576171875, 0.2392578125, 0.32275390625, 0.40625, 0.48974609375, 0.5732421875, 0.65673828125, 0.740234375, 0.82373046875, 0.9072265625, 0.99072265625, 1.07421875, 1.15771484375, 1.2412109375, 1.32470703125, 1.408203125, 1.49169921875, 1.5751953125, 1.65869140625, 1.7421875, 1.82568359375, 1.9091796875, 1.99267578125, 2.076171875, 2.15966796875, 2.2431640625, 2.32666015625, 2.41015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 11.0, 13.0, 15.0, 21.0, 26.0, 35.0, 43.0, 59.0, 85.0, 97.0, 152.0, 229.0, 318.0, 494.0, 876.0, 1931.0, 6365.0, 49546.0, 840497.0, 130251.0, 11625.0, 2698.0, 1191.0, 638.0, 380.0, 272.0, 182.0, 130.0, 79.0, 85.0, 45.0, 40.0, 32.0, 29.0, 19.0, 9.0, 10.0, 11.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.292236328125, -9.96728515625, -9.642333984375, -9.3173828125, -8.992431640625, -8.66748046875, -8.342529296875, -8.017578125, -7.692626953125, -7.36767578125, -7.042724609375, -6.7177734375, -6.392822265625, -6.06787109375, -5.742919921875, -5.41796875, -5.093017578125, -4.76806640625, -4.443115234375, -4.1181640625, -3.793212890625, -3.46826171875, -3.143310546875, -2.818359375, -2.493408203125, -2.16845703125, -1.843505859375, -1.5185546875, -1.193603515625, -0.86865234375, -0.543701171875, -0.21875, 0.106201171875, 0.43115234375, 0.756103515625, 1.0810546875, 1.406005859375, 1.73095703125, 2.055908203125, 2.380859375, 2.705810546875, 3.03076171875, 3.355712890625, 3.6806640625, 4.005615234375, 4.33056640625, 4.655517578125, 4.98046875, 5.305419921875, 5.63037109375, 5.955322265625, 6.2802734375, 6.605224609375, 6.93017578125, 7.255126953125, 7.580078125, 7.905029296875, 8.22998046875, 8.554931640625, 8.8798828125, 9.204833984375, 9.52978515625, 9.854736328125, 10.1796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 1.0, 8.0, 7.0, 6.0, 6.0, 14.0, 16.0, 18.0, 24.0, 20.0, 25.0, 30.0, 32.0, 52.0, 51.0, 46.0, 46.0, 71.0, 42.0, 49.0, 58.0, 46.0, 45.0, 52.0, 34.0, 28.0, 32.0, 25.0, 12.0, 19.0, 12.0, 14.0, 6.0, 14.0, 5.0, 7.0, 4.0, 8.0, 4.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.15625, -9.7828369140625, -9.409423828125, -9.0360107421875, -8.66259765625, -8.2891845703125, -7.915771484375, -7.5423583984375, -7.1689453125, -6.7955322265625, -6.422119140625, -6.0487060546875, -5.67529296875, -5.3018798828125, -4.928466796875, -4.5550537109375, -4.181640625, -3.8082275390625, -3.434814453125, -3.0614013671875, -2.68798828125, -2.3145751953125, -1.941162109375, -1.5677490234375, -1.1943359375, -0.8209228515625, -0.447509765625, -0.0740966796875, 0.29931640625, 0.6727294921875, 1.046142578125, 1.4195556640625, 1.79296875, 2.1663818359375, 2.539794921875, 2.9132080078125, 3.28662109375, 3.6600341796875, 4.033447265625, 4.4068603515625, 4.7802734375, 5.1536865234375, 5.527099609375, 5.9005126953125, 6.27392578125, 6.6473388671875, 7.020751953125, 7.3941650390625, 7.767578125, 8.1409912109375, 8.514404296875, 8.8878173828125, 9.26123046875, 9.6346435546875, 10.008056640625, 10.3814697265625, 10.7548828125, 11.1282958984375, 11.501708984375, 11.8751220703125, 12.24853515625, 12.6219482421875, 12.995361328125, 13.3687744140625, 13.7421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 7.0, 13.0, 17.0, 30.0, 36.0, 50.0, 80.0, 150.0, 307.0, 850.0, 3222.0, 19543.0, 647822.0, 353192.0, 18633.0, 3069.0, 829.0, 311.0, 157.0, 87.0, 46.0, 28.0, 21.0, 20.0, 6.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4140625, -3.319183349609375, -3.22430419921875, -3.129425048828125, -3.0345458984375, -2.939666748046875, -2.84478759765625, -2.749908447265625, -2.655029296875, -2.560150146484375, -2.46527099609375, -2.370391845703125, -2.2755126953125, -2.180633544921875, -2.08575439453125, -1.990875244140625, -1.89599609375, -1.801116943359375, -1.70623779296875, -1.611358642578125, -1.5164794921875, -1.421600341796875, -1.32672119140625, -1.231842041015625, -1.136962890625, -1.042083740234375, -0.94720458984375, -0.852325439453125, -0.7574462890625, -0.662567138671875, -0.56768798828125, -0.472808837890625, -0.3779296875, -0.283050537109375, -0.18817138671875, -0.093292236328125, 0.0015869140625, 0.096466064453125, 0.19134521484375, 0.286224365234375, 0.381103515625, 0.475982666015625, 0.57086181640625, 0.665740966796875, 0.7606201171875, 0.855499267578125, 0.95037841796875, 1.045257568359375, 1.14013671875, 1.235015869140625, 1.32989501953125, 1.424774169921875, 1.5196533203125, 1.614532470703125, 1.70941162109375, 1.804290771484375, 1.899169921875, 1.994049072265625, 2.08892822265625, 2.183807373046875, 2.2786865234375, 2.373565673828125, 2.46844482421875, 2.563323974609375, 2.658203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 3.0, 10.0, 7.0, 15.0, 17.0, 29.0, 42.0, 69.0, 78.0, 124.0, 174.0, 131.0, 78.0, 62.0, 40.0, 27.0, 14.0, 16.0, 5.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 8.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005474090576171875, -0.000531613826751709, -0.0005158185958862305, -0.000500023365020752, -0.00048422813415527344, -0.0004684329032897949, -0.0004526376724243164, -0.0004368424415588379, -0.0004210472106933594, -0.00040525197982788086, -0.00038945674896240234, -0.00037366151809692383, -0.0003578662872314453, -0.0003420710563659668, -0.0003262758255004883, -0.00031048059463500977, -0.00029468536376953125, -0.00027889013290405273, -0.0002630949020385742, -0.0002472996711730957, -0.0002315044403076172, -0.00021570920944213867, -0.00019991397857666016, -0.00018411874771118164, -0.00016832351684570312, -0.0001525282859802246, -0.0001367330551147461, -0.00012093782424926758, -0.00010514259338378906, -8.934736251831055e-05, -7.355213165283203e-05, -5.7756900787353516e-05, -4.1961669921875e-05, -2.6166439056396484e-05, -1.0371208190917969e-05, 5.424022674560547e-06, 2.1219253540039062e-05, 3.701448440551758e-05, 5.2809715270996094e-05, 6.860494613647461e-05, 8.440017700195312e-05, 0.00010019540786743164, 0.00011599063873291016, 0.00013178586959838867, 0.0001475811004638672, 0.0001633763313293457, 0.00017917156219482422, 0.00019496679306030273, 0.00021076202392578125, 0.00022655725479125977, 0.00024235248565673828, 0.0002581477165222168, 0.0002739429473876953, 0.00028973817825317383, 0.00030553340911865234, 0.00032132863998413086, 0.0003371238708496094, 0.0003529191017150879, 0.0003687143325805664, 0.0003845095634460449, 0.00040030479431152344, 0.00041610002517700195, 0.00043189525604248047, 0.000447690486907959, 0.0004634857177734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 10.0, 5.0, 19.0, 24.0, 43.0, 51.0, 75.0, 123.0, 171.0, 279.0, 548.0, 955.0, 1916.0, 4607.0, 14548.0, 62103.0, 648747.0, 253850.0, 42553.0, 10764.0, 3601.0, 1535.0, 846.0, 415.0, 265.0, 156.0, 92.0, 73.0, 63.0, 37.0, 22.0, 13.0, 12.0, 8.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7265625, -1.67706298828125, -1.6275634765625, -1.57806396484375, -1.528564453125, -1.47906494140625, -1.4295654296875, -1.38006591796875, -1.33056640625, -1.28106689453125, -1.2315673828125, -1.18206787109375, -1.132568359375, -1.08306884765625, -1.0335693359375, -0.98406982421875, -0.9345703125, -0.88507080078125, -0.8355712890625, -0.78607177734375, -0.736572265625, -0.68707275390625, -0.6375732421875, -0.58807373046875, -0.53857421875, -0.48907470703125, -0.4395751953125, -0.39007568359375, -0.340576171875, -0.29107666015625, -0.2415771484375, -0.19207763671875, -0.142578125, -0.09307861328125, -0.0435791015625, 0.00592041015625, 0.055419921875, 0.10491943359375, 0.1544189453125, 0.20391845703125, 0.25341796875, 0.30291748046875, 0.3524169921875, 0.40191650390625, 0.451416015625, 0.50091552734375, 0.5504150390625, 0.59991455078125, 0.6494140625, 0.69891357421875, 0.7484130859375, 0.79791259765625, 0.847412109375, 0.89691162109375, 0.9464111328125, 0.99591064453125, 1.04541015625, 1.09490966796875, 1.1444091796875, 1.19390869140625, 1.243408203125, 1.29290771484375, 1.3424072265625, 1.39190673828125, 1.44140625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 7.0, 8.0, 6.0, 10.0, 12.0, 12.0, 26.0, 19.0, 23.0, 32.0, 35.0, 57.0, 65.0, 67.0, 84.0, 83.0, 77.0, 58.0, 58.0, 55.0, 49.0, 28.0, 34.0, 19.0, 18.0, 21.0, 11.0, 10.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3028717041015625, -1.252227783203125, -1.2015838623046875, -1.15093994140625, -1.1002960205078125, -1.049652099609375, -0.9990081787109375, -0.9483642578125, -0.8977203369140625, -0.847076416015625, -0.7964324951171875, -0.74578857421875, -0.6951446533203125, -0.644500732421875, -0.5938568115234375, -0.543212890625, -0.4925689697265625, -0.441925048828125, -0.3912811279296875, -0.34063720703125, -0.2899932861328125, -0.239349365234375, -0.1887054443359375, -0.1380615234375, -0.0874176025390625, -0.036773681640625, 0.0138702392578125, 0.06451416015625, 0.1151580810546875, 0.165802001953125, 0.2164459228515625, 0.26708984375, 0.3177337646484375, 0.368377685546875, 0.4190216064453125, 0.46966552734375, 0.5203094482421875, 0.570953369140625, 0.6215972900390625, 0.6722412109375, 0.7228851318359375, 0.773529052734375, 0.8241729736328125, 0.87481689453125, 0.9254608154296875, 0.976104736328125, 1.0267486572265625, 1.077392578125, 1.1280364990234375, 1.178680419921875, 1.2293243408203125, 1.27996826171875, 1.3306121826171875, 1.381256103515625, 1.4319000244140625, 1.4825439453125, 1.5331878662109375, 1.583831787109375, 1.6344757080078125, 1.68511962890625, 1.7357635498046875, 1.786407470703125, 1.8370513916015625, 1.8876953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 11.0, 16.0, 26.0, 77.0, 123.0, 332.0, 197.0, 98.0, 55.0, 32.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.86931228637695, -59.121334075927734, -57.373355865478516, -55.6253776550293, -53.87739944458008, -52.129417419433594, -50.381439208984375, -48.633460998535156, -46.88548278808594, -45.13750457763672, -43.3895263671875, -41.64154815673828, -39.89356994628906, -38.145591735839844, -36.397613525390625, -34.64963150024414, -32.90165710449219, -31.15367889404297, -29.40570068359375, -27.65772247314453, -25.90974235534668, -24.16176414489746, -22.413785934448242, -20.66580581665039, -18.917827606201172, -17.169849395751953, -15.421870231628418, -13.6738920211792, -11.925912857055664, -10.177934646606445, -8.429956436157227, -6.681977272033691, -4.933998107910156, -3.1860194206237793, -1.4380409717559814, 0.3099374771118164, 2.0579161643981934, 3.8058948516845703, 5.553873062133789, 7.301852226257324, 9.049830436706543, 10.797808647155762, 12.545787811279297, 14.293766021728516, 16.041744232177734, 17.789722442626953, 19.537700653076172, 21.285680770874023, 23.033658981323242, 24.78163719177246, 26.52961540222168, 28.27759552001953, 30.02557373046875, 31.77355194091797, 33.52153015136719, 35.269508361816406, 37.017486572265625, 38.765464782714844, 40.51344299316406, 42.26142120361328, 44.0093994140625, 45.75737762451172, 47.50535583496094, 49.25333786010742, 51.00131607055664]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 6.0, 7.0, 11.0, 12.0, 6.0, 11.0, 19.0, 17.0, 14.0, 21.0, 25.0, 28.0, 29.0, 28.0, 32.0, 32.0, 50.0, 143.0, 125.0, 62.0, 43.0, 33.0, 38.0, 37.0, 19.0, 21.0, 21.0, 15.0, 17.0, 12.0, 9.0, 9.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.57209396362305, -40.23313522338867, -38.89417266845703, -37.555213928222656, -36.21625518798828, -34.877296447753906, -33.53833770751953, -32.19937515258789, -30.860416412353516, -29.52145767211914, -28.182497024536133, -26.843536376953125, -25.50457763671875, -24.165618896484375, -22.826658248901367, -21.48769760131836, -20.148738861083984, -18.80978012084961, -17.4708194732666, -16.131858825683594, -14.792900085449219, -13.453940391540527, -12.114980697631836, -10.776021003723145, -9.437061309814453, -8.098101615905762, -6.75914192199707, -5.420182228088379, -4.0812225341796875, -2.742262840270996, -1.4033031463623047, -0.06434345245361328, 1.2746124267578125, 2.613572120666504, 3.9525318145751953, 5.291491508483887, 6.630451202392578, 7.9694108963012695, 9.308370590209961, 10.647330284118652, 11.986289978027344, 13.325249671936035, 14.664209365844727, 16.003170013427734, 17.34212875366211, 18.681087493896484, 20.020048141479492, 21.3590087890625, 22.697967529296875, 24.03692626953125, 25.375886917114258, 26.714847564697266, 28.05380630493164, 29.392765045166016, 30.731725692749023, 32.07068634033203, 33.409645080566406, 34.74860382080078, 36.087562561035156, 37.4265251159668, 38.76548385620117, 40.10444259643555, 41.44340515136719, 42.78236389160156, 44.12132263183594]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 13.0, 18.0, 32.0, 40.0, 58.0, 82.0, 127.0, 216.0, 300.0, 438.0, 756.0, 1190.0, 1908.0, 3372.0, 6614.0, 15829.0, 49246.0, 195105.0, 762361.0, 1707185.0, 1027549.0, 302005.0, 79000.0, 22232.0, 8517.0, 4217.0, 2290.0, 1326.0, 802.0, 508.0, 319.0, 207.0, 132.0, 93.0, 58.0, 33.0, 35.0, 19.0, 13.0, 5.0, 17.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2890625, -3.178131103515625, -3.06719970703125, -2.956268310546875, -2.8453369140625, -2.734405517578125, -2.62347412109375, -2.512542724609375, -2.401611328125, -2.290679931640625, -2.17974853515625, -2.068817138671875, -1.9578857421875, -1.846954345703125, -1.73602294921875, -1.625091552734375, -1.51416015625, -1.403228759765625, -1.29229736328125, -1.181365966796875, -1.0704345703125, -0.959503173828125, -0.84857177734375, -0.737640380859375, -0.626708984375, -0.515777587890625, -0.40484619140625, -0.293914794921875, -0.1829833984375, -0.072052001953125, 0.03887939453125, 0.149810791015625, 0.2607421875, 0.371673583984375, 0.48260498046875, 0.593536376953125, 0.7044677734375, 0.815399169921875, 0.92633056640625, 1.037261962890625, 1.148193359375, 1.259124755859375, 1.37005615234375, 1.480987548828125, 1.5919189453125, 1.702850341796875, 1.81378173828125, 1.924713134765625, 2.03564453125, 2.146575927734375, 2.25750732421875, 2.368438720703125, 2.4793701171875, 2.590301513671875, 2.70123291015625, 2.812164306640625, 2.923095703125, 3.034027099609375, 3.14495849609375, 3.255889892578125, 3.3668212890625, 3.477752685546875, 3.58868408203125, 3.699615478515625, 3.810546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 12.0, 10.0, 9.0, 13.0, 15.0, 23.0, 17.0, 19.0, 27.0, 28.0, 52.0, 42.0, 48.0, 51.0, 52.0, 37.0, 38.0, 44.0, 43.0, 60.0, 40.0, 37.0, 32.0, 31.0, 22.0, 37.0, 17.0, 27.0, 21.0, 15.0, 13.0, 9.0, 11.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.9296875, -2.84210205078125, -2.7545166015625, -2.66693115234375, -2.579345703125, -2.49176025390625, -2.4041748046875, -2.31658935546875, -2.22900390625, -2.14141845703125, -2.0538330078125, -1.96624755859375, -1.878662109375, -1.79107666015625, -1.7034912109375, -1.61590576171875, -1.5283203125, -1.44073486328125, -1.3531494140625, -1.26556396484375, -1.177978515625, -1.09039306640625, -1.0028076171875, -0.91522216796875, -0.82763671875, -0.74005126953125, -0.6524658203125, -0.56488037109375, -0.477294921875, -0.38970947265625, -0.3021240234375, -0.21453857421875, -0.126953125, -0.03936767578125, 0.0482177734375, 0.13580322265625, 0.223388671875, 0.31097412109375, 0.3985595703125, 0.48614501953125, 0.57373046875, 0.66131591796875, 0.7489013671875, 0.83648681640625, 0.924072265625, 1.01165771484375, 1.0992431640625, 1.18682861328125, 1.2744140625, 1.36199951171875, 1.4495849609375, 1.53717041015625, 1.624755859375, 1.71234130859375, 1.7999267578125, 1.88751220703125, 1.97509765625, 2.06268310546875, 2.1502685546875, 2.23785400390625, 2.325439453125, 2.41302490234375, 2.5006103515625, 2.58819580078125, 2.67578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 13.0, 13.0, 8.0, 26.0, 28.0, 37.0, 61.0, 91.0, 136.0, 179.0, 315.0, 490.0, 861.0, 1752.0, 4633.0, 21735.0, 328157.0, 3669564.0, 145257.0, 14042.0, 3467.0, 1407.0, 725.0, 448.0, 273.0, 184.0, 117.0, 76.0, 46.0, 38.0, 26.0, 19.0, 16.0, 8.0, 6.0, 5.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.03125, -10.71044921875, -10.3896484375, -10.06884765625, -9.748046875, -9.42724609375, -9.1064453125, -8.78564453125, -8.46484375, -8.14404296875, -7.8232421875, -7.50244140625, -7.181640625, -6.86083984375, -6.5400390625, -6.21923828125, -5.8984375, -5.57763671875, -5.2568359375, -4.93603515625, -4.615234375, -4.29443359375, -3.9736328125, -3.65283203125, -3.33203125, -3.01123046875, -2.6904296875, -2.36962890625, -2.048828125, -1.72802734375, -1.4072265625, -1.08642578125, -0.765625, -0.44482421875, -0.1240234375, 0.19677734375, 0.517578125, 0.83837890625, 1.1591796875, 1.47998046875, 1.80078125, 2.12158203125, 2.4423828125, 2.76318359375, 3.083984375, 3.40478515625, 3.7255859375, 4.04638671875, 4.3671875, 4.68798828125, 5.0087890625, 5.32958984375, 5.650390625, 5.97119140625, 6.2919921875, 6.61279296875, 6.93359375, 7.25439453125, 7.5751953125, 7.89599609375, 8.216796875, 8.53759765625, 8.8583984375, 9.17919921875, 9.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 11.0, 22.0, 21.0, 37.0, 38.0, 55.0, 79.0, 96.0, 120.0, 166.0, 208.0, 263.0, 318.0, 402.0, 429.0, 374.0, 335.0, 256.0, 193.0, 132.0, 108.0, 76.0, 67.0, 37.0, 48.0, 37.0, 33.0, 25.0, 14.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.09130859375, -5.8857421875, -5.68017578125, -5.474609375, -5.26904296875, -5.0634765625, -4.85791015625, -4.65234375, -4.44677734375, -4.2412109375, -4.03564453125, -3.830078125, -3.62451171875, -3.4189453125, -3.21337890625, -3.0078125, -2.80224609375, -2.5966796875, -2.39111328125, -2.185546875, -1.97998046875, -1.7744140625, -1.56884765625, -1.36328125, -1.15771484375, -0.9521484375, -0.74658203125, -0.541015625, -0.33544921875, -0.1298828125, 0.07568359375, 0.28125, 0.48681640625, 0.6923828125, 0.89794921875, 1.103515625, 1.30908203125, 1.5146484375, 1.72021484375, 1.92578125, 2.13134765625, 2.3369140625, 2.54248046875, 2.748046875, 2.95361328125, 3.1591796875, 3.36474609375, 3.5703125, 3.77587890625, 3.9814453125, 4.18701171875, 4.392578125, 4.59814453125, 4.8037109375, 5.00927734375, 5.21484375, 5.42041015625, 5.6259765625, 5.83154296875, 6.037109375, 6.24267578125, 6.4482421875, 6.65380859375, 6.859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 24.0, 46.0, 93.0, 163.0, 230.0, 205.0, 114.0, 58.0, 24.0, 14.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.76553344726562, -163.6645050048828, -159.56349182128906, -155.46246337890625, -151.36143493652344, -147.26040649414062, -143.15939331054688, -139.05836486816406, -134.95733642578125, -130.85630798339844, -126.75528717041016, -122.65426635742188, -118.55323791503906, -114.45221710205078, -110.3511962890625, -106.25016784667969, -102.14915466308594, -98.04813385009766, -93.94710540771484, -89.84608459472656, -85.74505615234375, -81.64403533935547, -77.54301452636719, -73.44198608398438, -69.3409652709961, -65.23994445800781, -61.138916015625, -57.03789520263672, -52.93687057495117, -48.835845947265625, -44.734825134277344, -40.6338005065918, -36.53276824951172, -32.43174362182617, -28.330720901489258, -24.229698181152344, -20.128673553466797, -16.02764892578125, -11.926626205444336, -7.825603485107422, -3.724578857421875, 0.37644481658935547, 4.477468490600586, 8.578492164611816, 12.679515838623047, 16.780540466308594, 20.881563186645508, 24.982585906982422, 29.08361053466797, 33.184635162353516, 37.28565979003906, 41.386680603027344, 45.48770523071289, 49.58872985839844, 53.68975067138672, 57.790775299072266, 61.89179992675781, 65.9928207397461, 70.0938491821289, 74.19486999511719, 78.2958984375, 82.39691925048828, 86.49794006347656, 90.59896850585938, 94.69998931884766]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 3.0, 6.0, 11.0, 25.0, 22.0, 27.0, 28.0, 42.0, 49.0, 47.0, 60.0, 83.0, 76.0, 67.0, 61.0, 75.0, 52.0, 50.0, 52.0, 31.0, 37.0, 36.0, 15.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.98268127441406, -64.82744598388672, -62.672218322753906, -60.51698303222656, -58.361751556396484, -56.206520080566406, -54.05128479003906, -51.896053314208984, -49.740821838378906, -47.58559036254883, -45.43035888671875, -43.275123596191406, -41.11989212036133, -38.96466064453125, -36.809425354003906, -34.65419387817383, -32.49896240234375, -30.343730926513672, -28.18849754333496, -26.03326416015625, -23.878032684326172, -21.722801208496094, -19.567567825317383, -17.412334442138672, -15.257102966308594, -13.1018705368042, -10.946638107299805, -8.79140567779541, -6.636173248291016, -4.480940818786621, -2.3257083892822266, -0.17047595977783203, 1.9847564697265625, 4.139988899230957, 6.295221328735352, 8.450453758239746, 10.60568618774414, 12.760918617248535, 14.91615104675293, 17.07138442993164, 19.22661590576172, 21.381847381591797, 23.537080764770508, 25.69231414794922, 27.847545623779297, 30.002777099609375, 32.15801239013672, 34.3132438659668, 36.468475341796875, 38.62370681762695, 40.77893829345703, 42.934173583984375, 45.08940505981445, 47.24463653564453, 49.399871826171875, 51.55510330200195, 53.71033477783203, 55.86556625366211, 58.02079772949219, 60.17603302001953, 62.33126449584961, 64.48649597167969, 66.64173126220703, 68.79695892333984, 70.95219421386719]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 5.0, 11.0, 20.0, 24.0, 26.0, 54.0, 98.0, 173.0, 263.0, 480.0, 913.0, 1605.0, 3395.0, 8687.0, 25333.0, 96059.0, 584222.0, 248584.0, 52054.0, 15495.0, 5784.0, 2515.0, 1220.0, 672.0, 351.0, 190.0, 124.0, 68.0, 38.0, 22.0, 21.0, 12.0, 5.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.771728515625, -4.62158203125, -4.471435546875, -4.3212890625, -4.171142578125, -4.02099609375, -3.870849609375, -3.720703125, -3.570556640625, -3.42041015625, -3.270263671875, -3.1201171875, -2.969970703125, -2.81982421875, -2.669677734375, -2.51953125, -2.369384765625, -2.21923828125, -2.069091796875, -1.9189453125, -1.768798828125, -1.61865234375, -1.468505859375, -1.318359375, -1.168212890625, -1.01806640625, -0.867919921875, -0.7177734375, -0.567626953125, -0.41748046875, -0.267333984375, -0.1171875, 0.032958984375, 0.18310546875, 0.333251953125, 0.4833984375, 0.633544921875, 0.78369140625, 0.933837890625, 1.083984375, 1.234130859375, 1.38427734375, 1.534423828125, 1.6845703125, 1.834716796875, 1.98486328125, 2.135009765625, 2.28515625, 2.435302734375, 2.58544921875, 2.735595703125, 2.8857421875, 3.035888671875, 3.18603515625, 3.336181640625, 3.486328125, 3.636474609375, 3.78662109375, 3.936767578125, 4.0869140625, 4.237060546875, 4.38720703125, 4.537353515625, 4.6875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 7.0, 5.0, 13.0, 18.0, 16.0, 21.0, 27.0, 42.0, 45.0, 39.0, 65.0, 71.0, 75.0, 90.0, 88.0, 77.0, 58.0, 66.0, 28.0, 43.0, 44.0, 24.0, 13.0, 16.0, 8.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.841064453125, -4.68212890625, -4.523193359375, -4.3642578125, -4.205322265625, -4.04638671875, -3.887451171875, -3.728515625, -3.569580078125, -3.41064453125, -3.251708984375, -3.0927734375, -2.933837890625, -2.77490234375, -2.615966796875, -2.45703125, -2.298095703125, -2.13916015625, -1.980224609375, -1.8212890625, -1.662353515625, -1.50341796875, -1.344482421875, -1.185546875, -1.026611328125, -0.86767578125, -0.708740234375, -0.5498046875, -0.390869140625, -0.23193359375, -0.072998046875, 0.0859375, 0.244873046875, 0.40380859375, 0.562744140625, 0.7216796875, 0.880615234375, 1.03955078125, 1.198486328125, 1.357421875, 1.516357421875, 1.67529296875, 1.834228515625, 1.9931640625, 2.152099609375, 2.31103515625, 2.469970703125, 2.62890625, 2.787841796875, 2.94677734375, 3.105712890625, 3.2646484375, 3.423583984375, 3.58251953125, 3.741455078125, 3.900390625, 4.059326171875, 4.21826171875, 4.377197265625, 4.5361328125, 4.695068359375, 4.85400390625, 5.012939453125, 5.171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 7.0, 19.0, 10.0, 16.0, 34.0, 40.0, 53.0, 65.0, 125.0, 179.0, 341.0, 622.0, 1718.0, 7822.0, 98020.0, 907861.0, 25738.0, 3546.0, 1150.0, 465.0, 228.0, 171.0, 100.0, 76.0, 43.0, 20.0, 25.0, 17.0, 11.0, 9.0, 3.0, 10.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51953125, -7.26263427734375, -7.0057373046875, -6.74884033203125, -6.491943359375, -6.23504638671875, -5.9781494140625, -5.72125244140625, -5.46435546875, -5.20745849609375, -4.9505615234375, -4.69366455078125, -4.436767578125, -4.17987060546875, -3.9229736328125, -3.66607666015625, -3.4091796875, -3.15228271484375, -2.8953857421875, -2.63848876953125, -2.381591796875, -2.12469482421875, -1.8677978515625, -1.61090087890625, -1.35400390625, -1.09710693359375, -0.8402099609375, -0.58331298828125, -0.326416015625, -0.06951904296875, 0.1873779296875, 0.44427490234375, 0.701171875, 0.95806884765625, 1.2149658203125, 1.47186279296875, 1.728759765625, 1.98565673828125, 2.2425537109375, 2.49945068359375, 2.75634765625, 3.01324462890625, 3.2701416015625, 3.52703857421875, 3.783935546875, 4.04083251953125, 4.2977294921875, 4.55462646484375, 4.8115234375, 5.06842041015625, 5.3253173828125, 5.58221435546875, 5.839111328125, 6.09600830078125, 6.3529052734375, 6.60980224609375, 6.86669921875, 7.12359619140625, 7.3804931640625, 7.63739013671875, 7.894287109375, 8.15118408203125, 8.4080810546875, 8.66497802734375, 8.921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 9.0, 7.0, 12.0, 6.0, 10.0, 15.0, 17.0, 28.0, 23.0, 29.0, 23.0, 27.0, 47.0, 47.0, 55.0, 73.0, 86.0, 72.0, 58.0, 65.0, 43.0, 27.0, 27.0, 29.0, 19.0, 21.0, 14.0, 18.0, 13.0, 17.0, 8.0, 15.0, 6.0, 3.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.9609375, -11.5833740234375, -11.205810546875, -10.8282470703125, -10.45068359375, -10.0731201171875, -9.695556640625, -9.3179931640625, -8.9404296875, -8.5628662109375, -8.185302734375, -7.8077392578125, -7.43017578125, -7.0526123046875, -6.675048828125, -6.2974853515625, -5.919921875, -5.5423583984375, -5.164794921875, -4.7872314453125, -4.40966796875, -4.0321044921875, -3.654541015625, -3.2769775390625, -2.8994140625, -2.5218505859375, -2.144287109375, -1.7667236328125, -1.38916015625, -1.0115966796875, -0.634033203125, -0.2564697265625, 0.12109375, 0.4986572265625, 0.876220703125, 1.2537841796875, 1.63134765625, 2.0089111328125, 2.386474609375, 2.7640380859375, 3.1416015625, 3.5191650390625, 3.896728515625, 4.2742919921875, 4.65185546875, 5.0294189453125, 5.406982421875, 5.7845458984375, 6.162109375, 6.5396728515625, 6.917236328125, 7.2947998046875, 7.67236328125, 8.0499267578125, 8.427490234375, 8.8050537109375, 9.1826171875, 9.5601806640625, 9.937744140625, 10.3153076171875, 10.69287109375, 11.0704345703125, 11.447998046875, 11.8255615234375, 12.203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 2.0, 7.0, 10.0, 9.0, 12.0, 18.0, 23.0, 36.0, 61.0, 53.0, 94.0, 167.0, 285.0, 536.0, 1105.0, 2818.0, 8800.0, 36208.0, 790874.0, 173207.0, 23664.0, 6316.0, 2153.0, 921.0, 435.0, 237.0, 141.0, 91.0, 60.0, 46.0, 36.0, 22.0, 28.0, 14.0, 11.0, 7.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.92919921875, -0.9000396728515625, -0.870880126953125, -0.8417205810546875, -0.81256103515625, -0.7834014892578125, -0.754241943359375, -0.7250823974609375, -0.6959228515625, -0.6667633056640625, -0.637603759765625, -0.6084442138671875, -0.57928466796875, -0.5501251220703125, -0.520965576171875, -0.4918060302734375, -0.462646484375, -0.4334869384765625, -0.404327392578125, -0.3751678466796875, -0.34600830078125, -0.3168487548828125, -0.287689208984375, -0.2585296630859375, -0.2293701171875, -0.2002105712890625, -0.171051025390625, -0.1418914794921875, -0.11273193359375, -0.0835723876953125, -0.054412841796875, -0.0252532958984375, 0.00390625, 0.0330657958984375, 0.062225341796875, 0.0913848876953125, 0.12054443359375, 0.1497039794921875, 0.178863525390625, 0.2080230712890625, 0.2371826171875, 0.2663421630859375, 0.295501708984375, 0.3246612548828125, 0.35382080078125, 0.3829803466796875, 0.412139892578125, 0.4412994384765625, 0.470458984375, 0.4996185302734375, 0.528778076171875, 0.5579376220703125, 0.58709716796875, 0.6162567138671875, 0.645416259765625, 0.6745758056640625, 0.7037353515625, 0.7328948974609375, 0.762054443359375, 0.7912139892578125, 0.82037353515625, 0.8495330810546875, 0.878692626953125, 0.9078521728515625, 0.93701171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 4.0, 9.0, 9.0, 6.0, 6.0, 11.0, 14.0, 15.0, 23.0, 21.0, 43.0, 80.0, 87.0, 132.0, 139.0, 133.0, 59.0, 55.0, 28.0, 21.0, 15.0, 13.0, 12.0, 12.0, 10.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023698806762695312, -0.00023003295063972473, -0.00022307783365249634, -0.00021612271666526794, -0.00020916759967803955, -0.00020221248269081116, -0.00019525736570358276, -0.00018830224871635437, -0.00018134713172912598, -0.00017439201474189758, -0.0001674368977546692, -0.0001604817807674408, -0.0001535266637802124, -0.000146571546792984, -0.00013961642980575562, -0.00013266131281852722, -0.00012570619583129883, -0.00011875107884407043, -0.00011179596185684204, -0.00010484084486961365, -9.788572788238525e-05, -9.093061089515686e-05, -8.397549390792847e-05, -7.702037692070007e-05, -7.006525993347168e-05, -6.311014294624329e-05, -5.615502595901489e-05, -4.91999089717865e-05, -4.2244791984558105e-05, -3.528967499732971e-05, -2.833455801010132e-05, -2.1379441022872925e-05, -1.4424324035644531e-05, -7.469207048416138e-06, -5.140900611877441e-07, 6.441026926040649e-06, 1.3396143913269043e-05, 2.0351260900497437e-05, 2.730637788772583e-05, 3.4261494874954224e-05, 4.121661186218262e-05, 4.817172884941101e-05, 5.5126845836639404e-05, 6.20819628238678e-05, 6.903707981109619e-05, 7.599219679832458e-05, 8.294731378555298e-05, 8.990243077278137e-05, 9.685754776000977e-05, 0.00010381266474723816, 0.00011076778173446655, 0.00011772289872169495, 0.00012467801570892334, 0.00013163313269615173, 0.00013858824968338013, 0.00014554336667060852, 0.00015249848365783691, 0.0001594536006450653, 0.0001664087176322937, 0.0001733638346195221, 0.0001803189516067505, 0.00018727406859397888, 0.00019422918558120728, 0.00020118430256843567, 0.00020813941955566406]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 8.0, 3.0, 4.0, 7.0, 7.0, 13.0, 26.0, 25.0, 43.0, 84.0, 118.0, 182.0, 310.0, 577.0, 1197.0, 2713.0, 6756.0, 19802.0, 88340.0, 828801.0, 71168.0, 17448.0, 6084.0, 2431.0, 1099.0, 501.0, 299.0, 183.0, 97.0, 83.0, 48.0, 34.0, 23.0, 23.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6923828125, -0.66619873046875, -0.6400146484375, -0.61383056640625, -0.587646484375, -0.56146240234375, -0.5352783203125, -0.50909423828125, -0.48291015625, -0.45672607421875, -0.4305419921875, -0.40435791015625, -0.378173828125, -0.35198974609375, -0.3258056640625, -0.29962158203125, -0.2734375, -0.24725341796875, -0.2210693359375, -0.19488525390625, -0.168701171875, -0.14251708984375, -0.1163330078125, -0.09014892578125, -0.06396484375, -0.03778076171875, -0.0115966796875, 0.01458740234375, 0.040771484375, 0.06695556640625, 0.0931396484375, 0.11932373046875, 0.1455078125, 0.17169189453125, 0.1978759765625, 0.22406005859375, 0.250244140625, 0.27642822265625, 0.3026123046875, 0.32879638671875, 0.35498046875, 0.38116455078125, 0.4073486328125, 0.43353271484375, 0.459716796875, 0.48590087890625, 0.5120849609375, 0.53826904296875, 0.564453125, 0.59063720703125, 0.6168212890625, 0.64300537109375, 0.669189453125, 0.69537353515625, 0.7215576171875, 0.74774169921875, 0.77392578125, 0.80010986328125, 0.8262939453125, 0.85247802734375, 0.878662109375, 0.90484619140625, 0.9310302734375, 0.95721435546875, 0.9833984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 9.0, 5.0, 5.0, 6.0, 5.0, 14.0, 18.0, 14.0, 17.0, 25.0, 28.0, 36.0, 43.0, 69.0, 100.0, 84.0, 94.0, 84.0, 74.0, 54.0, 44.0, 42.0, 24.0, 23.0, 14.0, 7.0, 13.0, 4.0, 3.0, 9.0, 1.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8134765625, -0.7845001220703125, -0.755523681640625, -0.7265472412109375, -0.69757080078125, -0.6685943603515625, -0.639617919921875, -0.6106414794921875, -0.5816650390625, -0.5526885986328125, -0.523712158203125, -0.4947357177734375, -0.46575927734375, -0.4367828369140625, -0.407806396484375, -0.3788299560546875, -0.349853515625, -0.3208770751953125, -0.291900634765625, -0.2629241943359375, -0.23394775390625, -0.2049713134765625, -0.175994873046875, -0.1470184326171875, -0.1180419921875, -0.0890655517578125, -0.060089111328125, -0.0311126708984375, -0.00213623046875, 0.0268402099609375, 0.055816650390625, 0.0847930908203125, 0.11376953125, 0.1427459716796875, 0.171722412109375, 0.2006988525390625, 0.22967529296875, 0.2586517333984375, 0.287628173828125, 0.3166046142578125, 0.3455810546875, 0.3745574951171875, 0.403533935546875, 0.4325103759765625, 0.46148681640625, 0.4904632568359375, 0.519439697265625, 0.5484161376953125, 0.577392578125, 0.6063690185546875, 0.635345458984375, 0.6643218994140625, 0.69329833984375, 0.7222747802734375, 0.751251220703125, 0.7802276611328125, 0.8092041015625, 0.8381805419921875, 0.867156982421875, 0.8961334228515625, 0.92510986328125, 0.9540863037109375, 0.983062744140625, 1.0120391845703125, 1.041015625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 11.0, 8.0, 8.0, 25.0, 33.0, 75.0, 77.0, 470.0, 133.0, 68.0, 39.0, 20.0, 14.0, 12.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.608524322509766, -56.29075622558594, -54.97298812866211, -53.65522003173828, -52.33745193481445, -51.019683837890625, -49.7019157409668, -48.38414764404297, -47.06637954711914, -45.74861145019531, -44.430843353271484, -43.113075256347656, -41.79530715942383, -40.4775390625, -39.15977096557617, -37.842002868652344, -36.524234771728516, -35.20646667480469, -33.88869857788086, -32.57093048095703, -31.253162384033203, -29.935394287109375, -28.617626190185547, -27.29985809326172, -25.98208999633789, -24.664321899414062, -23.346553802490234, -22.028785705566406, -20.711017608642578, -19.39324951171875, -18.075481414794922, -16.757713317871094, -15.439943313598633, -14.122175216674805, -12.804407119750977, -11.486639022827148, -10.16887092590332, -8.851102828979492, -7.533334732055664, -6.215566635131836, -4.897798538208008, -3.5800304412841797, -2.2622623443603516, -0.9444942474365234, 0.3732738494873047, 1.6910419464111328, 3.008810043334961, 4.326578140258789, 5.644346237182617, 6.962114334106445, 8.279882431030273, 9.597650527954102, 10.91541862487793, 12.233186721801758, 13.550954818725586, 14.868722915649414, 16.186491012573242, 17.50425910949707, 18.8220272064209, 20.139795303344727, 21.457563400268555, 22.775331497192383, 24.09309959411621, 25.41086769104004, 26.728635787963867]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 6.0, 9.0, 4.0, 8.0, 5.0, 12.0, 19.0, 12.0, 20.0, 17.0, 28.0, 25.0, 31.0, 53.0, 187.0, 245.0, 68.0, 34.0, 17.0, 28.0, 25.0, 19.0, 10.0, 18.0, 11.0, 12.0, 14.0, 10.0, 13.0, 8.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.02647399902344, -37.91628646850586, -36.80609893798828, -35.69590759277344, -34.58572006225586, -33.47553253173828, -32.3653450012207, -31.255157470703125, -30.144969940185547, -29.03478240966797, -27.924592971801758, -26.81440544128418, -25.7042179107666, -24.59402847290039, -23.483840942382812, -22.373653411865234, -21.263463973999023, -20.153276443481445, -19.043087005615234, -17.932899475097656, -16.822711944580078, -15.712523460388184, -14.602334976196289, -13.492147445678711, -12.381958961486816, -11.271770477294922, -10.161582946777344, -9.05139446258545, -7.941206455230713, -6.831018447875977, -5.720829963684082, -4.610641956329346, -3.5004539489746094, -2.390265941619873, -1.2800776958465576, -0.1698894500732422, 0.9402985572814941, 2.0504865646362305, 3.160675048828125, 4.270863056182861, 5.381051063537598, 6.491239070892334, 7.60142707824707, 8.711615562438965, 9.82180404663086, 10.931991577148438, 12.042180061340332, 13.152368545532227, 14.262556076049805, 15.3727445602417, 16.482933044433594, 17.593120574951172, 18.70330810546875, 19.813495635986328, 20.92368507385254, 22.033872604370117, 23.144062042236328, 24.254249572753906, 25.364439010620117, 26.474626541137695, 27.584814071655273, 28.695003509521484, 29.805191040039062, 30.91537857055664, 32.02556610107422]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 7.0, 7.0, 10.0, 10.0, 15.0, 13.0, 13.0, 27.0, 24.0, 27.0, 22.0, 33.0, 52.0, 133.0, 263.0, 51.0, 48.0, 30.0, 27.0, 26.0, 25.0, 16.0, 20.0, 12.0, 13.0, 8.0, 13.0, 8.0, 12.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.4698486328125, -2.375244140625, -2.2806396484375, -2.18603515625, -2.0914306640625, -1.996826171875, -1.9022216796875, -1.8076171875, -1.7130126953125, -1.618408203125, -1.5238037109375, -1.42919921875, -1.3345947265625, -1.239990234375, -1.1453857421875, -1.05078125, -0.9561767578125, -0.861572265625, -0.7669677734375, -0.67236328125, -0.5777587890625, -0.483154296875, -0.3885498046875, -0.2939453125, -0.1993408203125, -0.104736328125, -0.0101318359375, 0.08447265625, 0.1790771484375, 0.273681640625, 0.3682861328125, 0.462890625, 0.5574951171875, 0.652099609375, 0.7467041015625, 0.84130859375, 0.9359130859375, 1.030517578125, 1.1251220703125, 1.2197265625, 1.3143310546875, 1.408935546875, 1.5035400390625, 1.59814453125, 1.6927490234375, 1.787353515625, 1.8819580078125, 1.9765625, 2.0711669921875, 2.165771484375, 2.2603759765625, 2.35498046875, 2.4495849609375, 2.544189453125, 2.6387939453125, 2.7333984375, 2.8280029296875, 2.922607421875, 3.0172119140625, 3.11181640625, 3.2064208984375, 3.301025390625, 3.3956298828125, 3.490234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 7.0, 9.0, 6.0, 14.0, 24.0, 22.0, 20.0, 38.0, 76.0, 156.0, 304.0, 883.0, 3139.0, 18342.0, 8345895.0, 15550.0, 2710.0, 753.0, 286.0, 126.0, 68.0, 36.0, 39.0, 20.0, 9.0, 14.0, 7.0, 2.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.041444778442383, -30.08550453186035, -29.129562377929688, -28.173622131347656, -27.217681884765625, -26.26173973083496, -25.30579948425293, -24.349857330322266, -23.393917083740234, -22.437976837158203, -21.48203468322754, -20.526094436645508, -19.570152282714844, -18.614212036132812, -17.65827178955078, -16.70233154296875, -15.746389389038086, -14.790448188781738, -13.83450698852539, -12.87856674194336, -11.922625541687012, -10.966684341430664, -10.010744094848633, -9.054802894592285, -8.098861694335938, -7.14292049407959, -6.1869797706604, -5.231039047241211, -4.275097846984863, -3.3191566467285156, -2.363215923309326, -1.4072751998901367, -0.4513359069824219, 0.5046050548553467, 1.4605460166931152, 2.416486978530884, 3.3724279403686523, 4.328369140625, 5.2843098640441895, 6.240250587463379, 7.196191787719727, 8.152132987976074, 9.108074188232422, 10.064014434814453, 11.0199556350708, 11.975896835327148, 12.93183708190918, 13.887778282165527, 14.843719482421875, 15.799660682678223, 16.75560188293457, 17.7115421295166, 18.667484283447266, 19.623424530029297, 20.579364776611328, 21.53530502319336, 22.491247177124023, 23.447187423706055, 24.40312957763672, 25.35906982421875, 26.31501007080078, 27.270952224731445, 28.226892471313477, 29.18283462524414, 30.138774871826172]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.394025802612305, -20.409008026123047, -19.423988342285156, -18.438968658447266, -17.453950881958008, -16.46893310546875, -15.48391342163086, -14.498894691467285, -13.513875961303711, -12.528857231140137, -11.543838500976562, -10.558819770812988, -9.573801040649414, -8.58878231048584, -7.603763580322266, -6.618744850158691, -5.633726119995117, -4.648707389831543, -3.6636886596679688, -2.6786699295043945, -1.6936511993408203, -0.7086324691772461, 0.2763862609863281, 1.2614049911499023, 2.2464237213134766, 3.231442451477051, 4.216461181640625, 5.201479911804199, 6.186498641967773, 7.171517372131348, 8.156536102294922, 9.141554832458496, 10.126571655273438, 11.111590385437012, 12.096609115600586, 13.08162784576416, 14.066646575927734, 15.051665306091309, 16.036684036254883, 17.02170181274414, 18.00672149658203, 18.991741180419922, 19.97675895690918, 20.961776733398438, 21.946796417236328, 22.93181610107422, 23.916833877563477, 24.901851654052734, 25.886871337890625, 26.871891021728516, 27.856908798217773, 28.84192657470703, 29.826946258544922, 30.811965942382812, 31.79698371887207, 32.78200149536133, 33.76702117919922, 34.75204086303711, 35.737060546875, 36.722076416015625, 37.707096099853516, 38.692115783691406, 39.67713165283203, 40.66215133666992, 41.64717102050781]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 6.0, 6.0, 19.0, 18.0, 40.0, 47.0, 48.0, 92.0, 112.0, 196.0, 362.0, 758.0, 1829.0, 5762.0, 22359.0, 100170.0, 259073.0, 101110.0, 22860.0, 5921.0, 1782.0, 724.0, 341.0, 198.0, 131.0, 63.0, 52.0, 42.0, 36.0, 24.0, 18.0, 12.0, 12.0, 11.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.65625, -30.6513671875, -29.646484375, -28.6416015625, -27.63671875, -26.6318359375, -25.626953125, -24.6220703125, -23.6171875, -22.6123046875, -21.607421875, -20.6025390625, -19.59765625, -18.5927734375, -17.587890625, -16.5830078125, -15.578125, -14.5732421875, -13.568359375, -12.5634765625, -11.55859375, -10.5537109375, -9.548828125, -8.5439453125, -7.5390625, -6.5341796875, -5.529296875, -4.5244140625, -3.51953125, -2.5146484375, -1.509765625, -0.5048828125, 0.5, 1.5048828125, 2.509765625, 3.5146484375, 4.51953125, 5.5244140625, 6.529296875, 7.5341796875, 8.5390625, 9.5439453125, 10.548828125, 11.5537109375, 12.55859375, 13.5634765625, 14.568359375, 15.5732421875, 16.578125, 17.5830078125, 18.587890625, 19.5927734375, 20.59765625, 21.6025390625, 22.607421875, 23.6123046875, 24.6171875, 25.6220703125, 26.626953125, 27.6318359375, 28.63671875, 29.6416015625, 30.646484375, 31.6513671875, 32.65625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 10.0, 9.0, 8.0, 14.0, 16.0, 42.0, 41.0, 72.0, 72.0, 94.0, 116.0, 98.0, 109.0, 71.0, 54.0, 59.0, 28.0, 27.0, 21.0, 13.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6484375, -5.47711181640625, -5.3057861328125, -5.13446044921875, -4.963134765625, -4.79180908203125, -4.6204833984375, -4.44915771484375, -4.27783203125, -4.10650634765625, -3.9351806640625, -3.76385498046875, -3.592529296875, -3.42120361328125, -3.2498779296875, -3.07855224609375, -2.9072265625, -2.73590087890625, -2.5645751953125, -2.39324951171875, -2.221923828125, -2.05059814453125, -1.8792724609375, -1.70794677734375, -1.53662109375, -1.36529541015625, -1.1939697265625, -1.02264404296875, -0.851318359375, -0.67999267578125, -0.5086669921875, -0.33734130859375, -0.166015625, 0.00531005859375, 0.1766357421875, 0.34796142578125, 0.519287109375, 0.69061279296875, 0.8619384765625, 1.03326416015625, 1.20458984375, 1.37591552734375, 1.5472412109375, 1.71856689453125, 1.889892578125, 2.06121826171875, 2.2325439453125, 2.40386962890625, 2.5751953125, 2.74652099609375, 2.9178466796875, 3.08917236328125, 3.260498046875, 3.43182373046875, 3.6031494140625, 3.77447509765625, 3.94580078125, 4.11712646484375, 4.2884521484375, 4.45977783203125, 4.631103515625, 4.80242919921875, 4.9737548828125, 5.14508056640625, 5.31640625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 7.0, 16.0, 13.0, 51.0, 87.0, 81.0, 74.0, 57.0, 32.0, 11.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.850107192993164, -29.01944351196289, -28.188779830932617, -27.358116149902344, -26.527454376220703, -25.696788787841797, -24.866127014160156, -24.035463333129883, -23.20479965209961, -22.374135971069336, -21.543472290039062, -20.71280860900879, -19.882144927978516, -19.051483154296875, -18.2208194732666, -17.390155792236328, -16.559492111206055, -15.728828430175781, -14.898164749145508, -14.06750202178955, -13.236838340759277, -12.406174659729004, -11.575511932373047, -10.744848251342773, -9.9141845703125, -9.083520889282227, -8.252857208251953, -7.422194480895996, -6.591530799865723, -5.760867118835449, -4.930203914642334, -4.099540710449219, -3.268878936767578, -2.438215494155884, -1.6075520515441895, -0.7768886089324951, 0.05377483367919922, 0.8844385147094727, 1.715101718902588, 2.545764923095703, 3.3764286041259766, 4.20709228515625, 5.037755489349365, 5.8684186935424805, 6.699082374572754, 7.529746055603027, 8.360408782958984, 9.191072463989258, 10.021736145019531, 10.852399826049805, 11.683063507080078, 12.513726234436035, 13.344389915466309, 14.175053596496582, 15.005716323852539, 15.836380004882812, 16.667043685913086, 17.49770736694336, 18.328371047973633, 19.159034729003906, 19.989696502685547, 20.820362091064453, 21.651023864746094, 22.481687545776367, 23.31235122680664]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 3.0, 8.0, 10.0, 13.0, 34.0, 52.0, 106.0, 93.0, 53.0, 42.0, 12.0, 7.0, 6.0, 5.0, 7.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.420063018798828, -19.75213623046875, -19.084209442138672, -18.416282653808594, -17.748355865478516, -17.080429077148438, -16.41250228881836, -15.744576454162598, -15.07664966583252, -14.408722877502441, -13.740796089172363, -13.072870254516602, -12.404943466186523, -11.737016677856445, -11.069089889526367, -10.401163101196289, -9.733236312866211, -9.065309524536133, -8.397382736206055, -7.729456424713135, -7.061529636383057, -6.3936028480529785, -5.725676536560059, -5.0577497482299805, -4.389822959899902, -3.721896171569824, -3.053969621658325, -2.386043071746826, -1.718116283416748, -1.05018949508667, -0.38226318359375, 0.2856636047363281, 0.9535903930664062, 1.6215170621871948, 2.2894437313079834, 2.9573702812194824, 3.6252970695495605, 4.293223857879639, 4.961150169372559, 5.629076957702637, 6.297003746032715, 6.964930534362793, 7.632857322692871, 8.300783157348633, 8.968709945678711, 9.636636734008789, 10.304563522338867, 10.972490310668945, 11.640417098999023, 12.308343887329102, 12.97627067565918, 13.644197463989258, 14.312124252319336, 14.980051040649414, 15.647976875305176, 16.315902709960938, 16.983829498291016, 17.651756286621094, 18.319683074951172, 18.98760986328125, 19.655536651611328, 20.323463439941406, 20.991390228271484, 21.659317016601562, 22.32724380493164]}, "eval/loss": 5.716084003448486, "eval/wer": 1.322015073383578, "eval/runtime": 866.8999, "eval/samples_per_second": 3.048, "eval/steps_per_second": 0.382} \ No newline at end of file