diff --git "a/wandb/run-20220323_161301-3mj7aa54/files/wandb-summary.json" "b/wandb/run-20220323_161301-3mj7aa54/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220323_161301-3mj7aa54/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 0.3634, "train/learning_rate": 7.776056338028169e-06, "train/epoch": 18.82, "train/global_step": 16787, "_runtime": 2686, "_timestamp": 1648054667, "_step": 286, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 9.0, 13.0, 9.0, 13.0, 15.0, 18.0, 20.0, 19.0, 20.0, 22.0, 28.0, 35.0, 25.0, 44.0, 38.0, 54.0, 42.0, 44.0, 40.0, 44.0, 54.0, 37.0, 39.0, 44.0, 36.0, 42.0, 24.0, 25.0, 27.0, 20.0, 17.0, 15.0, 8.0, 13.0, 10.0, 11.0, 2.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.655754566192627, -5.5245280265808105, -5.393301486968994, -5.262075424194336, -5.1308488845825195, -4.999622344970703, -4.868395805358887, -4.73716926574707, -4.605942726135254, -4.4747161865234375, -4.343489646911621, -4.212263107299805, -4.0810370445251465, -3.94981050491333, -3.8185839653015137, -3.6873574256896973, -3.55613112449646, -3.4249045848846436, -3.2936782836914062, -3.16245174407959, -3.0312252044677734, -2.899998664855957, -2.7687723636627197, -2.6375458240509033, -2.506319522857666, -2.3750929832458496, -2.2438666820526123, -2.112640142440796, -1.9814136028289795, -1.8501871824264526, -1.7189607620239258, -1.5877342224121094, -1.456507921218872, -1.3252815008163452, -1.1940549612045288, -1.062828540802002, -0.9316020607948303, -0.8003755807876587, -0.6691491603851318, -0.5379226803779602, -0.4066962003707886, -0.27546972036361694, -0.1442432701587677, -0.013016819953918457, 0.11820966005325317, 0.2494361400604248, 0.38066256046295166, 0.5118890404701233, 0.6431155204772949, 0.7743420004844666, 0.9055684804916382, 1.036794900894165, 1.1680214405059814, 1.2992478609085083, 1.4304742813110352, 1.5617008209228516, 1.6929272413253784, 1.8241536617279053, 1.9553802013397217, 2.086606502532959, 2.2178330421447754, 2.349059581756592, 2.480286121368408, 2.6115124225616455, 2.742738962173462]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 5.0, 10.0, 14.0, 16.0, 17.0, 17.0, 24.0, 27.0, 35.0, 29.0, 33.0, 32.0, 37.0, 38.0, 46.0, 34.0, 39.0, 38.0, 42.0, 41.0, 51.0, 51.0, 36.0, 34.0, 36.0, 40.0, 25.0, 27.0, 15.0, 16.0, 11.0, 18.0, 14.0, 11.0, 8.0, 8.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.057716369628906, -3.9166476726531982, -3.7755789756774902, -3.6345102787017822, -3.493441581726074, -3.352372884750366, -3.211304187774658, -3.070235252380371, -2.929166793823242, -2.788098096847534, -2.647029399871826, -2.505960702896118, -2.36489200592041, -2.223823308944702, -2.082754611968994, -1.9416857957839966, -1.800616979598999, -1.659548282623291, -1.518479585647583, -1.377410888671875, -1.236342191696167, -1.095273494720459, -0.9542046785354614, -0.8131359815597534, -0.6720672845840454, -0.5309985876083374, -0.389929860830307, -0.2488611340522766, -0.1077924370765686, 0.033276259899139404, 0.1743450164794922, 0.3154137134552002, 0.4564824104309082, 0.5975511074066162, 0.7386198043823242, 0.879688560962677, 1.0207571983337402, 1.1618258953094482, 1.3028947114944458, 1.4439634084701538, 1.5850321054458618, 1.7261008024215698, 1.8671694993972778, 2.0082383155822754, 2.1493070125579834, 2.2903757095336914, 2.4314444065093994, 2.5725131034851074, 2.7135818004608154, 2.8546504974365234, 2.9957191944122314, 3.1367878913879395, 3.2778565883636475, 3.4189252853393555, 3.5599942207336426, 3.7010626792907715, 3.8421316146850586, 3.9832003116607666, 4.124269008636475, 4.265337944030762, 4.406406402587891, 4.547475337982178, 4.688543796539307, 4.829612731933594, 4.970681190490723]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 11.0, 8.0, 37.0, 35.0, 47.0, 92.0, 112.0, 181.0, 290.0, 446.0, 683.0, 1119.0, 1806.0, 2827.0, 4758.0, 7913.0, 12625.0, 20931.0, 35301.0, 58179.0, 98564.0, 166089.0, 278674.0, 450927.0, 649480.0, 736007.0, 620385.0, 416763.0, 255713.0, 151498.0, 89635.0, 53836.0, 31428.0, 18807.0, 11288.0, 6900.0, 4206.0, 2522.0, 1566.0, 932.0, 585.0, 376.0, 222.0, 187.0, 84.0, 72.0, 52.0, 28.0, 20.0, 11.0, 3.0, 9.0, 8.0, 5.0, 2.0, 0.0, 2.0], "bins": [-6.0546875, -5.86785888671875, -5.6810302734375, -5.49420166015625, -5.307373046875, -5.12054443359375, -4.9337158203125, -4.74688720703125, -4.56005859375, -4.37322998046875, -4.1864013671875, -3.99957275390625, -3.812744140625, -3.62591552734375, -3.4390869140625, -3.25225830078125, -3.0654296875, -2.87860107421875, -2.6917724609375, -2.50494384765625, -2.318115234375, -2.13128662109375, -1.9444580078125, -1.75762939453125, -1.57080078125, -1.38397216796875, -1.1971435546875, -1.01031494140625, -0.823486328125, -0.63665771484375, -0.4498291015625, -0.26300048828125, -0.076171875, 0.11065673828125, 0.2974853515625, 0.48431396484375, 0.671142578125, 0.85797119140625, 1.0447998046875, 1.23162841796875, 1.41845703125, 1.60528564453125, 1.7921142578125, 1.97894287109375, 2.165771484375, 2.35260009765625, 2.5394287109375, 2.72625732421875, 2.9130859375, 3.09991455078125, 3.2867431640625, 3.47357177734375, 3.660400390625, 3.84722900390625, 4.0340576171875, 4.22088623046875, 4.40771484375, 4.59454345703125, 4.7813720703125, 4.96820068359375, 5.155029296875, 5.34185791015625, 5.5286865234375, 5.71551513671875, 5.90234375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 10.0, 9.0, 13.0, 19.0, 18.0, 17.0, 12.0, 21.0, 24.0, 32.0, 36.0, 35.0, 28.0, 42.0, 33.0, 35.0, 47.0, 41.0, 42.0, 35.0, 47.0, 47.0, 40.0, 46.0, 30.0, 32.0, 27.0, 28.0, 22.0, 13.0, 20.0, 21.0, 6.0, 10.0, 13.0, 14.0, 5.0, 6.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.94256591796875, -3.8031005859375, -3.66363525390625, -3.524169921875, -3.38470458984375, -3.2452392578125, -3.10577392578125, -2.96630859375, -2.82684326171875, -2.6873779296875, -2.54791259765625, -2.408447265625, -2.26898193359375, -2.1295166015625, -1.99005126953125, -1.8505859375, -1.71112060546875, -1.5716552734375, -1.43218994140625, -1.292724609375, -1.15325927734375, -1.0137939453125, -0.87432861328125, -0.73486328125, -0.59539794921875, -0.4559326171875, -0.31646728515625, -0.177001953125, -0.03753662109375, 0.1019287109375, 0.24139404296875, 0.380859375, 0.52032470703125, 0.6597900390625, 0.79925537109375, 0.938720703125, 1.07818603515625, 1.2176513671875, 1.35711669921875, 1.49658203125, 1.63604736328125, 1.7755126953125, 1.91497802734375, 2.054443359375, 2.19390869140625, 2.3333740234375, 2.47283935546875, 2.6123046875, 2.75177001953125, 2.8912353515625, 3.03070068359375, 3.170166015625, 3.30963134765625, 3.4490966796875, 3.58856201171875, 3.72802734375, 3.86749267578125, 4.0069580078125, 4.14642333984375, 4.285888671875, 4.42535400390625, 4.5648193359375, 4.70428466796875, 4.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 4.0, 10.0, 13.0, 21.0, 31.0, 43.0, 96.0, 134.0, 181.0, 303.0, 483.0, 707.0, 1179.0, 1840.0, 2906.0, 4630.0, 7392.0, 11852.0, 18652.0, 29769.0, 47624.0, 74913.0, 117111.0, 178156.0, 266190.0, 375802.0, 492822.0, 565990.0, 549723.0, 452118.0, 335048.0, 231798.0, 154415.0, 99647.0, 63806.0, 40222.0, 25504.0, 16201.0, 9998.0, 6257.0, 3948.0, 2499.0, 1567.0, 980.0, 620.0, 435.0, 220.0, 143.0, 106.0, 79.0, 32.0, 22.0, 25.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.1953125, -4.0634765625, -3.931640625, -3.7998046875, -3.66796875, -3.5361328125, -3.404296875, -3.2724609375, -3.140625, -3.0087890625, -2.876953125, -2.7451171875, -2.61328125, -2.4814453125, -2.349609375, -2.2177734375, -2.0859375, -1.9541015625, -1.822265625, -1.6904296875, -1.55859375, -1.4267578125, -1.294921875, -1.1630859375, -1.03125, -0.8994140625, -0.767578125, -0.6357421875, -0.50390625, -0.3720703125, -0.240234375, -0.1083984375, 0.0234375, 0.1552734375, 0.287109375, 0.4189453125, 0.55078125, 0.6826171875, 0.814453125, 0.9462890625, 1.078125, 1.2099609375, 1.341796875, 1.4736328125, 1.60546875, 1.7373046875, 1.869140625, 2.0009765625, 2.1328125, 2.2646484375, 2.396484375, 2.5283203125, 2.66015625, 2.7919921875, 2.923828125, 3.0556640625, 3.1875, 3.3193359375, 3.451171875, 3.5830078125, 3.71484375, 3.8466796875, 3.978515625, 4.1103515625, 4.2421875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 10.0, 7.0, 18.0, 9.0, 20.0, 19.0, 25.0, 47.0, 58.0, 65.0, 66.0, 86.0, 98.0, 116.0, 133.0, 163.0, 186.0, 190.0, 200.0, 219.0, 243.0, 201.0, 234.0, 249.0, 182.0, 187.0, 157.0, 142.0, 134.0, 108.0, 91.0, 75.0, 60.0, 45.0, 46.0, 39.0, 31.0, 33.0, 18.0, 17.0, 11.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.013671875, -1.95294189453125, -1.8922119140625, -1.83148193359375, -1.770751953125, -1.71002197265625, -1.6492919921875, -1.58856201171875, -1.52783203125, -1.46710205078125, -1.4063720703125, -1.34564208984375, -1.284912109375, -1.22418212890625, -1.1634521484375, -1.10272216796875, -1.0419921875, -0.98126220703125, -0.9205322265625, -0.85980224609375, -0.799072265625, -0.73834228515625, -0.6776123046875, -0.61688232421875, -0.55615234375, -0.49542236328125, -0.4346923828125, -0.37396240234375, -0.313232421875, -0.25250244140625, -0.1917724609375, -0.13104248046875, -0.0703125, -0.00958251953125, 0.0511474609375, 0.11187744140625, 0.172607421875, 0.23333740234375, 0.2940673828125, 0.35479736328125, 0.41552734375, 0.47625732421875, 0.5369873046875, 0.59771728515625, 0.658447265625, 0.71917724609375, 0.7799072265625, 0.84063720703125, 0.9013671875, 0.96209716796875, 1.0228271484375, 1.08355712890625, 1.144287109375, 1.20501708984375, 1.2657470703125, 1.32647705078125, 1.38720703125, 1.44793701171875, 1.5086669921875, 1.56939697265625, 1.630126953125, 1.69085693359375, 1.7515869140625, 1.81231689453125, 1.873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 5.0, 9.0, 11.0, 11.0, 21.0, 13.0, 13.0, 31.0, 25.0, 27.0, 33.0, 29.0, 25.0, 34.0, 44.0, 47.0, 42.0, 37.0, 39.0, 40.0, 55.0, 45.0, 33.0, 33.0, 33.0, 35.0, 31.0, 34.0, 35.0, 10.0, 19.0, 17.0, 16.0, 12.0, 7.0, 8.0, 6.0, 6.0, 1.0, 8.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.198858261108398, -4.0521440505981445, -3.9054298400878906, -3.7587156295776367, -3.612001419067383, -3.465287208557129, -3.318572998046875, -3.171858787536621, -3.025144577026367, -2.8784303665161133, -2.7317161560058594, -2.5850019454956055, -2.4382877349853516, -2.2915735244750977, -2.1448593139648438, -1.9981449842453003, -1.8514306545257568, -1.704716444015503, -1.558002233505249, -1.4112880229949951, -1.2645738124847412, -1.1178596019744873, -0.9711452722549438, -0.8244310617446899, -0.677716851234436, -0.5310026407241821, -0.38428840041160583, -0.23757416009902954, -0.09085994958877563, 0.05585426092147827, 0.20256853103637695, 0.34928274154663086, 0.49599695205688477, 0.6427111625671387, 0.7894253730773926, 0.9361396431922913, 1.0828537940979004, 1.2295680046081543, 1.3762823343276978, 1.5229965448379517, 1.6697107553482056, 1.8164249658584595, 1.9631391763687134, 2.109853506088257, 2.2565677165985107, 2.4032819271087646, 2.5499961376190186, 2.6967103481292725, 2.8434245586395264, 2.9901387691497803, 3.136852979660034, 3.283567190170288, 3.430281400680542, 3.576995611190796, 3.723710060119629, 3.870424270629883, 4.017138481140137, 4.163852691650391, 4.3105669021606445, 4.457281112670898, 4.603995323181152, 4.750709533691406, 4.89742374420166, 5.044137954711914, 5.190852165222168]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 7.0, 9.0, 10.0, 10.0, 18.0, 15.0, 19.0, 25.0, 23.0, 35.0, 31.0, 39.0, 25.0, 35.0, 30.0, 43.0, 53.0, 41.0, 41.0, 42.0, 42.0, 38.0, 43.0, 32.0, 37.0, 26.0, 34.0, 28.0, 23.0, 25.0, 21.0, 20.0, 17.0, 13.0, 10.0, 3.0, 8.0, 8.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.785914421081543, -4.6350555419921875, -4.484196662902832, -4.333337306976318, -4.182478427886963, -4.031619548797607, -3.880760669708252, -3.7299017906188965, -3.579042673110962, -3.4281837940216064, -3.277324676513672, -3.1264657974243164, -2.975606918334961, -2.8247478008270264, -2.673888921737671, -2.5230298042297363, -2.372170925140381, -2.2213120460510254, -2.070452928543091, -1.9195940494537354, -1.7687350511550903, -1.6178760528564453, -1.4670171737670898, -1.3161581754684448, -1.1652991771697998, -1.0144401788711548, -0.8635812401771545, -0.7127223014831543, -0.5618633031845093, -0.41100430488586426, -0.260145366191864, -0.10928642749786377, 0.04157304763793945, 0.19243201613426208, 0.3432909846305847, 0.49414995312690735, 0.64500892162323, 0.795867919921875, 0.9467268586158752, 1.0975857973098755, 1.2484447956085205, 1.3993037939071655, 1.5501627922058105, 1.701021671295166, 1.851880669593811, 2.002739667892456, 2.1535985469818115, 2.304457664489746, 2.4553165435791016, 2.606175422668457, 2.7570345401763916, 2.907893419265747, 3.0587525367736816, 3.209611415863037, 3.3604702949523926, 3.511329174041748, 3.6621882915496826, 3.813047170639038, 3.9639062881469727, 4.114765167236328, 4.265624046325684, 4.416482925415039, 4.567342281341553, 4.718201160430908, 4.869060039520264]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 7.0, 18.0, 30.0, 38.0, 64.0, 74.0, 115.0, 176.0, 260.0, 347.0, 568.0, 884.0, 1378.0, 1996.0, 3246.0, 5166.0, 8361.0, 13732.0, 22405.0, 36949.0, 60220.0, 94359.0, 136522.0, 165930.0, 159633.0, 122151.0, 81415.0, 51156.0, 30985.0, 19134.0, 11490.0, 7165.0, 4467.0, 2770.0, 1895.0, 1220.0, 701.0, 505.0, 336.0, 230.0, 147.0, 89.0, 73.0, 43.0, 34.0, 26.0, 11.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.71484375, -1.6626129150390625, -1.610382080078125, -1.5581512451171875, -1.50592041015625, -1.4536895751953125, -1.401458740234375, -1.3492279052734375, -1.2969970703125, -1.2447662353515625, -1.192535400390625, -1.1403045654296875, -1.08807373046875, -1.0358428955078125, -0.983612060546875, -0.9313812255859375, -0.879150390625, -0.8269195556640625, -0.774688720703125, -0.7224578857421875, -0.67022705078125, -0.6179962158203125, -0.565765380859375, -0.5135345458984375, -0.4613037109375, -0.4090728759765625, -0.356842041015625, -0.3046112060546875, -0.25238037109375, -0.2001495361328125, -0.147918701171875, -0.0956878662109375, -0.04345703125, 0.0087738037109375, 0.061004638671875, 0.1132354736328125, 0.16546630859375, 0.2176971435546875, 0.269927978515625, 0.3221588134765625, 0.3743896484375, 0.4266204833984375, 0.478851318359375, 0.5310821533203125, 0.58331298828125, 0.6355438232421875, 0.687774658203125, 0.7400054931640625, 0.792236328125, 0.8444671630859375, 0.896697998046875, 0.9489288330078125, 1.00115966796875, 1.0533905029296875, 1.105621337890625, 1.1578521728515625, 1.2100830078125, 1.2623138427734375, 1.314544677734375, 1.3667755126953125, 1.41900634765625, 1.4712371826171875, 1.523468017578125, 1.5756988525390625, 1.6279296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 4.0, 6.0, 7.0, 14.0, 10.0, 9.0, 13.0, 12.0, 16.0, 24.0, 14.0, 30.0, 34.0, 39.0, 28.0, 25.0, 36.0, 32.0, 42.0, 39.0, 42.0, 46.0, 39.0, 25.0, 51.0, 28.0, 36.0, 34.0, 30.0, 18.0, 21.0, 27.0, 30.0, 24.0, 22.0, 12.0, 14.0, 5.0, 8.0, 9.0, 8.0, 5.0, 5.0, 7.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.9619140625, -3.822265625, -3.6826171875, -3.54296875, -3.4033203125, -3.263671875, -3.1240234375, -2.984375, -2.8447265625, -2.705078125, -2.5654296875, -2.42578125, -2.2861328125, -2.146484375, -2.0068359375, -1.8671875, -1.7275390625, -1.587890625, -1.4482421875, -1.30859375, -1.1689453125, -1.029296875, -0.8896484375, -0.75, -0.6103515625, -0.470703125, -0.3310546875, -0.19140625, -0.0517578125, 0.087890625, 0.2275390625, 0.3671875, 0.5068359375, 0.646484375, 0.7861328125, 0.92578125, 1.0654296875, 1.205078125, 1.3447265625, 1.484375, 1.6240234375, 1.763671875, 1.9033203125, 2.04296875, 2.1826171875, 2.322265625, 2.4619140625, 2.6015625, 2.7412109375, 2.880859375, 3.0205078125, 3.16015625, 3.2998046875, 3.439453125, 3.5791015625, 3.71875, 3.8583984375, 3.998046875, 4.1376953125, 4.27734375, 4.4169921875, 4.556640625, 4.6962890625, 4.8359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 12.0, 11.0, 18.0, 25.0, 33.0, 44.0, 60.0, 108.0, 149.0, 290.0, 505.0, 1353.0, 3788.0, 12124.0, 47543.0, 906851.0, 55210.0, 13434.0, 4149.0, 1401.0, 632.0, 277.0, 178.0, 102.0, 75.0, 40.0, 32.0, 21.0, 23.0, 16.0, 4.0, 3.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76171875, -6.56011962890625, -6.3585205078125, -6.15692138671875, -5.955322265625, -5.75372314453125, -5.5521240234375, -5.35052490234375, -5.14892578125, -4.94732666015625, -4.7457275390625, -4.54412841796875, -4.342529296875, -4.14093017578125, -3.9393310546875, -3.73773193359375, -3.5361328125, -3.33453369140625, -3.1329345703125, -2.93133544921875, -2.729736328125, -2.52813720703125, -2.3265380859375, -2.12493896484375, -1.92333984375, -1.72174072265625, -1.5201416015625, -1.31854248046875, -1.116943359375, -0.91534423828125, -0.7137451171875, -0.51214599609375, -0.310546875, -0.10894775390625, 0.0926513671875, 0.29425048828125, 0.495849609375, 0.69744873046875, 0.8990478515625, 1.10064697265625, 1.30224609375, 1.50384521484375, 1.7054443359375, 1.90704345703125, 2.108642578125, 2.31024169921875, 2.5118408203125, 2.71343994140625, 2.9150390625, 3.11663818359375, 3.3182373046875, 3.51983642578125, 3.721435546875, 3.92303466796875, 4.1246337890625, 4.32623291015625, 4.52783203125, 4.72943115234375, 4.9310302734375, 5.13262939453125, 5.334228515625, 5.53582763671875, 5.7374267578125, 5.93902587890625, 6.140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 2.0, 14.0, 9.0, 17.0, 13.0, 12.0, 17.0, 24.0, 24.0, 31.0, 20.0, 24.0, 32.0, 43.0, 42.0, 30.0, 35.0, 36.0, 42.0, 44.0, 26.0, 33.0, 36.0, 33.0, 34.0, 43.0, 27.0, 22.0, 31.0, 30.0, 25.0, 22.0, 22.0, 16.0, 11.0, 11.0, 12.0, 9.0, 2.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.7734375, -2.6728515625, -2.572265625, -2.4716796875, -2.37109375, -2.2705078125, -2.169921875, -2.0693359375, -1.96875, -1.8681640625, -1.767578125, -1.6669921875, -1.56640625, -1.4658203125, -1.365234375, -1.2646484375, -1.1640625, -1.0634765625, -0.962890625, -0.8623046875, -0.76171875, -0.6611328125, -0.560546875, -0.4599609375, -0.359375, -0.2587890625, -0.158203125, -0.0576171875, 0.04296875, 0.1435546875, 0.244140625, 0.3447265625, 0.4453125, 0.5458984375, 0.646484375, 0.7470703125, 0.84765625, 0.9482421875, 1.048828125, 1.1494140625, 1.25, 1.3505859375, 1.451171875, 1.5517578125, 1.65234375, 1.7529296875, 1.853515625, 1.9541015625, 2.0546875, 2.1552734375, 2.255859375, 2.3564453125, 2.45703125, 2.5576171875, 2.658203125, 2.7587890625, 2.859375, 2.9599609375, 3.060546875, 3.1611328125, 3.26171875, 3.3623046875, 3.462890625, 3.5634765625, 3.6640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 11.0, 10.0, 9.0, 12.0, 11.0, 26.0, 51.0, 60.0, 92.0, 136.0, 213.0, 389.0, 660.0, 1300.0, 2649.0, 5561.0, 12723.0, 33236.0, 693507.0, 250922.0, 26676.0, 10805.0, 4719.0, 2212.0, 1092.0, 557.0, 344.0, 202.0, 112.0, 70.0, 55.0, 31.0, 23.0, 18.0, 13.0, 13.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75, -0.7257232666015625, -0.701446533203125, -0.6771697998046875, -0.65289306640625, -0.6286163330078125, -0.604339599609375, -0.5800628662109375, -0.5557861328125, -0.5315093994140625, -0.507232666015625, -0.4829559326171875, -0.45867919921875, -0.4344024658203125, -0.410125732421875, -0.3858489990234375, -0.361572265625, -0.3372955322265625, -0.313018798828125, -0.2887420654296875, -0.26446533203125, -0.2401885986328125, -0.215911865234375, -0.1916351318359375, -0.1673583984375, -0.1430816650390625, -0.118804931640625, -0.0945281982421875, -0.07025146484375, -0.0459747314453125, -0.021697998046875, 0.0025787353515625, 0.02685546875, 0.0511322021484375, 0.075408935546875, 0.0996856689453125, 0.12396240234375, 0.1482391357421875, 0.172515869140625, 0.1967926025390625, 0.2210693359375, 0.2453460693359375, 0.269622802734375, 0.2938995361328125, 0.31817626953125, 0.3424530029296875, 0.366729736328125, 0.3910064697265625, 0.415283203125, 0.4395599365234375, 0.463836669921875, 0.4881134033203125, 0.51239013671875, 0.5366668701171875, 0.560943603515625, 0.5852203369140625, 0.6094970703125, 0.6337738037109375, 0.658050537109375, 0.6823272705078125, 0.70660400390625, 0.7308807373046875, 0.755157470703125, 0.7794342041015625, 0.8037109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 8.0, 15.0, 12.0, 14.0, 14.0, 11.0, 33.0, 40.0, 34.0, 51.0, 36.0, 53.0, 75.0, 78.0, 69.0, 66.0, 56.0, 48.0, 42.0, 40.0, 27.0, 26.0, 20.0, 22.0, 23.0, 16.0, 12.0, 7.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.4634023904800415e-05, -3.3445656299591064e-05, -3.2257288694381714e-05, -3.106892108917236e-05, -2.9880553483963013e-05, -2.8692185878753662e-05, -2.750381827354431e-05, -2.631545066833496e-05, -2.512708306312561e-05, -2.393871545791626e-05, -2.275034785270691e-05, -2.156198024749756e-05, -2.0373612642288208e-05, -1.9185245037078857e-05, -1.7996877431869507e-05, -1.6808509826660156e-05, -1.5620142221450806e-05, -1.4431774616241455e-05, -1.3243407011032104e-05, -1.2055039405822754e-05, -1.0866671800613403e-05, -9.678304195404053e-06, -8.489936590194702e-06, -7.3015689849853516e-06, -6.113201379776001e-06, -4.92483377456665e-06, -3.7364661693573e-06, -2.5480985641479492e-06, -1.3597309589385986e-06, -1.7136335372924805e-07, 1.0170042514801025e-06, 2.205371856689453e-06, 3.3937394618988037e-06, 4.582107067108154e-06, 5.770474672317505e-06, 6.9588422775268555e-06, 8.147209882736206e-06, 9.335577487945557e-06, 1.0523945093154907e-05, 1.1712312698364258e-05, 1.2900680303573608e-05, 1.4089047908782959e-05, 1.527741551399231e-05, 1.646578311920166e-05, 1.765415072441101e-05, 1.884251832962036e-05, 2.0030885934829712e-05, 2.1219253540039062e-05, 2.2407621145248413e-05, 2.3595988750457764e-05, 2.4784356355667114e-05, 2.5972723960876465e-05, 2.7161091566085815e-05, 2.8349459171295166e-05, 2.9537826776504517e-05, 3.072619438171387e-05, 3.191456198692322e-05, 3.310292959213257e-05, 3.429129719734192e-05, 3.547966480255127e-05, 3.666803240776062e-05, 3.785640001296997e-05, 3.904476761817932e-05, 4.023313522338867e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 16.0, 24.0, 46.0, 54.0, 67.0, 89.0, 107.0, 153.0, 210.0, 243.0, 315.0, 514.0, 667.0, 879.0, 1328.0, 1789.0, 2712.0, 4411.0, 7240.0, 12425.0, 22225.0, 40065.0, 72405.0, 125998.0, 194253.0, 209185.0, 149294.0, 87435.0, 48352.0, 26670.0, 14760.0, 8594.0, 5180.0, 3314.0, 2086.0, 1465.0, 1019.0, 781.0, 560.0, 409.0, 291.0, 233.0, 198.0, 138.0, 106.0, 77.0, 54.0, 38.0, 25.0, 13.0, 12.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.71435546875, -0.6921463012695312, -0.6699371337890625, -0.6477279663085938, -0.625518798828125, -0.6033096313476562, -0.5811004638671875, -0.5588912963867188, -0.53668212890625, -0.5144729614257812, -0.4922637939453125, -0.47005462646484375, -0.447845458984375, -0.42563629150390625, -0.4034271240234375, -0.38121795654296875, -0.3590087890625, -0.33679962158203125, -0.3145904541015625, -0.29238128662109375, -0.270172119140625, -0.24796295166015625, -0.2257537841796875, -0.20354461669921875, -0.18133544921875, -0.15912628173828125, -0.1369171142578125, -0.11470794677734375, -0.092498779296875, -0.07028961181640625, -0.0480804443359375, -0.02587127685546875, -0.003662109375, 0.01854705810546875, 0.0407562255859375, 0.06296539306640625, 0.085174560546875, 0.10738372802734375, 0.1295928955078125, 0.15180206298828125, 0.17401123046875, 0.19622039794921875, 0.2184295654296875, 0.24063873291015625, 0.262847900390625, 0.28505706787109375, 0.3072662353515625, 0.32947540283203125, 0.3516845703125, 0.37389373779296875, 0.3961029052734375, 0.41831207275390625, 0.440521240234375, 0.46273040771484375, 0.4849395751953125, 0.5071487426757812, 0.52935791015625, 0.5515670776367188, 0.5737762451171875, 0.5959854125976562, 0.618194580078125, 0.6404037475585938, 0.6626129150390625, 0.6848220825195312, 0.70703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 7.0, 7.0, 13.0, 20.0, 37.0, 52.0, 46.0, 57.0, 92.0, 81.0, 82.0, 101.0, 87.0, 66.0, 56.0, 38.0, 32.0, 25.0, 17.0, 20.0, 16.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3249855041503906, -0.31476593017578125, -0.3045463562011719, -0.2943267822265625, -0.2841072082519531, -0.27388763427734375, -0.2636680603027344, -0.253448486328125, -0.24322891235351562, -0.23300933837890625, -0.22278976440429688, -0.2125701904296875, -0.20235061645507812, -0.19213104248046875, -0.18191146850585938, -0.17169189453125, -0.16147232055664062, -0.15125274658203125, -0.14103317260742188, -0.1308135986328125, -0.12059402465820312, -0.11037445068359375, -0.10015487670898438, -0.089935302734375, -0.07971572875976562, -0.06949615478515625, -0.059276580810546875, -0.0490570068359375, -0.038837432861328125, -0.02861785888671875, -0.018398284912109375, -0.0081787109375, 0.002040863037109375, 0.01226043701171875, 0.022480010986328125, 0.0326995849609375, 0.042919158935546875, 0.05313873291015625, 0.06335830688476562, 0.073577880859375, 0.08379745483398438, 0.09401702880859375, 0.10423660278320312, 0.1144561767578125, 0.12467575073242188, 0.13489532470703125, 0.14511489868164062, 0.15533447265625, 0.16555404663085938, 0.17577362060546875, 0.18599319458007812, 0.1962127685546875, 0.20643234252929688, 0.21665191650390625, 0.22687149047851562, 0.237091064453125, 0.24731063842773438, 0.25753021240234375, 0.2677497863769531, 0.2779693603515625, 0.2881889343261719, 0.29840850830078125, 0.3086280822753906, 0.31884765625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 3.0, 6.0, 9.0, 11.0, 10.0, 19.0, 18.0, 16.0, 22.0, 37.0, 36.0, 29.0, 26.0, 36.0, 29.0, 43.0, 46.0, 48.0, 46.0, 36.0, 54.0, 51.0, 40.0, 37.0, 31.0, 34.0, 36.0, 31.0, 33.0, 18.0, 18.0, 12.0, 16.0, 15.0, 9.0, 7.0, 5.0, 3.0, 1.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.499025344848633, -4.348140716552734, -4.197255611419678, -4.046370506286621, -3.8954858779907227, -3.744601011276245, -3.5937161445617676, -3.44283127784729, -3.2919464111328125, -3.141061544418335, -2.9901766777038574, -2.83929181098938, -2.6884069442749023, -2.537522077560425, -2.3866372108459473, -2.2357523441314697, -2.084867477416992, -1.9339826107025146, -1.783097743988037, -1.6322128772735596, -1.481328010559082, -1.3304431438446045, -1.179558277130127, -1.0286734104156494, -0.8777885437011719, -0.7269036769866943, -0.5760188102722168, -0.42513394355773926, -0.2742490768432617, -0.12336421012878418, 0.02752065658569336, 0.1784055233001709, 0.32928991317749023, 0.4801747798919678, 0.6310596466064453, 0.7819445133209229, 0.9328293800354004, 1.083714246749878, 1.2345991134643555, 1.385483980178833, 1.5363688468933105, 1.687253713607788, 1.8381385803222656, 1.9890234470367432, 2.1399083137512207, 2.2907931804656982, 2.441678047180176, 2.5925629138946533, 2.743447780609131, 2.8943326473236084, 3.045217514038086, 3.1961023807525635, 3.346987247467041, 3.4978721141815186, 3.648756980895996, 3.7996418476104736, 3.950526714324951, 4.101411819458008, 4.252296447753906, 4.403181076049805, 4.554066181182861, 4.704951286315918, 4.855835914611816, 5.006720542907715, 5.1576056480407715]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 11.0, 7.0, 12.0, 13.0, 14.0, 20.0, 21.0, 22.0, 20.0, 46.0, 37.0, 30.0, 31.0, 36.0, 38.0, 54.0, 34.0, 50.0, 45.0, 42.0, 40.0, 36.0, 46.0, 34.0, 36.0, 28.0, 23.0, 32.0, 29.0, 21.0, 17.0, 13.0, 16.0, 10.0, 5.0, 7.0, 9.0, 2.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.934784412384033, -4.780898094177246, -4.627011299133301, -4.473124980926514, -4.319238662719727, -4.1653523445129395, -4.011466026306152, -3.857579231262207, -3.70369291305542, -3.549806594848633, -3.3959200382232666, -3.2420334815979004, -3.0881471633911133, -2.934260845184326, -2.78037428855896, -2.6264877319335938, -2.4726014137268066, -2.3187150955200195, -2.1648285388946533, -2.010941982269287, -1.8570556640625, -1.7031692266464233, -1.5492827892303467, -1.39539635181427, -1.2415099143981934, -1.0876234769821167, -0.93373703956604, -0.7798506021499634, -0.6259641647338867, -0.47207772731781006, -0.3181912899017334, -0.16430485248565674, -0.010417938232421875, 0.14346849918365479, 0.29735493659973145, 0.4512413740158081, 0.6051278114318848, 0.7590142488479614, 0.9129006862640381, 1.0667871236801147, 1.2206735610961914, 1.374559998512268, 1.5284464359283447, 1.6823328733444214, 1.836219310760498, 1.9901057481765747, 2.1439921855926514, 2.2978787422180176, 2.4517650604248047, 2.605651378631592, 2.759537935256958, 2.913424491882324, 3.0673108100891113, 3.2211971282958984, 3.3750836849212646, 3.528970241546631, 3.682856559753418, 3.836742877960205, 3.9906294345855713, 4.1445159912109375, 4.298402309417725, 4.452288627624512, 4.606175422668457, 4.760061740875244, 4.913948059082031]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 8.0, 6.0, 13.0, 26.0, 41.0, 69.0, 99.0, 147.0, 240.0, 324.0, 470.0, 824.0, 1209.0, 1780.0, 2669.0, 4155.0, 6169.0, 9208.0, 13745.0, 19962.0, 28103.0, 38199.0, 50839.0, 64784.0, 78505.0, 89840.0, 97509.0, 98458.0, 92629.0, 82597.0, 69210.0, 55169.0, 42079.0, 30842.0, 21781.0, 15532.0, 10502.0, 7110.0, 4683.0, 3113.0, 2050.0, 1338.0, 846.0, 535.0, 391.0, 249.0, 188.0, 115.0, 65.0, 47.0, 32.0, 27.0, 11.0, 8.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.30078125, -3.191314697265625, -3.08184814453125, -2.972381591796875, -2.8629150390625, -2.753448486328125, -2.64398193359375, -2.534515380859375, -2.425048828125, -2.315582275390625, -2.20611572265625, -2.096649169921875, -1.9871826171875, -1.877716064453125, -1.76824951171875, -1.658782958984375, -1.54931640625, -1.439849853515625, -1.33038330078125, -1.220916748046875, -1.1114501953125, -1.001983642578125, -0.89251708984375, -0.783050537109375, -0.673583984375, -0.564117431640625, -0.45465087890625, -0.345184326171875, -0.2357177734375, -0.126251220703125, -0.01678466796875, 0.092681884765625, 0.2021484375, 0.311614990234375, 0.42108154296875, 0.530548095703125, 0.6400146484375, 0.749481201171875, 0.85894775390625, 0.968414306640625, 1.077880859375, 1.187347412109375, 1.29681396484375, 1.406280517578125, 1.5157470703125, 1.625213623046875, 1.73468017578125, 1.844146728515625, 1.95361328125, 2.063079833984375, 2.17254638671875, 2.282012939453125, 2.3914794921875, 2.500946044921875, 2.61041259765625, 2.719879150390625, 2.829345703125, 2.938812255859375, 3.04827880859375, 3.157745361328125, 3.2672119140625, 3.376678466796875, 3.48614501953125, 3.595611572265625, 3.705078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 3.0, 7.0, 13.0, 9.0, 12.0, 14.0, 24.0, 19.0, 23.0, 29.0, 28.0, 19.0, 38.0, 34.0, 30.0, 36.0, 35.0, 49.0, 32.0, 37.0, 44.0, 35.0, 30.0, 46.0, 33.0, 28.0, 31.0, 26.0, 25.0, 30.0, 27.0, 18.0, 17.0, 20.0, 13.0, 9.0, 11.0, 14.0, 5.0, 6.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.03125, -3.89593505859375, -3.7606201171875, -3.62530517578125, -3.489990234375, -3.35467529296875, -3.2193603515625, -3.08404541015625, -2.94873046875, -2.81341552734375, -2.6781005859375, -2.54278564453125, -2.407470703125, -2.27215576171875, -2.1368408203125, -2.00152587890625, -1.8662109375, -1.73089599609375, -1.5955810546875, -1.46026611328125, -1.324951171875, -1.18963623046875, -1.0543212890625, -0.91900634765625, -0.78369140625, -0.64837646484375, -0.5130615234375, -0.37774658203125, -0.242431640625, -0.10711669921875, 0.0281982421875, 0.16351318359375, 0.298828125, 0.43414306640625, 0.5694580078125, 0.70477294921875, 0.840087890625, 0.97540283203125, 1.1107177734375, 1.24603271484375, 1.38134765625, 1.51666259765625, 1.6519775390625, 1.78729248046875, 1.922607421875, 2.05792236328125, 2.1932373046875, 2.32855224609375, 2.4638671875, 2.59918212890625, 2.7344970703125, 2.86981201171875, 3.005126953125, 3.14044189453125, 3.2757568359375, 3.41107177734375, 3.54638671875, 3.68170166015625, 3.8170166015625, 3.95233154296875, 4.087646484375, 4.22296142578125, 4.3582763671875, 4.49359130859375, 4.62890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 15.0, 28.0, 60.0, 86.0, 144.0, 225.0, 327.0, 529.0, 861.0, 1378.0, 2155.0, 3484.0, 5249.0, 8097.0, 12227.0, 18469.0, 26473.0, 37155.0, 50223.0, 65950.0, 81770.0, 94424.0, 102324.0, 103834.0, 96900.0, 84872.0, 69475.0, 54221.0, 40451.0, 28828.0, 19782.0, 13336.0, 9053.0, 5913.0, 3745.0, 2382.0, 1439.0, 1000.0, 622.0, 404.0, 231.0, 160.0, 96.0, 57.0, 33.0, 21.0, 13.0, 10.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.33984375, -4.20037841796875, -4.0609130859375, -3.92144775390625, -3.781982421875, -3.64251708984375, -3.5030517578125, -3.36358642578125, -3.22412109375, -3.08465576171875, -2.9451904296875, -2.80572509765625, -2.666259765625, -2.52679443359375, -2.3873291015625, -2.24786376953125, -2.1083984375, -1.96893310546875, -1.8294677734375, -1.69000244140625, -1.550537109375, -1.41107177734375, -1.2716064453125, -1.13214111328125, -0.99267578125, -0.85321044921875, -0.7137451171875, -0.57427978515625, -0.434814453125, -0.29534912109375, -0.1558837890625, -0.01641845703125, 0.123046875, 0.26251220703125, 0.4019775390625, 0.54144287109375, 0.680908203125, 0.82037353515625, 0.9598388671875, 1.09930419921875, 1.23876953125, 1.37823486328125, 1.5177001953125, 1.65716552734375, 1.796630859375, 1.93609619140625, 2.0755615234375, 2.21502685546875, 2.3544921875, 2.49395751953125, 2.6334228515625, 2.77288818359375, 2.912353515625, 3.05181884765625, 3.1912841796875, 3.33074951171875, 3.47021484375, 3.60968017578125, 3.7491455078125, 3.88861083984375, 4.028076171875, 4.16754150390625, 4.3070068359375, 4.44647216796875, 4.5859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 5.0, 9.0, 9.0, 19.0, 16.0, 12.0, 13.0, 28.0, 21.0, 28.0, 20.0, 22.0, 31.0, 36.0, 27.0, 39.0, 30.0, 38.0, 31.0, 50.0, 28.0, 37.0, 44.0, 49.0, 31.0, 30.0, 29.0, 30.0, 29.0, 22.0, 20.0, 24.0, 19.0, 17.0, 11.0, 11.0, 12.0, 10.0, 13.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.724609375, -2.63995361328125, -2.5552978515625, -2.47064208984375, -2.385986328125, -2.30133056640625, -2.2166748046875, -2.13201904296875, -2.04736328125, -1.96270751953125, -1.8780517578125, -1.79339599609375, -1.708740234375, -1.62408447265625, -1.5394287109375, -1.45477294921875, -1.3701171875, -1.28546142578125, -1.2008056640625, -1.11614990234375, -1.031494140625, -0.94683837890625, -0.8621826171875, -0.77752685546875, -0.69287109375, -0.60821533203125, -0.5235595703125, -0.43890380859375, -0.354248046875, -0.26959228515625, -0.1849365234375, -0.10028076171875, -0.015625, 0.06903076171875, 0.1536865234375, 0.23834228515625, 0.322998046875, 0.40765380859375, 0.4923095703125, 0.57696533203125, 0.66162109375, 0.74627685546875, 0.8309326171875, 0.91558837890625, 1.000244140625, 1.08489990234375, 1.1695556640625, 1.25421142578125, 1.3388671875, 1.42352294921875, 1.5081787109375, 1.59283447265625, 1.677490234375, 1.76214599609375, 1.8468017578125, 1.93145751953125, 2.01611328125, 2.10076904296875, 2.1854248046875, 2.27008056640625, 2.354736328125, 2.43939208984375, 2.5240478515625, 2.60870361328125, 2.693359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 8.0, 22.0, 19.0, 17.0, 40.0, 47.0, 82.0, 108.0, 177.0, 241.0, 389.0, 585.0, 1003.0, 1543.0, 2496.0, 3786.0, 6104.0, 9616.0, 15325.0, 23690.0, 36496.0, 53990.0, 75523.0, 98762.0, 117852.0, 126705.0, 120659.0, 103616.0, 80476.0, 58169.0, 39909.0, 26187.0, 16331.0, 10370.0, 6704.0, 4171.0, 2720.0, 1676.0, 1113.0, 655.0, 425.0, 282.0, 178.0, 108.0, 62.0, 39.0, 29.0, 16.0, 17.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.15106201171875, -1.1077880859375, -1.06451416015625, -1.021240234375, -0.97796630859375, -0.9346923828125, -0.89141845703125, -0.84814453125, -0.80487060546875, -0.7615966796875, -0.71832275390625, -0.675048828125, -0.63177490234375, -0.5885009765625, -0.54522705078125, -0.501953125, -0.45867919921875, -0.4154052734375, -0.37213134765625, -0.328857421875, -0.28558349609375, -0.2423095703125, -0.19903564453125, -0.15576171875, -0.11248779296875, -0.0692138671875, -0.02593994140625, 0.017333984375, 0.06060791015625, 0.1038818359375, 0.14715576171875, 0.1904296875, 0.23370361328125, 0.2769775390625, 0.32025146484375, 0.363525390625, 0.40679931640625, 0.4500732421875, 0.49334716796875, 0.53662109375, 0.57989501953125, 0.6231689453125, 0.66644287109375, 0.709716796875, 0.75299072265625, 0.7962646484375, 0.83953857421875, 0.8828125, 0.92608642578125, 0.9693603515625, 1.01263427734375, 1.055908203125, 1.09918212890625, 1.1424560546875, 1.18572998046875, 1.22900390625, 1.27227783203125, 1.3155517578125, 1.35882568359375, 1.402099609375, 1.44537353515625, 1.4886474609375, 1.53192138671875, 1.5751953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 12.0, 6.0, 5.0, 10.0, 19.0, 25.0, 25.0, 22.0, 19.0, 29.0, 38.0, 54.0, 39.0, 54.0, 46.0, 51.0, 50.0, 63.0, 50.0, 55.0, 42.0, 43.0, 38.0, 29.0, 30.0, 28.0, 15.0, 30.0, 10.0, 14.0, 13.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000171661376953125, -0.0001658555120229721, -0.00016004964709281921, -0.00015424378216266632, -0.00014843791723251343, -0.00014263205230236053, -0.00013682618737220764, -0.00013102032244205475, -0.00012521445751190186, -0.00011940859258174896, -0.00011360272765159607, -0.00010779686272144318, -0.00010199099779129028, -9.618513286113739e-05, -9.03792679309845e-05, -8.45734030008316e-05, -7.876753807067871e-05, -7.296167314052582e-05, -6.715580821037292e-05, -6.134994328022003e-05, -5.554407835006714e-05, -4.9738213419914246e-05, -4.393234848976135e-05, -3.812648355960846e-05, -3.2320618629455566e-05, -2.6514753699302673e-05, -2.070888876914978e-05, -1.4903023838996887e-05, -9.097158908843994e-06, -3.291293978691101e-06, 2.514570951461792e-06, 8.320435881614685e-06, 1.4126300811767578e-05, 1.993216574192047e-05, 2.5738030672073364e-05, 3.154389560222626e-05, 3.734976053237915e-05, 4.3155625462532043e-05, 4.8961490392684937e-05, 5.476735532283783e-05, 6.057322025299072e-05, 6.637908518314362e-05, 7.218495011329651e-05, 7.79908150434494e-05, 8.37966799736023e-05, 8.960254490375519e-05, 9.540840983390808e-05, 0.00010121427476406097, 0.00010702013969421387, 0.00011282600462436676, 0.00011863186955451965, 0.00012443773448467255, 0.00013024359941482544, 0.00013604946434497833, 0.00014185532927513123, 0.00014766119420528412, 0.000153467059135437, 0.0001592729240655899, 0.0001650787889957428, 0.0001708846539258957, 0.00017669051885604858, 0.00018249638378620148, 0.00018830224871635437, 0.00019410811364650726, 0.00019991397857666016]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 7.0, 15.0, 15.0, 32.0, 43.0, 54.0, 76.0, 140.0, 233.0, 352.0, 585.0, 1031.0, 1691.0, 3099.0, 5632.0, 10394.0, 19276.0, 34204.0, 59277.0, 94118.0, 133693.0, 162395.0, 161114.0, 133596.0, 93487.0, 58358.0, 33771.0, 18732.0, 10207.0, 5672.0, 3054.0, 1723.0, 958.0, 548.0, 338.0, 206.0, 124.0, 94.0, 68.0, 53.0, 31.0, 17.0, 10.0, 7.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8603515625, -1.803955078125, -1.74755859375, -1.691162109375, -1.634765625, -1.578369140625, -1.52197265625, -1.465576171875, -1.4091796875, -1.352783203125, -1.29638671875, -1.239990234375, -1.18359375, -1.127197265625, -1.07080078125, -1.014404296875, -0.9580078125, -0.901611328125, -0.84521484375, -0.788818359375, -0.732421875, -0.676025390625, -0.61962890625, -0.563232421875, -0.5068359375, -0.450439453125, -0.39404296875, -0.337646484375, -0.28125, -0.224853515625, -0.16845703125, -0.112060546875, -0.0556640625, 0.000732421875, 0.05712890625, 0.113525390625, 0.169921875, 0.226318359375, 0.28271484375, 0.339111328125, 0.3955078125, 0.451904296875, 0.50830078125, 0.564697265625, 0.62109375, 0.677490234375, 0.73388671875, 0.790283203125, 0.8466796875, 0.903076171875, 0.95947265625, 1.015869140625, 1.072265625, 1.128662109375, 1.18505859375, 1.241455078125, 1.2978515625, 1.354248046875, 1.41064453125, 1.467041015625, 1.5234375, 1.579833984375, 1.63623046875, 1.692626953125, 1.7490234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 10.0, 12.0, 13.0, 16.0, 18.0, 19.0, 32.0, 36.0, 28.0, 39.0, 42.0, 55.0, 57.0, 60.0, 58.0, 65.0, 64.0, 51.0, 57.0, 40.0, 42.0, 27.0, 29.0, 21.0, 26.0, 21.0, 10.0, 16.0, 6.0, 2.0, 2.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.83349609375, -0.810516357421875, -0.78753662109375, -0.764556884765625, -0.7415771484375, -0.718597412109375, -0.69561767578125, -0.672637939453125, -0.649658203125, -0.626678466796875, -0.60369873046875, -0.580718994140625, -0.5577392578125, -0.534759521484375, -0.51177978515625, -0.488800048828125, -0.4658203125, -0.442840576171875, -0.41986083984375, -0.396881103515625, -0.3739013671875, -0.350921630859375, -0.32794189453125, -0.304962158203125, -0.281982421875, -0.259002685546875, -0.23602294921875, -0.213043212890625, -0.1900634765625, -0.167083740234375, -0.14410400390625, -0.121124267578125, -0.09814453125, -0.075164794921875, -0.05218505859375, -0.029205322265625, -0.0062255859375, 0.016754150390625, 0.03973388671875, 0.062713623046875, 0.085693359375, 0.108673095703125, 0.13165283203125, 0.154632568359375, 0.1776123046875, 0.200592041015625, 0.22357177734375, 0.246551513671875, 0.26953125, 0.292510986328125, 0.31549072265625, 0.338470458984375, 0.3614501953125, 0.384429931640625, 0.40740966796875, 0.430389404296875, 0.453369140625, 0.476348876953125, 0.49932861328125, 0.522308349609375, 0.5452880859375, 0.568267822265625, 0.59124755859375, 0.614227294921875, 0.63720703125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 6.0, 7.0, 9.0, 11.0, 15.0, 17.0, 14.0, 19.0, 25.0, 22.0, 25.0, 34.0, 36.0, 35.0, 36.0, 42.0, 42.0, 37.0, 35.0, 42.0, 38.0, 46.0, 47.0, 32.0, 52.0, 33.0, 25.0, 31.0, 27.0, 17.0, 27.0, 23.0, 16.0, 19.0, 13.0, 12.0, 3.0, 3.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.585928440093994, -4.439441680908203, -4.292954921722412, -4.146468162536621, -3.99998140335083, -3.853494644165039, -3.707007646560669, -3.560520887374878, -3.414034128189087, -3.267547369003296, -3.121060609817505, -2.974573850631714, -2.8280868530273438, -2.6816000938415527, -2.5351133346557617, -2.3886265754699707, -2.2421398162841797, -2.0956530570983887, -1.9491662979125977, -1.802679419517517, -1.656192660331726, -1.509705901145935, -1.3632190227508545, -1.2167322635650635, -1.0702455043792725, -0.9237587451934814, -0.7772719264030457, -0.6307851076126099, -0.48429834842681885, -0.33781158924102783, -0.19132477045059204, -0.04483795166015625, 0.10164928436279297, 0.24813607335090637, 0.3946228623390198, 0.5411096811294556, 0.6875964403152466, 0.8340831995010376, 0.9805700182914734, 1.1270568370819092, 1.2735435962677002, 1.4200303554534912, 1.5665171146392822, 1.7130039930343628, 1.8594907522201538, 2.0059776306152344, 2.1524643898010254, 2.2989511489868164, 2.4454379081726074, 2.5919246673583984, 2.7384114265441895, 2.8848981857299805, 3.0313849449157715, 3.1778717041015625, 3.3243587017059326, 3.4708454608917236, 3.6173322200775146, 3.7638189792633057, 3.9103057384490967, 4.056792736053467, 4.203279495239258, 4.349766254425049, 4.49625301361084, 4.642739772796631, 4.789226531982422]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 13.0, 12.0, 11.0, 20.0, 14.0, 27.0, 20.0, 28.0, 38.0, 40.0, 38.0, 28.0, 39.0, 44.0, 41.0, 48.0, 45.0, 40.0, 47.0, 41.0, 41.0, 32.0, 34.0, 35.0, 31.0, 31.0, 27.0, 15.0, 24.0, 18.0, 15.0, 11.0, 11.0, 3.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-6.228497505187988, -6.06591272354126, -5.903327465057373, -5.7407426834106445, -5.578157901763916, -5.4155731201171875, -5.252987861633301, -5.090403079986572, -4.927818298339844, -4.765233516693115, -4.6026482582092285, -4.4400634765625, -4.2774786949157715, -4.114893913269043, -3.9523086547851562, -3.7897238731384277, -3.627138614654541, -3.4645535945892334, -3.301968812942505, -3.1393837928771973, -2.9767990112304688, -2.814213991165161, -2.6516289710998535, -2.489044189453125, -2.3264591693878174, -2.1638741493225098, -2.0012893676757812, -1.8387043476104736, -1.6761194467544556, -1.5135345458984375, -1.3509495258331299, -1.1883646249771118, -1.025780200958252, -0.8631953001022339, -0.700610339641571, -0.5380253791809082, -0.37544047832489014, -0.21285557746887207, -0.05027061700820923, 0.11231434345245361, 0.2748992443084717, 0.43748417496681213, 0.6000691056251526, 0.7626540660858154, 0.9252389669418335, 1.0878238677978516, 1.2504088878631592, 1.4129937887191772, 1.5755786895751953, 1.7381635904312134, 1.9007484912872314, 2.063333511352539, 2.2259182929992676, 2.388503313064575, 2.551088333129883, 2.7136731147766113, 2.876258134841919, 3.0388431549072266, 3.201427936553955, 3.3640129566192627, 3.5265979766845703, 3.689182758331299, 3.8517677783966064, 4.014352798461914, 4.176937580108643]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 18.0, 29.0, 51.0, 76.0, 122.0, 202.0, 289.0, 465.0, 737.0, 1211.0, 1816.0, 2897.0, 4923.0, 7740.0, 12982.0, 21259.0, 36373.0, 60698.0, 103486.0, 176725.0, 297002.0, 472494.0, 651641.0, 715696.0, 600615.0, 411371.0, 251415.0, 147258.0, 87628.0, 50689.0, 30037.0, 17853.0, 10800.0, 6585.0, 4052.0, 2570.0, 1594.0, 1012.0, 680.0, 404.0, 272.0, 158.0, 121.0, 87.0, 47.0, 34.0, 22.0, 10.0, 9.0, 10.0, 6.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.466064453125, -4.31884765625, -4.171630859375, -4.0244140625, -3.877197265625, -3.72998046875, -3.582763671875, -3.435546875, -3.288330078125, -3.14111328125, -2.993896484375, -2.8466796875, -2.699462890625, -2.55224609375, -2.405029296875, -2.2578125, -2.110595703125, -1.96337890625, -1.816162109375, -1.6689453125, -1.521728515625, -1.37451171875, -1.227294921875, -1.080078125, -0.932861328125, -0.78564453125, -0.638427734375, -0.4912109375, -0.343994140625, -0.19677734375, -0.049560546875, 0.09765625, 0.244873046875, 0.39208984375, 0.539306640625, 0.6865234375, 0.833740234375, 0.98095703125, 1.128173828125, 1.275390625, 1.422607421875, 1.56982421875, 1.717041015625, 1.8642578125, 2.011474609375, 2.15869140625, 2.305908203125, 2.453125, 2.600341796875, 2.74755859375, 2.894775390625, 3.0419921875, 3.189208984375, 3.33642578125, 3.483642578125, 3.630859375, 3.778076171875, 3.92529296875, 4.072509765625, 4.2197265625, 4.366943359375, 4.51416015625, 4.661376953125, 4.80859375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 15.0, 12.0, 22.0, 21.0, 24.0, 30.0, 41.0, 34.0, 30.0, 42.0, 44.0, 47.0, 44.0, 54.0, 56.0, 47.0, 42.0, 50.0, 41.0, 36.0, 33.0, 42.0, 31.0, 29.0, 22.0, 23.0, 18.0, 14.0, 5.0, 11.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15625, -5.00628662109375, -4.8563232421875, -4.70635986328125, -4.556396484375, -4.40643310546875, -4.2564697265625, -4.10650634765625, -3.95654296875, -3.80657958984375, -3.6566162109375, -3.50665283203125, -3.356689453125, -3.20672607421875, -3.0567626953125, -2.90679931640625, -2.7568359375, -2.60687255859375, -2.4569091796875, -2.30694580078125, -2.156982421875, -2.00701904296875, -1.8570556640625, -1.70709228515625, -1.55712890625, -1.40716552734375, -1.2572021484375, -1.10723876953125, -0.957275390625, -0.80731201171875, -0.6573486328125, -0.50738525390625, -0.357421875, -0.20745849609375, -0.0574951171875, 0.09246826171875, 0.242431640625, 0.39239501953125, 0.5423583984375, 0.69232177734375, 0.84228515625, 0.99224853515625, 1.1422119140625, 1.29217529296875, 1.442138671875, 1.59210205078125, 1.7420654296875, 1.89202880859375, 2.0419921875, 2.19195556640625, 2.3419189453125, 2.49188232421875, 2.641845703125, 2.79180908203125, 2.9417724609375, 3.09173583984375, 3.24169921875, 3.39166259765625, 3.5416259765625, 3.69158935546875, 3.841552734375, 3.99151611328125, 4.1414794921875, 4.29144287109375, 4.44140625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 5.0, 11.0, 20.0, 35.0, 42.0, 70.0, 117.0, 153.0, 277.0, 403.0, 600.0, 909.0, 1368.0, 2220.0, 3179.0, 4936.0, 7835.0, 12323.0, 19109.0, 29352.0, 45525.0, 69871.0, 106476.0, 160081.0, 233046.0, 326343.0, 426143.0, 506204.0, 528882.0, 474496.0, 379113.0, 279103.0, 195483.0, 131852.0, 87784.0, 56564.0, 36985.0, 23971.0, 15183.0, 9949.0, 6408.0, 4167.0, 2649.0, 1750.0, 1169.0, 708.0, 490.0, 313.0, 224.0, 145.0, 89.0, 54.0, 30.0, 26.0, 14.0, 16.0, 6.0, 8.0, 5.0, 2.0], "bins": [-3.49609375, -3.387725830078125, -3.27935791015625, -3.170989990234375, -3.0626220703125, -2.954254150390625, -2.84588623046875, -2.737518310546875, -2.629150390625, -2.520782470703125, -2.41241455078125, -2.304046630859375, -2.1956787109375, -2.087310791015625, -1.97894287109375, -1.870574951171875, -1.76220703125, -1.653839111328125, -1.54547119140625, -1.437103271484375, -1.3287353515625, -1.220367431640625, -1.11199951171875, -1.003631591796875, -0.895263671875, -0.786895751953125, -0.67852783203125, -0.570159912109375, -0.4617919921875, -0.353424072265625, -0.24505615234375, -0.136688232421875, -0.0283203125, 0.080047607421875, 0.18841552734375, 0.296783447265625, 0.4051513671875, 0.513519287109375, 0.62188720703125, 0.730255126953125, 0.838623046875, 0.946990966796875, 1.05535888671875, 1.163726806640625, 1.2720947265625, 1.380462646484375, 1.48883056640625, 1.597198486328125, 1.70556640625, 1.813934326171875, 1.92230224609375, 2.030670166015625, 2.1390380859375, 2.247406005859375, 2.35577392578125, 2.464141845703125, 2.572509765625, 2.680877685546875, 2.78924560546875, 2.897613525390625, 3.0059814453125, 3.114349365234375, 3.22271728515625, 3.331085205078125, 3.439453125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 10.0, 15.0, 11.0, 18.0, 27.0, 29.0, 27.0, 42.0, 55.0, 68.0, 78.0, 87.0, 127.0, 119.0, 158.0, 167.0, 184.0, 209.0, 242.0, 248.0, 238.0, 209.0, 231.0, 216.0, 175.0, 191.0, 139.0, 144.0, 120.0, 90.0, 90.0, 70.0, 53.0, 38.0, 36.0, 18.0, 22.0, 20.0, 21.0, 10.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.869140625, -1.8144378662109375, -1.759735107421875, -1.7050323486328125, -1.65032958984375, -1.5956268310546875, -1.540924072265625, -1.4862213134765625, -1.4315185546875, -1.3768157958984375, -1.322113037109375, -1.2674102783203125, -1.21270751953125, -1.1580047607421875, -1.103302001953125, -1.0485992431640625, -0.993896484375, -0.9391937255859375, -0.884490966796875, -0.8297882080078125, -0.77508544921875, -0.7203826904296875, -0.665679931640625, -0.6109771728515625, -0.5562744140625, -0.5015716552734375, -0.446868896484375, -0.3921661376953125, -0.33746337890625, -0.2827606201171875, -0.228057861328125, -0.1733551025390625, -0.11865234375, -0.0639495849609375, -0.009246826171875, 0.0454559326171875, 0.10015869140625, 0.1548614501953125, 0.209564208984375, 0.2642669677734375, 0.3189697265625, 0.3736724853515625, 0.428375244140625, 0.4830780029296875, 0.53778076171875, 0.5924835205078125, 0.647186279296875, 0.7018890380859375, 0.756591796875, 0.8112945556640625, 0.865997314453125, 0.9207000732421875, 0.97540283203125, 1.0301055908203125, 1.084808349609375, 1.1395111083984375, 1.1942138671875, 1.2489166259765625, 1.303619384765625, 1.3583221435546875, 1.41302490234375, 1.4677276611328125, 1.522430419921875, 1.5771331787109375, 1.6318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 9.0, 8.0, 22.0, 16.0, 19.0, 23.0, 39.0, 34.0, 39.0, 41.0, 50.0, 39.0, 50.0, 56.0, 56.0, 47.0, 41.0, 47.0, 48.0, 38.0, 35.0, 40.0, 42.0, 33.0, 20.0, 17.0, 21.0, 12.0, 10.0, 8.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.699108600616455, -5.535609722137451, -5.372110843658447, -5.208612442016602, -5.045113563537598, -4.881614685058594, -4.71811580657959, -4.554616928100586, -4.391118049621582, -4.227619171142578, -4.064120292663574, -3.9006216526031494, -3.7371230125427246, -3.5736241340637207, -3.410125255584717, -3.246626377105713, -3.083127975463867, -2.9196290969848633, -2.7561304569244385, -2.5926315784454346, -2.4291329383850098, -2.265634059906006, -2.102135181427002, -1.9386364221572876, -1.7751376628875732, -1.6116389036178589, -1.4481401443481445, -1.2846412658691406, -1.1211425065994263, -0.9576437473297119, -0.7941449284553528, -0.6306461095809937, -0.4671468734741211, -0.30364808440208435, -0.1401492953300476, 0.023349493741989136, 0.18684828281402588, 0.35034704208374023, 0.5138458609580994, 0.6773446798324585, 0.8408434391021729, 1.0043421983718872, 1.1678409576416016, 1.3313398361206055, 1.4948385953903198, 1.6583373546600342, 1.821836233139038, 1.9853349924087524, 2.148833751678467, 2.3123326301574707, 2.4758312702178955, 2.6393301486968994, 2.802828788757324, 2.966327667236328, 3.129826545715332, 3.293325424194336, 3.4568240642547607, 3.6203229427337646, 3.7838215827941895, 3.9473204612731934, 4.110819339752197, 4.274317741394043, 4.437816619873047, 4.601315498352051, 4.764814376831055]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 9.0, 12.0, 15.0, 11.0, 20.0, 17.0, 24.0, 20.0, 16.0, 25.0, 23.0, 34.0, 39.0, 42.0, 41.0, 37.0, 34.0, 46.0, 41.0, 32.0, 56.0, 44.0, 38.0, 37.0, 35.0, 30.0, 25.0, 27.0, 24.0, 23.0, 20.0, 19.0, 14.0, 14.0, 9.0, 8.0, 8.0, 6.0, 2.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.018582820892334, -4.880659103393555, -4.742735862731934, -4.6048126220703125, -4.466888904571533, -4.328965187072754, -4.191041946411133, -4.053118705749512, -3.9151949882507324, -3.7772715091705322, -3.639348030090332, -3.501424551010132, -3.3635010719299316, -3.2255775928497314, -3.0876541137695312, -2.949730634689331, -2.811807155609131, -2.6738836765289307, -2.5359601974487305, -2.3980367183685303, -2.26011323928833, -2.12218976020813, -1.9842662811279297, -1.8463428020477295, -1.7084193229675293, -1.570495843887329, -1.432572364807129, -1.2946488857269287, -1.1567254066467285, -1.0188019275665283, -0.8808784484863281, -0.7429549694061279, -0.6050319671630859, -0.46710848808288574, -0.32918500900268555, -0.19126152992248535, -0.053338050842285156, 0.08458542823791504, 0.22250890731811523, 0.36043238639831543, 0.4983558654785156, 0.6362793445587158, 0.774202823638916, 0.9121263027191162, 1.0500497817993164, 1.1879732608795166, 1.3258967399597168, 1.463820219039917, 1.6017436981201172, 1.7396671772003174, 1.8775906562805176, 2.0155141353607178, 2.153437614440918, 2.291361093521118, 2.4292845726013184, 2.5672080516815186, 2.7051315307617188, 2.843055009841919, 2.980978488922119, 3.1189019680023193, 3.2568254470825195, 3.3947489261627197, 3.53267240524292, 3.67059588432312, 3.8085193634033203]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 8.0, 10.0, 11.0, 28.0, 49.0, 64.0, 125.0, 170.0, 264.0, 376.0, 680.0, 993.0, 1583.0, 2457.0, 3673.0, 5450.0, 7876.0, 11737.0, 16123.0, 22600.0, 30698.0, 40183.0, 50987.0, 62335.0, 75065.0, 84515.0, 90965.0, 92108.0, 87200.0, 77635.0, 66523.0, 55081.0, 43619.0, 33946.0, 25064.0, 18146.0, 13004.0, 9073.0, 6220.0, 4154.0, 2818.0, 1725.0, 1126.0, 773.0, 510.0, 313.0, 194.0, 106.0, 76.0, 46.0, 31.0, 20.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.59765625, -1.5479888916015625, -1.498321533203125, -1.4486541748046875, -1.39898681640625, -1.3493194580078125, -1.299652099609375, -1.2499847412109375, -1.2003173828125, -1.1506500244140625, -1.100982666015625, -1.0513153076171875, -1.00164794921875, -0.9519805908203125, -0.902313232421875, -0.8526458740234375, -0.802978515625, -0.7533111572265625, -0.703643798828125, -0.6539764404296875, -0.60430908203125, -0.5546417236328125, -0.504974365234375, -0.4553070068359375, -0.4056396484375, -0.3559722900390625, -0.306304931640625, -0.2566375732421875, -0.20697021484375, -0.1573028564453125, -0.107635498046875, -0.0579681396484375, -0.00830078125, 0.0413665771484375, 0.091033935546875, 0.1407012939453125, 0.19036865234375, 0.2400360107421875, 0.289703369140625, 0.3393707275390625, 0.3890380859375, 0.4387054443359375, 0.488372802734375, 0.5380401611328125, 0.58770751953125, 0.6373748779296875, 0.687042236328125, 0.7367095947265625, 0.786376953125, 0.8360443115234375, 0.885711669921875, 0.9353790283203125, 0.98504638671875, 1.0347137451171875, 1.084381103515625, 1.1340484619140625, 1.1837158203125, 1.2333831787109375, 1.283050537109375, 1.3327178955078125, 1.38238525390625, 1.4320526123046875, 1.481719970703125, 1.5313873291015625, 1.5810546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 6.0, 7.0, 7.0, 5.0, 13.0, 17.0, 14.0, 18.0, 22.0, 12.0, 17.0, 20.0, 21.0, 24.0, 26.0, 25.0, 36.0, 37.0, 26.0, 34.0, 23.0, 47.0, 29.0, 55.0, 41.0, 35.0, 33.0, 42.0, 37.0, 25.0, 35.0, 17.0, 21.0, 26.0, 16.0, 18.0, 22.0, 11.0, 16.0, 10.0, 11.0, 6.0, 13.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.482421875, -3.373016357421875, -3.26361083984375, -3.154205322265625, -3.0447998046875, -2.935394287109375, -2.82598876953125, -2.716583251953125, -2.607177734375, -2.497772216796875, -2.38836669921875, -2.278961181640625, -2.1695556640625, -2.060150146484375, -1.95074462890625, -1.841339111328125, -1.73193359375, -1.622528076171875, -1.51312255859375, -1.403717041015625, -1.2943115234375, -1.184906005859375, -1.07550048828125, -0.966094970703125, -0.856689453125, -0.747283935546875, -0.63787841796875, -0.528472900390625, -0.4190673828125, -0.309661865234375, -0.20025634765625, -0.090850830078125, 0.0185546875, 0.127960205078125, 0.23736572265625, 0.346771240234375, 0.4561767578125, 0.565582275390625, 0.67498779296875, 0.784393310546875, 0.893798828125, 1.003204345703125, 1.11260986328125, 1.222015380859375, 1.3314208984375, 1.440826416015625, 1.55023193359375, 1.659637451171875, 1.76904296875, 1.878448486328125, 1.98785400390625, 2.097259521484375, 2.2066650390625, 2.316070556640625, 2.42547607421875, 2.534881591796875, 2.644287109375, 2.753692626953125, 2.86309814453125, 2.972503662109375, 3.0819091796875, 3.191314697265625, 3.30072021484375, 3.410125732421875, 3.51953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 4.0, 8.0, 14.0, 14.0, 30.0, 32.0, 58.0, 65.0, 130.0, 236.0, 338.0, 535.0, 934.0, 1585.0, 2822.0, 4925.0, 8592.0, 15557.0, 28796.0, 166900.0, 718089.0, 49932.0, 21399.0, 11995.0, 6634.0, 3789.0, 2108.0, 1213.0, 671.0, 450.0, 246.0, 146.0, 100.0, 74.0, 40.0, 20.0, 15.0, 13.0, 8.0, 11.0, 6.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -5.00860595703125, -4.8375244140625, -4.66644287109375, -4.495361328125, -4.32427978515625, -4.1531982421875, -3.98211669921875, -3.81103515625, -3.63995361328125, -3.4688720703125, -3.29779052734375, -3.126708984375, -2.95562744140625, -2.7845458984375, -2.61346435546875, -2.4423828125, -2.27130126953125, -2.1002197265625, -1.92913818359375, -1.758056640625, -1.58697509765625, -1.4158935546875, -1.24481201171875, -1.07373046875, -0.90264892578125, -0.7315673828125, -0.56048583984375, -0.389404296875, -0.21832275390625, -0.0472412109375, 0.12384033203125, 0.294921875, 0.46600341796875, 0.6370849609375, 0.80816650390625, 0.979248046875, 1.15032958984375, 1.3214111328125, 1.49249267578125, 1.66357421875, 1.83465576171875, 2.0057373046875, 2.17681884765625, 2.347900390625, 2.51898193359375, 2.6900634765625, 2.86114501953125, 3.0322265625, 3.20330810546875, 3.3743896484375, 3.54547119140625, 3.716552734375, 3.88763427734375, 4.0587158203125, 4.22979736328125, 4.40087890625, 4.57196044921875, 4.7430419921875, 4.91412353515625, 5.085205078125, 5.25628662109375, 5.4273681640625, 5.59844970703125, 5.76953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 8.0, 14.0, 15.0, 18.0, 12.0, 16.0, 19.0, 24.0, 22.0, 34.0, 32.0, 34.0, 49.0, 39.0, 43.0, 38.0, 36.0, 48.0, 47.0, 43.0, 45.0, 43.0, 35.0, 31.0, 26.0, 24.0, 25.0, 28.0, 16.0, 28.0, 14.0, 8.0, 17.0, 6.0, 8.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.765625, -3.648223876953125, -3.53082275390625, -3.413421630859375, -3.2960205078125, -3.178619384765625, -3.06121826171875, -2.943817138671875, -2.826416015625, -2.709014892578125, -2.59161376953125, -2.474212646484375, -2.3568115234375, -2.239410400390625, -2.12200927734375, -2.004608154296875, -1.88720703125, -1.769805908203125, -1.65240478515625, -1.535003662109375, -1.4176025390625, -1.300201416015625, -1.18280029296875, -1.065399169921875, -0.947998046875, -0.830596923828125, -0.71319580078125, -0.595794677734375, -0.4783935546875, -0.360992431640625, -0.24359130859375, -0.126190185546875, -0.0087890625, 0.108612060546875, 0.22601318359375, 0.343414306640625, 0.4608154296875, 0.578216552734375, 0.69561767578125, 0.813018798828125, 0.930419921875, 1.047821044921875, 1.16522216796875, 1.282623291015625, 1.4000244140625, 1.517425537109375, 1.63482666015625, 1.752227783203125, 1.86962890625, 1.987030029296875, 2.10443115234375, 2.221832275390625, 2.3392333984375, 2.456634521484375, 2.57403564453125, 2.691436767578125, 2.808837890625, 2.926239013671875, 3.04364013671875, 3.161041259765625, 3.2784423828125, 3.395843505859375, 3.51324462890625, 3.630645751953125, 3.748046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 10.0, 14.0, 24.0, 25.0, 40.0, 52.0, 72.0, 147.0, 220.0, 362.0, 669.0, 1260.0, 2472.0, 4770.0, 9571.0, 20949.0, 67349.0, 772730.0, 119221.0, 25444.0, 11497.0, 5501.0, 2759.0, 1490.0, 781.0, 426.0, 256.0, 148.0, 103.0, 51.0, 38.0, 27.0, 17.0, 16.0, 6.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.087890625, -1.0534820556640625, -1.019073486328125, -0.9846649169921875, -0.95025634765625, -0.9158477783203125, -0.881439208984375, -0.8470306396484375, -0.8126220703125, -0.7782135009765625, -0.743804931640625, -0.7093963623046875, -0.67498779296875, -0.6405792236328125, -0.606170654296875, -0.5717620849609375, -0.537353515625, -0.5029449462890625, -0.468536376953125, -0.4341278076171875, -0.39971923828125, -0.3653106689453125, -0.330902099609375, -0.2964935302734375, -0.2620849609375, -0.2276763916015625, -0.193267822265625, -0.1588592529296875, -0.12445068359375, -0.0900421142578125, -0.055633544921875, -0.0212249755859375, 0.01318359375, 0.0475921630859375, 0.082000732421875, 0.1164093017578125, 0.15081787109375, 0.1852264404296875, 0.219635009765625, 0.2540435791015625, 0.2884521484375, 0.3228607177734375, 0.357269287109375, 0.3916778564453125, 0.42608642578125, 0.4604949951171875, 0.494903564453125, 0.5293121337890625, 0.563720703125, 0.5981292724609375, 0.632537841796875, 0.6669464111328125, 0.70135498046875, 0.7357635498046875, 0.770172119140625, 0.8045806884765625, 0.8389892578125, 0.8733978271484375, 0.907806396484375, 0.9422149658203125, 0.97662353515625, 1.0110321044921875, 1.045440673828125, 1.0798492431640625, 1.1142578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 7.0, 12.0, 18.0, 15.0, 17.0, 23.0, 39.0, 51.0, 54.0, 51.0, 77.0, 109.0, 86.0, 85.0, 69.0, 42.0, 51.0, 45.0, 28.0, 19.0, 17.0, 12.0, 13.0, 7.0, 9.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003199577331542969, -0.0003108382225036621, -0.00030171871185302734, -0.0002925992012023926, -0.0002834796905517578, -0.00027436017990112305, -0.0002652406692504883, -0.0002561211585998535, -0.00024700164794921875, -0.00023788213729858398, -0.00022876262664794922, -0.00021964311599731445, -0.0002105236053466797, -0.00020140409469604492, -0.00019228458404541016, -0.0001831650733947754, -0.00017404556274414062, -0.00016492605209350586, -0.0001558065414428711, -0.00014668703079223633, -0.00013756752014160156, -0.0001284480094909668, -0.00011932849884033203, -0.00011020898818969727, -0.0001010894775390625, -9.196996688842773e-05, -8.285045623779297e-05, -7.37309455871582e-05, -6.461143493652344e-05, -5.549192428588867e-05, -4.6372413635253906e-05, -3.725290298461914e-05, -2.8133392333984375e-05, -1.901388168334961e-05, -9.894371032714844e-06, -7.748603820800781e-07, 8.344650268554688e-06, 1.7464160919189453e-05, 2.658367156982422e-05, 3.5703182220458984e-05, 4.482269287109375e-05, 5.3942203521728516e-05, 6.306171417236328e-05, 7.218122482299805e-05, 8.130073547363281e-05, 9.042024612426758e-05, 9.953975677490234e-05, 0.00010865926742553711, 0.00011777877807617188, 0.00012689828872680664, 0.0001360177993774414, 0.00014513731002807617, 0.00015425682067871094, 0.0001633763313293457, 0.00017249584197998047, 0.00018161535263061523, 0.00019073486328125, 0.00019985437393188477, 0.00020897388458251953, 0.0002180933952331543, 0.00022721290588378906, 0.00023633241653442383, 0.0002454519271850586, 0.00025457143783569336, 0.0002636909484863281]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 12.0, 10.0, 17.0, 20.0, 41.0, 57.0, 71.0, 121.0, 192.0, 298.0, 451.0, 587.0, 946.0, 1400.0, 2180.0, 3214.0, 5123.0, 7954.0, 12580.0, 19785.0, 31119.0, 48913.0, 76528.0, 110780.0, 142800.0, 154205.0, 136191.0, 102050.0, 68922.0, 44459.0, 27903.0, 17852.0, 11374.0, 7155.0, 4451.0, 3074.0, 1902.0, 1297.0, 817.0, 533.0, 337.0, 280.0, 182.0, 121.0, 82.0, 41.0, 43.0, 31.0, 16.0, 13.0, 13.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.3662109375, -0.3545417785644531, -0.34287261962890625, -0.3312034606933594, -0.3195343017578125, -0.3078651428222656, -0.29619598388671875, -0.2845268249511719, -0.272857666015625, -0.2611885070800781, -0.24951934814453125, -0.23785018920898438, -0.2261810302734375, -0.21451187133789062, -0.20284271240234375, -0.19117355346679688, -0.17950439453125, -0.16783523559570312, -0.15616607666015625, -0.14449691772460938, -0.1328277587890625, -0.12115859985351562, -0.10948944091796875, -0.09782028198242188, -0.086151123046875, -0.07448196411132812, -0.06281280517578125, -0.051143646240234375, -0.0394744873046875, -0.027805328369140625, -0.01613616943359375, -0.004467010498046875, 0.0072021484375, 0.018871307373046875, 0.03054046630859375, 0.042209625244140625, 0.0538787841796875, 0.06554794311523438, 0.07721710205078125, 0.08888626098632812, 0.100555419921875, 0.11222457885742188, 0.12389373779296875, 0.13556289672851562, 0.1472320556640625, 0.15890121459960938, 0.17057037353515625, 0.18223953247070312, 0.19390869140625, 0.20557785034179688, 0.21724700927734375, 0.22891616821289062, 0.2405853271484375, 0.2522544860839844, 0.26392364501953125, 0.2755928039550781, 0.287261962890625, 0.2989311218261719, 0.31060028076171875, 0.3222694396972656, 0.3339385986328125, 0.3456077575683594, 0.35727691650390625, 0.3689460754394531, 0.380615234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 3.0, 7.0, 6.0, 11.0, 7.0, 14.0, 15.0, 16.0, 22.0, 24.0, 23.0, 36.0, 53.0, 47.0, 37.0, 39.0, 50.0, 57.0, 64.0, 56.0, 52.0, 54.0, 54.0, 43.0, 32.0, 34.0, 25.0, 20.0, 16.0, 17.0, 15.0, 12.0, 10.0, 2.0, 5.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13921356201171875, -0.1345062255859375, -0.12979888916015625, -0.125091552734375, -0.12038421630859375, -0.1156768798828125, -0.11096954345703125, -0.10626220703125, -0.10155487060546875, -0.0968475341796875, -0.09214019775390625, -0.087432861328125, -0.08272552490234375, -0.0780181884765625, -0.07331085205078125, -0.068603515625, -0.06389617919921875, -0.0591888427734375, -0.05448150634765625, -0.049774169921875, -0.04506683349609375, -0.0403594970703125, -0.03565216064453125, -0.03094482421875, -0.02623748779296875, -0.0215301513671875, -0.01682281494140625, -0.012115478515625, -0.00740814208984375, -0.0027008056640625, 0.00200653076171875, 0.0067138671875, 0.01142120361328125, 0.0161285400390625, 0.02083587646484375, 0.025543212890625, 0.03025054931640625, 0.0349578857421875, 0.03966522216796875, 0.04437255859375, 0.04907989501953125, 0.0537872314453125, 0.05849456787109375, 0.063201904296875, 0.06790924072265625, 0.0726165771484375, 0.07732391357421875, 0.08203125, 0.08673858642578125, 0.0914459228515625, 0.09615325927734375, 0.100860595703125, 0.10556793212890625, 0.1102752685546875, 0.11498260498046875, 0.11968994140625, 0.12439727783203125, 0.1291046142578125, 0.13381195068359375, 0.138519287109375, 0.14322662353515625, 0.1479339599609375, 0.15264129638671875, 0.1573486328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 0.0, 5.0, 6.0, 7.0, 15.0, 12.0, 20.0, 20.0, 27.0, 30.0, 34.0, 36.0, 50.0, 40.0, 46.0, 41.0, 52.0, 41.0, 73.0, 46.0, 37.0, 42.0, 51.0, 49.0, 31.0, 42.0, 35.0, 24.0, 24.0, 13.0, 12.0, 5.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.585474491119385, -4.447064399719238, -4.30865478515625, -4.1702446937561035, -4.031834602355957, -3.8934247493743896, -3.7550148963928223, -3.616604804992676, -3.4781949520111084, -3.339785099029541, -3.2013750076293945, -3.062965154647827, -2.9245553016662598, -2.7861452102661133, -2.647735357284546, -2.5093255043029785, -2.370915412902832, -2.2325055599212646, -2.094095468521118, -1.9556856155395508, -1.8172756433486938, -1.678865671157837, -1.5404558181762695, -1.4020458459854126, -1.2636358737945557, -1.1252259016036987, -0.9868159890174866, -0.8484060764312744, -0.7099961042404175, -0.5715861320495605, -0.4331762194633484, -0.29476630687713623, -0.1563563346862793, -0.01794639229774475, 0.1204635500907898, 0.25887349247932434, 0.3972834348678589, 0.5356934070587158, 0.674103319644928, 0.8125132322311401, 0.9509232044219971, 1.089333176612854, 1.227743148803711, 1.3661530017852783, 1.5045629739761353, 1.6429729461669922, 1.7813827991485596, 1.9197927713394165, 2.0582027435302734, 2.196612596511841, 2.3350226879119873, 2.4734325408935547, 2.611842632293701, 2.7502524852752686, 2.888662338256836, 3.0270724296569824, 3.16548228263855, 3.303892135620117, 3.4423022270202637, 3.580712080001831, 3.7191219329833984, 3.857532024383545, 3.9959418773651123, 4.13435173034668, 4.272761821746826]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 10.0, 5.0, 16.0, 12.0, 14.0, 18.0, 21.0, 17.0, 19.0, 22.0, 26.0, 23.0, 34.0, 41.0, 38.0, 41.0, 37.0, 36.0, 42.0, 38.0, 38.0, 45.0, 50.0, 33.0, 45.0, 27.0, 35.0, 24.0, 31.0, 22.0, 17.0, 25.0, 18.0, 18.0, 14.0, 9.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 5.0, 1.0, 5.0, 2.0], "bins": [-4.284055233001709, -4.169294834136963, -4.054533958435059, -3.9397735595703125, -3.8250129222869873, -3.710252285003662, -3.595491647720337, -3.4807310104370117, -3.3659706115722656, -3.2512099742889404, -3.1364493370056152, -3.021688938140869, -2.906928300857544, -2.7921676635742188, -2.6774070262908936, -2.5626463890075684, -2.447885751724243, -2.333125114440918, -2.2183644771575928, -2.1036038398742676, -1.9888434410095215, -1.8740828037261963, -1.759322166442871, -1.644561529159546, -1.5298010110855103, -1.415040373802185, -1.3002798557281494, -1.1855192184448242, -1.070758581161499, -0.9559980630874634, -0.8412374258041382, -0.7264768481254578, -0.6117160320281982, -0.4969554543495178, -0.382194846868515, -0.2674342393875122, -0.1526736617088318, -0.03791308403015137, 0.07684755325317383, 0.19160813093185425, 0.30636870861053467, 0.4211292862892151, 0.5358898639678955, 0.6506505012512207, 0.7654110789299011, 0.8801716566085815, 0.9949322938919067, 1.1096928119659424, 1.2244534492492676, 1.3392140865325928, 1.4539746046066284, 1.5687352418899536, 1.6834957599639893, 1.7982563972473145, 1.9130170345306396, 2.027777671813965, 2.142538070678711, 2.257298707962036, 2.3720593452453613, 2.4868197441101074, 2.6015803813934326, 2.716341018676758, 2.831101655960083, 2.945862293243408, 3.0606229305267334]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 24.0, 41.0, 65.0, 78.0, 113.0, 190.0, 304.0, 404.0, 693.0, 1067.0, 1445.0, 2286.0, 3406.0, 5282.0, 7484.0, 11075.0, 16016.0, 23005.0, 31838.0, 43081.0, 55914.0, 69429.0, 82205.0, 91988.0, 96886.0, 95798.0, 88327.0, 77719.0, 63570.0, 50346.0, 37673.0, 27971.0, 19686.0, 13912.0, 9562.0, 6454.0, 4377.0, 3038.0, 1991.0, 1290.0, 847.0, 582.0, 365.0, 253.0, 151.0, 111.0, 68.0, 48.0, 41.0, 24.0, 13.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.111328125, -2.044921875, -1.978515625, -1.912109375, -1.845703125, -1.779296875, -1.712890625, -1.646484375, -1.580078125, -1.513671875, -1.447265625, -1.380859375, -1.314453125, -1.248046875, -1.181640625, -1.115234375, -1.048828125, -0.982421875, -0.916015625, -0.849609375, -0.783203125, -0.716796875, -0.650390625, -0.583984375, -0.517578125, -0.451171875, -0.384765625, -0.318359375, -0.251953125, -0.185546875, -0.119140625, -0.052734375, 0.013671875, 0.080078125, 0.146484375, 0.212890625, 0.279296875, 0.345703125, 0.412109375, 0.478515625, 0.544921875, 0.611328125, 0.677734375, 0.744140625, 0.810546875, 0.876953125, 0.943359375, 1.009765625, 1.076171875, 1.142578125, 1.208984375, 1.275390625, 1.341796875, 1.408203125, 1.474609375, 1.541015625, 1.607421875, 1.673828125, 1.740234375, 1.806640625, 1.873046875, 1.939453125, 2.005859375, 2.072265625, 2.138671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 15.0, 9.0, 6.0, 13.0, 20.0, 14.0, 14.0, 21.0, 26.0, 17.0, 38.0, 25.0, 40.0, 37.0, 39.0, 39.0, 40.0, 36.0, 28.0, 42.0, 40.0, 38.0, 39.0, 39.0, 43.0, 39.0, 24.0, 31.0, 18.0, 17.0, 18.0, 20.0, 19.0, 13.0, 17.0, 8.0, 16.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.390625, -3.281005859375, -3.17138671875, -3.061767578125, -2.9521484375, -2.842529296875, -2.73291015625, -2.623291015625, -2.513671875, -2.404052734375, -2.29443359375, -2.184814453125, -2.0751953125, -1.965576171875, -1.85595703125, -1.746337890625, -1.63671875, -1.527099609375, -1.41748046875, -1.307861328125, -1.1982421875, -1.088623046875, -0.97900390625, -0.869384765625, -0.759765625, -0.650146484375, -0.54052734375, -0.430908203125, -0.3212890625, -0.211669921875, -0.10205078125, 0.007568359375, 0.1171875, 0.226806640625, 0.33642578125, 0.446044921875, 0.5556640625, 0.665283203125, 0.77490234375, 0.884521484375, 0.994140625, 1.103759765625, 1.21337890625, 1.322998046875, 1.4326171875, 1.542236328125, 1.65185546875, 1.761474609375, 1.87109375, 1.980712890625, 2.09033203125, 2.199951171875, 2.3095703125, 2.419189453125, 2.52880859375, 2.638427734375, 2.748046875, 2.857666015625, 2.96728515625, 3.076904296875, 3.1865234375, 3.296142578125, 3.40576171875, 3.515380859375, 3.625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 4.0, 10.0, 14.0, 21.0, 30.0, 57.0, 71.0, 104.0, 161.0, 243.0, 405.0, 534.0, 820.0, 1299.0, 1807.0, 2788.0, 4205.0, 6244.0, 9726.0, 14302.0, 20955.0, 29786.0, 41241.0, 55288.0, 70345.0, 84689.0, 96402.0, 102329.0, 101184.0, 92803.0, 79105.0, 64187.0, 49661.0, 36579.0, 25915.0, 18157.0, 12353.0, 8427.0, 5561.0, 3563.0, 2406.0, 1650.0, 1062.0, 681.0, 417.0, 309.0, 228.0, 144.0, 96.0, 63.0, 47.0, 35.0, 19.0, 12.0, 5.0, 11.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.77734375, -2.690032958984375, -2.60272216796875, -2.515411376953125, -2.4281005859375, -2.340789794921875, -2.25347900390625, -2.166168212890625, -2.078857421875, -1.991546630859375, -1.90423583984375, -1.816925048828125, -1.7296142578125, -1.642303466796875, -1.55499267578125, -1.467681884765625, -1.38037109375, -1.293060302734375, -1.20574951171875, -1.118438720703125, -1.0311279296875, -0.943817138671875, -0.85650634765625, -0.769195556640625, -0.681884765625, -0.594573974609375, -0.50726318359375, -0.419952392578125, -0.3326416015625, -0.245330810546875, -0.15802001953125, -0.070709228515625, 0.0166015625, 0.103912353515625, 0.19122314453125, 0.278533935546875, 0.3658447265625, 0.453155517578125, 0.54046630859375, 0.627777099609375, 0.715087890625, 0.802398681640625, 0.88970947265625, 0.977020263671875, 1.0643310546875, 1.151641845703125, 1.23895263671875, 1.326263427734375, 1.41357421875, 1.500885009765625, 1.58819580078125, 1.675506591796875, 1.7628173828125, 1.850128173828125, 1.93743896484375, 2.024749755859375, 2.112060546875, 2.199371337890625, 2.28668212890625, 2.373992919921875, 2.4613037109375, 2.548614501953125, 2.63592529296875, 2.723236083984375, 2.810546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 3.0, 8.0, 11.0, 11.0, 17.0, 16.0, 20.0, 18.0, 33.0, 13.0, 34.0, 32.0, 27.0, 36.0, 38.0, 39.0, 26.0, 41.0, 35.0, 39.0, 31.0, 42.0, 52.0, 33.0, 41.0, 37.0, 27.0, 25.0, 31.0, 21.0, 22.0, 33.0, 18.0, 15.0, 12.0, 17.0, 11.0, 11.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.208984375, -2.13726806640625, -2.0655517578125, -1.99383544921875, -1.922119140625, -1.85040283203125, -1.7786865234375, -1.70697021484375, -1.63525390625, -1.56353759765625, -1.4918212890625, -1.42010498046875, -1.348388671875, -1.27667236328125, -1.2049560546875, -1.13323974609375, -1.0615234375, -0.98980712890625, -0.9180908203125, -0.84637451171875, -0.774658203125, -0.70294189453125, -0.6312255859375, -0.55950927734375, -0.48779296875, -0.41607666015625, -0.3443603515625, -0.27264404296875, -0.200927734375, -0.12921142578125, -0.0574951171875, 0.01422119140625, 0.0859375, 0.15765380859375, 0.2293701171875, 0.30108642578125, 0.372802734375, 0.44451904296875, 0.5162353515625, 0.58795166015625, 0.65966796875, 0.73138427734375, 0.8031005859375, 0.87481689453125, 0.946533203125, 1.01824951171875, 1.0899658203125, 1.16168212890625, 1.2333984375, 1.30511474609375, 1.3768310546875, 1.44854736328125, 1.520263671875, 1.59197998046875, 1.6636962890625, 1.73541259765625, 1.80712890625, 1.87884521484375, 1.9505615234375, 2.02227783203125, 2.093994140625, 2.16571044921875, 2.2374267578125, 2.30914306640625, 2.380859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 14.0, 22.0, 25.0, 37.0, 70.0, 109.0, 181.0, 216.0, 317.0, 554.0, 802.0, 1201.0, 2079.0, 3295.0, 5229.0, 8487.0, 13804.0, 22641.0, 36247.0, 55820.0, 81522.0, 108930.0, 130795.0, 137116.0, 126353.0, 102357.0, 74838.0, 50158.0, 32912.0, 20100.0, 12335.0, 7345.0, 4580.0, 2883.0, 1809.0, 1130.0, 787.0, 488.0, 327.0, 222.0, 128.0, 94.0, 69.0, 35.0, 22.0, 16.0, 19.0, 8.0, 4.0, 10.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.044921875, -1.0093536376953125, -0.973785400390625, -0.9382171630859375, -0.90264892578125, -0.8670806884765625, -0.831512451171875, -0.7959442138671875, -0.7603759765625, -0.7248077392578125, -0.689239501953125, -0.6536712646484375, -0.61810302734375, -0.5825347900390625, -0.546966552734375, -0.5113983154296875, -0.475830078125, -0.4402618408203125, -0.404693603515625, -0.3691253662109375, -0.33355712890625, -0.2979888916015625, -0.262420654296875, -0.2268524169921875, -0.1912841796875, -0.1557159423828125, -0.120147705078125, -0.0845794677734375, -0.04901123046875, -0.0134429931640625, 0.022125244140625, 0.0576934814453125, 0.09326171875, 0.1288299560546875, 0.164398193359375, 0.1999664306640625, 0.23553466796875, 0.2711029052734375, 0.306671142578125, 0.3422393798828125, 0.3778076171875, 0.4133758544921875, 0.448944091796875, 0.4845123291015625, 0.52008056640625, 0.5556488037109375, 0.591217041015625, 0.6267852783203125, 0.662353515625, 0.6979217529296875, 0.733489990234375, 0.7690582275390625, 0.80462646484375, 0.8401947021484375, 0.875762939453125, 0.9113311767578125, 0.9468994140625, 0.9824676513671875, 1.018035888671875, 1.0536041259765625, 1.08917236328125, 1.1247406005859375, 1.160308837890625, 1.1958770751953125, 1.2314453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 4.0, 6.0, 6.0, 4.0, 9.0, 11.0, 24.0, 15.0, 12.0, 28.0, 22.0, 29.0, 26.0, 29.0, 45.0, 42.0, 50.0, 51.0, 42.0, 45.0, 38.0, 48.0, 36.0, 50.0, 43.0, 31.0, 31.0, 39.0, 23.0, 33.0, 18.0, 12.0, 12.0, 13.0, 7.0, 11.0, 11.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012373924255371094, -0.00011986494064331055, -0.00011599063873291016, -0.00011211633682250977, -0.00010824203491210938, -0.00010436773300170898, -0.0001004934310913086, -9.66191291809082e-05, -9.274482727050781e-05, -8.887052536010742e-05, -8.499622344970703e-05, -8.112192153930664e-05, -7.724761962890625e-05, -7.337331771850586e-05, -6.949901580810547e-05, -6.562471389770508e-05, -6.175041198730469e-05, -5.78761100769043e-05, -5.4001808166503906e-05, -5.0127506256103516e-05, -4.6253204345703125e-05, -4.2378902435302734e-05, -3.8504600524902344e-05, -3.463029861450195e-05, -3.075599670410156e-05, -2.6881694793701172e-05, -2.300739288330078e-05, -1.913309097290039e-05, -1.52587890625e-05, -1.138448715209961e-05, -7.510185241699219e-06, -3.635883331298828e-06, 2.384185791015625e-07, 4.112720489501953e-06, 7.987022399902344e-06, 1.1861324310302734e-05, 1.5735626220703125e-05, 1.9609928131103516e-05, 2.3484230041503906e-05, 2.7358531951904297e-05, 3.123283386230469e-05, 3.510713577270508e-05, 3.898143768310547e-05, 4.285573959350586e-05, 4.673004150390625e-05, 5.060434341430664e-05, 5.447864532470703e-05, 5.835294723510742e-05, 6.222724914550781e-05, 6.61015510559082e-05, 6.99758529663086e-05, 7.385015487670898e-05, 7.772445678710938e-05, 8.159875869750977e-05, 8.547306060791016e-05, 8.934736251831055e-05, 9.322166442871094e-05, 9.709596633911133e-05, 0.00010097026824951172, 0.00010484457015991211, 0.0001087188720703125, 0.00011259317398071289, 0.00011646747589111328, 0.00012034177780151367, 0.00012421607971191406]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 22.0, 24.0, 41.0, 49.0, 77.0, 123.0, 169.0, 244.0, 375.0, 605.0, 889.0, 1473.0, 2360.0, 3694.0, 5997.0, 9819.0, 15616.0, 24898.0, 37983.0, 55904.0, 78320.0, 101755.0, 120016.0, 126474.0, 119612.0, 102371.0, 78997.0, 56290.0, 38059.0, 24657.0, 15479.0, 9867.0, 5970.0, 3861.0, 2314.0, 1433.0, 916.0, 621.0, 399.0, 258.0, 178.0, 109.0, 60.0, 54.0, 29.0, 29.0, 18.0, 12.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.041015625, -1.0089874267578125, -0.976959228515625, -0.9449310302734375, -0.91290283203125, -0.8808746337890625, -0.848846435546875, -0.8168182373046875, -0.7847900390625, -0.7527618408203125, -0.720733642578125, -0.6887054443359375, -0.65667724609375, -0.6246490478515625, -0.592620849609375, -0.5605926513671875, -0.528564453125, -0.4965362548828125, -0.464508056640625, -0.4324798583984375, -0.40045166015625, -0.3684234619140625, -0.336395263671875, -0.3043670654296875, -0.2723388671875, -0.2403106689453125, -0.208282470703125, -0.1762542724609375, -0.14422607421875, -0.1121978759765625, -0.080169677734375, -0.0481414794921875, -0.01611328125, 0.0159149169921875, 0.047943115234375, 0.0799713134765625, 0.11199951171875, 0.1440277099609375, 0.176055908203125, 0.2080841064453125, 0.2401123046875, 0.2721405029296875, 0.304168701171875, 0.3361968994140625, 0.36822509765625, 0.4002532958984375, 0.432281494140625, 0.4643096923828125, 0.496337890625, 0.5283660888671875, 0.560394287109375, 0.5924224853515625, 0.62445068359375, 0.6564788818359375, 0.688507080078125, 0.7205352783203125, 0.7525634765625, 0.7845916748046875, 0.816619873046875, 0.8486480712890625, 0.88067626953125, 0.9127044677734375, 0.944732666015625, 0.9767608642578125, 1.0087890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 9.0, 2.0, 16.0, 19.0, 17.0, 20.0, 40.0, 27.0, 42.0, 48.0, 41.0, 38.0, 54.0, 66.0, 64.0, 53.0, 55.0, 44.0, 40.0, 53.0, 40.0, 35.0, 21.0, 26.0, 23.0, 23.0, 20.0, 7.0, 12.0, 6.0, 10.0, 4.0, 5.0, 3.0, 7.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51123046875, -0.49663543701171875, -0.4820404052734375, -0.46744537353515625, -0.452850341796875, -0.43825531005859375, -0.4236602783203125, -0.40906524658203125, -0.39447021484375, -0.37987518310546875, -0.3652801513671875, -0.35068511962890625, -0.336090087890625, -0.32149505615234375, -0.3069000244140625, -0.29230499267578125, -0.2777099609375, -0.26311492919921875, -0.2485198974609375, -0.23392486572265625, -0.219329833984375, -0.20473480224609375, -0.1901397705078125, -0.17554473876953125, -0.16094970703125, -0.14635467529296875, -0.1317596435546875, -0.11716461181640625, -0.102569580078125, -0.08797454833984375, -0.0733795166015625, -0.05878448486328125, -0.044189453125, -0.02959442138671875, -0.0149993896484375, -0.00040435791015625, 0.014190673828125, 0.02878570556640625, 0.0433807373046875, 0.05797576904296875, 0.07257080078125, 0.08716583251953125, 0.1017608642578125, 0.11635589599609375, 0.130950927734375, 0.14554595947265625, 0.1601409912109375, 0.17473602294921875, 0.1893310546875, 0.20392608642578125, 0.2185211181640625, 0.23311614990234375, 0.247711181640625, 0.26230621337890625, 0.2769012451171875, 0.29149627685546875, 0.30609130859375, 0.32068634033203125, 0.3352813720703125, 0.34987640380859375, 0.364471435546875, 0.37906646728515625, 0.3936614990234375, 0.40825653076171875, 0.4228515625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 22.0, 16.0, 15.0, 20.0, 25.0, 24.0, 27.0, 39.0, 37.0, 44.0, 39.0, 64.0, 58.0, 43.0, 47.0, 49.0, 49.0, 46.0, 51.0, 40.0, 34.0, 42.0, 30.0, 26.0, 19.0, 27.0, 15.0, 9.0, 4.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41330099105835, -4.277430057525635, -4.14155912399292, -4.005688190460205, -3.8698172569274902, -3.7339463233947754, -3.5980753898620605, -3.4622044563293457, -3.326333522796631, -3.190462589263916, -3.054591655731201, -2.9187207221984863, -2.7828497886657715, -2.6469788551330566, -2.511107921600342, -2.375236988067627, -2.239366292953491, -2.1034953594207764, -1.9676244258880615, -1.8317534923553467, -1.6958825588226318, -1.560011625289917, -1.4241408109664917, -1.2882698774337769, -1.152398943901062, -1.0165280103683472, -0.8806570768356323, -0.7447862029075623, -0.6089152693748474, -0.47304433584213257, -0.3371734619140625, -0.20130252838134766, -0.06543159484863281, 0.07043932378292084, 0.2063102424144745, 0.34218114614486694, 0.4780520796775818, 0.6139230132102966, 0.7497938871383667, 0.8856648206710815, 1.0215357542037964, 1.1574066877365112, 1.293277621269226, 1.4291484355926514, 1.5650193691253662, 1.700890302658081, 1.836761236190796, 1.9726321697235107, 2.1085031032562256, 2.2443740367889404, 2.3802449703216553, 2.51611590385437, 2.651986837387085, 2.7878577709198, 2.9237284660339355, 3.0595993995666504, 3.1954703330993652, 3.33134126663208, 3.467212200164795, 3.6030831336975098, 3.7389540672302246, 3.8748250007629395, 4.010695934295654, 4.146566867828369, 4.282437801361084]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 10.0, 12.0, 12.0, 8.0, 17.0, 14.0, 24.0, 33.0, 31.0, 29.0, 33.0, 45.0, 45.0, 35.0, 47.0, 36.0, 35.0, 40.0, 39.0, 47.0, 56.0, 38.0, 31.0, 38.0, 34.0, 28.0, 34.0, 15.0, 20.0, 17.0, 15.0, 12.0, 11.0, 7.0, 5.0, 10.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.605142116546631, -4.480573654174805, -4.3560051918029785, -4.231436252593994, -4.106867790222168, -3.982299327850342, -3.8577308654785156, -3.7331621646881104, -3.608593463897705, -3.484025001525879, -3.3594563007354736, -3.2348878383636475, -3.110319137573242, -2.985750675201416, -2.86118221282959, -2.7366135120391846, -2.6120450496673584, -2.4874765872955322, -2.362907886505127, -2.238339424133301, -2.1137707233428955, -1.9892022609710693, -1.8646336793899536, -1.740065097808838, -1.6154965162277222, -1.4909279346466064, -1.3663593530654907, -1.241790771484375, -1.1172223091125488, -0.9926536679267883, -0.8680851459503174, -0.7435165643692017, -0.6189479827880859, -0.4943794012069702, -0.3698108494281769, -0.24524229764938354, -0.12067371606826782, 0.0038948655128479004, 0.12846338748931885, 0.25303196907043457, 0.3776005506515503, 0.502169132232666, 0.6267377138137817, 0.7513062357902527, 0.8758748173713684, 1.000443458557129, 1.125011920928955, 1.2495805025100708, 1.3741490840911865, 1.4987176656723022, 1.623286247253418, 1.7478547096252441, 1.8724234104156494, 1.9969918727874756, 2.121560573577881, 2.246129035949707, 2.370697498321533, 2.4952659606933594, 2.6198346614837646, 2.744403123855591, 2.868971824645996, 2.9935402870178223, 3.1181087493896484, 3.2426774501800537, 3.367246150970459]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 14.0, 19.0, 28.0, 35.0, 86.0, 138.0, 207.0, 346.0, 564.0, 995.0, 1727.0, 2757.0, 4694.0, 8011.0, 13618.0, 23881.0, 41072.0, 70457.0, 119475.0, 201475.0, 324154.0, 477159.0, 611759.0, 649123.0, 565913.0, 415479.0, 268210.0, 163312.0, 96446.0, 55846.0, 32204.0, 18612.0, 11061.0, 6294.0, 3723.0, 2154.0, 1275.0, 757.0, 492.0, 291.0, 165.0, 94.0, 58.0, 34.0, 28.0, 16.0, 16.0, 11.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.86737060546875, -2.7757568359375, -2.68414306640625, -2.592529296875, -2.50091552734375, -2.4093017578125, -2.31768798828125, -2.22607421875, -2.13446044921875, -2.0428466796875, -1.95123291015625, -1.859619140625, -1.76800537109375, -1.6763916015625, -1.58477783203125, -1.4931640625, -1.40155029296875, -1.3099365234375, -1.21832275390625, -1.126708984375, -1.03509521484375, -0.9434814453125, -0.85186767578125, -0.76025390625, -0.66864013671875, -0.5770263671875, -0.48541259765625, -0.393798828125, -0.30218505859375, -0.2105712890625, -0.11895751953125, -0.02734375, 0.06427001953125, 0.1558837890625, 0.24749755859375, 0.339111328125, 0.43072509765625, 0.5223388671875, 0.61395263671875, 0.70556640625, 0.79718017578125, 0.8887939453125, 0.98040771484375, 1.072021484375, 1.16363525390625, 1.2552490234375, 1.34686279296875, 1.4384765625, 1.53009033203125, 1.6217041015625, 1.71331787109375, 1.804931640625, 1.89654541015625, 1.9881591796875, 2.07977294921875, 2.17138671875, 2.26300048828125, 2.3546142578125, 2.44622802734375, 2.537841796875, 2.62945556640625, 2.7210693359375, 2.81268310546875, 2.904296875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 11.0, 4.0, 7.0, 7.0, 11.0, 17.0, 11.0, 14.0, 13.0, 30.0, 23.0, 33.0, 36.0, 28.0, 44.0, 37.0, 39.0, 42.0, 43.0, 54.0, 45.0, 45.0, 36.0, 37.0, 46.0, 41.0, 34.0, 33.0, 25.0, 28.0, 37.0, 17.0, 10.0, 8.0, 15.0, 10.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 3.0], "bins": [-4.0078125, -3.90252685546875, -3.7972412109375, -3.69195556640625, -3.586669921875, -3.48138427734375, -3.3760986328125, -3.27081298828125, -3.16552734375, -3.06024169921875, -2.9549560546875, -2.84967041015625, -2.744384765625, -2.63909912109375, -2.5338134765625, -2.42852783203125, -2.3232421875, -2.21795654296875, -2.1126708984375, -2.00738525390625, -1.902099609375, -1.79681396484375, -1.6915283203125, -1.58624267578125, -1.48095703125, -1.37567138671875, -1.2703857421875, -1.16510009765625, -1.059814453125, -0.95452880859375, -0.8492431640625, -0.74395751953125, -0.638671875, -0.53338623046875, -0.4281005859375, -0.32281494140625, -0.217529296875, -0.11224365234375, -0.0069580078125, 0.09832763671875, 0.20361328125, 0.30889892578125, 0.4141845703125, 0.51947021484375, 0.624755859375, 0.73004150390625, 0.8353271484375, 0.94061279296875, 1.0458984375, 1.15118408203125, 1.2564697265625, 1.36175537109375, 1.467041015625, 1.57232666015625, 1.6776123046875, 1.78289794921875, 1.88818359375, 1.99346923828125, 2.0987548828125, 2.20404052734375, 2.309326171875, 2.41461181640625, 2.5198974609375, 2.62518310546875, 2.73046875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 14.0, 19.0, 28.0, 29.0, 48.0, 78.0, 133.0, 215.0, 367.0, 597.0, 1021.0, 1925.0, 3350.0, 6204.0, 11542.0, 21456.0, 38976.0, 71030.0, 127430.0, 218537.0, 353668.0, 521909.0, 655748.0, 667768.0, 551932.0, 384505.0, 239892.0, 140036.0, 79532.0, 43608.0, 23593.0, 13023.0, 7211.0, 3892.0, 2127.0, 1182.0, 712.0, 401.0, 223.0, 123.0, 72.0, 41.0, 25.0, 20.0, 15.0, 10.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.640625, -3.530609130859375, -3.42059326171875, -3.310577392578125, -3.2005615234375, -3.090545654296875, -2.98052978515625, -2.870513916015625, -2.760498046875, -2.650482177734375, -2.54046630859375, -2.430450439453125, -2.3204345703125, -2.210418701171875, -2.10040283203125, -1.990386962890625, -1.88037109375, -1.770355224609375, -1.66033935546875, -1.550323486328125, -1.4403076171875, -1.330291748046875, -1.22027587890625, -1.110260009765625, -1.000244140625, -0.890228271484375, -0.78021240234375, -0.670196533203125, -0.5601806640625, -0.450164794921875, -0.34014892578125, -0.230133056640625, -0.1201171875, -0.010101318359375, 0.09991455078125, 0.209930419921875, 0.3199462890625, 0.429962158203125, 0.53997802734375, 0.649993896484375, 0.760009765625, 0.870025634765625, 0.98004150390625, 1.090057373046875, 1.2000732421875, 1.310089111328125, 1.42010498046875, 1.530120849609375, 1.64013671875, 1.750152587890625, 1.86016845703125, 1.970184326171875, 2.0802001953125, 2.190216064453125, 2.30023193359375, 2.410247802734375, 2.520263671875, 2.630279541015625, 2.74029541015625, 2.850311279296875, 2.9603271484375, 3.070343017578125, 3.18035888671875, 3.290374755859375, 3.400390625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 3.0, 6.0, 17.0, 24.0, 19.0, 34.0, 49.0, 44.0, 62.0, 79.0, 87.0, 107.0, 115.0, 168.0, 165.0, 184.0, 193.0, 228.0, 222.0, 231.0, 236.0, 228.0, 227.0, 204.0, 182.0, 172.0, 154.0, 127.0, 98.0, 86.0, 74.0, 57.0, 49.0, 37.0, 25.0, 24.0, 12.0, 11.0, 12.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4609375, -1.4179840087890625, -1.375030517578125, -1.3320770263671875, -1.28912353515625, -1.2461700439453125, -1.203216552734375, -1.1602630615234375, -1.1173095703125, -1.0743560791015625, -1.031402587890625, -0.9884490966796875, -0.94549560546875, -0.9025421142578125, -0.859588623046875, -0.8166351318359375, -0.773681640625, -0.7307281494140625, -0.687774658203125, -0.6448211669921875, -0.60186767578125, -0.5589141845703125, -0.515960693359375, -0.4730072021484375, -0.4300537109375, -0.3871002197265625, -0.344146728515625, -0.3011932373046875, -0.25823974609375, -0.2152862548828125, -0.172332763671875, -0.1293792724609375, -0.08642578125, -0.0434722900390625, -0.000518798828125, 0.0424346923828125, 0.08538818359375, 0.1283416748046875, 0.171295166015625, 0.2142486572265625, 0.2572021484375, 0.3001556396484375, 0.343109130859375, 0.3860626220703125, 0.42901611328125, 0.4719696044921875, 0.514923095703125, 0.5578765869140625, 0.600830078125, 0.6437835693359375, 0.686737060546875, 0.7296905517578125, 0.77264404296875, 0.8155975341796875, 0.858551025390625, 0.9015045166015625, 0.9444580078125, 0.9874114990234375, 1.030364990234375, 1.0733184814453125, 1.11627197265625, 1.1592254638671875, 1.202178955078125, 1.2451324462890625, 1.2880859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 8.0, 11.0, 8.0, 11.0, 16.0, 21.0, 23.0, 20.0, 26.0, 32.0, 25.0, 52.0, 37.0, 43.0, 43.0, 47.0, 44.0, 42.0, 53.0, 46.0, 38.0, 51.0, 36.0, 37.0, 35.0, 35.0, 31.0, 20.0, 25.0, 12.0, 9.0, 16.0, 5.0, 15.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4774107933044434, -3.358022451400757, -3.2386341094970703, -3.119245767593384, -2.9998574256896973, -2.8804690837860107, -2.761080741882324, -2.6416923999786377, -2.522304058074951, -2.4029157161712646, -2.283527374267578, -2.1641390323638916, -2.044750690460205, -1.9253623485565186, -1.805974006652832, -1.6865856647491455, -1.5671974420547485, -1.447809100151062, -1.3284207582473755, -1.209032416343689, -1.0896440744400024, -0.9702557921409607, -0.8508674502372742, -0.7314791083335876, -0.6120907664299011, -0.4927024245262146, -0.3733140826225281, -0.25392577052116394, -0.13453742861747742, -0.015149116516113281, 0.10423922538757324, 0.22362756729125977, 0.3430159091949463, 0.4624042510986328, 0.5817925930023193, 0.7011809349060059, 0.8205692768096924, 0.9399575591087341, 1.0593459606170654, 1.178734302520752, 1.2981226444244385, 1.417510986328125, 1.5368993282318115, 1.656287670135498, 1.7756760120391846, 1.895064353942871, 2.0144526958465576, 2.133841037750244, 2.2532291412353516, 2.372617483139038, 2.4920058250427246, 2.611394166946411, 2.7307825088500977, 2.850170850753784, 2.9695591926574707, 3.0889475345611572, 3.2083358764648438, 3.3277242183685303, 3.447112560272217, 3.5665009021759033, 3.68588924407959, 3.8052775859832764, 3.924665927886963, 4.04405403137207, 4.163442611694336]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 5.0, 4.0, 14.0, 8.0, 7.0, 11.0, 14.0, 17.0, 23.0, 18.0, 24.0, 24.0, 31.0, 30.0, 28.0, 33.0, 44.0, 39.0, 36.0, 36.0, 36.0, 39.0, 40.0, 35.0, 33.0, 31.0, 33.0, 37.0, 38.0, 30.0, 24.0, 25.0, 25.0, 17.0, 15.0, 14.0, 13.0, 9.0, 9.0, 7.0, 12.0, 10.0, 3.0, 6.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-3.250214099884033, -3.1495373249053955, -3.048860788345337, -2.948184013366699, -2.8475072383880615, -2.746830463409424, -2.6461539268493652, -2.5454771518707275, -2.44480037689209, -2.344123601913452, -2.2434470653533936, -2.142770290374756, -2.042093515396118, -1.94141685962677, -1.8407402038574219, -1.7400634288787842, -1.6393868923187256, -1.5387102365493774, -1.4380334615707397, -1.3373568058013916, -1.236680030822754, -1.1360033750534058, -1.0353267192840576, -0.9346500039100647, -0.8339732885360718, -0.7332965731620789, -0.6326198577880859, -0.5319432020187378, -0.4312664866447449, -0.33058977127075195, -0.2299131155014038, -0.1292364001274109, -0.02855992317199707, 0.07211677730083466, 0.17279347777366638, 0.2734701633453369, 0.37414687871932983, 0.47482359409332275, 0.5755002498626709, 0.6761769652366638, 0.7768536806106567, 0.8775303959846497, 0.9782071113586426, 1.0788837671279907, 1.1795604228973389, 1.2802371978759766, 1.3809138536453247, 1.4815905094146729, 1.5822672843933105, 1.6829439401626587, 1.7836207151412964, 1.8842973709106445, 1.9849741458892822, 2.08565092086792, 2.1863274574279785, 2.287004232406616, 2.387681007385254, 2.4883577823638916, 2.58903431892395, 2.689711093902588, 2.7903878688812256, 2.8910646438598633, 2.991741180419922, 3.0924179553985596, 3.193094491958618]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 4.0, 3.0, 21.0, 21.0, 36.0, 71.0, 88.0, 148.0, 227.0, 347.0, 556.0, 996.0, 1485.0, 2399.0, 3713.0, 5850.0, 8791.0, 12987.0, 18740.0, 26211.0, 35760.0, 47088.0, 58943.0, 71792.0, 82753.0, 90206.0, 93339.0, 91098.0, 83967.0, 73343.0, 61742.0, 49505.0, 37690.0, 28176.0, 19734.0, 13814.0, 9520.0, 6233.0, 4152.0, 2599.0, 1693.0, 1001.0, 649.0, 426.0, 250.0, 152.0, 96.0, 51.0, 41.0, 21.0, 18.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.263427734375, -1.21923828125, -1.175048828125, -1.130859375, -1.086669921875, -1.04248046875, -0.998291015625, -0.9541015625, -0.909912109375, -0.86572265625, -0.821533203125, -0.77734375, -0.733154296875, -0.68896484375, -0.644775390625, -0.6005859375, -0.556396484375, -0.51220703125, -0.468017578125, -0.423828125, -0.379638671875, -0.33544921875, -0.291259765625, -0.2470703125, -0.202880859375, -0.15869140625, -0.114501953125, -0.0703125, -0.026123046875, 0.01806640625, 0.062255859375, 0.1064453125, 0.150634765625, 0.19482421875, 0.239013671875, 0.283203125, 0.327392578125, 0.37158203125, 0.415771484375, 0.4599609375, 0.504150390625, 0.54833984375, 0.592529296875, 0.63671875, 0.680908203125, 0.72509765625, 0.769287109375, 0.8134765625, 0.857666015625, 0.90185546875, 0.946044921875, 0.990234375, 1.034423828125, 1.07861328125, 1.122802734375, 1.1669921875, 1.211181640625, 1.25537109375, 1.299560546875, 1.34375, 1.387939453125, 1.43212890625, 1.476318359375, 1.5205078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 8.0, 9.0, 5.0, 8.0, 7.0, 8.0, 9.0, 11.0, 18.0, 15.0, 19.0, 25.0, 28.0, 24.0, 37.0, 26.0, 44.0, 44.0, 32.0, 33.0, 42.0, 39.0, 34.0, 38.0, 38.0, 37.0, 36.0, 28.0, 33.0, 32.0, 39.0, 30.0, 22.0, 22.0, 21.0, 9.0, 16.0, 14.0, 15.0, 8.0, 15.0, 7.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0], "bins": [-3.095703125, -3.003814697265625, -2.91192626953125, -2.820037841796875, -2.7281494140625, -2.636260986328125, -2.54437255859375, -2.452484130859375, -2.360595703125, -2.268707275390625, -2.17681884765625, -2.084930419921875, -1.9930419921875, -1.901153564453125, -1.80926513671875, -1.717376708984375, -1.62548828125, -1.533599853515625, -1.44171142578125, -1.349822998046875, -1.2579345703125, -1.166046142578125, -1.07415771484375, -0.982269287109375, -0.890380859375, -0.798492431640625, -0.70660400390625, -0.614715576171875, -0.5228271484375, -0.430938720703125, -0.33905029296875, -0.247161865234375, -0.1552734375, -0.063385009765625, 0.02850341796875, 0.120391845703125, 0.2122802734375, 0.304168701171875, 0.39605712890625, 0.487945556640625, 0.579833984375, 0.671722412109375, 0.76361083984375, 0.855499267578125, 0.9473876953125, 1.039276123046875, 1.13116455078125, 1.223052978515625, 1.31494140625, 1.406829833984375, 1.49871826171875, 1.590606689453125, 1.6824951171875, 1.774383544921875, 1.86627197265625, 1.958160400390625, 2.050048828125, 2.141937255859375, 2.23382568359375, 2.325714111328125, 2.4176025390625, 2.509490966796875, 2.60137939453125, 2.693267822265625, 2.78515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 13.0, 13.0, 8.0, 24.0, 39.0, 62.0, 74.0, 148.0, 233.0, 381.0, 664.0, 1187.0, 2204.0, 4102.0, 7663.0, 13709.0, 25383.0, 84230.0, 789362.0, 65993.0, 24344.0, 13024.0, 7103.0, 3880.0, 2040.0, 1125.0, 629.0, 388.0, 217.0, 117.0, 75.0, 39.0, 31.0, 22.0, 12.0, 11.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6953125, -5.501953125, -5.30859375, -5.115234375, -4.921875, -4.728515625, -4.53515625, -4.341796875, -4.1484375, -3.955078125, -3.76171875, -3.568359375, -3.375, -3.181640625, -2.98828125, -2.794921875, -2.6015625, -2.408203125, -2.21484375, -2.021484375, -1.828125, -1.634765625, -1.44140625, -1.248046875, -1.0546875, -0.861328125, -0.66796875, -0.474609375, -0.28125, -0.087890625, 0.10546875, 0.298828125, 0.4921875, 0.685546875, 0.87890625, 1.072265625, 1.265625, 1.458984375, 1.65234375, 1.845703125, 2.0390625, 2.232421875, 2.42578125, 2.619140625, 2.8125, 3.005859375, 3.19921875, 3.392578125, 3.5859375, 3.779296875, 3.97265625, 4.166015625, 4.359375, 4.552734375, 4.74609375, 4.939453125, 5.1328125, 5.326171875, 5.51953125, 5.712890625, 5.90625, 6.099609375, 6.29296875, 6.486328125, 6.6796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 4.0, 16.0, 7.0, 11.0, 16.0, 15.0, 26.0, 21.0, 21.0, 22.0, 24.0, 39.0, 24.0, 34.0, 52.0, 45.0, 47.0, 52.0, 36.0, 42.0, 52.0, 39.0, 28.0, 32.0, 36.0, 33.0, 24.0, 24.0, 25.0, 20.0, 17.0, 16.0, 19.0, 7.0, 9.0, 15.0, 11.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8046875, -3.682373046875, -3.56005859375, -3.437744140625, -3.3154296875, -3.193115234375, -3.07080078125, -2.948486328125, -2.826171875, -2.703857421875, -2.58154296875, -2.459228515625, -2.3369140625, -2.214599609375, -2.09228515625, -1.969970703125, -1.84765625, -1.725341796875, -1.60302734375, -1.480712890625, -1.3583984375, -1.236083984375, -1.11376953125, -0.991455078125, -0.869140625, -0.746826171875, -0.62451171875, -0.502197265625, -0.3798828125, -0.257568359375, -0.13525390625, -0.012939453125, 0.109375, 0.231689453125, 0.35400390625, 0.476318359375, 0.5986328125, 0.720947265625, 0.84326171875, 0.965576171875, 1.087890625, 1.210205078125, 1.33251953125, 1.454833984375, 1.5771484375, 1.699462890625, 1.82177734375, 1.944091796875, 2.06640625, 2.188720703125, 2.31103515625, 2.433349609375, 2.5556640625, 2.677978515625, 2.80029296875, 2.922607421875, 3.044921875, 3.167236328125, 3.28955078125, 3.411865234375, 3.5341796875, 3.656494140625, 3.77880859375, 3.901123046875, 4.0234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 4.0, 7.0, 12.0, 20.0, 24.0, 31.0, 43.0, 56.0, 97.0, 153.0, 203.0, 383.0, 571.0, 1008.0, 1764.0, 3151.0, 5674.0, 10004.0, 18316.0, 38807.0, 340058.0, 531710.0, 49853.0, 20641.0, 11099.0, 6274.0, 3533.0, 2052.0, 1142.0, 712.0, 380.0, 265.0, 139.0, 113.0, 76.0, 59.0, 28.0, 22.0, 24.0, 11.0, 14.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.14453125, -1.10772705078125, -1.0709228515625, -1.03411865234375, -0.997314453125, -0.96051025390625, -0.9237060546875, -0.88690185546875, -0.85009765625, -0.81329345703125, -0.7764892578125, -0.73968505859375, -0.702880859375, -0.66607666015625, -0.6292724609375, -0.59246826171875, -0.5556640625, -0.51885986328125, -0.4820556640625, -0.44525146484375, -0.408447265625, -0.37164306640625, -0.3348388671875, -0.29803466796875, -0.26123046875, -0.22442626953125, -0.1876220703125, -0.15081787109375, -0.114013671875, -0.07720947265625, -0.0404052734375, -0.00360107421875, 0.033203125, 0.07000732421875, 0.1068115234375, 0.14361572265625, 0.180419921875, 0.21722412109375, 0.2540283203125, 0.29083251953125, 0.32763671875, 0.36444091796875, 0.4012451171875, 0.43804931640625, 0.474853515625, 0.51165771484375, 0.5484619140625, 0.58526611328125, 0.6220703125, 0.65887451171875, 0.6956787109375, 0.73248291015625, 0.769287109375, 0.80609130859375, 0.8428955078125, 0.87969970703125, 0.91650390625, 0.95330810546875, 0.9901123046875, 1.02691650390625, 1.063720703125, 1.10052490234375, 1.1373291015625, 1.17413330078125, 1.2109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 10.0, 14.0, 15.0, 30.0, 28.0, 57.0, 72.0, 69.0, 86.0, 84.0, 96.0, 91.0, 71.0, 61.0, 51.0, 45.0, 26.0, 24.0, 29.0, 13.0, 7.0, 3.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000446319580078125, -0.0004305988550186157, -0.00041487812995910645, -0.00039915740489959717, -0.0003834366798400879, -0.0003677159547805786, -0.00035199522972106934, -0.00033627450466156006, -0.0003205537796020508, -0.0003048330545425415, -0.0002891123294830322, -0.00027339160442352295, -0.00025767087936401367, -0.0002419501543045044, -0.00022622942924499512, -0.00021050870418548584, -0.00019478797912597656, -0.00017906725406646729, -0.000163346529006958, -0.00014762580394744873, -0.00013190507888793945, -0.00011618435382843018, -0.0001004636287689209, -8.474290370941162e-05, -6.902217864990234e-05, -5.3301453590393066e-05, -3.758072853088379e-05, -2.1860003471374512e-05, -6.139278411865234e-06, 9.581446647644043e-06, 2.530217170715332e-05, 4.10228967666626e-05, 5.6743621826171875e-05, 7.246434688568115e-05, 8.818507194519043e-05, 0.00010390579700469971, 0.00011962652206420898, 0.00013534724712371826, 0.00015106797218322754, 0.00016678869724273682, 0.0001825094223022461, 0.00019823014736175537, 0.00021395087242126465, 0.00022967159748077393, 0.0002453923225402832, 0.0002611130475997925, 0.00027683377265930176, 0.00029255449771881104, 0.0003082752227783203, 0.0003239959478378296, 0.00033971667289733887, 0.00035543739795684814, 0.0003711581230163574, 0.0003868788480758667, 0.000402599573135376, 0.00041832029819488525, 0.00043404102325439453, 0.0004497617483139038, 0.0004654824733734131, 0.00048120319843292236, 0.0004969239234924316, 0.0005126446485519409, 0.0005283653736114502, 0.0005440860986709595, 0.0005598068237304688]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 8.0, 9.0, 13.0, 24.0, 27.0, 34.0, 52.0, 86.0, 103.0, 173.0, 234.0, 323.0, 460.0, 705.0, 1006.0, 1348.0, 2055.0, 3015.0, 4725.0, 7026.0, 10811.0, 16528.0, 24956.0, 38381.0, 57806.0, 84677.0, 116189.0, 140697.0, 142915.0, 121232.0, 90354.0, 62358.0, 41414.0, 27011.0, 17228.0, 11538.0, 7576.0, 5020.0, 3255.0, 2241.0, 1522.0, 1069.0, 701.0, 543.0, 333.0, 232.0, 158.0, 117.0, 94.0, 55.0, 31.0, 31.0, 17.0, 13.0, 12.0, 11.0, 6.0, 5.0, 1.0, 1.0, 4.0], "bins": [-0.328125, -0.3175697326660156, -0.30701446533203125, -0.2964591979980469, -0.2859039306640625, -0.2753486633300781, -0.26479339599609375, -0.2542381286621094, -0.243682861328125, -0.23312759399414062, -0.22257232666015625, -0.21201705932617188, -0.2014617919921875, -0.19090652465820312, -0.18035125732421875, -0.16979598999023438, -0.15924072265625, -0.14868545532226562, -0.13813018798828125, -0.12757492065429688, -0.1170196533203125, -0.10646438598632812, -0.09590911865234375, -0.08535385131835938, -0.074798583984375, -0.06424331665039062, -0.05368804931640625, -0.043132781982421875, -0.0325775146484375, -0.022022247314453125, -0.01146697998046875, -0.000911712646484375, 0.0096435546875, 0.020198822021484375, 0.03075408935546875, 0.041309356689453125, 0.0518646240234375, 0.062419891357421875, 0.07297515869140625, 0.08353042602539062, 0.094085693359375, 0.10464096069335938, 0.11519622802734375, 0.12575149536132812, 0.1363067626953125, 0.14686203002929688, 0.15741729736328125, 0.16797256469726562, 0.17852783203125, 0.18908309936523438, 0.19963836669921875, 0.21019363403320312, 0.2207489013671875, 0.23130416870117188, 0.24185943603515625, 0.2524147033691406, 0.262969970703125, 0.2735252380371094, 0.28408050537109375, 0.2946357727050781, 0.3051910400390625, 0.3157463073730469, 0.32630157470703125, 0.3368568420410156, 0.347412109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 3.0, 4.0, 8.0, 9.0, 8.0, 9.0, 16.0, 20.0, 18.0, 24.0, 27.0, 38.0, 32.0, 51.0, 47.0, 51.0, 39.0, 50.0, 46.0, 57.0, 54.0, 44.0, 37.0, 42.0, 39.0, 40.0, 32.0, 29.0, 24.0, 15.0, 20.0, 8.0, 8.0, 13.0, 2.0, 5.0, 8.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1434326171875, -0.138946533203125, -0.13446044921875, -0.129974365234375, -0.12548828125, -0.121002197265625, -0.11651611328125, -0.112030029296875, -0.1075439453125, -0.103057861328125, -0.09857177734375, -0.094085693359375, -0.089599609375, -0.085113525390625, -0.08062744140625, -0.076141357421875, -0.0716552734375, -0.067169189453125, -0.06268310546875, -0.058197021484375, -0.0537109375, -0.049224853515625, -0.04473876953125, -0.040252685546875, -0.0357666015625, -0.031280517578125, -0.02679443359375, -0.022308349609375, -0.017822265625, -0.013336181640625, -0.00885009765625, -0.004364013671875, 0.0001220703125, 0.004608154296875, 0.00909423828125, 0.013580322265625, 0.01806640625, 0.022552490234375, 0.02703857421875, 0.031524658203125, 0.0360107421875, 0.040496826171875, 0.04498291015625, 0.049468994140625, 0.053955078125, 0.058441162109375, 0.06292724609375, 0.067413330078125, 0.0718994140625, 0.076385498046875, 0.08087158203125, 0.085357666015625, 0.08984375, 0.094329833984375, 0.09881591796875, 0.103302001953125, 0.1077880859375, 0.112274169921875, 0.11676025390625, 0.121246337890625, 0.125732421875, 0.130218505859375, 0.13470458984375, 0.139190673828125, 0.1436767578125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 6.0, 9.0, 12.0, 16.0, 10.0, 10.0, 23.0, 18.0, 30.0, 41.0, 41.0, 34.0, 47.0, 47.0, 44.0, 32.0, 47.0, 48.0, 53.0, 40.0, 48.0, 34.0, 49.0, 36.0, 42.0, 30.0, 32.0, 16.0, 16.0, 15.0, 14.0, 14.0, 16.0, 6.0, 7.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6977133750915527, -2.592954397201538, -2.4881954193115234, -2.3834362030029297, -2.278677225112915, -2.1739182472229004, -2.0691592693328857, -1.964400291442871, -1.859641194343567, -1.7548822164535522, -1.650123119354248, -1.5453641414642334, -1.4406051635742188, -1.3358460664749146, -1.2310870885849, -1.1263279914855957, -1.021569013595581, -0.9168099761009216, -0.8120509386062622, -0.7072919607162476, -0.6025329232215881, -0.4977738857269287, -0.39301490783691406, -0.28825587034225464, -0.18349683284759521, -0.07873781025409698, 0.026021212339401245, 0.13078022003173828, 0.2355392575263977, 0.34029829502105713, 0.4450572729110718, 0.5498163104057312, 0.6545753479003906, 0.75933438539505, 0.8640934228897095, 0.9688524007797241, 1.0736114978790283, 1.178370475769043, 1.2831294536590576, 1.3878884315490723, 1.4926475286483765, 1.5974065065383911, 1.7021656036376953, 1.80692458152771, 1.9116835594177246, 2.0164427757263184, 2.121201515197754, 2.2259607315063477, 2.3307197093963623, 2.435478687286377, 2.5402376651763916, 2.6449966430664062, 2.749755859375, 2.8545148372650146, 2.9592738151550293, 3.064032793045044, 3.1687917709350586, 3.2735507488250732, 3.378309726715088, 3.4830689430236816, 3.5878279209136963, 3.692586898803711, 3.7973458766937256, 3.9021048545837402, 4.006864070892334]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 6.0, 15.0, 11.0, 11.0, 17.0, 14.0, 28.0, 20.0, 21.0, 28.0, 35.0, 31.0, 31.0, 41.0, 45.0, 42.0, 32.0, 43.0, 46.0, 37.0, 37.0, 34.0, 44.0, 34.0, 50.0, 36.0, 24.0, 26.0, 19.0, 24.0, 17.0, 16.0, 14.0, 11.0, 14.0, 7.0, 11.0, 2.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.018164873123169, -2.924908399581909, -2.8316516876220703, -2.7383952140808105, -2.645138740539551, -2.551882266998291, -2.4586257934570312, -2.3653690814971924, -2.2721126079559326, -2.178856134414673, -2.085599422454834, -1.9923429489135742, -1.8990864753723145, -1.8058300018310547, -1.7125734090805054, -1.619316816329956, -1.5260603427886963, -1.4328038692474365, -1.3395472764968872, -1.246290683746338, -1.1530342102050781, -1.0597777366638184, -0.966521143913269, -0.8732646107673645, -0.78000807762146, -0.6867515444755554, -0.5934950113296509, -0.5002384781837463, -0.4069819450378418, -0.31372541189193726, -0.22046887874603271, -0.12721234560012817, -0.03395557403564453, 0.05930095911026001, 0.15255749225616455, 0.2458140254020691, 0.33907055854797363, 0.4323270916938782, 0.5255836248397827, 0.6188401579856873, 0.7120966911315918, 0.8053532242774963, 0.8986097574234009, 0.9918662905693054, 1.08512282371521, 1.1783792972564697, 1.271635890007019, 1.3648924827575684, 1.4581489562988281, 1.551405429840088, 1.6446620225906372, 1.7379186153411865, 1.8311750888824463, 1.924431562423706, 2.017688274383545, 2.1109447479248047, 2.2042012214660645, 2.297457695007324, 2.390714168548584, 2.483970880508423, 2.5772273540496826, 2.6704838275909424, 2.7637405395507812, 2.856997013092041, 2.950253486633301]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 21.0, 28.0, 49.0, 91.0, 166.0, 254.0, 413.0, 663.0, 1164.0, 1878.0, 3325.0, 5722.0, 9408.0, 15568.0, 25194.0, 39705.0, 59550.0, 83580.0, 107728.0, 125075.0, 130737.0, 120984.0, 100506.0, 75447.0, 52359.0, 34426.0, 21673.0, 13240.0, 7957.0, 4682.0, 2723.0, 1682.0, 1024.0, 569.0, 363.0, 222.0, 159.0, 72.0, 42.0, 37.0, 18.0, 13.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.983184814453125, -1.91558837890625, -1.847991943359375, -1.7803955078125, -1.712799072265625, -1.64520263671875, -1.577606201171875, -1.510009765625, -1.442413330078125, -1.37481689453125, -1.307220458984375, -1.2396240234375, -1.172027587890625, -1.10443115234375, -1.036834716796875, -0.96923828125, -0.901641845703125, -0.83404541015625, -0.766448974609375, -0.6988525390625, -0.631256103515625, -0.56365966796875, -0.496063232421875, -0.428466796875, -0.360870361328125, -0.29327392578125, -0.225677490234375, -0.1580810546875, -0.090484619140625, -0.02288818359375, 0.044708251953125, 0.1123046875, 0.179901123046875, 0.24749755859375, 0.315093994140625, 0.3826904296875, 0.450286865234375, 0.51788330078125, 0.585479736328125, 0.653076171875, 0.720672607421875, 0.78826904296875, 0.855865478515625, 0.9234619140625, 0.991058349609375, 1.05865478515625, 1.126251220703125, 1.19384765625, 1.261444091796875, 1.32904052734375, 1.396636962890625, 1.4642333984375, 1.531829833984375, 1.59942626953125, 1.667022705078125, 1.734619140625, 1.802215576171875, 1.86981201171875, 1.937408447265625, 2.0050048828125, 2.072601318359375, 2.14019775390625, 2.207794189453125, 2.275390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 6.0, 6.0, 11.0, 13.0, 28.0, 17.0, 19.0, 21.0, 20.0, 28.0, 28.0, 33.0, 33.0, 36.0, 37.0, 35.0, 28.0, 54.0, 42.0, 41.0, 39.0, 38.0, 42.0, 42.0, 38.0, 33.0, 30.0, 27.0, 30.0, 18.0, 15.0, 12.0, 24.0, 12.0, 7.0, 10.0, 14.0, 7.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.63006591796875, -2.5413818359375, -2.45269775390625, -2.364013671875, -2.27532958984375, -2.1866455078125, -2.09796142578125, -2.00927734375, -1.92059326171875, -1.8319091796875, -1.74322509765625, -1.654541015625, -1.56585693359375, -1.4771728515625, -1.38848876953125, -1.2998046875, -1.21112060546875, -1.1224365234375, -1.03375244140625, -0.945068359375, -0.85638427734375, -0.7677001953125, -0.67901611328125, -0.59033203125, -0.50164794921875, -0.4129638671875, -0.32427978515625, -0.235595703125, -0.14691162109375, -0.0582275390625, 0.03045654296875, 0.119140625, 0.20782470703125, 0.2965087890625, 0.38519287109375, 0.473876953125, 0.56256103515625, 0.6512451171875, 0.73992919921875, 0.82861328125, 0.91729736328125, 1.0059814453125, 1.09466552734375, 1.183349609375, 1.27203369140625, 1.3607177734375, 1.44940185546875, 1.5380859375, 1.62677001953125, 1.7154541015625, 1.80413818359375, 1.892822265625, 1.98150634765625, 2.0701904296875, 2.15887451171875, 2.24755859375, 2.33624267578125, 2.4249267578125, 2.51361083984375, 2.602294921875, 2.69097900390625, 2.7796630859375, 2.86834716796875, 2.95703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 13.0, 17.0, 22.0, 37.0, 48.0, 87.0, 136.0, 185.0, 300.0, 513.0, 810.0, 1286.0, 2147.0, 3473.0, 5592.0, 9229.0, 15007.0, 23915.0, 37529.0, 56579.0, 80312.0, 104797.0, 125658.0, 131731.0, 123305.0, 102360.0, 76339.0, 53479.0, 35094.0, 22396.0, 13924.0, 8537.0, 5201.0, 3308.0, 2050.0, 1163.0, 727.0, 481.0, 263.0, 163.0, 114.0, 85.0, 50.0, 33.0, 20.0, 12.0, 11.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.341796875, -2.26483154296875, -2.1878662109375, -2.11090087890625, -2.033935546875, -1.95697021484375, -1.8800048828125, -1.80303955078125, -1.72607421875, -1.64910888671875, -1.5721435546875, -1.49517822265625, -1.418212890625, -1.34124755859375, -1.2642822265625, -1.18731689453125, -1.1103515625, -1.03338623046875, -0.9564208984375, -0.87945556640625, -0.802490234375, -0.72552490234375, -0.6485595703125, -0.57159423828125, -0.49462890625, -0.41766357421875, -0.3406982421875, -0.26373291015625, -0.186767578125, -0.10980224609375, -0.0328369140625, 0.04412841796875, 0.12109375, 0.19805908203125, 0.2750244140625, 0.35198974609375, 0.428955078125, 0.50592041015625, 0.5828857421875, 0.65985107421875, 0.73681640625, 0.81378173828125, 0.8907470703125, 0.96771240234375, 1.044677734375, 1.12164306640625, 1.1986083984375, 1.27557373046875, 1.3525390625, 1.42950439453125, 1.5064697265625, 1.58343505859375, 1.660400390625, 1.73736572265625, 1.8143310546875, 1.89129638671875, 1.96826171875, 2.04522705078125, 2.1221923828125, 2.19915771484375, 2.276123046875, 2.35308837890625, 2.4300537109375, 2.50701904296875, 2.583984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 6.0, 7.0, 16.0, 11.0, 12.0, 18.0, 15.0, 24.0, 25.0, 23.0, 31.0, 24.0, 29.0, 34.0, 36.0, 36.0, 45.0, 25.0, 44.0, 41.0, 35.0, 37.0, 44.0, 37.0, 30.0, 36.0, 27.0, 38.0, 28.0, 32.0, 19.0, 16.0, 18.0, 23.0, 8.0, 14.0, 6.0, 6.0, 10.0, 6.0, 4.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.76171875, -1.7088165283203125, -1.655914306640625, -1.6030120849609375, -1.55010986328125, -1.4972076416015625, -1.444305419921875, -1.3914031982421875, -1.3385009765625, -1.2855987548828125, -1.232696533203125, -1.1797943115234375, -1.12689208984375, -1.0739898681640625, -1.021087646484375, -0.9681854248046875, -0.915283203125, -0.8623809814453125, -0.809478759765625, -0.7565765380859375, -0.70367431640625, -0.6507720947265625, -0.597869873046875, -0.5449676513671875, -0.4920654296875, -0.4391632080078125, -0.386260986328125, -0.3333587646484375, -0.28045654296875, -0.2275543212890625, -0.174652099609375, -0.1217498779296875, -0.06884765625, -0.0159454345703125, 0.036956787109375, 0.0898590087890625, 0.14276123046875, 0.1956634521484375, 0.248565673828125, 0.3014678955078125, 0.3543701171875, 0.4072723388671875, 0.460174560546875, 0.5130767822265625, 0.56597900390625, 0.6188812255859375, 0.671783447265625, 0.7246856689453125, 0.777587890625, 0.8304901123046875, 0.883392333984375, 0.9362945556640625, 0.98919677734375, 1.0420989990234375, 1.095001220703125, 1.1479034423828125, 1.2008056640625, 1.2537078857421875, 1.306610107421875, 1.3595123291015625, 1.41241455078125, 1.4653167724609375, 1.518218994140625, 1.5711212158203125, 1.6240234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 13.0, 21.0, 35.0, 59.0, 86.0, 138.0, 207.0, 369.0, 580.0, 1073.0, 1959.0, 3791.0, 6741.0, 13178.0, 25053.0, 46389.0, 82389.0, 131557.0, 175201.0, 183356.0, 150281.0, 99993.0, 58563.0, 31659.0, 16790.0, 8721.0, 4647.0, 2432.0, 1357.0, 755.0, 439.0, 268.0, 145.0, 105.0, 65.0, 44.0, 20.0, 15.0, 21.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3079986572265625, -1.267364501953125, -1.2267303466796875, -1.18609619140625, -1.1454620361328125, -1.104827880859375, -1.0641937255859375, -1.0235595703125, -0.9829254150390625, -0.942291259765625, -0.9016571044921875, -0.86102294921875, -0.8203887939453125, -0.779754638671875, -0.7391204833984375, -0.698486328125, -0.6578521728515625, -0.617218017578125, -0.5765838623046875, -0.53594970703125, -0.4953155517578125, -0.454681396484375, -0.4140472412109375, -0.3734130859375, -0.3327789306640625, -0.292144775390625, -0.2515106201171875, -0.21087646484375, -0.1702423095703125, -0.129608154296875, -0.0889739990234375, -0.04833984375, -0.0077056884765625, 0.032928466796875, 0.0735626220703125, 0.11419677734375, 0.1548309326171875, 0.195465087890625, 0.2360992431640625, 0.2767333984375, 0.3173675537109375, 0.358001708984375, 0.3986358642578125, 0.43927001953125, 0.4799041748046875, 0.520538330078125, 0.5611724853515625, 0.601806640625, 0.6424407958984375, 0.683074951171875, 0.7237091064453125, 0.76434326171875, 0.8049774169921875, 0.845611572265625, 0.8862457275390625, 0.9268798828125, 0.9675140380859375, 1.008148193359375, 1.0487823486328125, 1.08941650390625, 1.1300506591796875, 1.170684814453125, 1.2113189697265625, 1.251953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 2.0, 7.0, 6.0, 16.0, 19.0, 18.0, 29.0, 36.0, 46.0, 40.0, 45.0, 71.0, 69.0, 60.0, 64.0, 63.0, 75.0, 57.0, 51.0, 47.0, 40.0, 25.0, 18.0, 23.0, 21.0, 12.0, 6.0, 6.0, 3.0, 7.0, 5.0, 4.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010186433792114258, -9.767618030309677e-05, -9.348802268505096e-05, -8.929986506700516e-05, -8.511170744895935e-05, -8.092354983091354e-05, -7.673539221286774e-05, -7.254723459482193e-05, -6.835907697677612e-05, -6.417091935873032e-05, -5.998276174068451e-05, -5.57946041226387e-05, -5.1606446504592896e-05, -4.741828888654709e-05, -4.323013126850128e-05, -3.9041973650455475e-05, -3.485381603240967e-05, -3.066565841436386e-05, -2.6477500796318054e-05, -2.2289343178272247e-05, -1.810118556022644e-05, -1.3913027942180634e-05, -9.724870324134827e-06, -5.53671270608902e-06, -1.3485550880432129e-06, 2.839602530002594e-06, 7.027760148048401e-06, 1.1215917766094208e-05, 1.5404075384140015e-05, 1.959223300218582e-05, 2.378039062023163e-05, 2.7968548238277435e-05, 3.215670585632324e-05, 3.634486347436905e-05, 4.0533021092414856e-05, 4.472117871046066e-05, 4.890933632850647e-05, 5.3097493946552277e-05, 5.7285651564598083e-05, 6.147380918264389e-05, 6.56619668006897e-05, 6.98501244187355e-05, 7.403828203678131e-05, 7.822643965482712e-05, 8.241459727287292e-05, 8.660275489091873e-05, 9.079091250896454e-05, 9.497907012701035e-05, 9.916722774505615e-05, 0.00010335538536310196, 0.00010754354298114777, 0.00011173170059919357, 0.00011591985821723938, 0.00012010801583528519, 0.000124296173453331, 0.0001284843310713768, 0.0001326724886894226, 0.00013686064630746841, 0.00014104880392551422, 0.00014523696154356003, 0.00014942511916160583, 0.00015361327677965164, 0.00015780143439769745, 0.00016198959201574326, 0.00016617774963378906]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 6.0, 3.0, 5.0, 5.0, 10.0, 15.0, 28.0, 44.0, 62.0, 89.0, 137.0, 182.0, 321.0, 493.0, 810.0, 1286.0, 2030.0, 3254.0, 5384.0, 8711.0, 14122.0, 22819.0, 35669.0, 54036.0, 77804.0, 103815.0, 124550.0, 133783.0, 125318.0, 105024.0, 77898.0, 54574.0, 35974.0, 22970.0, 14241.0, 8905.0, 5390.0, 3345.0, 1991.0, 1211.0, 808.0, 528.0, 316.0, 190.0, 136.0, 88.0, 54.0, 47.0, 30.0, 18.0, 13.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.89990234375, -0.8704071044921875, -0.840911865234375, -0.8114166259765625, -0.78192138671875, -0.7524261474609375, -0.722930908203125, -0.6934356689453125, -0.6639404296875, -0.6344451904296875, -0.604949951171875, -0.5754547119140625, -0.54595947265625, -0.5164642333984375, -0.486968994140625, -0.4574737548828125, -0.427978515625, -0.3984832763671875, -0.368988037109375, -0.3394927978515625, -0.30999755859375, -0.2805023193359375, -0.251007080078125, -0.2215118408203125, -0.1920166015625, -0.1625213623046875, -0.133026123046875, -0.1035308837890625, -0.07403564453125, -0.0445404052734375, -0.015045166015625, 0.0144500732421875, 0.0439453125, 0.0734405517578125, 0.102935791015625, 0.1324310302734375, 0.16192626953125, 0.1914215087890625, 0.220916748046875, 0.2504119873046875, 0.2799072265625, 0.3094024658203125, 0.338897705078125, 0.3683929443359375, 0.39788818359375, 0.4273834228515625, 0.456878662109375, 0.4863739013671875, 0.515869140625, 0.5453643798828125, 0.574859619140625, 0.6043548583984375, 0.63385009765625, 0.6633453369140625, 0.692840576171875, 0.7223358154296875, 0.7518310546875, 0.7813262939453125, 0.810821533203125, 0.8403167724609375, 0.86981201171875, 0.8993072509765625, 0.928802490234375, 0.9582977294921875, 0.98779296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 16.0, 16.0, 10.0, 16.0, 17.0, 23.0, 26.0, 31.0, 25.0, 38.0, 38.0, 31.0, 24.0, 38.0, 41.0, 47.0, 41.0, 37.0, 42.0, 42.0, 22.0, 36.0, 43.0, 43.0, 31.0, 22.0, 26.0, 23.0, 16.0, 15.0, 14.0, 10.0, 13.0, 8.0, 8.0, 3.0, 8.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.290771484375, -0.282012939453125, -0.27325439453125, -0.264495849609375, -0.2557373046875, -0.246978759765625, -0.23822021484375, -0.229461669921875, -0.220703125, -0.211944580078125, -0.20318603515625, -0.194427490234375, -0.1856689453125, -0.176910400390625, -0.16815185546875, -0.159393310546875, -0.150634765625, -0.141876220703125, -0.13311767578125, -0.124359130859375, -0.1156005859375, -0.106842041015625, -0.09808349609375, -0.089324951171875, -0.08056640625, -0.071807861328125, -0.06304931640625, -0.054290771484375, -0.0455322265625, -0.036773681640625, -0.02801513671875, -0.019256591796875, -0.010498046875, -0.001739501953125, 0.00701904296875, 0.015777587890625, 0.0245361328125, 0.033294677734375, 0.04205322265625, 0.050811767578125, 0.0595703125, 0.068328857421875, 0.07708740234375, 0.085845947265625, 0.0946044921875, 0.103363037109375, 0.11212158203125, 0.120880126953125, 0.129638671875, 0.138397216796875, 0.14715576171875, 0.155914306640625, 0.1646728515625, 0.173431396484375, 0.18218994140625, 0.190948486328125, 0.19970703125, 0.208465576171875, 0.21722412109375, 0.225982666015625, 0.2347412109375, 0.243499755859375, 0.25225830078125, 0.261016845703125, 0.269775390625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 16.0, 7.0, 11.0, 18.0, 14.0, 16.0, 18.0, 24.0, 34.0, 41.0, 50.0, 50.0, 66.0, 41.0, 54.0, 52.0, 66.0, 50.0, 46.0, 51.0, 45.0, 32.0, 40.0, 36.0, 29.0, 13.0, 16.0, 17.0, 11.0, 9.0, 10.0, 4.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.868220329284668, -2.757042407989502, -2.645864725112915, -2.534686803817749, -2.423509120941162, -2.312331199645996, -2.20115327835083, -2.089975595474243, -1.9787976741790771, -1.8676198720932007, -1.7564420700073242, -1.6452641487121582, -1.5340863466262817, -1.4229085445404053, -1.3117307424545288, -1.2005529403686523, -1.0893751382827759, -0.9781973361968994, -0.8670194745063782, -0.7558416724205017, -0.6446638107299805, -0.533486008644104, -0.42230820655822754, -0.3111303448677063, -0.19995254278182983, -0.08877471834421158, 0.022403106093406677, 0.13358092308044434, 0.2447587549686432, 0.35593658685684204, 0.4671143889427185, 0.5782922506332397, 0.6894700527191162, 0.8006478548049927, 0.9118257164955139, 1.0230035781860352, 1.1341813802719116, 1.245359182357788, 1.3565369844436646, 1.467714786529541, 1.578892707824707, 1.6900705099105835, 1.80124831199646, 1.912426233291626, 2.023603916168213, 2.134781837463379, 2.245959758758545, 2.357137441635132, 2.4683151245117188, 2.5794930458068848, 2.6906707286834717, 2.8018486499786377, 2.9130263328552246, 3.0242042541503906, 3.1353821754455566, 3.2465598583221436, 3.3577377796173096, 3.4689157009124756, 3.5800933837890625, 3.6912713050842285, 3.8024489879608154, 3.9136269092559814, 4.024804592132568, 4.135982513427734, 4.2471604347229]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 10.0, 9.0, 12.0, 14.0, 13.0, 12.0, 20.0, 17.0, 23.0, 31.0, 30.0, 30.0, 38.0, 33.0, 31.0, 39.0, 41.0, 40.0, 38.0, 54.0, 46.0, 37.0, 35.0, 39.0, 26.0, 45.0, 36.0, 25.0, 24.0, 22.0, 30.0, 18.0, 16.0, 7.0, 12.0, 9.0, 7.0, 6.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.749818801879883, -2.657663106918335, -2.565507411956787, -2.4733517169952393, -2.3811960220336914, -2.2890403270721436, -2.1968846321105957, -2.104728937149048, -2.0125732421875, -1.9204175472259521, -1.8282618522644043, -1.7361061573028564, -1.6439504623413086, -1.5517947673797607, -1.459639072418213, -1.367483377456665, -1.2753275632858276, -1.1831718683242798, -1.091016173362732, -0.9988604784011841, -0.9067047834396362, -0.8145490884780884, -0.7223933339118958, -0.6302376389503479, -0.5380819439888, -0.4459262490272522, -0.35377055406570435, -0.2616148293018341, -0.16945913434028625, -0.0773034393787384, 0.014852285385131836, 0.10700798034667969, 0.19916367530822754, 0.2913193702697754, 0.38347506523132324, 0.4756307899951935, 0.567786455154419, 0.6599421501159668, 0.7520979046821594, 0.8442535996437073, 0.9364092946052551, 1.0285650491714478, 1.1207207441329956, 1.2128764390945435, 1.3050321340560913, 1.3971878290176392, 1.489343523979187, 1.5814992189407349, 1.6736549139022827, 1.7658106088638306, 1.8579663038253784, 1.9501219987869263, 2.0422778129577637, 2.1344335079193115, 2.2265892028808594, 2.3187448978424072, 2.410900592803955, 2.503056287765503, 2.595211982727051, 2.6873676776885986, 2.7795233726501465, 2.8716790676116943, 2.963834762573242, 3.05599045753479, 3.148146152496338]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 16.0, 13.0, 27.0, 34.0, 43.0, 69.0, 105.0, 138.0, 218.0, 329.0, 467.0, 698.0, 1013.0, 1457.0, 2430.0, 3629.0, 5582.0, 8544.0, 13560.0, 21329.0, 33652.0, 53205.0, 84139.0, 131488.0, 203245.0, 294972.0, 403130.0, 495333.0, 539320.0, 515488.0, 430907.0, 323041.0, 223951.0, 147091.0, 93866.0, 59396.0, 37383.0, 23548.0, 14740.0, 9479.0, 6077.0, 3853.0, 2504.0, 1644.0, 1046.0, 737.0, 436.0, 292.0, 209.0, 119.0, 99.0, 62.0, 54.0, 38.0, 18.0, 11.0, 6.0, 4.0, 3.0, 3.0], "bins": [-1.8486328125, -1.791961669921875, -1.73529052734375, -1.678619384765625, -1.6219482421875, -1.565277099609375, -1.50860595703125, -1.451934814453125, -1.395263671875, -1.338592529296875, -1.28192138671875, -1.225250244140625, -1.1685791015625, -1.111907958984375, -1.05523681640625, -0.998565673828125, -0.94189453125, -0.885223388671875, -0.82855224609375, -0.771881103515625, -0.7152099609375, -0.658538818359375, -0.60186767578125, -0.545196533203125, -0.488525390625, -0.431854248046875, -0.37518310546875, -0.318511962890625, -0.2618408203125, -0.205169677734375, -0.14849853515625, -0.091827392578125, -0.03515625, 0.021514892578125, 0.07818603515625, 0.134857177734375, 0.1915283203125, 0.248199462890625, 0.30487060546875, 0.361541748046875, 0.418212890625, 0.474884033203125, 0.53155517578125, 0.588226318359375, 0.6448974609375, 0.701568603515625, 0.75823974609375, 0.814910888671875, 0.87158203125, 0.928253173828125, 0.98492431640625, 1.041595458984375, 1.0982666015625, 1.154937744140625, 1.21160888671875, 1.268280029296875, 1.324951171875, 1.381622314453125, 1.43829345703125, 1.494964599609375, 1.5516357421875, 1.608306884765625, 1.66497802734375, 1.721649169921875, 1.7783203125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 10.0, 6.0, 4.0, 10.0, 18.0, 20.0, 24.0, 21.0, 17.0, 20.0, 22.0, 22.0, 40.0, 49.0, 34.0, 42.0, 28.0, 33.0, 47.0, 46.0, 58.0, 33.0, 46.0, 19.0, 28.0, 30.0, 37.0, 38.0, 26.0, 25.0, 22.0, 15.0, 20.0, 21.0, 15.0, 9.0, 6.0, 3.0, 9.0, 4.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.25714111328125, -2.1802978515625, -2.10345458984375, -2.026611328125, -1.94976806640625, -1.8729248046875, -1.79608154296875, -1.71923828125, -1.64239501953125, -1.5655517578125, -1.48870849609375, -1.411865234375, -1.33502197265625, -1.2581787109375, -1.18133544921875, -1.1044921875, -1.02764892578125, -0.9508056640625, -0.87396240234375, -0.797119140625, -0.72027587890625, -0.6434326171875, -0.56658935546875, -0.48974609375, -0.41290283203125, -0.3360595703125, -0.25921630859375, -0.182373046875, -0.10552978515625, -0.0286865234375, 0.04815673828125, 0.125, 0.20184326171875, 0.2786865234375, 0.35552978515625, 0.432373046875, 0.50921630859375, 0.5860595703125, 0.66290283203125, 0.73974609375, 0.81658935546875, 0.8934326171875, 0.97027587890625, 1.047119140625, 1.12396240234375, 1.2008056640625, 1.27764892578125, 1.3544921875, 1.43133544921875, 1.5081787109375, 1.58502197265625, 1.661865234375, 1.73870849609375, 1.8155517578125, 1.89239501953125, 1.96923828125, 2.04608154296875, 2.1229248046875, 2.19976806640625, 2.276611328125, 2.35345458984375, 2.4302978515625, 2.50714111328125, 2.583984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 9.0, 19.0, 23.0, 35.0, 54.0, 64.0, 162.0, 194.0, 313.0, 456.0, 804.0, 1189.0, 1938.0, 2919.0, 4939.0, 7783.0, 12691.0, 20247.0, 31984.0, 50632.0, 79260.0, 121799.0, 183511.0, 264562.0, 360850.0, 458521.0, 517468.0, 513281.0, 448743.0, 352579.0, 255666.0, 177207.0, 117799.0, 76272.0, 48431.0, 30431.0, 19250.0, 12140.0, 7489.0, 4633.0, 2934.0, 1867.0, 1167.0, 716.0, 471.0, 282.0, 191.0, 95.0, 74.0, 65.0, 20.0, 21.0, 18.0, 12.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.078125, -2.010986328125, -1.94384765625, -1.876708984375, -1.8095703125, -1.742431640625, -1.67529296875, -1.608154296875, -1.541015625, -1.473876953125, -1.40673828125, -1.339599609375, -1.2724609375, -1.205322265625, -1.13818359375, -1.071044921875, -1.00390625, -0.936767578125, -0.86962890625, -0.802490234375, -0.7353515625, -0.668212890625, -0.60107421875, -0.533935546875, -0.466796875, -0.399658203125, -0.33251953125, -0.265380859375, -0.1982421875, -0.131103515625, -0.06396484375, 0.003173828125, 0.0703125, 0.137451171875, 0.20458984375, 0.271728515625, 0.3388671875, 0.406005859375, 0.47314453125, 0.540283203125, 0.607421875, 0.674560546875, 0.74169921875, 0.808837890625, 0.8759765625, 0.943115234375, 1.01025390625, 1.077392578125, 1.14453125, 1.211669921875, 1.27880859375, 1.345947265625, 1.4130859375, 1.480224609375, 1.54736328125, 1.614501953125, 1.681640625, 1.748779296875, 1.81591796875, 1.883056640625, 1.9501953125, 2.017333984375, 2.08447265625, 2.151611328125, 2.21875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 9.0, 10.0, 12.0, 24.0, 30.0, 41.0, 39.0, 47.0, 76.0, 83.0, 95.0, 106.0, 125.0, 118.0, 156.0, 134.0, 213.0, 198.0, 235.0, 209.0, 216.0, 223.0, 198.0, 189.0, 208.0, 145.0, 158.0, 118.0, 115.0, 117.0, 72.0, 75.0, 71.0, 37.0, 40.0, 39.0, 17.0, 19.0, 13.0, 11.0, 12.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0420379638671875, -1.010833740234375, -0.9796295166015625, -0.94842529296875, -0.9172210693359375, -0.886016845703125, -0.8548126220703125, -0.8236083984375, -0.7924041748046875, -0.761199951171875, -0.7299957275390625, -0.69879150390625, -0.6675872802734375, -0.636383056640625, -0.6051788330078125, -0.573974609375, -0.5427703857421875, -0.511566162109375, -0.4803619384765625, -0.44915771484375, -0.4179534912109375, -0.386749267578125, -0.3555450439453125, -0.3243408203125, -0.2931365966796875, -0.261932373046875, -0.2307281494140625, -0.19952392578125, -0.1683197021484375, -0.137115478515625, -0.1059112548828125, -0.07470703125, -0.0435028076171875, -0.012298583984375, 0.0189056396484375, 0.05010986328125, 0.0813140869140625, 0.112518310546875, 0.1437225341796875, 0.1749267578125, 0.2061309814453125, 0.237335205078125, 0.2685394287109375, 0.29974365234375, 0.3309478759765625, 0.362152099609375, 0.3933563232421875, 0.424560546875, 0.4557647705078125, 0.486968994140625, 0.5181732177734375, 0.54937744140625, 0.5805816650390625, 0.611785888671875, 0.6429901123046875, 0.6741943359375, 0.7053985595703125, 0.736602783203125, 0.7678070068359375, 0.79901123046875, 0.8302154541015625, 0.861419677734375, 0.8926239013671875, 0.923828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 14.0, 11.0, 7.0, 12.0, 19.0, 17.0, 20.0, 45.0, 35.0, 32.0, 40.0, 48.0, 47.0, 37.0, 62.0, 51.0, 45.0, 47.0, 42.0, 49.0, 51.0, 37.0, 29.0, 37.0, 28.0, 33.0, 13.0, 17.0, 10.0, 9.0, 10.0, 11.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664024591445923, -2.5656075477600098, -2.467190742492676, -2.3687736988067627, -2.2703568935394287, -2.1719398498535156, -2.0735230445861816, -1.9751060009002686, -1.876689076423645, -1.7782721519470215, -1.679855227470398, -1.5814383029937744, -1.4830212593078613, -1.3846044540405273, -1.2861874103546143, -1.1877704858779907, -1.0893535614013672, -0.9909366369247437, -0.8925197124481201, -0.7941027283668518, -0.6956858038902283, -0.5972688794136047, -0.4988518953323364, -0.4004349708557129, -0.30201804637908936, -0.20360110700130463, -0.1051841676235199, -0.006767213344573975, 0.09164971113204956, 0.1900666356086731, 0.2884836196899414, 0.38690054416656494, 0.4853177070617676, 0.5837346315383911, 0.6821515560150146, 0.780568540096283, 0.8789854645729065, 0.97740238904953, 1.0758193731307983, 1.1742362976074219, 1.2726532220840454, 1.371070146560669, 1.4694870710372925, 1.567903995513916, 1.666321039199829, 1.764737844467163, 1.8631548881530762, 1.9615718126296997, 2.0599887371063232, 2.1584057807922363, 2.2568225860595703, 2.3552396297454834, 2.4536564350128174, 2.5520734786987305, 2.6504902839660645, 2.7489073276519775, 2.8473243713378906, 2.9457414150238037, 3.0441582202911377, 3.142575263977051, 3.2409920692443848, 3.339409112930298, 3.437826156616211, 3.536242961883545, 3.634659767150879]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 8.0, 9.0, 5.0, 10.0, 19.0, 12.0, 14.0, 16.0, 10.0, 25.0, 36.0, 23.0, 23.0, 38.0, 33.0, 38.0, 41.0, 41.0, 32.0, 42.0, 54.0, 39.0, 36.0, 35.0, 36.0, 34.0, 38.0, 30.0, 17.0, 28.0, 23.0, 22.0, 20.0, 23.0, 14.0, 18.0, 11.0, 5.0, 8.0, 4.0, 2.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6012017726898193, -2.5200769901275635, -2.4389522075653076, -2.3578274250030518, -2.276702880859375, -2.195578098297119, -2.1144533157348633, -2.0333285331726074, -1.9522037506103516, -1.8710789680480957, -1.7899541854858398, -1.7088295221328735, -1.6277047395706177, -1.5465799570083618, -1.4654552936553955, -1.3843305110931396, -1.3032057285308838, -1.222080945968628, -1.140956163406372, -1.0598315000534058, -0.9787067174911499, -0.897581934928894, -0.816457211971283, -0.7353324890136719, -0.654207706451416, -0.5730829238891602, -0.4919582009315491, -0.4108334481716156, -0.32970869541168213, -0.24858394265174866, -0.16745918989181519, -0.0863344669342041, -0.005209445953369141, 0.07591530680656433, 0.1570400595664978, 0.23816481232643127, 0.31928956508636475, 0.4004143178462982, 0.4815390706062317, 0.5626637935638428, 0.6437885761260986, 0.7249133586883545, 0.8060380816459656, 0.8871628046035767, 0.9682875871658325, 1.0494123697280884, 1.1305370330810547, 1.2116618156433105, 1.2927865982055664, 1.3739113807678223, 1.4550361633300781, 1.5361608266830444, 1.6172856092453003, 1.6984103918075562, 1.7795350551605225, 1.8606598377227783, 1.9417846202850342, 2.02290940284729, 2.104034185409546, 2.1851589679718018, 2.2662835121154785, 2.3474082946777344, 2.4285330772399902, 2.509657859802246, 2.590782642364502]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 14.0, 21.0, 29.0, 38.0, 67.0, 100.0, 154.0, 255.0, 393.0, 639.0, 1051.0, 1699.0, 2771.0, 4690.0, 7899.0, 12962.0, 21179.0, 34224.0, 53433.0, 78896.0, 106696.0, 131259.0, 140739.0, 129899.0, 105442.0, 76638.0, 51675.0, 33274.0, 20464.0, 12655.0, 7654.0, 4593.0, 2733.0, 1676.0, 997.0, 609.0, 370.0, 257.0, 144.0, 97.0, 65.0, 39.0, 24.0, 15.0, 15.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.662109375, -1.6109161376953125, -1.559722900390625, -1.5085296630859375, -1.45733642578125, -1.4061431884765625, -1.354949951171875, -1.3037567138671875, -1.2525634765625, -1.2013702392578125, -1.150177001953125, -1.0989837646484375, -1.04779052734375, -0.9965972900390625, -0.945404052734375, -0.8942108154296875, -0.843017578125, -0.7918243408203125, -0.740631103515625, -0.6894378662109375, -0.63824462890625, -0.5870513916015625, -0.535858154296875, -0.4846649169921875, -0.4334716796875, -0.3822784423828125, -0.331085205078125, -0.2798919677734375, -0.22869873046875, -0.1775054931640625, -0.126312255859375, -0.0751190185546875, -0.02392578125, 0.0272674560546875, 0.078460693359375, 0.1296539306640625, 0.18084716796875, 0.2320404052734375, 0.283233642578125, 0.3344268798828125, 0.3856201171875, 0.4368133544921875, 0.488006591796875, 0.5391998291015625, 0.59039306640625, 0.6415863037109375, 0.692779541015625, 0.7439727783203125, 0.795166015625, 0.8463592529296875, 0.897552490234375, 0.9487457275390625, 0.99993896484375, 1.0511322021484375, 1.102325439453125, 1.1535186767578125, 1.2047119140625, 1.2559051513671875, 1.307098388671875, 1.3582916259765625, 1.40948486328125, 1.4606781005859375, 1.511871337890625, 1.5630645751953125, 1.6142578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 12.0, 8.0, 17.0, 13.0, 23.0, 24.0, 15.0, 25.0, 32.0, 26.0, 40.0, 34.0, 42.0, 30.0, 36.0, 44.0, 47.0, 40.0, 41.0, 46.0, 41.0, 34.0, 37.0, 42.0, 24.0, 26.0, 23.0, 25.0, 18.0, 18.0, 13.0, 25.0, 9.0, 10.0, 12.0, 5.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.779296875, -2.694732666015625, -2.61016845703125, -2.525604248046875, -2.4410400390625, -2.356475830078125, -2.27191162109375, -2.187347412109375, -2.102783203125, -2.018218994140625, -1.93365478515625, -1.849090576171875, -1.7645263671875, -1.679962158203125, -1.59539794921875, -1.510833740234375, -1.42626953125, -1.341705322265625, -1.25714111328125, -1.172576904296875, -1.0880126953125, -1.003448486328125, -0.91888427734375, -0.834320068359375, -0.749755859375, -0.665191650390625, -0.58062744140625, -0.496063232421875, -0.4114990234375, -0.326934814453125, -0.24237060546875, -0.157806396484375, -0.0732421875, 0.011322021484375, 0.09588623046875, 0.180450439453125, 0.2650146484375, 0.349578857421875, 0.43414306640625, 0.518707275390625, 0.603271484375, 0.687835693359375, 0.77239990234375, 0.856964111328125, 0.9415283203125, 1.026092529296875, 1.11065673828125, 1.195220947265625, 1.27978515625, 1.364349365234375, 1.44891357421875, 1.533477783203125, 1.6180419921875, 1.702606201171875, 1.78717041015625, 1.871734619140625, 1.956298828125, 2.040863037109375, 2.12542724609375, 2.209991455078125, 2.2945556640625, 2.379119873046875, 2.46368408203125, 2.548248291015625, 2.6328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 9.0, 9.0, 14.0, 18.0, 28.0, 35.0, 75.0, 101.0, 173.0, 213.0, 342.0, 528.0, 863.0, 1423.0, 2243.0, 3723.0, 6071.0, 9627.0, 16172.0, 27953.0, 136660.0, 715666.0, 66095.0, 23832.0, 14245.0, 8415.0, 5351.0, 3326.0, 1939.0, 1254.0, 730.0, 494.0, 296.0, 214.0, 144.0, 100.0, 46.0, 41.0, 22.0, 18.0, 8.0, 11.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0859375, -2.98431396484375, -2.8826904296875, -2.78106689453125, -2.679443359375, -2.57781982421875, -2.4761962890625, -2.37457275390625, -2.27294921875, -2.17132568359375, -2.0697021484375, -1.96807861328125, -1.866455078125, -1.76483154296875, -1.6632080078125, -1.56158447265625, -1.4599609375, -1.35833740234375, -1.2567138671875, -1.15509033203125, -1.053466796875, -0.95184326171875, -0.8502197265625, -0.74859619140625, -0.64697265625, -0.54534912109375, -0.4437255859375, -0.34210205078125, -0.240478515625, -0.13885498046875, -0.0372314453125, 0.06439208984375, 0.166015625, 0.26763916015625, 0.3692626953125, 0.47088623046875, 0.572509765625, 0.67413330078125, 0.7757568359375, 0.87738037109375, 0.97900390625, 1.08062744140625, 1.1822509765625, 1.28387451171875, 1.385498046875, 1.48712158203125, 1.5887451171875, 1.69036865234375, 1.7919921875, 1.89361572265625, 1.9952392578125, 2.09686279296875, 2.198486328125, 2.30010986328125, 2.4017333984375, 2.50335693359375, 2.60498046875, 2.70660400390625, 2.8082275390625, 2.90985107421875, 3.011474609375, 3.11309814453125, 3.2147216796875, 3.31634521484375, 3.41796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 7.0, 10.0, 8.0, 11.0, 15.0, 9.0, 12.0, 20.0, 29.0, 17.0, 27.0, 26.0, 24.0, 34.0, 38.0, 42.0, 40.0, 32.0, 37.0, 37.0, 42.0, 41.0, 27.0, 33.0, 47.0, 40.0, 31.0, 33.0, 32.0, 31.0, 21.0, 20.0, 25.0, 16.0, 12.0, 14.0, 16.0, 8.0, 7.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.564453125, -2.494293212890625, -2.42413330078125, -2.353973388671875, -2.2838134765625, -2.213653564453125, -2.14349365234375, -2.073333740234375, -2.003173828125, -1.933013916015625, -1.86285400390625, -1.792694091796875, -1.7225341796875, -1.652374267578125, -1.58221435546875, -1.512054443359375, -1.44189453125, -1.371734619140625, -1.30157470703125, -1.231414794921875, -1.1612548828125, -1.091094970703125, -1.02093505859375, -0.950775146484375, -0.880615234375, -0.810455322265625, -0.74029541015625, -0.670135498046875, -0.5999755859375, -0.529815673828125, -0.45965576171875, -0.389495849609375, -0.3193359375, -0.249176025390625, -0.17901611328125, -0.108856201171875, -0.0386962890625, 0.031463623046875, 0.10162353515625, 0.171783447265625, 0.241943359375, 0.312103271484375, 0.38226318359375, 0.452423095703125, 0.5225830078125, 0.592742919921875, 0.66290283203125, 0.733062744140625, 0.80322265625, 0.873382568359375, 0.94354248046875, 1.013702392578125, 1.0838623046875, 1.154022216796875, 1.22418212890625, 1.294342041015625, 1.364501953125, 1.434661865234375, 1.50482177734375, 1.574981689453125, 1.6451416015625, 1.715301513671875, 1.78546142578125, 1.855621337890625, 1.92578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 13.0, 10.0, 22.0, 31.0, 48.0, 52.0, 90.0, 148.0, 243.0, 381.0, 650.0, 1146.0, 2214.0, 4771.0, 11488.0, 36349.0, 700783.0, 246956.0, 25857.0, 9019.0, 3951.0, 1914.0, 953.0, 545.0, 331.0, 194.0, 110.0, 94.0, 66.0, 45.0, 18.0, 15.0, 11.0, 5.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8772201538085938, -0.8457489013671875, -0.8142776489257812, -0.782806396484375, -0.7513351440429688, -0.7198638916015625, -0.6883926391601562, -0.65692138671875, -0.6254501342773438, -0.5939788818359375, -0.5625076293945312, -0.531036376953125, -0.49956512451171875, -0.4680938720703125, -0.43662261962890625, -0.4051513671875, -0.37368011474609375, -0.3422088623046875, -0.31073760986328125, -0.279266357421875, -0.24779510498046875, -0.2163238525390625, -0.18485260009765625, -0.15338134765625, -0.12191009521484375, -0.0904388427734375, -0.05896759033203125, -0.027496337890625, 0.00397491455078125, 0.0354461669921875, 0.06691741943359375, 0.098388671875, 0.12985992431640625, 0.1613311767578125, 0.19280242919921875, 0.224273681640625, 0.25574493408203125, 0.2872161865234375, 0.31868743896484375, 0.35015869140625, 0.38162994384765625, 0.4131011962890625, 0.44457244873046875, 0.476043701171875, 0.5075149536132812, 0.5389862060546875, 0.5704574584960938, 0.6019287109375, 0.6333999633789062, 0.6648712158203125, 0.6963424682617188, 0.727813720703125, 0.7592849731445312, 0.7907562255859375, 0.8222274780273438, 0.85369873046875, 0.8851699829101562, 0.9166412353515625, 0.9481124877929688, 0.979583740234375, 1.0110549926757812, 1.0425262451171875, 1.0739974975585938, 1.10546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 8.0, 8.0, 24.0, 18.0, 18.0, 15.0, 33.0, 32.0, 37.0, 79.0, 78.0, 77.0, 113.0, 84.0, 77.0, 59.0, 46.0, 43.0, 33.0, 23.0, 22.0, 16.0, 8.0, 14.0, 6.0, 1.0, 7.0, 4.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020599365234375, -0.00019984692335128784, -0.00019370019435882568, -0.00018755346536636353, -0.00018140673637390137, -0.0001752600073814392, -0.00016911327838897705, -0.0001629665493965149, -0.00015681982040405273, -0.00015067309141159058, -0.00014452636241912842, -0.00013837963342666626, -0.0001322329044342041, -0.00012608617544174194, -0.00011993944644927979, -0.00011379271745681763, -0.00010764598846435547, -0.00010149925947189331, -9.535253047943115e-05, -8.9205801486969e-05, -8.305907249450684e-05, -7.691234350204468e-05, -7.076561450958252e-05, -6.461888551712036e-05, -5.84721565246582e-05, -5.2325427532196045e-05, -4.617869853973389e-05, -4.003196954727173e-05, -3.388524055480957e-05, -2.7738511562347412e-05, -2.1591782569885254e-05, -1.5445053577423096e-05, -9.298324584960938e-06, -3.1515955924987793e-06, 2.995133399963379e-06, 9.141862392425537e-06, 1.5288591384887695e-05, 2.1435320377349854e-05, 2.7582049369812012e-05, 3.372877836227417e-05, 3.987550735473633e-05, 4.6022236347198486e-05, 5.2168965339660645e-05, 5.83156943321228e-05, 6.446242332458496e-05, 7.060915231704712e-05, 7.675588130950928e-05, 8.290261030197144e-05, 8.90493392944336e-05, 9.519606828689575e-05, 0.00010134279727935791, 0.00010748952627182007, 0.00011363625526428223, 0.00011978298425674438, 0.00012592971324920654, 0.0001320764422416687, 0.00013822317123413086, 0.00014436990022659302, 0.00015051662921905518, 0.00015666335821151733, 0.0001628100872039795, 0.00016895681619644165, 0.0001751035451889038, 0.00018125027418136597, 0.00018739700317382812]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 12.0, 18.0, 19.0, 28.0, 39.0, 50.0, 78.0, 103.0, 154.0, 242.0, 336.0, 484.0, 677.0, 1007.0, 1548.0, 2530.0, 4189.0, 7722.0, 15387.0, 30741.0, 63469.0, 129999.0, 227671.0, 248436.0, 156210.0, 78369.0, 37633.0, 18595.0, 9358.0, 5080.0, 2949.0, 1747.0, 1159.0, 769.0, 504.0, 376.0, 258.0, 192.0, 115.0, 99.0, 63.0, 39.0, 30.0, 22.0, 11.0, 10.0, 10.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0], "bins": [-0.383056640625, -0.3718376159667969, -0.36061859130859375, -0.3493995666503906, -0.3381805419921875, -0.3269615173339844, -0.31574249267578125, -0.3045234680175781, -0.293304443359375, -0.2820854187011719, -0.27086639404296875, -0.2596473693847656, -0.2484283447265625, -0.23720932006835938, -0.22599029541015625, -0.21477127075195312, -0.20355224609375, -0.19233322143554688, -0.18111419677734375, -0.16989517211914062, -0.1586761474609375, -0.14745712280273438, -0.13623809814453125, -0.12501907348632812, -0.113800048828125, -0.10258102416992188, -0.09136199951171875, -0.08014297485351562, -0.0689239501953125, -0.057704925537109375, -0.04648590087890625, -0.035266876220703125, -0.0240478515625, -0.012828826904296875, -0.00160980224609375, 0.009609222412109375, 0.0208282470703125, 0.032047271728515625, 0.04326629638671875, 0.054485321044921875, 0.065704345703125, 0.07692337036132812, 0.08814239501953125, 0.09936141967773438, 0.1105804443359375, 0.12179946899414062, 0.13301849365234375, 0.14423751831054688, 0.15545654296875, 0.16667556762695312, 0.17789459228515625, 0.18911361694335938, 0.2003326416015625, 0.21155166625976562, 0.22277069091796875, 0.23398971557617188, 0.245208740234375, 0.2564277648925781, 0.26764678955078125, 0.2788658142089844, 0.2900848388671875, 0.3013038635253906, 0.31252288818359375, 0.3237419128417969, 0.3349609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 9.0, 9.0, 12.0, 17.0, 31.0, 25.0, 30.0, 36.0, 47.0, 56.0, 59.0, 58.0, 52.0, 66.0, 71.0, 48.0, 53.0, 57.0, 42.0, 41.0, 36.0, 27.0, 23.0, 18.0, 16.0, 12.0, 10.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11468505859375, -0.1114511489868164, -0.10821723937988281, -0.10498332977294922, -0.10174942016601562, -0.09851551055908203, -0.09528160095214844, -0.09204769134521484, -0.08881378173828125, -0.08557987213134766, -0.08234596252441406, -0.07911205291748047, -0.07587814331054688, -0.07264423370361328, -0.06941032409667969, -0.0661764144897461, -0.0629425048828125, -0.059708595275878906, -0.05647468566894531, -0.05324077606201172, -0.050006866455078125, -0.04677295684814453, -0.04353904724121094, -0.040305137634277344, -0.03707122802734375, -0.033837318420410156, -0.030603408813476562, -0.02736949920654297, -0.024135589599609375, -0.02090167999267578, -0.017667770385742188, -0.014433860778808594, -0.011199951171875, -0.007966041564941406, -0.0047321319580078125, -0.0014982223510742188, 0.001735687255859375, 0.004969596862792969, 0.008203506469726562, 0.011437416076660156, 0.01467132568359375, 0.017905235290527344, 0.021139144897460938, 0.02437305450439453, 0.027606964111328125, 0.03084087371826172, 0.03407478332519531, 0.037308692932128906, 0.0405426025390625, 0.043776512145996094, 0.04701042175292969, 0.05024433135986328, 0.053478240966796875, 0.05671215057373047, 0.05994606018066406, 0.06317996978759766, 0.06641387939453125, 0.06964778900146484, 0.07288169860839844, 0.07611560821533203, 0.07934951782226562, 0.08258342742919922, 0.08581733703613281, 0.0890512466430664, 0.09228515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 6.0, 13.0, 14.0, 14.0, 18.0, 27.0, 26.0, 25.0, 45.0, 40.0, 37.0, 66.0, 38.0, 48.0, 44.0, 67.0, 45.0, 60.0, 49.0, 50.0, 38.0, 35.0, 35.0, 33.0, 14.0, 24.0, 20.0, 5.0, 14.0, 10.0, 13.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.709514856338501, -2.607354164123535, -2.5051937103271484, -2.4030330181121826, -2.300872325897217, -2.19871187210083, -2.0965511798858643, -1.994390606880188, -1.8922300338745117, -1.7900694608688354, -1.6879088878631592, -1.5857481956481934, -1.483587622642517, -1.3814270496368408, -1.279266357421875, -1.1771057844161987, -1.0749452114105225, -0.9727846384048462, -0.8706240057945251, -0.7684633731842041, -0.6663028001785278, -0.5641422271728516, -0.4619815945625305, -0.3598209619522095, -0.2576603889465332, -0.15549978613853455, -0.05333918333053589, 0.04882141947746277, 0.15098202228546143, 0.2531425952911377, 0.35530322790145874, 0.4574638605117798, 0.559624433517456, 0.6617850065231323, 0.7639456391334534, 0.8661062717437744, 0.9682668447494507, 1.070427417755127, 1.1725881099700928, 1.274748682975769, 1.3769092559814453, 1.4790698289871216, 1.5812304019927979, 1.6833910942077637, 1.78555166721344, 1.8877122402191162, 1.989872932434082, 2.0920333862304688, 2.1941940784454346, 2.2963547706604004, 2.398515224456787, 2.500675916671753, 2.6028366088867188, 2.7049970626831055, 2.8071577548980713, 2.909318447113037, 3.011478900909424, 3.1136395931243896, 3.2158000469207764, 3.317960739135742, 3.420121192932129, 3.5222818851470947, 3.6244425773620605, 3.7266030311584473, 3.828763723373413]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 4.0, 7.0, 13.0, 6.0, 5.0, 18.0, 13.0, 15.0, 17.0, 17.0, 13.0, 29.0, 28.0, 32.0, 36.0, 38.0, 32.0, 46.0, 29.0, 38.0, 36.0, 50.0, 46.0, 25.0, 53.0, 33.0, 43.0, 38.0, 26.0, 19.0, 24.0, 28.0, 30.0, 17.0, 13.0, 12.0, 20.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4528353214263916, -2.3742663860321045, -2.2956972122192383, -2.217128276824951, -2.138559103012085, -2.059990167617798, -1.9814211130142212, -1.9028520584106445, -1.8242831230163574, -1.7457140684127808, -1.667145013809204, -1.588576078414917, -1.5100070238113403, -1.4314379692077637, -1.352868914604187, -1.2742998600006104, -1.1957308053970337, -1.117161750793457, -1.0385926961898804, -0.9600237011909485, -0.8814547061920166, -0.8028856515884399, -0.7243165969848633, -0.6457476019859314, -0.5671785473823547, -0.48860952258110046, -0.4100404977798462, -0.33147144317626953, -0.25290241837501526, -0.174333393573761, -0.09576433897018433, -0.01719534397125244, 0.06137371063232422, 0.1399427354335785, 0.21851177513599396, 0.2970808148384094, 0.3756498396396637, 0.45421886444091797, 0.5327879190444946, 0.6113569140434265, 0.6899259686470032, 0.7684950232505798, 0.8470640182495117, 0.9256330728530884, 1.004202127456665, 1.0827710628509521, 1.1613402366638184, 1.2399091720581055, 1.3184782266616821, 1.3970472812652588, 1.4756163358688354, 1.554185390472412, 1.6327543258666992, 1.7113233804702759, 1.7898924350738525, 1.8684613704681396, 1.9470305442810059, 2.025599479675293, 2.104168653488159, 2.1827375888824463, 2.2613067626953125, 2.3398756980895996, 2.4184446334838867, 2.497013807296753, 2.57558274269104]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 5.0, 9.0, 11.0, 14.0, 21.0, 39.0, 45.0, 78.0, 114.0, 170.0, 252.0, 388.0, 665.0, 995.0, 1565.0, 2538.0, 4027.0, 6392.0, 9816.0, 15708.0, 24071.0, 35947.0, 51975.0, 70477.0, 90996.0, 107519.0, 116933.0, 115593.0, 103983.0, 85526.0, 65043.0, 47005.0, 32347.0, 21019.0, 13813.0, 8683.0, 5500.0, 3409.0, 2080.0, 1356.0, 899.0, 568.0, 318.0, 224.0, 165.0, 81.0, 68.0, 41.0, 31.0, 16.0, 11.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.798828125, -1.7405242919921875, -1.682220458984375, -1.6239166259765625, -1.56561279296875, -1.5073089599609375, -1.449005126953125, -1.3907012939453125, -1.3323974609375, -1.2740936279296875, -1.215789794921875, -1.1574859619140625, -1.09918212890625, -1.0408782958984375, -0.982574462890625, -0.9242706298828125, -0.865966796875, -0.8076629638671875, -0.749359130859375, -0.6910552978515625, -0.63275146484375, -0.5744476318359375, -0.516143798828125, -0.4578399658203125, -0.3995361328125, -0.3412322998046875, -0.282928466796875, -0.2246246337890625, -0.16632080078125, -0.1080169677734375, -0.049713134765625, 0.0085906982421875, 0.06689453125, 0.1251983642578125, 0.183502197265625, 0.2418060302734375, 0.30010986328125, 0.3584136962890625, 0.416717529296875, 0.4750213623046875, 0.5333251953125, 0.5916290283203125, 0.649932861328125, 0.7082366943359375, 0.76654052734375, 0.8248443603515625, 0.883148193359375, 0.9414520263671875, 0.999755859375, 1.0580596923828125, 1.116363525390625, 1.1746673583984375, 1.23297119140625, 1.2912750244140625, 1.349578857421875, 1.4078826904296875, 1.4661865234375, 1.5244903564453125, 1.582794189453125, 1.6410980224609375, 1.69940185546875, 1.7577056884765625, 1.816009521484375, 1.8743133544921875, 1.9326171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 10.0, 10.0, 12.0, 12.0, 10.0, 14.0, 12.0, 13.0, 23.0, 16.0, 23.0, 26.0, 25.0, 35.0, 45.0, 36.0, 42.0, 30.0, 46.0, 48.0, 39.0, 37.0, 39.0, 38.0, 39.0, 39.0, 37.0, 26.0, 30.0, 21.0, 23.0, 24.0, 19.0, 14.0, 14.0, 21.0, 8.0, 12.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.17486572265625, -2.0977783203125, -2.02069091796875, -1.943603515625, -1.86651611328125, -1.7894287109375, -1.71234130859375, -1.63525390625, -1.55816650390625, -1.4810791015625, -1.40399169921875, -1.326904296875, -1.24981689453125, -1.1727294921875, -1.09564208984375, -1.0185546875, -0.94146728515625, -0.8643798828125, -0.78729248046875, -0.710205078125, -0.63311767578125, -0.5560302734375, -0.47894287109375, -0.40185546875, -0.32476806640625, -0.2476806640625, -0.17059326171875, -0.093505859375, -0.01641845703125, 0.0606689453125, 0.13775634765625, 0.21484375, 0.29193115234375, 0.3690185546875, 0.44610595703125, 0.523193359375, 0.60028076171875, 0.6773681640625, 0.75445556640625, 0.83154296875, 0.90863037109375, 0.9857177734375, 1.06280517578125, 1.139892578125, 1.21697998046875, 1.2940673828125, 1.37115478515625, 1.4482421875, 1.52532958984375, 1.6024169921875, 1.67950439453125, 1.756591796875, 1.83367919921875, 1.9107666015625, 1.98785400390625, 2.06494140625, 2.14202880859375, 2.2191162109375, 2.29620361328125, 2.373291015625, 2.45037841796875, 2.5274658203125, 2.60455322265625, 2.681640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 13.0, 20.0, 35.0, 57.0, 68.0, 125.0, 178.0, 284.0, 447.0, 667.0, 1092.0, 1730.0, 2875.0, 4467.0, 7310.0, 11710.0, 18338.0, 28906.0, 43168.0, 62807.0, 83964.0, 105708.0, 120704.0, 123959.0, 114374.0, 95060.0, 72495.0, 51678.0, 35001.0, 22786.0, 14358.0, 9192.0, 5574.0, 3543.0, 2200.0, 1348.0, 841.0, 564.0, 323.0, 189.0, 143.0, 90.0, 64.0, 36.0, 18.0, 17.0, 9.0, 3.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.117462158203125, -2.04742431640625, -1.977386474609375, -1.9073486328125, -1.837310791015625, -1.76727294921875, -1.697235107421875, -1.627197265625, -1.557159423828125, -1.48712158203125, -1.417083740234375, -1.3470458984375, -1.277008056640625, -1.20697021484375, -1.136932373046875, -1.06689453125, -0.996856689453125, -0.92681884765625, -0.856781005859375, -0.7867431640625, -0.716705322265625, -0.64666748046875, -0.576629638671875, -0.506591796875, -0.436553955078125, -0.36651611328125, -0.296478271484375, -0.2264404296875, -0.156402587890625, -0.08636474609375, -0.016326904296875, 0.0537109375, 0.123748779296875, 0.19378662109375, 0.263824462890625, 0.3338623046875, 0.403900146484375, 0.47393798828125, 0.543975830078125, 0.614013671875, 0.684051513671875, 0.75408935546875, 0.824127197265625, 0.8941650390625, 0.964202880859375, 1.03424072265625, 1.104278564453125, 1.17431640625, 1.244354248046875, 1.31439208984375, 1.384429931640625, 1.4544677734375, 1.524505615234375, 1.59454345703125, 1.664581298828125, 1.734619140625, 1.804656982421875, 1.87469482421875, 1.944732666015625, 2.0147705078125, 2.084808349609375, 2.15484619140625, 2.224884033203125, 2.294921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 10.0, 8.0, 6.0, 17.0, 18.0, 24.0, 18.0, 17.0, 23.0, 32.0, 42.0, 33.0, 36.0, 33.0, 40.0, 43.0, 38.0, 38.0, 42.0, 46.0, 45.0, 30.0, 39.0, 27.0, 34.0, 37.0, 35.0, 19.0, 22.0, 23.0, 26.0, 14.0, 15.0, 8.0, 9.0, 16.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.8037109375, -1.7514495849609375, -1.699188232421875, -1.6469268798828125, -1.59466552734375, -1.5424041748046875, -1.490142822265625, -1.4378814697265625, -1.3856201171875, -1.3333587646484375, -1.281097412109375, -1.2288360595703125, -1.17657470703125, -1.1243133544921875, -1.072052001953125, -1.0197906494140625, -0.967529296875, -0.9152679443359375, -0.863006591796875, -0.8107452392578125, -0.75848388671875, -0.7062225341796875, -0.653961181640625, -0.6016998291015625, -0.5494384765625, -0.4971771240234375, -0.444915771484375, -0.3926544189453125, -0.34039306640625, -0.2881317138671875, -0.235870361328125, -0.1836090087890625, -0.13134765625, -0.0790863037109375, -0.026824951171875, 0.0254364013671875, 0.07769775390625, 0.1299591064453125, 0.182220458984375, 0.2344818115234375, 0.2867431640625, 0.3390045166015625, 0.391265869140625, 0.4435272216796875, 0.49578857421875, 0.5480499267578125, 0.600311279296875, 0.6525726318359375, 0.704833984375, 0.7570953369140625, 0.809356689453125, 0.8616180419921875, 0.91387939453125, 0.9661407470703125, 1.018402099609375, 1.0706634521484375, 1.1229248046875, 1.1751861572265625, 1.227447509765625, 1.2797088623046875, 1.33197021484375, 1.3842315673828125, 1.436492919921875, 1.4887542724609375, 1.541015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 21.0, 23.0, 35.0, 49.0, 49.0, 101.0, 128.0, 176.0, 273.0, 341.0, 489.0, 735.0, 1059.0, 1571.0, 2354.0, 3719.0, 6067.0, 10635.0, 20968.0, 45712.0, 103213.0, 205709.0, 270866.0, 193687.0, 93847.0, 41232.0, 19201.0, 9954.0, 5709.0, 3422.0, 2305.0, 1516.0, 1026.0, 635.0, 466.0, 349.0, 264.0, 164.0, 123.0, 84.0, 86.0, 62.0, 32.0, 27.0, 19.0, 9.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.15625, -2.085418701171875, -2.01458740234375, -1.943756103515625, -1.8729248046875, -1.802093505859375, -1.73126220703125, -1.660430908203125, -1.589599609375, -1.518768310546875, -1.44793701171875, -1.377105712890625, -1.3062744140625, -1.235443115234375, -1.16461181640625, -1.093780517578125, -1.02294921875, -0.952117919921875, -0.88128662109375, -0.810455322265625, -0.7396240234375, -0.668792724609375, -0.59796142578125, -0.527130126953125, -0.456298828125, -0.385467529296875, -0.31463623046875, -0.243804931640625, -0.1729736328125, -0.102142333984375, -0.03131103515625, 0.039520263671875, 0.1103515625, 0.181182861328125, 0.25201416015625, 0.322845458984375, 0.3936767578125, 0.464508056640625, 0.53533935546875, 0.606170654296875, 0.677001953125, 0.747833251953125, 0.81866455078125, 0.889495849609375, 0.9603271484375, 1.031158447265625, 1.10198974609375, 1.172821044921875, 1.24365234375, 1.314483642578125, 1.38531494140625, 1.456146240234375, 1.5269775390625, 1.597808837890625, 1.66864013671875, 1.739471435546875, 1.810302734375, 1.881134033203125, 1.95196533203125, 2.022796630859375, 2.0936279296875, 2.164459228515625, 2.23529052734375, 2.306121826171875, 2.376953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 3.0, 5.0, 15.0, 11.0, 32.0, 44.0, 87.0, 108.0, 145.0, 165.0, 139.0, 85.0, 49.0, 32.0, 16.0, 15.0, 16.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00042819976806640625, -0.000415705144405365, -0.00040321052074432373, -0.00039071589708328247, -0.0003782212734222412, -0.00036572664976119995, -0.0003532320261001587, -0.00034073740243911743, -0.00032824277877807617, -0.0003157481551170349, -0.00030325353145599365, -0.0002907589077949524, -0.00027826428413391113, -0.0002657696604728699, -0.0002532750368118286, -0.00024078041315078735, -0.0002282857894897461, -0.00021579116582870483, -0.00020329654216766357, -0.00019080191850662231, -0.00017830729484558105, -0.0001658126711845398, -0.00015331804752349854, -0.00014082342386245728, -0.00012832880020141602, -0.00011583417654037476, -0.0001033395528793335, -9.084492921829224e-05, -7.835030555725098e-05, -6.585568189620972e-05, -5.336105823516846e-05, -4.08664345741272e-05, -2.8371810913085938e-05, -1.5877187252044678e-05, -3.382563591003418e-06, 9.112060070037842e-06, 2.16066837310791e-05, 3.410130739212036e-05, 4.659593105316162e-05, 5.909055471420288e-05, 7.158517837524414e-05, 8.40798020362854e-05, 9.657442569732666e-05, 0.00010906904935836792, 0.00012156367301940918, 0.00013405829668045044, 0.0001465529203414917, 0.00015904754400253296, 0.00017154216766357422, 0.00018403679132461548, 0.00019653141498565674, 0.000209026038646698, 0.00022152066230773926, 0.00023401528596878052, 0.0002465099096298218, 0.00025900453329086304, 0.0002714991569519043, 0.00028399378061294556, 0.0002964884042739868, 0.0003089830279350281, 0.00032147765159606934, 0.0003339722752571106, 0.00034646689891815186, 0.0003589615225791931, 0.0003714561462402344]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 11.0, 11.0, 13.0, 21.0, 31.0, 33.0, 46.0, 74.0, 127.0, 167.0, 218.0, 342.0, 500.0, 738.0, 1129.0, 1608.0, 2654.0, 4433.0, 7427.0, 13638.0, 25339.0, 48009.0, 89531.0, 148939.0, 196797.0, 191368.0, 137361.0, 81881.0, 43102.0, 22525.0, 12260.0, 6902.0, 4102.0, 2420.0, 1515.0, 1035.0, 700.0, 471.0, 326.0, 211.0, 155.0, 105.0, 86.0, 61.0, 39.0, 28.0, 18.0, 14.0, 10.0, 9.0, 3.0, 1.0, 5.0, 3.0, 5.0, 1.0], "bins": [-1.68359375, -1.6324462890625, -1.581298828125, -1.5301513671875, -1.47900390625, -1.4278564453125, -1.376708984375, -1.3255615234375, -1.2744140625, -1.2232666015625, -1.172119140625, -1.1209716796875, -1.06982421875, -1.0186767578125, -0.967529296875, -0.9163818359375, -0.865234375, -0.8140869140625, -0.762939453125, -0.7117919921875, -0.66064453125, -0.6094970703125, -0.558349609375, -0.5072021484375, -0.4560546875, -0.4049072265625, -0.353759765625, -0.3026123046875, -0.25146484375, -0.2003173828125, -0.149169921875, -0.0980224609375, -0.046875, 0.0042724609375, 0.055419921875, 0.1065673828125, 0.15771484375, 0.2088623046875, 0.260009765625, 0.3111572265625, 0.3623046875, 0.4134521484375, 0.464599609375, 0.5157470703125, 0.56689453125, 0.6180419921875, 0.669189453125, 0.7203369140625, 0.771484375, 0.8226318359375, 0.873779296875, 0.9249267578125, 0.97607421875, 1.0272216796875, 1.078369140625, 1.1295166015625, 1.1806640625, 1.2318115234375, 1.282958984375, 1.3341064453125, 1.38525390625, 1.4364013671875, 1.487548828125, 1.5386962890625, 1.58984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 7.0, 3.0, 6.0, 4.0, 7.0, 11.0, 10.0, 19.0, 21.0, 20.0, 28.0, 22.0, 37.0, 51.0, 55.0, 58.0, 71.0, 58.0, 52.0, 68.0, 53.0, 58.0, 53.0, 40.0, 36.0, 26.0, 25.0, 25.0, 17.0, 13.0, 9.0, 10.0, 10.0, 2.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5139656066894531, -0.49814605712890625, -0.4823265075683594, -0.4665069580078125, -0.4506874084472656, -0.43486785888671875, -0.4190483093261719, -0.403228759765625, -0.3874092102050781, -0.37158966064453125, -0.3557701110839844, -0.3399505615234375, -0.3241310119628906, -0.30831146240234375, -0.2924919128417969, -0.27667236328125, -0.2608528137207031, -0.24503326416015625, -0.22921371459960938, -0.2133941650390625, -0.19757461547851562, -0.18175506591796875, -0.16593551635742188, -0.150115966796875, -0.13429641723632812, -0.11847686767578125, -0.10265731811523438, -0.0868377685546875, -0.07101821899414062, -0.05519866943359375, -0.039379119873046875, -0.0235595703125, -0.007740020751953125, 0.00807952880859375, 0.023899078369140625, 0.0397186279296875, 0.055538177490234375, 0.07135772705078125, 0.08717727661132812, 0.102996826171875, 0.11881637573242188, 0.13463592529296875, 0.15045547485351562, 0.1662750244140625, 0.18209457397460938, 0.19791412353515625, 0.21373367309570312, 0.22955322265625, 0.24537277221679688, 0.26119232177734375, 0.2770118713378906, 0.2928314208984375, 0.3086509704589844, 0.32447052001953125, 0.3402900695800781, 0.356109619140625, 0.3719291687011719, 0.38774871826171875, 0.4035682678222656, 0.4193878173828125, 0.4352073669433594, 0.45102691650390625, 0.4668464660644531, 0.482666015625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 5.0, 9.0, 10.0, 15.0, 22.0, 29.0, 28.0, 17.0, 30.0, 38.0, 40.0, 33.0, 52.0, 37.0, 54.0, 49.0, 52.0, 44.0, 48.0, 54.0, 60.0, 33.0, 40.0, 27.0, 32.0, 24.0, 25.0, 17.0, 11.0, 5.0, 12.0, 14.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6937949657440186, -2.598236322402954, -2.5026776790618896, -2.4071192741394043, -2.31156063079834, -2.2160019874572754, -2.120443344116211, -2.0248847007751465, -1.9293262958526611, -1.8337676525115967, -1.7382091283798218, -1.6426504850387573, -1.5470919609069824, -1.451533317565918, -1.3559746742248535, -1.2604161500930786, -1.1648575067520142, -1.0692988634109497, -0.9737403392791748, -0.8781816959381104, -0.7826231718063354, -0.687064528465271, -0.5915059447288513, -0.49594736099243164, -0.40038877725601196, -0.3048301935195923, -0.2092715948820114, -0.11371299624443054, -0.018154412508010864, 0.07740417122840881, 0.17296278476715088, 0.26852136850357056, 0.36407995223999023, 0.4596385359764099, 0.5551971197128296, 0.650755763053894, 0.746314287185669, 0.8418729305267334, 0.9374315142631531, 1.0329900979995728, 1.1285486221313477, 1.224107265472412, 1.319665789604187, 1.4152244329452515, 1.5107829570770264, 1.6063416004180908, 1.7019002437591553, 1.7974587678909302, 1.8930174112319946, 1.988576054573059, 2.084134578704834, 2.1796932220458984, 2.275251865386963, 2.3708102703094482, 2.4663689136505127, 2.561927556991577, 2.6574862003326416, 2.753044843673706, 2.8486034870147705, 2.944161891937256, 3.0397205352783203, 3.1352791786193848, 3.230837821960449, 3.3263964653015137, 3.421954870223999]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 14.0, 11.0, 12.0, 14.0, 12.0, 15.0, 24.0, 18.0, 26.0, 22.0, 19.0, 31.0, 31.0, 33.0, 26.0, 42.0, 33.0, 33.0, 44.0, 36.0, 38.0, 34.0, 33.0, 32.0, 36.0, 31.0, 22.0, 40.0, 34.0, 19.0, 24.0, 16.0, 14.0, 17.0, 11.0, 21.0, 14.0, 10.0, 3.0, 14.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.268397569656372, -2.196098804473877, -2.123800039291382, -2.0515012741088867, -1.979202389717102, -1.906903624534607, -1.8346048593521118, -1.7623059749603271, -1.690007209777832, -1.617708444595337, -1.5454096794128418, -1.4731109142303467, -1.400812029838562, -1.328513264656067, -1.2562144994735718, -1.183915615081787, -1.1116169691085815, -1.0393182039260864, -0.9670193791389465, -0.8947206139564514, -0.8224217891693115, -0.7501230239868164, -0.6778242588043213, -0.6055254340171814, -0.5332266688346863, -0.4609278738498688, -0.38862907886505127, -0.31633031368255615, -0.24403151869773865, -0.17173272371292114, -0.09943395853042603, -0.027135133743286133, 0.045163631439208984, 0.11746241897344589, 0.1897612065076828, 0.2620599865913391, 0.3343587815761566, 0.4066575765609741, 0.47895634174346924, 0.5512551665306091, 0.6235539317131042, 0.6958526968955994, 0.7681515216827393, 0.8404502868652344, 0.9127490520477295, 0.9850478768348694, 1.0573465824127197, 1.1296454668045044, 1.2019442319869995, 1.2742429971694946, 1.3465417623519897, 1.4188406467437744, 1.4911394119262695, 1.5634381771087646, 1.6357369422912598, 1.7080357074737549, 1.78033447265625, 1.8526332378387451, 1.9249320030212402, 1.9972307682037354, 2.0695295333862305, 2.1418285369873047, 2.2141270637512207, 2.286426067352295, 2.35872483253479]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 12.0, 12.0, 17.0, 39.0, 45.0, 81.0, 134.0, 207.0, 309.0, 484.0, 727.0, 1224.0, 1858.0, 2994.0, 5006.0, 8374.0, 13558.0, 22812.0, 38546.0, 65538.0, 110302.0, 182528.0, 290698.0, 427353.0, 554892.0, 615087.0, 575506.0, 455307.0, 317672.0, 200909.0, 123019.0, 72984.0, 42933.0, 25100.0, 15016.0, 8906.0, 5469.0, 3225.0, 2038.0, 1226.0, 747.0, 494.0, 326.0, 211.0, 117.0, 78.0, 55.0, 43.0, 19.0, 24.0, 9.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0], "bins": [-1.8837890625, -1.8241729736328125, -1.764556884765625, -1.7049407958984375, -1.64532470703125, -1.5857086181640625, -1.526092529296875, -1.4664764404296875, -1.4068603515625, -1.3472442626953125, -1.287628173828125, -1.2280120849609375, -1.16839599609375, -1.1087799072265625, -1.049163818359375, -0.9895477294921875, -0.929931640625, -0.8703155517578125, -0.810699462890625, -0.7510833740234375, -0.69146728515625, -0.6318511962890625, -0.572235107421875, -0.5126190185546875, -0.4530029296875, -0.3933868408203125, -0.333770751953125, -0.2741546630859375, -0.21453857421875, -0.1549224853515625, -0.095306396484375, -0.0356903076171875, 0.02392578125, 0.0835418701171875, 0.143157958984375, 0.2027740478515625, 0.26239013671875, 0.3220062255859375, 0.381622314453125, 0.4412384033203125, 0.5008544921875, 0.5604705810546875, 0.620086669921875, 0.6797027587890625, 0.73931884765625, 0.7989349365234375, 0.858551025390625, 0.9181671142578125, 0.977783203125, 1.0373992919921875, 1.097015380859375, 1.1566314697265625, 1.21624755859375, 1.2758636474609375, 1.335479736328125, 1.3950958251953125, 1.4547119140625, 1.5143280029296875, 1.573944091796875, 1.6335601806640625, 1.69317626953125, 1.7527923583984375, 1.812408447265625, 1.8720245361328125, 1.931640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 8.0, 10.0, 10.0, 14.0, 15.0, 15.0, 20.0, 27.0, 26.0, 26.0, 27.0, 31.0, 25.0, 26.0, 36.0, 40.0, 44.0, 31.0, 32.0, 47.0, 34.0, 50.0, 39.0, 28.0, 37.0, 41.0, 38.0, 24.0, 23.0, 15.0, 25.0, 19.0, 20.0, 17.0, 15.0, 10.0, 12.0, 12.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.15234375, -2.0853271484375, -2.018310546875, -1.9512939453125, -1.88427734375, -1.8172607421875, -1.750244140625, -1.6832275390625, -1.6162109375, -1.5491943359375, -1.482177734375, -1.4151611328125, -1.34814453125, -1.2811279296875, -1.214111328125, -1.1470947265625, -1.080078125, -1.0130615234375, -0.946044921875, -0.8790283203125, -0.81201171875, -0.7449951171875, -0.677978515625, -0.6109619140625, -0.5439453125, -0.4769287109375, -0.409912109375, -0.3428955078125, -0.27587890625, -0.2088623046875, -0.141845703125, -0.0748291015625, -0.0078125, 0.0592041015625, 0.126220703125, 0.1932373046875, 0.26025390625, 0.3272705078125, 0.394287109375, 0.4613037109375, 0.5283203125, 0.5953369140625, 0.662353515625, 0.7293701171875, 0.79638671875, 0.8634033203125, 0.930419921875, 0.9974365234375, 1.064453125, 1.1314697265625, 1.198486328125, 1.2655029296875, 1.33251953125, 1.3995361328125, 1.466552734375, 1.5335693359375, 1.6005859375, 1.6676025390625, 1.734619140625, 1.8016357421875, 1.86865234375, 1.9356689453125, 2.002685546875, 2.0697021484375, 2.13671875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 11.0, 11.0, 9.0, 29.0, 35.0, 52.0, 82.0, 140.0, 224.0, 323.0, 449.0, 772.0, 1215.0, 1922.0, 2995.0, 4653.0, 7514.0, 11979.0, 18781.0, 29793.0, 46388.0, 72367.0, 111323.0, 166797.0, 243737.0, 337285.0, 435464.0, 509235.0, 520404.0, 466632.0, 373524.0, 274991.0, 192821.0, 129334.0, 84608.0, 54374.0, 34384.0, 21889.0, 13933.0, 8640.0, 5537.0, 3575.0, 2192.0, 1406.0, 851.0, 553.0, 377.0, 232.0, 163.0, 103.0, 56.0, 58.0, 31.0, 13.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0], "bins": [-1.9638671875, -1.90283203125, -1.841796875, -1.78076171875, -1.7197265625, -1.65869140625, -1.59765625, -1.53662109375, -1.4755859375, -1.41455078125, -1.353515625, -1.29248046875, -1.2314453125, -1.17041015625, -1.109375, -1.04833984375, -0.9873046875, -0.92626953125, -0.865234375, -0.80419921875, -0.7431640625, -0.68212890625, -0.62109375, -0.56005859375, -0.4990234375, -0.43798828125, -0.376953125, -0.31591796875, -0.2548828125, -0.19384765625, -0.1328125, -0.07177734375, -0.0107421875, 0.05029296875, 0.111328125, 0.17236328125, 0.2333984375, 0.29443359375, 0.35546875, 0.41650390625, 0.4775390625, 0.53857421875, 0.599609375, 0.66064453125, 0.7216796875, 0.78271484375, 0.84375, 0.90478515625, 0.9658203125, 1.02685546875, 1.087890625, 1.14892578125, 1.2099609375, 1.27099609375, 1.33203125, 1.39306640625, 1.4541015625, 1.51513671875, 1.576171875, 1.63720703125, 1.6982421875, 1.75927734375, 1.8203125, 1.88134765625, 1.9423828125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 4.0, 11.0, 10.0, 16.0, 17.0, 19.0, 26.0, 41.0, 46.0, 57.0, 65.0, 76.0, 93.0, 113.0, 127.0, 146.0, 159.0, 171.0, 181.0, 219.0, 248.0, 191.0, 241.0, 231.0, 210.0, 190.0, 188.0, 152.0, 147.0, 121.0, 91.0, 93.0, 92.0, 59.0, 54.0, 32.0, 40.0, 22.0, 16.0, 13.0, 3.0, 12.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.8389816284179688, -0.8093109130859375, -0.7796401977539062, -0.749969482421875, -0.7202987670898438, -0.6906280517578125, -0.6609573364257812, -0.63128662109375, -0.6016159057617188, -0.5719451904296875, -0.5422744750976562, -0.512603759765625, -0.48293304443359375, -0.4532623291015625, -0.42359161376953125, -0.3939208984375, -0.36425018310546875, -0.3345794677734375, -0.30490875244140625, -0.275238037109375, -0.24556732177734375, -0.2158966064453125, -0.18622589111328125, -0.15655517578125, -0.12688446044921875, -0.0972137451171875, -0.06754302978515625, -0.037872314453125, -0.00820159912109375, 0.0214691162109375, 0.05113983154296875, 0.080810546875, 0.11048126220703125, 0.1401519775390625, 0.16982269287109375, 0.199493408203125, 0.22916412353515625, 0.2588348388671875, 0.28850555419921875, 0.31817626953125, 0.34784698486328125, 0.3775177001953125, 0.40718841552734375, 0.436859130859375, 0.46652984619140625, 0.4962005615234375, 0.5258712768554688, 0.5555419921875, 0.5852127075195312, 0.6148834228515625, 0.6445541381835938, 0.674224853515625, 0.7038955688476562, 0.7335662841796875, 0.7632369995117188, 0.79290771484375, 0.8225784301757812, 0.8522491455078125, 0.8819198608398438, 0.911590576171875, 0.9412612915039062, 0.9709320068359375, 1.0006027221679688, 1.0302734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 13.0, 12.0, 14.0, 15.0, 17.0, 29.0, 22.0, 35.0, 34.0, 34.0, 34.0, 34.0, 41.0, 39.0, 59.0, 43.0, 52.0, 62.0, 52.0, 51.0, 39.0, 35.0, 44.0, 23.0, 26.0, 26.0, 19.0, 10.0, 9.0, 19.0, 7.0, 7.0, 10.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3728184700012207, -2.28498911857605, -2.197160005569458, -2.109330654144287, -2.021501302719116, -1.9336721897125244, -1.8458428382873535, -1.7580136060714722, -1.6701843738555908, -1.5823551416397095, -1.4945257902145386, -1.4066965579986572, -1.3188673257827759, -1.2310380935668945, -1.1432087421417236, -1.0553795099258423, -0.9675501585006714, -0.8797208666801453, -0.7918916344642639, -0.7040623426437378, -0.6162331104278564, -0.5284038186073303, -0.4405745267868042, -0.35274529457092285, -0.26491600275039673, -0.177086740732193, -0.08925746381282806, -0.0014281868934631348, 0.0864010751247406, 0.17423033714294434, 0.26205962896347046, 0.3498888611793518, 0.43771815299987793, 0.525547444820404, 0.6133766770362854, 0.7012059688568115, 0.7890352010726929, 0.876864492893219, 0.9646937847137451, 1.0525230169296265, 1.1403522491455078, 1.2281814813613892, 1.31601083278656, 1.4038400650024414, 1.4916692972183228, 1.579498529434204, 1.667327880859375, 1.7551571130752563, 1.8429864645004272, 1.9308156967163086, 2.0186450481414795, 2.1064743995666504, 2.194303512573242, 2.282132863998413, 2.369962215423584, 2.457791328430176, 2.5456206798553467, 2.6334500312805176, 2.7212791442871094, 2.8091084957122803, 2.896937847137451, 2.984766960144043, 3.072596311569214, 3.1604256629943848, 3.2482547760009766]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 3.0, 8.0, 8.0, 16.0, 9.0, 17.0, 10.0, 14.0, 27.0, 27.0, 22.0, 28.0, 17.0, 27.0, 40.0, 32.0, 43.0, 38.0, 34.0, 33.0, 41.0, 39.0, 50.0, 40.0, 32.0, 49.0, 27.0, 26.0, 32.0, 25.0, 30.0, 29.0, 19.0, 11.0, 23.0, 16.0, 6.0, 7.0, 8.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.2009451389312744, -2.12716007232666, -2.053374767303467, -1.9795897006988525, -1.9058046340942383, -1.8320194482803345, -1.7582342624664307, -1.6844491958618164, -1.6106640100479126, -1.5368788242340088, -1.4630937576293945, -1.3893085718154907, -1.315523386001587, -1.2417383193969727, -1.1679531335830688, -1.094167947769165, -1.0203828811645508, -0.9465977549552917, -0.8728126287460327, -0.7990274429321289, -0.7252423167228699, -0.6514571905136108, -0.577672004699707, -0.503886878490448, -0.43010175228118896, -0.35631662607192993, -0.2825314700603485, -0.20874632894992828, -0.13496118783950806, -0.06117606163024902, 0.012609094381332397, 0.08639425039291382, 0.16017913818359375, 0.23396427929401398, 0.3077494204044342, 0.3815345764160156, 0.45531970262527466, 0.5291048288345337, 0.6028900146484375, 0.6766751408576965, 0.7504602670669556, 0.8242453932762146, 0.8980305194854736, 0.9718157052993774, 1.0456008911132812, 1.1193859577178955, 1.1931711435317993, 1.2669563293457031, 1.3407413959503174, 1.4145265817642212, 1.4883116483688354, 1.5620968341827393, 1.6358819007873535, 1.7096670866012573, 1.7834522724151611, 1.8572373390197754, 1.9310225248336792, 2.004807710647583, 2.0785927772521973, 2.1523778438568115, 2.226163148880005, 2.299948215484619, 2.3737332820892334, 2.4475185871124268, 2.521303653717041]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 14.0, 11.0, 17.0, 19.0, 45.0, 97.0, 101.0, 143.0, 222.0, 365.0, 610.0, 950.0, 1474.0, 2428.0, 3720.0, 6000.0, 9357.0, 14792.0, 23541.0, 37408.0, 56433.0, 82515.0, 113413.0, 137156.0, 142677.0, 126260.0, 96561.0, 68464.0, 44781.0, 29114.0, 18496.0, 11563.0, 7307.0, 4697.0, 2872.0, 1758.0, 1157.0, 710.0, 471.0, 323.0, 169.0, 139.0, 73.0, 54.0, 27.0, 26.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1689910888671875, -1.128997802734375, -1.0890045166015625, -1.04901123046875, -1.0090179443359375, -0.969024658203125, -0.9290313720703125, -0.8890380859375, -0.8490447998046875, -0.809051513671875, -0.7690582275390625, -0.72906494140625, -0.6890716552734375, -0.649078369140625, -0.6090850830078125, -0.569091796875, -0.5290985107421875, -0.489105224609375, -0.4491119384765625, -0.40911865234375, -0.3691253662109375, -0.329132080078125, -0.2891387939453125, -0.2491455078125, -0.2091522216796875, -0.169158935546875, -0.1291656494140625, -0.08917236328125, -0.0491790771484375, -0.009185791015625, 0.0308074951171875, 0.07080078125, 0.1107940673828125, 0.150787353515625, 0.1907806396484375, 0.23077392578125, 0.2707672119140625, 0.310760498046875, 0.3507537841796875, 0.3907470703125, 0.4307403564453125, 0.470733642578125, 0.5107269287109375, 0.55072021484375, 0.5907135009765625, 0.630706787109375, 0.6707000732421875, 0.710693359375, 0.7506866455078125, 0.790679931640625, 0.8306732177734375, 0.87066650390625, 0.9106597900390625, 0.950653076171875, 0.9906463623046875, 1.0306396484375, 1.0706329345703125, 1.110626220703125, 1.1506195068359375, 1.19061279296875, 1.2306060791015625, 1.270599365234375, 1.3105926513671875, 1.3505859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 13.0, 14.0, 9.0, 8.0, 14.0, 10.0, 9.0, 25.0, 17.0, 17.0, 24.0, 30.0, 35.0, 31.0, 42.0, 30.0, 28.0, 42.0, 31.0, 28.0, 34.0, 48.0, 38.0, 32.0, 43.0, 34.0, 40.0, 29.0, 34.0, 27.0, 26.0, 18.0, 24.0, 12.0, 16.0, 10.0, 13.0, 11.0, 5.0, 11.0, 6.0, 8.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.37890625, -2.30535888671875, -2.2318115234375, -2.15826416015625, -2.084716796875, -2.01116943359375, -1.9376220703125, -1.86407470703125, -1.79052734375, -1.71697998046875, -1.6434326171875, -1.56988525390625, -1.496337890625, -1.42279052734375, -1.3492431640625, -1.27569580078125, -1.2021484375, -1.12860107421875, -1.0550537109375, -0.98150634765625, -0.907958984375, -0.83441162109375, -0.7608642578125, -0.68731689453125, -0.61376953125, -0.54022216796875, -0.4666748046875, -0.39312744140625, -0.319580078125, -0.24603271484375, -0.1724853515625, -0.09893798828125, -0.025390625, 0.04815673828125, 0.1217041015625, 0.19525146484375, 0.268798828125, 0.34234619140625, 0.4158935546875, 0.48944091796875, 0.56298828125, 0.63653564453125, 0.7100830078125, 0.78363037109375, 0.857177734375, 0.93072509765625, 1.0042724609375, 1.07781982421875, 1.1513671875, 1.22491455078125, 1.2984619140625, 1.37200927734375, 1.445556640625, 1.51910400390625, 1.5926513671875, 1.66619873046875, 1.73974609375, 1.81329345703125, 1.8868408203125, 1.96038818359375, 2.033935546875, 2.10748291015625, 2.1810302734375, 2.25457763671875, 2.328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 13.0, 11.0, 13.0, 17.0, 26.0, 57.0, 78.0, 121.0, 196.0, 336.0, 639.0, 1143.0, 2220.0, 4220.0, 8313.0, 15981.0, 30571.0, 243570.0, 660255.0, 39952.0, 19483.0, 10050.0, 5294.0, 2817.0, 1381.0, 778.0, 438.0, 217.0, 143.0, 67.0, 57.0, 33.0, 19.0, 14.0, 10.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.3167724609375, -3.213623046875, -3.1104736328125, -3.00732421875, -2.9041748046875, -2.801025390625, -2.6978759765625, -2.5947265625, -2.4915771484375, -2.388427734375, -2.2852783203125, -2.18212890625, -2.0789794921875, -1.975830078125, -1.8726806640625, -1.76953125, -1.6663818359375, -1.563232421875, -1.4600830078125, -1.35693359375, -1.2537841796875, -1.150634765625, -1.0474853515625, -0.9443359375, -0.8411865234375, -0.738037109375, -0.6348876953125, -0.53173828125, -0.4285888671875, -0.325439453125, -0.2222900390625, -0.119140625, -0.0159912109375, 0.087158203125, 0.1903076171875, 0.29345703125, 0.3966064453125, 0.499755859375, 0.6029052734375, 0.7060546875, 0.8092041015625, 0.912353515625, 1.0155029296875, 1.11865234375, 1.2218017578125, 1.324951171875, 1.4281005859375, 1.53125, 1.6343994140625, 1.737548828125, 1.8406982421875, 1.94384765625, 2.0469970703125, 2.150146484375, 2.2532958984375, 2.3564453125, 2.4595947265625, 2.562744140625, 2.6658935546875, 2.76904296875, 2.8721923828125, 2.975341796875, 3.0784912109375, 3.181640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 6.0, 6.0, 3.0, 10.0, 6.0, 15.0, 12.0, 15.0, 13.0, 11.0, 21.0, 24.0, 29.0, 33.0, 38.0, 35.0, 26.0, 30.0, 40.0, 44.0, 36.0, 39.0, 37.0, 46.0, 27.0, 34.0, 22.0, 38.0, 30.0, 42.0, 29.0, 20.0, 30.0, 24.0, 18.0, 22.0, 12.0, 14.0, 12.0, 10.0, 14.0, 7.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.779296875, -1.7242279052734375, -1.669158935546875, -1.6140899658203125, -1.55902099609375, -1.5039520263671875, -1.448883056640625, -1.3938140869140625, -1.3387451171875, -1.2836761474609375, -1.228607177734375, -1.1735382080078125, -1.11846923828125, -1.0634002685546875, -1.008331298828125, -0.9532623291015625, -0.898193359375, -0.8431243896484375, -0.788055419921875, -0.7329864501953125, -0.67791748046875, -0.6228485107421875, -0.567779541015625, -0.5127105712890625, -0.4576416015625, -0.4025726318359375, -0.347503662109375, -0.2924346923828125, -0.23736572265625, -0.1822967529296875, -0.127227783203125, -0.0721588134765625, -0.01708984375, 0.0379791259765625, 0.093048095703125, 0.1481170654296875, 0.20318603515625, 0.2582550048828125, 0.313323974609375, 0.3683929443359375, 0.4234619140625, 0.4785308837890625, 0.533599853515625, 0.5886688232421875, 0.64373779296875, 0.6988067626953125, 0.753875732421875, 0.8089447021484375, 0.864013671875, 0.9190826416015625, 0.974151611328125, 1.0292205810546875, 1.08428955078125, 1.1393585205078125, 1.194427490234375, 1.2494964599609375, 1.3045654296875, 1.3596343994140625, 1.414703369140625, 1.4697723388671875, 1.52484130859375, 1.5799102783203125, 1.634979248046875, 1.6900482177734375, 1.7451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 14.0, 17.0, 26.0, 43.0, 65.0, 95.0, 162.0, 206.0, 381.0, 567.0, 959.0, 1751.0, 3187.0, 6182.0, 13233.0, 32778.0, 345480.0, 574562.0, 38795.0, 15134.0, 6875.0, 3459.0, 1880.0, 1021.0, 594.0, 363.0, 251.0, 162.0, 101.0, 52.0, 40.0, 18.0, 17.0, 18.0, 12.0, 8.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5336532592773438, -0.5170135498046875, -0.5003738403320312, -0.483734130859375, -0.46709442138671875, -0.4504547119140625, -0.43381500244140625, -0.41717529296875, -0.40053558349609375, -0.3838958740234375, -0.36725616455078125, -0.350616455078125, -0.33397674560546875, -0.3173370361328125, -0.30069732666015625, -0.2840576171875, -0.26741790771484375, -0.2507781982421875, -0.23413848876953125, -0.217498779296875, -0.20085906982421875, -0.1842193603515625, -0.16757965087890625, -0.15093994140625, -0.13430023193359375, -0.1176605224609375, -0.10102081298828125, -0.084381103515625, -0.06774139404296875, -0.0511016845703125, -0.03446197509765625, -0.017822265625, -0.00118255615234375, 0.0154571533203125, 0.03209686279296875, 0.048736572265625, 0.06537628173828125, 0.0820159912109375, 0.09865570068359375, 0.11529541015625, 0.13193511962890625, 0.1485748291015625, 0.16521453857421875, 0.181854248046875, 0.19849395751953125, 0.2151336669921875, 0.23177337646484375, 0.2484130859375, 0.26505279541015625, 0.2816925048828125, 0.29833221435546875, 0.314971923828125, 0.33161163330078125, 0.3482513427734375, 0.36489105224609375, 0.38153076171875, 0.39817047119140625, 0.4148101806640625, 0.43144989013671875, 0.448089599609375, 0.46472930908203125, 0.4813690185546875, 0.49800872802734375, 0.5146484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 3.0, 11.0, 5.0, 16.0, 14.0, 17.0, 15.0, 27.0, 37.0, 45.0, 61.0, 55.0, 72.0, 73.0, 87.0, 72.0, 75.0, 54.0, 48.0, 45.0, 23.0, 22.0, 21.0, 13.0, 21.0, 11.0, 10.0, 9.0, 8.0, 4.0, 5.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.241964340209961e-05, -6.943941116333008e-05, -6.645917892456055e-05, -6.347894668579102e-05, -6.0498714447021484e-05, -5.751848220825195e-05, -5.453824996948242e-05, -5.155801773071289e-05, -4.857778549194336e-05, -4.559755325317383e-05, -4.26173210144043e-05, -3.9637088775634766e-05, -3.6656856536865234e-05, -3.36766242980957e-05, -3.069639205932617e-05, -2.771615982055664e-05, -2.473592758178711e-05, -2.1755695343017578e-05, -1.8775463104248047e-05, -1.5795230865478516e-05, -1.2814998626708984e-05, -9.834766387939453e-06, -6.854534149169922e-06, -3.874301910400391e-06, -8.940696716308594e-07, 2.086162567138672e-06, 5.066394805908203e-06, 8.046627044677734e-06, 1.1026859283447266e-05, 1.4007091522216797e-05, 1.6987323760986328e-05, 1.996755599975586e-05, 2.294778823852539e-05, 2.5928020477294922e-05, 2.8908252716064453e-05, 3.1888484954833984e-05, 3.4868717193603516e-05, 3.784894943237305e-05, 4.082918167114258e-05, 4.380941390991211e-05, 4.678964614868164e-05, 4.976987838745117e-05, 5.27501106262207e-05, 5.5730342864990234e-05, 5.8710575103759766e-05, 6.16908073425293e-05, 6.467103958129883e-05, 6.765127182006836e-05, 7.063150405883789e-05, 7.361173629760742e-05, 7.659196853637695e-05, 7.957220077514648e-05, 8.255243301391602e-05, 8.553266525268555e-05, 8.851289749145508e-05, 9.149312973022461e-05, 9.447336196899414e-05, 9.745359420776367e-05, 0.0001004338264465332, 0.00010341405868530273, 0.00010639429092407227, 0.0001093745231628418, 0.00011235475540161133, 0.00011533498764038086]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 9.0, 8.0, 20.0, 33.0, 35.0, 51.0, 71.0, 99.0, 157.0, 223.0, 313.0, 447.0, 598.0, 859.0, 1263.0, 1875.0, 2818.0, 4768.0, 8053.0, 14842.0, 29025.0, 60264.0, 122558.0, 212258.0, 241606.0, 167259.0, 87474.0, 42794.0, 20823.0, 10840.0, 6174.0, 3706.0, 2315.0, 1483.0, 989.0, 721.0, 527.0, 370.0, 246.0, 161.0, 140.0, 93.0, 57.0, 32.0, 27.0, 20.0, 15.0, 10.0, 14.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.310302734375, -0.30097198486328125, -0.2916412353515625, -0.28231048583984375, -0.272979736328125, -0.26364898681640625, -0.2543182373046875, -0.24498748779296875, -0.23565673828125, -0.22632598876953125, -0.2169952392578125, -0.20766448974609375, -0.198333740234375, -0.18900299072265625, -0.1796722412109375, -0.17034149169921875, -0.1610107421875, -0.15167999267578125, -0.1423492431640625, -0.13301849365234375, -0.123687744140625, -0.11435699462890625, -0.1050262451171875, -0.09569549560546875, -0.08636474609375, -0.07703399658203125, -0.0677032470703125, -0.05837249755859375, -0.049041748046875, -0.03971099853515625, -0.0303802490234375, -0.02104949951171875, -0.01171875, -0.00238800048828125, 0.0069427490234375, 0.01627349853515625, 0.025604248046875, 0.03493499755859375, 0.0442657470703125, 0.05359649658203125, 0.06292724609375, 0.07225799560546875, 0.0815887451171875, 0.09091949462890625, 0.100250244140625, 0.10958099365234375, 0.1189117431640625, 0.12824249267578125, 0.1375732421875, 0.14690399169921875, 0.1562347412109375, 0.16556549072265625, 0.174896240234375, 0.18422698974609375, 0.1935577392578125, 0.20288848876953125, 0.21221923828125, 0.22154998779296875, 0.2308807373046875, 0.24021148681640625, 0.249542236328125, 0.25887298583984375, 0.2682037353515625, 0.27753448486328125, 0.286865234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 10.0, 2.0, 10.0, 6.0, 16.0, 20.0, 12.0, 27.0, 21.0, 27.0, 40.0, 59.0, 58.0, 62.0, 62.0, 75.0, 74.0, 83.0, 57.0, 42.0, 50.0, 29.0, 20.0, 26.0, 16.0, 16.0, 12.0, 9.0, 12.0, 9.0, 4.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.10791015625, -0.10469341278076172, -0.10147666931152344, -0.09825992584228516, -0.09504318237304688, -0.0918264389038086, -0.08860969543457031, -0.08539295196533203, -0.08217620849609375, -0.07895946502685547, -0.07574272155761719, -0.0725259780883789, -0.06930923461914062, -0.06609249114990234, -0.06287574768066406, -0.05965900421142578, -0.0564422607421875, -0.05322551727294922, -0.05000877380371094, -0.046792030334472656, -0.043575286865234375, -0.040358543395996094, -0.03714179992675781, -0.03392505645751953, -0.03070831298828125, -0.02749156951904297, -0.024274826049804688, -0.021058082580566406, -0.017841339111328125, -0.014624595642089844, -0.011407852172851562, -0.008191108703613281, -0.004974365234375, -0.0017576217651367188, 0.0014591217041015625, 0.004675865173339844, 0.007892608642578125, 0.011109352111816406, 0.014326095581054688, 0.01754283905029297, 0.02075958251953125, 0.02397632598876953, 0.027193069458007812, 0.030409812927246094, 0.033626556396484375, 0.036843299865722656, 0.04006004333496094, 0.04327678680419922, 0.0464935302734375, 0.04971027374267578, 0.05292701721191406, 0.056143760681152344, 0.059360504150390625, 0.0625772476196289, 0.06579399108886719, 0.06901073455810547, 0.07222747802734375, 0.07544422149658203, 0.07866096496582031, 0.0818777084350586, 0.08509445190429688, 0.08831119537353516, 0.09152793884277344, 0.09474468231201172, 0.09796142578125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 10.0, 14.0, 7.0, 16.0, 23.0, 17.0, 30.0, 35.0, 16.0, 33.0, 34.0, 38.0, 43.0, 39.0, 59.0, 56.0, 52.0, 66.0, 60.0, 33.0, 47.0, 45.0, 32.0, 30.0, 31.0, 25.0, 18.0, 17.0, 14.0, 10.0, 10.0, 9.0, 7.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4706783294677734, -2.3802058696746826, -2.2897331714630127, -2.199260711669922, -2.108788013458252, -2.018315553665161, -1.9278430938720703, -1.83737051486969, -1.7468979358673096, -1.6564253568649292, -1.5659527778625488, -1.475480318069458, -1.3850077390670776, -1.2945351600646973, -1.2040627002716064, -1.113590121269226, -1.0231175422668457, -0.9326449632644653, -0.8421724438667297, -0.7516999244689941, -0.6612273454666138, -0.5707547664642334, -0.4802822470664978, -0.3898097276687622, -0.29933714866638184, -0.20886459946632385, -0.11839205026626587, -0.027919501066207886, 0.0625530481338501, 0.15302559733390808, 0.24349814653396606, 0.33397066593170166, 0.42444300651550293, 0.5149155855178833, 0.6053881049156189, 0.6958606243133545, 0.7863332033157349, 0.8768057823181152, 0.9672783017158508, 1.0577508211135864, 1.1482234001159668, 1.2386959791183472, 1.3291685581207275, 1.4196410179138184, 1.5101135969161987, 1.600586175918579, 1.69105863571167, 1.7815312147140503, 1.8720037937164307, 1.962476372718811, 2.0529489517211914, 2.1434214115142822, 2.233893871307373, 2.324366569519043, 2.414839029312134, 2.5053114891052246, 2.5957841873168945, 2.6862566471099854, 2.7767293453216553, 2.867201805114746, 2.957674503326416, 3.048146963119507, 3.1386194229125977, 3.2290921211242676, 3.3195645809173584]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 3.0, 5.0, 12.0, 11.0, 6.0, 12.0, 16.0, 13.0, 21.0, 18.0, 37.0, 24.0, 22.0, 28.0, 35.0, 39.0, 38.0, 32.0, 35.0, 44.0, 38.0, 43.0, 46.0, 44.0, 47.0, 34.0, 33.0, 35.0, 25.0, 28.0, 26.0, 27.0, 24.0, 9.0, 15.0, 18.0, 11.0, 8.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2393386363983154, -2.1643495559692383, -2.089360237121582, -2.014371156692505, -1.9393818378448486, -1.864392638206482, -1.7894034385681152, -1.714414358139038, -1.6394250392913818, -1.5644358396530151, -1.4894466400146484, -1.4144574403762817, -1.339468240737915, -1.2644790410995483, -1.1894898414611816, -1.1145007610321045, -1.0395115613937378, -0.9645223617553711, -0.8895331621170044, -0.8145439624786377, -0.739554762840271, -0.6645655632019043, -0.5895764231681824, -0.5145872235298157, -0.439598023891449, -0.3646088242530823, -0.2896196246147156, -0.21463045477867126, -0.13964125514030457, -0.06465205550193787, 0.010337114334106445, 0.08532631397247314, 0.16031551361083984, 0.23530471324920654, 0.31029391288757324, 0.38528308272361755, 0.46027228236198425, 0.5352615118026733, 0.6102506518363953, 0.685239851474762, 0.7602290511131287, 0.8352182507514954, 0.9102074503898621, 0.985196590423584, 1.0601857900619507, 1.1351749897003174, 1.210164189338684, 1.2851533889770508, 1.3601425886154175, 1.4351317882537842, 1.5101209878921509, 1.5851101875305176, 1.6600993871688843, 1.735088586807251, 1.8100776672363281, 1.8850669860839844, 1.9600560665130615, 2.0350451469421387, 2.110034465789795, 2.185023546218872, 2.2600128650665283, 2.3350019454956055, 2.4099912643432617, 2.484980344772339, 2.559969663619995]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 13.0, 25.0, 32.0, 63.0, 87.0, 134.0, 199.0, 345.0, 626.0, 1032.0, 1656.0, 2698.0, 4259.0, 6770.0, 10569.0, 16292.0, 24591.0, 35260.0, 49496.0, 65902.0, 84133.0, 99252.0, 108351.0, 109827.0, 101910.0, 87578.0, 70241.0, 53225.0, 38364.0, 26306.0, 17680.0, 11598.0, 7640.0, 4656.0, 2916.0, 1847.0, 1127.0, 665.0, 466.0, 291.0, 159.0, 104.0, 70.0, 46.0, 23.0, 10.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6416015625, -1.588836669921875, -1.53607177734375, -1.483306884765625, -1.4305419921875, -1.377777099609375, -1.32501220703125, -1.272247314453125, -1.219482421875, -1.166717529296875, -1.11395263671875, -1.061187744140625, -1.0084228515625, -0.955657958984375, -0.90289306640625, -0.850128173828125, -0.79736328125, -0.744598388671875, -0.69183349609375, -0.639068603515625, -0.5863037109375, -0.533538818359375, -0.48077392578125, -0.428009033203125, -0.375244140625, -0.322479248046875, -0.26971435546875, -0.216949462890625, -0.1641845703125, -0.111419677734375, -0.05865478515625, -0.005889892578125, 0.046875, 0.099639892578125, 0.15240478515625, 0.205169677734375, 0.2579345703125, 0.310699462890625, 0.36346435546875, 0.416229248046875, 0.468994140625, 0.521759033203125, 0.57452392578125, 0.627288818359375, 0.6800537109375, 0.732818603515625, 0.78558349609375, 0.838348388671875, 0.89111328125, 0.943878173828125, 0.99664306640625, 1.049407958984375, 1.1021728515625, 1.154937744140625, 1.20770263671875, 1.260467529296875, 1.313232421875, 1.365997314453125, 1.41876220703125, 1.471527099609375, 1.5242919921875, 1.577056884765625, 1.62982177734375, 1.682586669921875, 1.7353515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 6.0, 10.0, 11.0, 25.0, 9.0, 18.0, 20.0, 24.0, 21.0, 25.0, 23.0, 31.0, 39.0, 34.0, 29.0, 32.0, 31.0, 34.0, 30.0, 44.0, 34.0, 45.0, 29.0, 44.0, 35.0, 31.0, 33.0, 25.0, 30.0, 22.0, 19.0, 15.0, 19.0, 16.0, 15.0, 13.0, 11.0, 8.0, 5.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0], "bins": [-2.146484375, -2.07965087890625, -2.0128173828125, -1.94598388671875, -1.879150390625, -1.81231689453125, -1.7454833984375, -1.67864990234375, -1.61181640625, -1.54498291015625, -1.4781494140625, -1.41131591796875, -1.344482421875, -1.27764892578125, -1.2108154296875, -1.14398193359375, -1.0771484375, -1.01031494140625, -0.9434814453125, -0.87664794921875, -0.809814453125, -0.74298095703125, -0.6761474609375, -0.60931396484375, -0.54248046875, -0.47564697265625, -0.4088134765625, -0.34197998046875, -0.275146484375, -0.20831298828125, -0.1414794921875, -0.07464599609375, -0.0078125, 0.05902099609375, 0.1258544921875, 0.19268798828125, 0.259521484375, 0.32635498046875, 0.3931884765625, 0.46002197265625, 0.52685546875, 0.59368896484375, 0.6605224609375, 0.72735595703125, 0.794189453125, 0.86102294921875, 0.9278564453125, 0.99468994140625, 1.0615234375, 1.12835693359375, 1.1951904296875, 1.26202392578125, 1.328857421875, 1.39569091796875, 1.4625244140625, 1.52935791015625, 1.59619140625, 1.66302490234375, 1.7298583984375, 1.79669189453125, 1.863525390625, 1.93035888671875, 1.9971923828125, 2.06402587890625, 2.130859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 17.0, 38.0, 56.0, 94.0, 166.0, 256.0, 489.0, 889.0, 1697.0, 3277.0, 6005.0, 11253.0, 21050.0, 37901.0, 64301.0, 99361.0, 135983.0, 159275.0, 156254.0, 129407.0, 90725.0, 57384.0, 33194.0, 18563.0, 9771.0, 5194.0, 2707.0, 1464.0, 772.0, 422.0, 220.0, 130.0, 83.0, 50.0, 30.0, 18.0, 10.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.405914306640625, -2.31964111328125, -2.233367919921875, -2.1470947265625, -2.060821533203125, -1.97454833984375, -1.888275146484375, -1.802001953125, -1.715728759765625, -1.62945556640625, -1.543182373046875, -1.4569091796875, -1.370635986328125, -1.28436279296875, -1.198089599609375, -1.11181640625, -1.025543212890625, -0.93927001953125, -0.852996826171875, -0.7667236328125, -0.680450439453125, -0.59417724609375, -0.507904052734375, -0.421630859375, -0.335357666015625, -0.24908447265625, -0.162811279296875, -0.0765380859375, 0.009735107421875, 0.09600830078125, 0.182281494140625, 0.2685546875, 0.354827880859375, 0.44110107421875, 0.527374267578125, 0.6136474609375, 0.699920654296875, 0.78619384765625, 0.872467041015625, 0.958740234375, 1.045013427734375, 1.13128662109375, 1.217559814453125, 1.3038330078125, 1.390106201171875, 1.47637939453125, 1.562652587890625, 1.64892578125, 1.735198974609375, 1.82147216796875, 1.907745361328125, 1.9940185546875, 2.080291748046875, 2.16656494140625, 2.252838134765625, 2.339111328125, 2.425384521484375, 2.51165771484375, 2.597930908203125, 2.6842041015625, 2.770477294921875, 2.85675048828125, 2.943023681640625, 3.029296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 12.0, 10.0, 15.0, 14.0, 18.0, 16.0, 19.0, 28.0, 32.0, 29.0, 29.0, 28.0, 50.0, 33.0, 42.0, 51.0, 45.0, 42.0, 46.0, 37.0, 53.0, 38.0, 20.0, 34.0, 37.0, 29.0, 31.0, 23.0, 19.0, 21.0, 17.0, 14.0, 17.0, 7.0, 4.0, 10.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.486328125, -1.4350738525390625, -1.383819580078125, -1.3325653076171875, -1.28131103515625, -1.2300567626953125, -1.178802490234375, -1.1275482177734375, -1.0762939453125, -1.0250396728515625, -0.973785400390625, -0.9225311279296875, -0.87127685546875, -0.8200225830078125, -0.768768310546875, -0.7175140380859375, -0.666259765625, -0.6150054931640625, -0.563751220703125, -0.5124969482421875, -0.46124267578125, -0.4099884033203125, -0.358734130859375, -0.3074798583984375, -0.2562255859375, -0.2049713134765625, -0.153717041015625, -0.1024627685546875, -0.05120849609375, 4.57763671875e-05, 0.051300048828125, 0.1025543212890625, 0.15380859375, 0.2050628662109375, 0.256317138671875, 0.3075714111328125, 0.35882568359375, 0.4100799560546875, 0.461334228515625, 0.5125885009765625, 0.5638427734375, 0.6150970458984375, 0.666351318359375, 0.7176055908203125, 0.76885986328125, 0.8201141357421875, 0.871368408203125, 0.9226226806640625, 0.973876953125, 1.0251312255859375, 1.076385498046875, 1.1276397705078125, 1.17889404296875, 1.2301483154296875, 1.281402587890625, 1.3326568603515625, 1.3839111328125, 1.4351654052734375, 1.486419677734375, 1.5376739501953125, 1.58892822265625, 1.6401824951171875, 1.691436767578125, 1.7426910400390625, 1.7939453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 5.0, 1.0, 3.0, 6.0, 7.0, 11.0, 17.0, 18.0, 35.0, 27.0, 55.0, 103.0, 123.0, 193.0, 308.0, 476.0, 778.0, 1405.0, 2578.0, 4799.0, 9749.0, 18924.0, 38252.0, 76608.0, 141917.0, 209805.0, 217278.0, 152867.0, 85219.0, 42924.0, 20902.0, 10711.0, 5514.0, 2990.0, 1554.0, 894.0, 549.0, 323.0, 228.0, 129.0, 87.0, 50.0, 42.0, 28.0, 20.0, 10.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.544921875, -1.493560791015625, -1.44219970703125, -1.390838623046875, -1.3394775390625, -1.288116455078125, -1.23675537109375, -1.185394287109375, -1.134033203125, -1.082672119140625, -1.03131103515625, -0.979949951171875, -0.9285888671875, -0.877227783203125, -0.82586669921875, -0.774505615234375, -0.72314453125, -0.671783447265625, -0.62042236328125, -0.569061279296875, -0.5177001953125, -0.466339111328125, -0.41497802734375, -0.363616943359375, -0.312255859375, -0.260894775390625, -0.20953369140625, -0.158172607421875, -0.1068115234375, -0.055450439453125, -0.00408935546875, 0.047271728515625, 0.0986328125, 0.149993896484375, 0.20135498046875, 0.252716064453125, 0.3040771484375, 0.355438232421875, 0.40679931640625, 0.458160400390625, 0.509521484375, 0.560882568359375, 0.61224365234375, 0.663604736328125, 0.7149658203125, 0.766326904296875, 0.81768798828125, 0.869049072265625, 0.92041015625, 0.971771240234375, 1.02313232421875, 1.074493408203125, 1.1258544921875, 1.177215576171875, 1.22857666015625, 1.279937744140625, 1.331298828125, 1.382659912109375, 1.43402099609375, 1.485382080078125, 1.5367431640625, 1.588104248046875, 1.63946533203125, 1.690826416015625, 1.7421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 3.0, 6.0, 7.0, 3.0, 6.0, 11.0, 29.0, 31.0, 30.0, 48.0, 63.0, 70.0, 79.0, 92.0, 89.0, 104.0, 68.0, 43.0, 54.0, 44.0, 28.0, 24.0, 21.0, 14.0, 7.0, 12.0, 5.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.00025773048400878906, -0.0002516061067581177, -0.0002454817295074463, -0.0002393573522567749, -0.00023323297500610352, -0.00022710859775543213, -0.00022098422050476074, -0.00021485984325408936, -0.00020873546600341797, -0.00020261108875274658, -0.0001964867115020752, -0.0001903623342514038, -0.00018423795700073242, -0.00017811357975006104, -0.00017198920249938965, -0.00016586482524871826, -0.00015974044799804688, -0.0001536160707473755, -0.0001474916934967041, -0.00014136731624603271, -0.00013524293899536133, -0.00012911856174468994, -0.00012299418449401855, -0.00011686980724334717, -0.00011074542999267578, -0.0001046210527420044, -9.849667549133301e-05, -9.237229824066162e-05, -8.624792098999023e-05, -8.012354373931885e-05, -7.399916648864746e-05, -6.787478923797607e-05, -6.175041198730469e-05, -5.56260347366333e-05, -4.9501657485961914e-05, -4.337728023529053e-05, -3.725290298461914e-05, -3.1128525733947754e-05, -2.5004148483276367e-05, -1.887977123260498e-05, -1.2755393981933594e-05, -6.631016731262207e-06, -5.066394805908203e-07, 5.617737770080566e-06, 1.1742115020751953e-05, 1.786649227142334e-05, 2.3990869522094727e-05, 3.0115246772766113e-05, 3.62396240234375e-05, 4.236400127410889e-05, 4.8488378524780273e-05, 5.461275577545166e-05, 6.073713302612305e-05, 6.686151027679443e-05, 7.298588752746582e-05, 7.911026477813721e-05, 8.52346420288086e-05, 9.135901927947998e-05, 9.748339653015137e-05, 0.00010360777378082275, 0.00010973215103149414, 0.00011585652828216553, 0.00012198090553283691, 0.0001281052827835083, 0.0001342296600341797]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 13.0, 24.0, 35.0, 48.0, 65.0, 75.0, 128.0, 184.0, 222.0, 320.0, 425.0, 650.0, 1016.0, 1487.0, 2266.0, 3319.0, 5322.0, 8555.0, 13729.0, 22411.0, 36628.0, 58198.0, 88354.0, 122337.0, 146812.0, 149223.0, 127579.0, 93483.0, 62004.0, 39277.0, 24089.0, 14731.0, 9036.0, 5527.0, 3593.0, 2348.0, 1561.0, 1018.0, 742.0, 481.0, 380.0, 237.0, 187.0, 114.0, 99.0, 67.0, 47.0, 39.0, 19.0, 22.0, 11.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0], "bins": [-1.07421875, -1.0407257080078125, -1.007232666015625, -0.9737396240234375, -0.94024658203125, -0.9067535400390625, -0.873260498046875, -0.8397674560546875, -0.8062744140625, -0.7727813720703125, -0.739288330078125, -0.7057952880859375, -0.67230224609375, -0.6388092041015625, -0.605316162109375, -0.5718231201171875, -0.538330078125, -0.5048370361328125, -0.471343994140625, -0.4378509521484375, -0.40435791015625, -0.3708648681640625, -0.337371826171875, -0.3038787841796875, -0.2703857421875, -0.2368927001953125, -0.203399658203125, -0.1699066162109375, -0.13641357421875, -0.1029205322265625, -0.069427490234375, -0.0359344482421875, -0.00244140625, 0.0310516357421875, 0.064544677734375, 0.0980377197265625, 0.13153076171875, 0.1650238037109375, 0.198516845703125, 0.2320098876953125, 0.2655029296875, 0.2989959716796875, 0.332489013671875, 0.3659820556640625, 0.39947509765625, 0.4329681396484375, 0.466461181640625, 0.4999542236328125, 0.533447265625, 0.5669403076171875, 0.600433349609375, 0.6339263916015625, 0.66741943359375, 0.7009124755859375, 0.734405517578125, 0.7678985595703125, 0.8013916015625, 0.8348846435546875, 0.868377685546875, 0.9018707275390625, 0.93536376953125, 0.9688568115234375, 1.002349853515625, 1.0358428955078125, 1.0693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 8.0, 9.0, 5.0, 4.0, 12.0, 13.0, 18.0, 22.0, 27.0, 30.0, 39.0, 36.0, 32.0, 54.0, 47.0, 59.0, 52.0, 74.0, 41.0, 59.0, 53.0, 50.0, 48.0, 46.0, 30.0, 29.0, 20.0, 15.0, 17.0, 13.0, 5.0, 8.0, 4.0, 3.0, 7.0, 4.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.3229255676269531, -0.31089019775390625, -0.2988548278808594, -0.2868194580078125, -0.2747840881347656, -0.26274871826171875, -0.2507133483886719, -0.238677978515625, -0.22664260864257812, -0.21460723876953125, -0.20257186889648438, -0.1905364990234375, -0.17850112915039062, -0.16646575927734375, -0.15443038940429688, -0.14239501953125, -0.13035964965820312, -0.11832427978515625, -0.10628890991210938, -0.0942535400390625, -0.08221817016601562, -0.07018280029296875, -0.058147430419921875, -0.046112060546875, -0.034076690673828125, -0.02204132080078125, -0.010005950927734375, 0.0020294189453125, 0.014064788818359375, 0.02610015869140625, 0.038135528564453125, 0.0501708984375, 0.062206268310546875, 0.07424163818359375, 0.08627700805664062, 0.0983123779296875, 0.11034774780273438, 0.12238311767578125, 0.13441848754882812, 0.146453857421875, 0.15848922729492188, 0.17052459716796875, 0.18255996704101562, 0.1945953369140625, 0.20663070678710938, 0.21866607666015625, 0.23070144653320312, 0.24273681640625, 0.2547721862792969, 0.26680755615234375, 0.2788429260253906, 0.2908782958984375, 0.3029136657714844, 0.31494903564453125, 0.3269844055175781, 0.339019775390625, 0.3510551452636719, 0.36309051513671875, 0.3751258850097656, 0.3871612548828125, 0.3991966247558594, 0.41123199462890625, 0.4232673645019531, 0.435302734375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 6.0, 2.0, 11.0, 14.0, 7.0, 14.0, 18.0, 22.0, 16.0, 20.0, 36.0, 28.0, 28.0, 40.0, 37.0, 51.0, 53.0, 58.0, 41.0, 56.0, 48.0, 50.0, 47.0, 44.0, 40.0, 27.0, 28.0, 20.0, 16.0, 19.0, 28.0, 12.0, 14.0, 8.0, 5.0, 7.0, 8.0, 7.0, 5.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2837777137756348, -2.2020413875579834, -2.120305299758911, -2.0385689735412598, -1.956832766532898, -1.8750965595245361, -1.7933602333068848, -1.711624026298523, -1.6298878192901611, -1.5481516122817993, -1.4664154052734375, -1.3846790790557861, -1.3029428720474243, -1.2212066650390625, -1.1394703388214111, -1.0577341318130493, -0.9759979248046875, -0.8942617177963257, -0.8125254511833191, -0.7307891845703125, -0.6490529775619507, -0.5673167705535889, -0.4855805039405823, -0.4038442373275757, -0.32210803031921387, -0.24037179350852966, -0.15863555669784546, -0.07689931988716125, 0.004836916923522949, 0.08657315373420715, 0.16830939054489136, 0.25004565715789795, 0.33178210258483887, 0.41351833939552307, 0.4952545762062073, 0.5769908428192139, 0.6587270498275757, 0.7404632568359375, 0.8221995234489441, 0.9039357900619507, 0.9856719970703125, 1.0674082040786743, 1.1491444110870361, 1.2308807373046875, 1.3126169443130493, 1.3943531513214111, 1.4760894775390625, 1.5578256845474243, 1.6395618915557861, 1.721298098564148, 1.8030343055725098, 1.8847706317901611, 1.966506838798523, 2.0482430458068848, 2.129979372024536, 2.2117156982421875, 2.2934517860412598, 2.375188112258911, 2.4569242000579834, 2.5386605262756348, 2.620396614074707, 2.7021329402923584, 2.7838692665100098, 2.865605354309082, 2.9473416805267334]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 4.0, 11.0, 10.0, 9.0, 13.0, 23.0, 19.0, 26.0, 22.0, 25.0, 36.0, 26.0, 28.0, 38.0, 35.0, 50.0, 45.0, 43.0, 37.0, 37.0, 44.0, 41.0, 32.0, 39.0, 41.0, 39.0, 31.0, 31.0, 19.0, 20.0, 23.0, 15.0, 11.0, 19.0, 17.0, 11.0, 10.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.569464683532715, -2.4883816242218018, -2.4072985649108887, -2.3262155055999756, -2.2451324462890625, -2.1640493869781494, -2.0829663276672363, -2.0018832683563232, -1.9208002090454102, -1.839717149734497, -1.758634090423584, -1.677551031112671, -1.5964679718017578, -1.5153849124908447, -1.4343018531799316, -1.3532187938690186, -1.2721357345581055, -1.1910526752471924, -1.1099696159362793, -1.0288865566253662, -0.9478034973144531, -0.86672043800354, -0.785637378692627, -0.7045543193817139, -0.6234712600708008, -0.5423882007598877, -0.4613051414489746, -0.3802220821380615, -0.29913902282714844, -0.21805596351623535, -0.13697290420532227, -0.05588984489440918, 0.025193452835083008, 0.1062765121459961, 0.18735957145690918, 0.26844263076782227, 0.34952569007873535, 0.43060874938964844, 0.5116918087005615, 0.5927748680114746, 0.6738579273223877, 0.7549409866333008, 0.8360240459442139, 0.917107105255127, 0.99819016456604, 1.0792732238769531, 1.1603562831878662, 1.2414393424987793, 1.3225224018096924, 1.4036054611206055, 1.4846885204315186, 1.5657715797424316, 1.6468546390533447, 1.7279376983642578, 1.809020757675171, 1.890103816986084, 1.971186876296997, 2.05226993560791, 2.1333529949188232, 2.2144360542297363, 2.2955191135406494, 2.3766021728515625, 2.4576852321624756, 2.5387682914733887, 2.6198513507843018]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 10.0, 32.0, 49.0, 50.0, 105.0, 167.0, 195.0, 330.0, 552.0, 782.0, 1209.0, 1879.0, 3002.0, 4584.0, 7221.0, 11596.0, 18315.0, 29540.0, 48357.0, 78664.0, 126930.0, 199750.0, 302039.0, 420982.0, 525037.0, 569729.0, 534538.0, 434877.0, 314966.0, 209544.0, 132487.0, 81685.0, 51024.0, 31195.0, 19390.0, 12129.0, 7661.0, 4775.0, 3136.0, 1926.0, 1324.0, 873.0, 632.0, 331.0, 248.0, 144.0, 106.0, 63.0, 43.0, 28.0, 20.0, 17.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.5791015625, -1.529052734375, -1.47900390625, -1.428955078125, -1.37890625, -1.328857421875, -1.27880859375, -1.228759765625, -1.1787109375, -1.128662109375, -1.07861328125, -1.028564453125, -0.978515625, -0.928466796875, -0.87841796875, -0.828369140625, -0.7783203125, -0.728271484375, -0.67822265625, -0.628173828125, -0.578125, -0.528076171875, -0.47802734375, -0.427978515625, -0.3779296875, -0.327880859375, -0.27783203125, -0.227783203125, -0.177734375, -0.127685546875, -0.07763671875, -0.027587890625, 0.0224609375, 0.072509765625, 0.12255859375, 0.172607421875, 0.22265625, 0.272705078125, 0.32275390625, 0.372802734375, 0.4228515625, 0.472900390625, 0.52294921875, 0.572998046875, 0.623046875, 0.673095703125, 0.72314453125, 0.773193359375, 0.8232421875, 0.873291015625, 0.92333984375, 0.973388671875, 1.0234375, 1.073486328125, 1.12353515625, 1.173583984375, 1.2236328125, 1.273681640625, 1.32373046875, 1.373779296875, 1.423828125, 1.473876953125, 1.52392578125, 1.573974609375, 1.6240234375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 10.0, 8.0, 9.0, 7.0, 11.0, 20.0, 21.0, 16.0, 23.0, 30.0, 27.0, 33.0, 28.0, 35.0, 31.0, 34.0, 42.0, 43.0, 53.0, 43.0, 37.0, 41.0, 38.0, 35.0, 44.0, 39.0, 38.0, 30.0, 23.0, 32.0, 16.0, 19.0, 20.0, 12.0, 15.0, 9.0, 10.0, 5.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.35546875, -2.28692626953125, -2.2183837890625, -2.14984130859375, -2.081298828125, -2.01275634765625, -1.9442138671875, -1.87567138671875, -1.80712890625, -1.73858642578125, -1.6700439453125, -1.60150146484375, -1.532958984375, -1.46441650390625, -1.3958740234375, -1.32733154296875, -1.2587890625, -1.19024658203125, -1.1217041015625, -1.05316162109375, -0.984619140625, -0.91607666015625, -0.8475341796875, -0.77899169921875, -0.71044921875, -0.64190673828125, -0.5733642578125, -0.50482177734375, -0.436279296875, -0.36773681640625, -0.2991943359375, -0.23065185546875, -0.162109375, -0.09356689453125, -0.0250244140625, 0.04351806640625, 0.112060546875, 0.18060302734375, 0.2491455078125, 0.31768798828125, 0.38623046875, 0.45477294921875, 0.5233154296875, 0.59185791015625, 0.660400390625, 0.72894287109375, 0.7974853515625, 0.86602783203125, 0.9345703125, 1.00311279296875, 1.0716552734375, 1.14019775390625, 1.208740234375, 1.27728271484375, 1.3458251953125, 1.41436767578125, 1.48291015625, 1.55145263671875, 1.6199951171875, 1.68853759765625, 1.757080078125, 1.82562255859375, 1.8941650390625, 1.96270751953125, 2.03125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 14.0, 6.0, 14.0, 24.0, 44.0, 74.0, 120.0, 186.0, 329.0, 424.0, 700.0, 1178.0, 1830.0, 3098.0, 4971.0, 8061.0, 13029.0, 21081.0, 33711.0, 53359.0, 84975.0, 133092.0, 201174.0, 293561.0, 402915.0, 503178.0, 552702.0, 518590.0, 427404.0, 317061.0, 219558.0, 146166.0, 93898.0, 59501.0, 37034.0, 23126.0, 14550.0, 9066.0, 5542.0, 3366.0, 2117.0, 1312.0, 847.0, 514.0, 303.0, 181.0, 138.0, 75.0, 41.0, 27.0, 10.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.9677734375, -1.9092254638671875, -1.850677490234375, -1.7921295166015625, -1.73358154296875, -1.6750335693359375, -1.616485595703125, -1.5579376220703125, -1.4993896484375, -1.4408416748046875, -1.382293701171875, -1.3237457275390625, -1.26519775390625, -1.2066497802734375, -1.148101806640625, -1.0895538330078125, -1.031005859375, -0.9724578857421875, -0.913909912109375, -0.8553619384765625, -0.79681396484375, -0.7382659912109375, -0.679718017578125, -0.6211700439453125, -0.5626220703125, -0.5040740966796875, -0.445526123046875, -0.3869781494140625, -0.32843017578125, -0.2698822021484375, -0.211334228515625, -0.1527862548828125, -0.09423828125, -0.0356903076171875, 0.022857666015625, 0.0814056396484375, 0.13995361328125, 0.1985015869140625, 0.257049560546875, 0.3155975341796875, 0.3741455078125, 0.4326934814453125, 0.491241455078125, 0.5497894287109375, 0.60833740234375, 0.6668853759765625, 0.725433349609375, 0.7839813232421875, 0.842529296875, 0.9010772705078125, 0.959625244140625, 1.0181732177734375, 1.07672119140625, 1.1352691650390625, 1.193817138671875, 1.2523651123046875, 1.3109130859375, 1.3694610595703125, 1.428009033203125, 1.4865570068359375, 1.54510498046875, 1.6036529541015625, 1.662200927734375, 1.7207489013671875, 1.779296875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 8.0, 14.0, 13.0, 9.0, 14.0, 27.0, 34.0, 32.0, 42.0, 57.0, 68.0, 73.0, 91.0, 122.0, 143.0, 172.0, 187.0, 204.0, 221.0, 227.0, 240.0, 226.0, 202.0, 206.0, 229.0, 205.0, 151.0, 162.0, 102.0, 115.0, 104.0, 83.0, 66.0, 56.0, 44.0, 36.0, 23.0, 32.0, 9.0, 7.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88720703125, -0.8587646484375, -0.830322265625, -0.8018798828125, -0.7734375, -0.7449951171875, -0.716552734375, -0.6881103515625, -0.65966796875, -0.6312255859375, -0.602783203125, -0.5743408203125, -0.5458984375, -0.5174560546875, -0.489013671875, -0.4605712890625, -0.43212890625, -0.4036865234375, -0.375244140625, -0.3468017578125, -0.318359375, -0.2899169921875, -0.261474609375, -0.2330322265625, -0.20458984375, -0.1761474609375, -0.147705078125, -0.1192626953125, -0.0908203125, -0.0623779296875, -0.033935546875, -0.0054931640625, 0.02294921875, 0.0513916015625, 0.079833984375, 0.1082763671875, 0.13671875, 0.1651611328125, 0.193603515625, 0.2220458984375, 0.25048828125, 0.2789306640625, 0.307373046875, 0.3358154296875, 0.3642578125, 0.3927001953125, 0.421142578125, 0.4495849609375, 0.47802734375, 0.5064697265625, 0.534912109375, 0.5633544921875, 0.591796875, 0.6202392578125, 0.648681640625, 0.6771240234375, 0.70556640625, 0.7340087890625, 0.762451171875, 0.7908935546875, 0.8193359375, 0.8477783203125, 0.876220703125, 0.9046630859375, 0.93310546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 5.0, 13.0, 11.0, 11.0, 21.0, 25.0, 21.0, 38.0, 24.0, 50.0, 50.0, 46.0, 52.0, 40.0, 59.0, 50.0, 60.0, 38.0, 54.0, 39.0, 36.0, 38.0, 32.0, 29.0, 21.0, 23.0, 27.0, 12.0, 20.0, 12.0, 6.0, 8.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0792129039764404, -1.9951753616333008, -1.9111379384994507, -1.827100396156311, -1.743062973022461, -1.6590254306793213, -1.5749878883361816, -1.490950345993042, -1.406912922859192, -1.3228753805160522, -1.2388379573822021, -1.1548004150390625, -1.0707628726959229, -0.9867254495620728, -0.9026879072189331, -0.8186504244804382, -0.7346129417419434, -0.6505754590034485, -0.5665379762649536, -0.48250043392181396, -0.3984629511833191, -0.3144254684448242, -0.23038792610168457, -0.1463504433631897, -0.062312960624694824, 0.021724537014961243, 0.10576203465461731, 0.18979954719543457, 0.27383702993392944, 0.3578745126724243, 0.44191205501556396, 0.5259495377540588, 0.6099870204925537, 0.6940245032310486, 0.7780619859695435, 0.8620995283126831, 0.946137011051178, 1.0301744937896729, 1.1142120361328125, 1.1982495784759521, 1.2822870016098022, 1.366324543952942, 1.450361967086792, 1.5343995094299316, 1.6184370517730713, 1.7024744749069214, 1.786512017250061, 1.8705494403839111, 1.9545869827270508, 2.0386245250701904, 2.12266206741333, 2.2066993713378906, 2.2907369136810303, 2.37477445602417, 2.4588119983673096, 2.542849540710449, 2.6268868446350098, 2.7109243869781494, 2.794961929321289, 2.8789992332458496, 2.9630367755889893, 3.047074317932129, 3.1311118602752686, 3.215149402618408, 3.299186944961548]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 6.0, 17.0, 13.0, 15.0, 18.0, 21.0, 28.0, 27.0, 28.0, 28.0, 22.0, 38.0, 32.0, 36.0, 41.0, 28.0, 47.0, 44.0, 50.0, 29.0, 36.0, 25.0, 35.0, 35.0, 43.0, 25.0, 26.0, 32.0, 17.0, 25.0, 15.0, 21.0, 16.0, 22.0, 11.0, 10.0, 1.0, 0.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208658218383789, -2.1371073722839355, -2.065556526184082, -1.9940054416656494, -1.922454595565796, -1.8509037494659424, -1.7793527841567993, -1.7078018188476562, -1.6362509727478027, -1.5647001266479492, -1.4931491613388062, -1.421598196029663, -1.3500473499298096, -1.278496503829956, -1.206945538520813, -1.13539457321167, -1.0638437271118164, -0.9922928214073181, -0.9207419157028198, -0.8491910099983215, -0.7776401042938232, -0.706089198589325, -0.6345382928848267, -0.5629873871803284, -0.4914364814758301, -0.4198855757713318, -0.3483346700668335, -0.2767837643623352, -0.20523285865783691, -0.13368195295333862, -0.06213104724884033, 0.009419858455657959, 0.08097076416015625, 0.15252166986465454, 0.22407257556915283, 0.2956234812736511, 0.3671743869781494, 0.4387252926826477, 0.510276198387146, 0.5818271040916443, 0.6533780097961426, 0.7249289155006409, 0.7964798212051392, 0.8680307269096375, 0.9395816326141357, 1.0111324787139893, 1.0826834440231323, 1.1542344093322754, 1.225785255432129, 1.2973361015319824, 1.3688870668411255, 1.4404380321502686, 1.511988878250122, 1.5835397243499756, 1.6550906896591187, 1.7266416549682617, 1.7981925010681152, 1.8697433471679688, 1.9412943124771118, 2.012845277786255, 2.0843961238861084, 2.155946969985962, 2.2274980545043945, 2.299048900604248, 2.3705997467041016]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 6.0, 13.0, 19.0, 28.0, 51.0, 58.0, 102.0, 152.0, 253.0, 394.0, 610.0, 940.0, 1462.0, 2498.0, 3994.0, 6663.0, 11328.0, 19444.0, 33360.0, 55782.0, 87372.0, 124924.0, 154525.0, 158498.0, 133294.0, 96623.0, 62799.0, 38329.0, 22432.0, 13148.0, 7500.0, 4533.0, 2766.0, 1751.0, 991.0, 653.0, 477.0, 251.0, 185.0, 136.0, 72.0, 54.0, 23.0, 25.0, 17.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.87158203125, -0.844451904296875, -0.81732177734375, -0.790191650390625, -0.7630615234375, -0.735931396484375, -0.70880126953125, -0.681671142578125, -0.654541015625, -0.627410888671875, -0.60028076171875, -0.573150634765625, -0.5460205078125, -0.518890380859375, -0.49176025390625, -0.464630126953125, -0.4375, -0.410369873046875, -0.38323974609375, -0.356109619140625, -0.3289794921875, -0.301849365234375, -0.27471923828125, -0.247589111328125, -0.220458984375, -0.193328857421875, -0.16619873046875, -0.139068603515625, -0.1119384765625, -0.084808349609375, -0.05767822265625, -0.030548095703125, -0.00341796875, 0.023712158203125, 0.05084228515625, 0.077972412109375, 0.1051025390625, 0.132232666015625, 0.15936279296875, 0.186492919921875, 0.213623046875, 0.240753173828125, 0.26788330078125, 0.295013427734375, 0.3221435546875, 0.349273681640625, 0.37640380859375, 0.403533935546875, 0.4306640625, 0.457794189453125, 0.48492431640625, 0.512054443359375, 0.5391845703125, 0.566314697265625, 0.59344482421875, 0.620574951171875, 0.647705078125, 0.674835205078125, 0.70196533203125, 0.729095458984375, 0.7562255859375, 0.783355712890625, 0.81048583984375, 0.837615966796875, 0.86474609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 5.0, 10.0, 9.0, 12.0, 7.0, 13.0, 22.0, 17.0, 31.0, 32.0, 22.0, 32.0, 34.0, 27.0, 33.0, 26.0, 31.0, 39.0, 59.0, 33.0, 38.0, 42.0, 38.0, 28.0, 42.0, 17.0, 38.0, 31.0, 24.0, 31.0, 23.0, 18.0, 18.0, 23.0, 27.0, 18.0, 11.0, 7.0, 8.0, 5.0, 9.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.16400146484375, -2.0916748046875, -2.01934814453125, -1.947021484375, -1.87469482421875, -1.8023681640625, -1.73004150390625, -1.65771484375, -1.58538818359375, -1.5130615234375, -1.44073486328125, -1.368408203125, -1.29608154296875, -1.2237548828125, -1.15142822265625, -1.0791015625, -1.00677490234375, -0.9344482421875, -0.86212158203125, -0.789794921875, -0.71746826171875, -0.6451416015625, -0.57281494140625, -0.50048828125, -0.42816162109375, -0.3558349609375, -0.28350830078125, -0.211181640625, -0.13885498046875, -0.0665283203125, 0.00579833984375, 0.078125, 0.15045166015625, 0.2227783203125, 0.29510498046875, 0.367431640625, 0.43975830078125, 0.5120849609375, 0.58441162109375, 0.65673828125, 0.72906494140625, 0.8013916015625, 0.87371826171875, 0.946044921875, 1.01837158203125, 1.0906982421875, 1.16302490234375, 1.2353515625, 1.30767822265625, 1.3800048828125, 1.45233154296875, 1.524658203125, 1.59698486328125, 1.6693115234375, 1.74163818359375, 1.81396484375, 1.88629150390625, 1.9586181640625, 2.03094482421875, 2.103271484375, 2.17559814453125, 2.2479248046875, 2.32025146484375, 2.392578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 12.0, 15.0, 30.0, 24.0, 31.0, 48.0, 66.0, 110.0, 123.0, 232.0, 385.0, 674.0, 1330.0, 2762.0, 5673.0, 12341.0, 26738.0, 131010.0, 789881.0, 42153.0, 18229.0, 8363.0, 4003.0, 1900.0, 992.0, 510.0, 336.0, 175.0, 117.0, 61.0, 49.0, 38.0, 34.0, 22.0, 23.0, 9.0, 5.0, 5.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.91546630859375, -2.8250732421875, -2.73468017578125, -2.644287109375, -2.55389404296875, -2.4635009765625, -2.37310791015625, -2.28271484375, -2.19232177734375, -2.1019287109375, -2.01153564453125, -1.921142578125, -1.83074951171875, -1.7403564453125, -1.64996337890625, -1.5595703125, -1.46917724609375, -1.3787841796875, -1.28839111328125, -1.197998046875, -1.10760498046875, -1.0172119140625, -0.92681884765625, -0.83642578125, -0.74603271484375, -0.6556396484375, -0.56524658203125, -0.474853515625, -0.38446044921875, -0.2940673828125, -0.20367431640625, -0.11328125, -0.02288818359375, 0.0675048828125, 0.15789794921875, 0.248291015625, 0.33868408203125, 0.4290771484375, 0.51947021484375, 0.60986328125, 0.70025634765625, 0.7906494140625, 0.88104248046875, 0.971435546875, 1.06182861328125, 1.1522216796875, 1.24261474609375, 1.3330078125, 1.42340087890625, 1.5137939453125, 1.60418701171875, 1.694580078125, 1.78497314453125, 1.8753662109375, 1.96575927734375, 2.05615234375, 2.14654541015625, 2.2369384765625, 2.32733154296875, 2.417724609375, 2.50811767578125, 2.5985107421875, 2.68890380859375, 2.779296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 14.0, 11.0, 9.0, 11.0, 15.0, 21.0, 18.0, 25.0, 32.0, 31.0, 28.0, 35.0, 35.0, 31.0, 41.0, 37.0, 45.0, 39.0, 46.0, 39.0, 38.0, 40.0, 27.0, 30.0, 32.0, 29.0, 28.0, 35.0, 25.0, 24.0, 23.0, 15.0, 17.0, 12.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.6728515625, -1.620849609375, -1.56884765625, -1.516845703125, -1.46484375, -1.412841796875, -1.36083984375, -1.308837890625, -1.2568359375, -1.204833984375, -1.15283203125, -1.100830078125, -1.048828125, -0.996826171875, -0.94482421875, -0.892822265625, -0.8408203125, -0.788818359375, -0.73681640625, -0.684814453125, -0.6328125, -0.580810546875, -0.52880859375, -0.476806640625, -0.4248046875, -0.372802734375, -0.32080078125, -0.268798828125, -0.216796875, -0.164794921875, -0.11279296875, -0.060791015625, -0.0087890625, 0.043212890625, 0.09521484375, 0.147216796875, 0.19921875, 0.251220703125, 0.30322265625, 0.355224609375, 0.4072265625, 0.459228515625, 0.51123046875, 0.563232421875, 0.615234375, 0.667236328125, 0.71923828125, 0.771240234375, 0.8232421875, 0.875244140625, 0.92724609375, 0.979248046875, 1.03125, 1.083251953125, 1.13525390625, 1.187255859375, 1.2392578125, 1.291259765625, 1.34326171875, 1.395263671875, 1.447265625, 1.499267578125, 1.55126953125, 1.603271484375, 1.6552734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 10.0, 9.0, 11.0, 22.0, 25.0, 42.0, 50.0, 100.0, 169.0, 304.0, 566.0, 1074.0, 2287.0, 5127.0, 13129.0, 39673.0, 789838.0, 156689.0, 23819.0, 8722.0, 3431.0, 1574.0, 780.0, 437.0, 229.0, 153.0, 97.0, 60.0, 39.0, 23.0, 14.0, 11.0, 12.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.43115234375, -0.41910552978515625, -0.4070587158203125, -0.39501190185546875, -0.382965087890625, -0.37091827392578125, -0.3588714599609375, -0.34682464599609375, -0.33477783203125, -0.32273101806640625, -0.3106842041015625, -0.29863739013671875, -0.286590576171875, -0.27454376220703125, -0.2624969482421875, -0.25045013427734375, -0.2384033203125, -0.22635650634765625, -0.2143096923828125, -0.20226287841796875, -0.190216064453125, -0.17816925048828125, -0.1661224365234375, -0.15407562255859375, -0.14202880859375, -0.12998199462890625, -0.1179351806640625, -0.10588836669921875, -0.093841552734375, -0.08179473876953125, -0.0697479248046875, -0.05770111083984375, -0.045654296875, -0.03360748291015625, -0.0215606689453125, -0.00951385498046875, 0.002532958984375, 0.01457977294921875, 0.0266265869140625, 0.03867340087890625, 0.05072021484375, 0.06276702880859375, 0.0748138427734375, 0.08686065673828125, 0.098907470703125, 0.11095428466796875, 0.1230010986328125, 0.13504791259765625, 0.1470947265625, 0.15914154052734375, 0.1711883544921875, 0.18323516845703125, 0.195281982421875, 0.20732879638671875, 0.2193756103515625, 0.23142242431640625, 0.24346923828125, 0.25551605224609375, 0.2675628662109375, 0.27960968017578125, 0.291656494140625, 0.30370330810546875, 0.3157501220703125, 0.32779693603515625, 0.33984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 4.0, 11.0, 15.0, 26.0, 39.0, 32.0, 53.0, 71.0, 68.0, 109.0, 98.0, 71.0, 95.0, 70.0, 40.0, 47.0, 23.0, 21.0, 16.0, 23.0, 8.0, 4.0, 6.0, 8.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6803226470947266e-05, -5.532149225473404e-05, -5.383975803852081e-05, -5.235802382230759e-05, -5.087628960609436e-05, -4.9394555389881134e-05, -4.791282117366791e-05, -4.643108695745468e-05, -4.4949352741241455e-05, -4.346761852502823e-05, -4.1985884308815e-05, -4.0504150092601776e-05, -3.902241587638855e-05, -3.7540681660175323e-05, -3.60589474439621e-05, -3.457721322774887e-05, -3.3095479011535645e-05, -3.161374479532242e-05, -3.0132010579109192e-05, -2.8650276362895966e-05, -2.716854214668274e-05, -2.5686807930469513e-05, -2.4205073714256287e-05, -2.272333949804306e-05, -2.1241605281829834e-05, -1.9759871065616608e-05, -1.827813684940338e-05, -1.6796402633190155e-05, -1.531466841697693e-05, -1.3832934200763702e-05, -1.2351199984550476e-05, -1.086946576833725e-05, -9.387731552124023e-06, -7.905997335910797e-06, -6.424263119697571e-06, -4.9425289034843445e-06, -3.460794687271118e-06, -1.979060471057892e-06, -4.973262548446655e-07, 9.844079613685608e-07, 2.466142177581787e-06, 3.9478763937950134e-06, 5.42961061000824e-06, 6.911344826221466e-06, 8.393079042434692e-06, 9.874813258647919e-06, 1.1356547474861145e-05, 1.2838281691074371e-05, 1.4320015907287598e-05, 1.5801750123500824e-05, 1.728348433971405e-05, 1.8765218555927277e-05, 2.0246952772140503e-05, 2.172868698835373e-05, 2.3210421204566956e-05, 2.4692155420780182e-05, 2.6173889636993408e-05, 2.7655623853206635e-05, 2.913735806941986e-05, 3.061909228563309e-05, 3.2100826501846313e-05, 3.358256071805954e-05, 3.5064294934272766e-05, 3.654602915048599e-05, 3.802776336669922e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 12.0, 22.0, 35.0, 48.0, 70.0, 116.0, 157.0, 251.0, 414.0, 684.0, 1026.0, 1623.0, 2768.0, 4194.0, 6918.0, 11504.0, 19242.0, 31324.0, 50232.0, 78773.0, 115098.0, 149301.0, 158663.0, 137553.0, 101615.0, 67474.0, 42368.0, 26112.0, 15763.0, 9562.0, 5856.0, 3617.0, 2255.0, 1394.0, 860.0, 594.0, 341.0, 232.0, 158.0, 111.0, 74.0, 40.0, 27.0, 23.0, 15.0, 13.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1456298828125, -0.14097976684570312, -0.13632965087890625, -0.13167953491210938, -0.1270294189453125, -0.12237930297851562, -0.11772918701171875, -0.11307907104492188, -0.108428955078125, -0.10377883911132812, -0.09912872314453125, -0.09447860717773438, -0.0898284912109375, -0.08517837524414062, -0.08052825927734375, -0.07587814331054688, -0.07122802734375, -0.06657791137695312, -0.06192779541015625, -0.057277679443359375, -0.0526275634765625, -0.047977447509765625, -0.04332733154296875, -0.038677215576171875, -0.034027099609375, -0.029376983642578125, -0.02472686767578125, -0.020076751708984375, -0.0154266357421875, -0.010776519775390625, -0.00612640380859375, -0.001476287841796875, 0.003173828125, 0.007823944091796875, 0.01247406005859375, 0.017124176025390625, 0.0217742919921875, 0.026424407958984375, 0.03107452392578125, 0.035724639892578125, 0.040374755859375, 0.045024871826171875, 0.04967498779296875, 0.054325103759765625, 0.0589752197265625, 0.06362533569335938, 0.06827545166015625, 0.07292556762695312, 0.07757568359375, 0.08222579956054688, 0.08687591552734375, 0.09152603149414062, 0.0961761474609375, 0.10082626342773438, 0.10547637939453125, 0.11012649536132812, 0.114776611328125, 0.11942672729492188, 0.12407684326171875, 0.12872695922851562, 0.1333770751953125, 0.13802719116210938, 0.14267730712890625, 0.14732742309570312, 0.1519775390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 8.0, 6.0, 17.0, 20.0, 22.0, 16.0, 26.0, 33.0, 37.0, 41.0, 46.0, 42.0, 49.0, 56.0, 59.0, 54.0, 56.0, 45.0, 38.0, 45.0, 43.0, 30.0, 29.0, 29.0, 29.0, 27.0, 14.0, 19.0, 16.0, 6.0, 6.0, 6.0, 4.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06219482421875, -0.06032419204711914, -0.05845355987548828, -0.05658292770385742, -0.05471229553222656, -0.0528416633605957, -0.050971031188964844, -0.049100399017333984, -0.047229766845703125, -0.045359134674072266, -0.043488502502441406, -0.04161787033081055, -0.03974723815917969, -0.03787660598754883, -0.03600597381591797, -0.03413534164428711, -0.03226470947265625, -0.03039407730102539, -0.02852344512939453, -0.026652812957763672, -0.024782180786132812, -0.022911548614501953, -0.021040916442871094, -0.019170284271240234, -0.017299652099609375, -0.015429019927978516, -0.013558387756347656, -0.011687755584716797, -0.009817123413085938, -0.007946491241455078, -0.006075859069824219, -0.004205226898193359, -0.0023345947265625, -0.0004639625549316406, 0.0014066696166992188, 0.003277301788330078, 0.0051479339599609375, 0.007018566131591797, 0.008889198303222656, 0.010759830474853516, 0.012630462646484375, 0.014501094818115234, 0.016371726989746094, 0.018242359161376953, 0.020112991333007812, 0.021983623504638672, 0.02385425567626953, 0.02572488784790039, 0.02759552001953125, 0.02946615219116211, 0.03133678436279297, 0.03320741653442383, 0.03507804870605469, 0.03694868087768555, 0.038819313049316406, 0.040689945220947266, 0.042560577392578125, 0.044431209564208984, 0.046301841735839844, 0.0481724739074707, 0.05004310607910156, 0.05191373825073242, 0.05378437042236328, 0.05565500259399414, 0.057525634765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 12.0, 14.0, 20.0, 20.0, 22.0, 27.0, 40.0, 36.0, 44.0, 51.0, 49.0, 54.0, 58.0, 63.0, 42.0, 37.0, 42.0, 54.0, 42.0, 29.0, 32.0, 28.0, 26.0, 25.0, 21.0, 22.0, 13.0, 13.0, 12.0, 4.0, 4.0, 6.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.067145347595215, -1.9843353033065796, -1.9015253782272339, -1.8187153339385986, -1.735905408859253, -1.6530953645706177, -1.5702853202819824, -1.4874753952026367, -1.4046653509140015, -1.3218553066253662, -1.2390453815460205, -1.1562353372573853, -1.07342529296875, -0.9906153678894043, -0.907805323600769, -0.8249953389167786, -0.7421853542327881, -0.6593753695487976, -0.5765653848648071, -0.4937553405761719, -0.4109453558921814, -0.3281353712081909, -0.24532535672187805, -0.16251534223556519, -0.07970535755157471, 0.0031046420335769653, 0.08591464161872864, 0.1687246412038803, 0.251534640789032, 0.33434462547302246, 0.4171546399593353, 0.4999646544456482, 0.5827746391296387, 0.6655846238136292, 0.7483946084976196, 0.8312046527862549, 0.9140146374702454, 0.9968246221542358, 1.079634666442871, 1.1624445915222168, 1.245254635810852, 1.3280646800994873, 1.410874605178833, 1.4936846494674683, 1.5764946937561035, 1.6593046188354492, 1.7421146631240845, 1.8249247074127197, 1.9077346324920654, 1.9905446767807007, 2.073354721069336, 2.1561646461486816, 2.2389745712280273, 2.321784496307373, 2.404594659805298, 2.4874045848846436, 2.5702147483825684, 2.653024673461914, 2.735834836959839, 2.8186447620391846, 2.9014546871185303, 2.984264850616455, 3.067074775695801, 3.1498847007751465, 3.232694625854492]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 16.0, 11.0, 18.0, 14.0, 25.0, 23.0, 28.0, 26.0, 26.0, 28.0, 35.0, 34.0, 33.0, 38.0, 34.0, 48.0, 39.0, 50.0, 35.0, 36.0, 25.0, 30.0, 38.0, 42.0, 26.0, 31.0, 25.0, 24.0, 21.0, 19.0, 23.0, 12.0, 23.0, 11.0, 10.0, 2.0, 0.0, 3.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.195040702819824, -2.123992919921875, -2.052945375442505, -1.9818977117538452, -1.9108500480651855, -1.8398023843765259, -1.7687547206878662, -1.6977070569992065, -1.6266593933105469, -1.5556117296218872, -1.4845640659332275, -1.4135164022445679, -1.3424687385559082, -1.2714210748672485, -1.2003734111785889, -1.1293257474899292, -1.0582780838012695, -0.9872304201126099, -0.9161827564239502, -0.8451350927352905, -0.7740874290466309, -0.7030397653579712, -0.6319921016693115, -0.5609444379806519, -0.4898967742919922, -0.4188491106033325, -0.34780144691467285, -0.2767537832260132, -0.20570611953735352, -0.13465845584869385, -0.06361079216003418, 0.007436871528625488, 0.07848429679870605, 0.14953196048736572, 0.2205796241760254, 0.29162728786468506, 0.3626749515533447, 0.4337226152420044, 0.5047702789306641, 0.5758179426193237, 0.6468656063079834, 0.7179132699966431, 0.7889609336853027, 0.8600085973739624, 0.9310562610626221, 1.0021039247512817, 1.0731515884399414, 1.144199252128601, 1.2152469158172607, 1.2862945795059204, 1.35734224319458, 1.4283899068832397, 1.4994375705718994, 1.570485234260559, 1.6415328979492188, 1.7125805616378784, 1.783628225326538, 1.8546758890151978, 1.9257235527038574, 1.996771216392517, 2.0678188800811768, 2.138866424560547, 2.209914207458496, 2.2809619903564453, 2.3520095348358154]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 16.0, 26.0, 40.0, 88.0, 113.0, 178.0, 312.0, 516.0, 835.0, 1436.0, 2248.0, 3715.0, 5787.0, 9254.0, 14543.0, 22035.0, 32394.0, 45671.0, 61570.0, 79416.0, 94671.0, 105414.0, 108825.0, 103892.0, 91772.0, 75726.0, 58396.0, 43251.0, 30193.0, 20450.0, 13285.0, 8503.0, 5403.0, 3344.0, 1978.0, 1297.0, 828.0, 467.0, 249.0, 172.0, 113.0, 57.0, 19.0, 18.0, 15.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.466796875, -1.4200897216796875, -1.373382568359375, -1.3266754150390625, -1.27996826171875, -1.2332611083984375, -1.186553955078125, -1.1398468017578125, -1.0931396484375, -1.0464324951171875, -0.999725341796875, -0.9530181884765625, -0.90631103515625, -0.8596038818359375, -0.812896728515625, -0.7661895751953125, -0.719482421875, -0.6727752685546875, -0.626068115234375, -0.5793609619140625, -0.53265380859375, -0.4859466552734375, -0.439239501953125, -0.3925323486328125, -0.3458251953125, -0.2991180419921875, -0.252410888671875, -0.2057037353515625, -0.15899658203125, -0.1122894287109375, -0.065582275390625, -0.0188751220703125, 0.02783203125, 0.0745391845703125, 0.121246337890625, 0.1679534912109375, 0.21466064453125, 0.2613677978515625, 0.308074951171875, 0.3547821044921875, 0.4014892578125, 0.4481964111328125, 0.494903564453125, 0.5416107177734375, 0.58831787109375, 0.6350250244140625, 0.681732177734375, 0.7284393310546875, 0.775146484375, 0.8218536376953125, 0.868560791015625, 0.9152679443359375, 0.96197509765625, 1.0086822509765625, 1.055389404296875, 1.1020965576171875, 1.1488037109375, 1.1955108642578125, 1.242218017578125, 1.2889251708984375, 1.33563232421875, 1.3823394775390625, 1.429046630859375, 1.4757537841796875, 1.5224609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 3.0, 12.0, 13.0, 10.0, 16.0, 14.0, 19.0, 24.0, 24.0, 26.0, 29.0, 23.0, 36.0, 41.0, 35.0, 37.0, 29.0, 53.0, 43.0, 44.0, 38.0, 38.0, 37.0, 48.0, 35.0, 39.0, 42.0, 25.0, 23.0, 17.0, 17.0, 14.0, 21.0, 19.0, 13.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.419921875, -2.3441162109375, -2.268310546875, -2.1925048828125, -2.11669921875, -2.0408935546875, -1.965087890625, -1.8892822265625, -1.8134765625, -1.7376708984375, -1.661865234375, -1.5860595703125, -1.51025390625, -1.4344482421875, -1.358642578125, -1.2828369140625, -1.20703125, -1.1312255859375, -1.055419921875, -0.9796142578125, -0.90380859375, -0.8280029296875, -0.752197265625, -0.6763916015625, -0.6005859375, -0.5247802734375, -0.448974609375, -0.3731689453125, -0.29736328125, -0.2215576171875, -0.145751953125, -0.0699462890625, 0.005859375, 0.0816650390625, 0.157470703125, 0.2332763671875, 0.30908203125, 0.3848876953125, 0.460693359375, 0.5364990234375, 0.6123046875, 0.6881103515625, 0.763916015625, 0.8397216796875, 0.91552734375, 0.9913330078125, 1.067138671875, 1.1429443359375, 1.21875, 1.2945556640625, 1.370361328125, 1.4461669921875, 1.52197265625, 1.5977783203125, 1.673583984375, 1.7493896484375, 1.8251953125, 1.9010009765625, 1.976806640625, 2.0526123046875, 2.12841796875, 2.2042236328125, 2.280029296875, 2.3558349609375, 2.431640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 12.0, 14.0, 34.0, 46.0, 78.0, 175.0, 286.0, 481.0, 960.0, 1833.0, 3381.0, 6166.0, 11371.0, 20585.0, 35003.0, 58070.0, 88284.0, 120951.0, 145283.0, 149955.0, 133238.0, 101971.0, 69462.0, 43499.0, 25681.0, 14541.0, 7837.0, 4246.0, 2321.0, 1241.0, 710.0, 376.0, 190.0, 115.0, 53.0, 37.0, 27.0, 9.0, 6.0, 12.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.52734375, -2.4575347900390625, -2.387725830078125, -2.3179168701171875, -2.24810791015625, -2.1782989501953125, -2.108489990234375, -2.0386810302734375, -1.9688720703125, -1.8990631103515625, -1.829254150390625, -1.7594451904296875, -1.68963623046875, -1.6198272705078125, -1.550018310546875, -1.4802093505859375, -1.410400390625, -1.3405914306640625, -1.270782470703125, -1.2009735107421875, -1.13116455078125, -1.0613555908203125, -0.991546630859375, -0.9217376708984375, -0.8519287109375, -0.7821197509765625, -0.712310791015625, -0.6425018310546875, -0.57269287109375, -0.5028839111328125, -0.433074951171875, -0.3632659912109375, -0.29345703125, -0.2236480712890625, -0.153839111328125, -0.0840301513671875, -0.01422119140625, 0.0555877685546875, 0.125396728515625, 0.1952056884765625, 0.2650146484375, 0.3348236083984375, 0.404632568359375, 0.4744415283203125, 0.54425048828125, 0.6140594482421875, 0.683868408203125, 0.7536773681640625, 0.823486328125, 0.8932952880859375, 0.963104248046875, 1.0329132080078125, 1.10272216796875, 1.1725311279296875, 1.242340087890625, 1.3121490478515625, 1.3819580078125, 1.4517669677734375, 1.521575927734375, 1.5913848876953125, 1.66119384765625, 1.7310028076171875, 1.800811767578125, 1.8706207275390625, 1.9404296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 5.0, 6.0, 4.0, 7.0, 6.0, 11.0, 14.0, 11.0, 19.0, 25.0, 29.0, 23.0, 27.0, 25.0, 33.0, 40.0, 33.0, 34.0, 30.0, 36.0, 39.0, 39.0, 36.0, 37.0, 39.0, 40.0, 34.0, 34.0, 37.0, 20.0, 28.0, 23.0, 22.0, 17.0, 15.0, 22.0, 12.0, 10.0, 12.0, 9.0, 11.0, 9.0, 4.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3466796875, -1.3033294677734375, -1.259979248046875, -1.2166290283203125, -1.17327880859375, -1.1299285888671875, -1.086578369140625, -1.0432281494140625, -0.9998779296875, -0.9565277099609375, -0.913177490234375, -0.8698272705078125, -0.82647705078125, -0.7831268310546875, -0.739776611328125, -0.6964263916015625, -0.653076171875, -0.6097259521484375, -0.566375732421875, -0.5230255126953125, -0.47967529296875, -0.4363250732421875, -0.392974853515625, -0.3496246337890625, -0.3062744140625, -0.2629241943359375, -0.219573974609375, -0.1762237548828125, -0.13287353515625, -0.0895233154296875, -0.046173095703125, -0.0028228759765625, 0.04052734375, 0.0838775634765625, 0.127227783203125, 0.1705780029296875, 0.21392822265625, 0.2572784423828125, 0.300628662109375, 0.3439788818359375, 0.3873291015625, 0.4306793212890625, 0.474029541015625, 0.5173797607421875, 0.56072998046875, 0.6040802001953125, 0.647430419921875, 0.6907806396484375, 0.734130859375, 0.7774810791015625, 0.820831298828125, 0.8641815185546875, 0.90753173828125, 0.9508819580078125, 0.994232177734375, 1.0375823974609375, 1.0809326171875, 1.1242828369140625, 1.167633056640625, 1.2109832763671875, 1.25433349609375, 1.2976837158203125, 1.341033935546875, 1.3843841552734375, 1.427734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 8.0, 11.0, 12.0, 17.0, 20.0, 30.0, 54.0, 76.0, 88.0, 144.0, 211.0, 315.0, 459.0, 757.0, 1166.0, 1782.0, 2788.0, 4328.0, 7426.0, 12198.0, 19736.0, 32213.0, 50678.0, 75366.0, 104817.0, 130468.0, 141732.0, 132527.0, 108852.0, 78943.0, 53176.0, 33397.0, 20854.0, 12843.0, 7770.0, 4846.0, 2981.0, 1875.0, 1285.0, 779.0, 527.0, 301.0, 222.0, 160.0, 108.0, 79.0, 40.0, 31.0, 30.0, 17.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.85888671875, -0.830780029296875, -0.80267333984375, -0.774566650390625, -0.7464599609375, -0.718353271484375, -0.69024658203125, -0.662139892578125, -0.634033203125, -0.605926513671875, -0.57781982421875, -0.549713134765625, -0.5216064453125, -0.493499755859375, -0.46539306640625, -0.437286376953125, -0.4091796875, -0.381072998046875, -0.35296630859375, -0.324859619140625, -0.2967529296875, -0.268646240234375, -0.24053955078125, -0.212432861328125, -0.184326171875, -0.156219482421875, -0.12811279296875, -0.100006103515625, -0.0718994140625, -0.043792724609375, -0.01568603515625, 0.012420654296875, 0.04052734375, 0.068634033203125, 0.09674072265625, 0.124847412109375, 0.1529541015625, 0.181060791015625, 0.20916748046875, 0.237274169921875, 0.265380859375, 0.293487548828125, 0.32159423828125, 0.349700927734375, 0.3778076171875, 0.405914306640625, 0.43402099609375, 0.462127685546875, 0.490234375, 0.518341064453125, 0.54644775390625, 0.574554443359375, 0.6026611328125, 0.630767822265625, 0.65887451171875, 0.686981201171875, 0.715087890625, 0.743194580078125, 0.77130126953125, 0.799407958984375, 0.8275146484375, 0.855621337890625, 0.88372802734375, 0.911834716796875, 0.93994140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 2.0, 4.0, 4.0, 10.0, 5.0, 16.0, 11.0, 23.0, 26.0, 32.0, 26.0, 48.0, 51.0, 56.0, 60.0, 59.0, 73.0, 49.0, 64.0, 69.0, 53.0, 47.0, 48.0, 34.0, 29.0, 13.0, 28.0, 13.0, 11.0, 10.0, 4.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00014519691467285156, -0.00014136359095573425, -0.00013753026723861694, -0.00013369694352149963, -0.00012986361980438232, -0.00012603029608726501, -0.0001221969723701477, -0.0001183636486530304, -0.00011453032493591309, -0.00011069700121879578, -0.00010686367750167847, -0.00010303035378456116, -9.919703006744385e-05, -9.536370635032654e-05, -9.153038263320923e-05, -8.769705891609192e-05, -8.386373519897461e-05, -8.00304114818573e-05, -7.619708776473999e-05, -7.236376404762268e-05, -6.853044033050537e-05, -6.469711661338806e-05, -6.086379289627075e-05, -5.703046917915344e-05, -5.319714546203613e-05, -4.936382174491882e-05, -4.5530498027801514e-05, -4.1697174310684204e-05, -3.7863850593566895e-05, -3.4030526876449585e-05, -3.0197203159332275e-05, -2.6363879442214966e-05, -2.2530555725097656e-05, -1.8697232007980347e-05, -1.4863908290863037e-05, -1.1030584573745728e-05, -7.197260856628418e-06, -3.3639371395111084e-06, 4.6938657760620117e-07, 4.302710294723511e-06, 8.13603401184082e-06, 1.196935772895813e-05, 1.580268144607544e-05, 1.963600516319275e-05, 2.346932888031006e-05, 2.7302652597427368e-05, 3.113597631454468e-05, 3.496930003166199e-05, 3.88026237487793e-05, 4.2635947465896606e-05, 4.6469271183013916e-05, 5.0302594900131226e-05, 5.4135918617248535e-05, 5.7969242334365845e-05, 6.180256605148315e-05, 6.563588976860046e-05, 6.946921348571777e-05, 7.330253720283508e-05, 7.713586091995239e-05, 8.09691846370697e-05, 8.480250835418701e-05, 8.863583207130432e-05, 9.246915578842163e-05, 9.630247950553894e-05, 0.00010013580322265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 9.0, 18.0, 18.0, 30.0, 32.0, 58.0, 73.0, 104.0, 196.0, 293.0, 504.0, 834.0, 1466.0, 2468.0, 4444.0, 7831.0, 13918.0, 24632.0, 41364.0, 66870.0, 99260.0, 131804.0, 150803.0, 147855.0, 123353.0, 88450.0, 58841.0, 35392.0, 20418.0, 11750.0, 6600.0, 3724.0, 2049.0, 1225.0, 700.0, 406.0, 262.0, 171.0, 94.0, 62.0, 45.0, 30.0, 32.0, 19.0, 10.0, 11.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0], "bins": [-0.97412109375, -0.9435348510742188, -0.9129486083984375, -0.8823623657226562, -0.851776123046875, -0.8211898803710938, -0.7906036376953125, -0.7600173950195312, -0.72943115234375, -0.6988449096679688, -0.6682586669921875, -0.6376724243164062, -0.607086181640625, -0.5764999389648438, -0.5459136962890625, -0.5153274536132812, -0.4847412109375, -0.45415496826171875, -0.4235687255859375, -0.39298248291015625, -0.362396240234375, -0.33180999755859375, -0.3012237548828125, -0.27063751220703125, -0.24005126953125, -0.20946502685546875, -0.1788787841796875, -0.14829254150390625, -0.117706298828125, -0.08712005615234375, -0.0565338134765625, -0.02594757080078125, 0.004638671875, 0.03522491455078125, 0.0658111572265625, 0.09639739990234375, 0.126983642578125, 0.15756988525390625, 0.1881561279296875, 0.21874237060546875, 0.24932861328125, 0.27991485595703125, 0.3105010986328125, 0.34108734130859375, 0.371673583984375, 0.40225982666015625, 0.4328460693359375, 0.46343231201171875, 0.4940185546875, 0.5246047973632812, 0.5551910400390625, 0.5857772827148438, 0.616363525390625, 0.6469497680664062, 0.6775360107421875, 0.7081222534179688, 0.73870849609375, 0.7692947387695312, 0.7998809814453125, 0.8304672241210938, 0.861053466796875, 0.8916397094726562, 0.9222259521484375, 0.9528121948242188, 0.9833984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 6.0, 3.0, 7.0, 7.0, 9.0, 13.0, 13.0, 17.0, 34.0, 19.0, 15.0, 33.0, 30.0, 32.0, 39.0, 43.0, 49.0, 41.0, 43.0, 46.0, 39.0, 36.0, 48.0, 50.0, 39.0, 31.0, 44.0, 24.0, 19.0, 30.0, 25.0, 11.0, 14.0, 9.0, 14.0, 4.0, 9.0, 12.0, 10.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.25974273681640625, -0.2509307861328125, -0.24211883544921875, -0.233306884765625, -0.22449493408203125, -0.2156829833984375, -0.20687103271484375, -0.19805908203125, -0.18924713134765625, -0.1804351806640625, -0.17162322998046875, -0.162811279296875, -0.15399932861328125, -0.1451873779296875, -0.13637542724609375, -0.1275634765625, -0.11875152587890625, -0.1099395751953125, -0.10112762451171875, -0.092315673828125, -0.08350372314453125, -0.0746917724609375, -0.06587982177734375, -0.05706787109375, -0.04825592041015625, -0.0394439697265625, -0.03063201904296875, -0.021820068359375, -0.01300811767578125, -0.0041961669921875, 0.00461578369140625, 0.013427734375, 0.02223968505859375, 0.0310516357421875, 0.03986358642578125, 0.048675537109375, 0.05748748779296875, 0.0662994384765625, 0.07511138916015625, 0.08392333984375, 0.09273529052734375, 0.1015472412109375, 0.11035919189453125, 0.119171142578125, 0.12798309326171875, 0.1367950439453125, 0.14560699462890625, 0.1544189453125, 0.16323089599609375, 0.1720428466796875, 0.18085479736328125, 0.189666748046875, 0.19847869873046875, 0.2072906494140625, 0.21610260009765625, 0.22491455078125, 0.23372650146484375, 0.2425384521484375, 0.25135040283203125, 0.260162353515625, 0.26897430419921875, 0.2777862548828125, 0.28659820556640625, 0.29541015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 4.0, 11.0, 7.0, 18.0, 14.0, 15.0, 13.0, 18.0, 30.0, 33.0, 43.0, 52.0, 42.0, 34.0, 45.0, 48.0, 49.0, 45.0, 41.0, 60.0, 48.0, 37.0, 44.0, 41.0, 32.0, 30.0, 26.0, 12.0, 20.0, 18.0, 15.0, 9.0, 5.0, 7.0, 3.0, 10.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0593392848968506, -1.9821583032608032, -1.9049773216247559, -1.827796220779419, -1.7506152391433716, -1.6734342575073242, -1.5962531566619873, -1.51907217502594, -1.4418911933898926, -1.3647102117538452, -1.2875292301177979, -1.210348129272461, -1.1331671476364136, -1.0559861660003662, -0.9788051247596741, -0.9016240835189819, -0.8244431018829346, -0.7472621202468872, -0.6700810790061951, -0.5929000377655029, -0.5157190561294556, -0.4385380446910858, -0.36135703325271606, -0.2841759920120239, -0.20699501037597656, -0.1298139989376068, -0.05263298749923706, 0.02454802393913269, 0.10172903537750244, 0.1789100468158722, 0.25609105825424194, 0.3332720994949341, 0.41045284271240234, 0.4876338541507721, 0.5648148655891418, 0.641995906829834, 0.7191768884658813, 0.7963578701019287, 0.8735389113426208, 0.950719952583313, 1.0279009342193604, 1.1050819158554077, 1.182262897491455, 1.259443998336792, 1.3366249799728394, 1.4138059616088867, 1.4909870624542236, 1.568168044090271, 1.6453490257263184, 1.7225300073623657, 1.799710988998413, 1.87689208984375, 1.9540730714797974, 2.0312540531158447, 2.1084351539611816, 2.1856160163879395, 2.2627971172332764, 2.3399782180786133, 2.417159080505371, 2.494340181350708, 2.571521282196045, 2.6487021446228027, 2.7258832454681396, 2.8030643463134766, 2.8802452087402344]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 5.0, 10.0, 14.0, 7.0, 6.0, 11.0, 9.0, 24.0, 18.0, 25.0, 23.0, 21.0, 27.0, 26.0, 29.0, 41.0, 32.0, 44.0, 45.0, 41.0, 42.0, 37.0, 43.0, 33.0, 45.0, 47.0, 27.0, 32.0, 36.0, 27.0, 22.0, 20.0, 25.0, 18.0, 20.0, 13.0, 11.0, 10.0, 13.0, 2.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4597015380859375, -2.3847670555114746, -2.3098325729370117, -2.234898090362549, -2.159963607788086, -2.085029125213623, -2.01009464263916, -1.9351601600646973, -1.8602256774902344, -1.7852911949157715, -1.7103567123413086, -1.6354222297668457, -1.5604877471923828, -1.48555326461792, -1.410618782043457, -1.3356842994689941, -1.2607496976852417, -1.1858152151107788, -1.110880732536316, -1.035946249961853, -0.9610117673873901, -0.8860772848129272, -0.8111427426338196, -0.7362082600593567, -0.6612737774848938, -0.5863392949104309, -0.511404812335968, -0.43647029995918274, -0.36153581738471985, -0.28660133481025696, -0.21166682243347168, -0.1367323398590088, -0.0617978572845459, 0.013136632740497589, 0.08807112276554108, 0.16300562024116516, 0.23794010281562805, 0.31287458539009094, 0.3878090977668762, 0.4627435803413391, 0.537678062915802, 0.6126125454902649, 0.6875470280647278, 0.7624815702438354, 0.8374160528182983, 0.9123505353927612, 0.9872850179672241, 1.062219500541687, 1.13715398311615, 1.2120884656906128, 1.2870229482650757, 1.3619574308395386, 1.4368919134140015, 1.5118263959884644, 1.5867609977722168, 1.6616954803466797, 1.7366299629211426, 1.8115644454956055, 1.8864989280700684, 1.9614334106445312, 2.036367893218994, 2.111302375793457, 2.18623685836792, 2.261171340942383, 2.3361058235168457]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 7.0, 9.0, 9.0, 25.0, 27.0, 63.0, 122.0, 190.0, 288.0, 469.0, 704.0, 1181.0, 1918.0, 3042.0, 5000.0, 8266.0, 13489.0, 22044.0, 37155.0, 61732.0, 102619.0, 167660.0, 264732.0, 392162.0, 515503.0, 589658.0, 575448.0, 478223.0, 350960.0, 232871.0, 144663.0, 88618.0, 53221.0, 31791.0, 19403.0, 11840.0, 7170.0, 4509.0, 2770.0, 1699.0, 1137.0, 725.0, 419.0, 290.0, 158.0, 100.0, 73.0, 50.0, 31.0, 23.0, 9.0, 10.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4742889404296875, -1.423187255859375, -1.3720855712890625, -1.32098388671875, -1.2698822021484375, -1.218780517578125, -1.1676788330078125, -1.1165771484375, -1.0654754638671875, -1.014373779296875, -0.9632720947265625, -0.91217041015625, -0.8610687255859375, -0.809967041015625, -0.7588653564453125, -0.707763671875, -0.6566619873046875, -0.605560302734375, -0.5544586181640625, -0.50335693359375, -0.4522552490234375, -0.401153564453125, -0.3500518798828125, -0.2989501953125, -0.2478485107421875, -0.196746826171875, -0.1456451416015625, -0.09454345703125, -0.0434417724609375, 0.007659912109375, 0.0587615966796875, 0.10986328125, 0.1609649658203125, 0.212066650390625, 0.2631683349609375, 0.31427001953125, 0.3653717041015625, 0.416473388671875, 0.4675750732421875, 0.5186767578125, 0.5697784423828125, 0.620880126953125, 0.6719818115234375, 0.72308349609375, 0.7741851806640625, 0.825286865234375, 0.8763885498046875, 0.927490234375, 0.9785919189453125, 1.029693603515625, 1.0807952880859375, 1.13189697265625, 1.1829986572265625, 1.234100341796875, 1.2852020263671875, 1.3363037109375, 1.3874053955078125, 1.438507080078125, 1.4896087646484375, 1.54071044921875, 1.5918121337890625, 1.642913818359375, 1.6940155029296875, 1.7451171875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 8.0, 9.0, 5.0, 13.0, 10.0, 28.0, 21.0, 21.0, 21.0, 20.0, 23.0, 37.0, 42.0, 39.0, 38.0, 41.0, 34.0, 30.0, 47.0, 33.0, 38.0, 40.0, 40.0, 32.0, 37.0, 24.0, 29.0, 29.0, 27.0, 30.0, 23.0, 17.0, 15.0, 13.0, 12.0, 11.0, 5.0, 6.0, 5.0, 4.0, 10.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.90625, -1.845794677734375, -1.78533935546875, -1.724884033203125, -1.6644287109375, -1.603973388671875, -1.54351806640625, -1.483062744140625, -1.422607421875, -1.362152099609375, -1.30169677734375, -1.241241455078125, -1.1807861328125, -1.120330810546875, -1.05987548828125, -0.999420166015625, -0.93896484375, -0.878509521484375, -0.81805419921875, -0.757598876953125, -0.6971435546875, -0.636688232421875, -0.57623291015625, -0.515777587890625, -0.455322265625, -0.394866943359375, -0.33441162109375, -0.273956298828125, -0.2135009765625, -0.153045654296875, -0.09259033203125, -0.032135009765625, 0.0283203125, 0.088775634765625, 0.14923095703125, 0.209686279296875, 0.2701416015625, 0.330596923828125, 0.39105224609375, 0.451507568359375, 0.511962890625, 0.572418212890625, 0.63287353515625, 0.693328857421875, 0.7537841796875, 0.814239501953125, 0.87469482421875, 0.935150146484375, 0.99560546875, 1.056060791015625, 1.11651611328125, 1.176971435546875, 1.2374267578125, 1.297882080078125, 1.35833740234375, 1.418792724609375, 1.479248046875, 1.539703369140625, 1.60015869140625, 1.660614013671875, 1.7210693359375, 1.781524658203125, 1.84197998046875, 1.902435302734375, 1.962890625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 10.0, 9.0, 15.0, 28.0, 42.0, 62.0, 115.0, 191.0, 347.0, 530.0, 896.0, 1600.0, 2712.0, 4563.0, 7977.0, 13923.0, 23835.0, 41627.0, 70564.0, 118673.0, 194613.0, 303897.0, 441019.0, 566467.0, 621354.0, 564559.0, 438146.0, 299597.0, 192860.0, 117179.0, 69909.0, 40771.0, 23712.0, 13475.0, 8068.0, 4483.0, 2663.0, 1548.0, 905.0, 562.0, 324.0, 184.0, 121.0, 67.0, 37.0, 17.0, 20.0, 10.0, 8.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6962890625, -1.6322479248046875, -1.568206787109375, -1.5041656494140625, -1.44012451171875, -1.3760833740234375, -1.312042236328125, -1.2480010986328125, -1.1839599609375, -1.1199188232421875, -1.055877685546875, -0.9918365478515625, -0.92779541015625, -0.8637542724609375, -0.799713134765625, -0.7356719970703125, -0.671630859375, -0.6075897216796875, -0.543548583984375, -0.4795074462890625, -0.41546630859375, -0.3514251708984375, -0.287384033203125, -0.2233428955078125, -0.1593017578125, -0.0952606201171875, -0.031219482421875, 0.0328216552734375, 0.09686279296875, 0.1609039306640625, 0.224945068359375, 0.2889862060546875, 0.35302734375, 0.4170684814453125, 0.481109619140625, 0.5451507568359375, 0.60919189453125, 0.6732330322265625, 0.737274169921875, 0.8013153076171875, 0.8653564453125, 0.9293975830078125, 0.993438720703125, 1.0574798583984375, 1.12152099609375, 1.1855621337890625, 1.249603271484375, 1.3136444091796875, 1.377685546875, 1.4417266845703125, 1.505767822265625, 1.5698089599609375, 1.63385009765625, 1.6978912353515625, 1.761932373046875, 1.8259735107421875, 1.8900146484375, 1.9540557861328125, 2.018096923828125, 2.0821380615234375, 2.14617919921875, 2.2102203369140625, 2.274261474609375, 2.3383026123046875, 2.40234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 7.0, 15.0, 13.0, 20.0, 34.0, 39.0, 40.0, 57.0, 61.0, 90.0, 102.0, 120.0, 156.0, 170.0, 184.0, 198.0, 222.0, 253.0, 259.0, 234.0, 240.0, 214.0, 235.0, 199.0, 149.0, 138.0, 124.0, 92.0, 87.0, 68.0, 68.0, 42.0, 27.0, 26.0, 18.0, 15.0, 14.0, 11.0, 8.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7649612426757812, -0.7364654541015625, -0.7079696655273438, -0.679473876953125, -0.6509780883789062, -0.6224822998046875, -0.5939865112304688, -0.56549072265625, -0.5369949340820312, -0.5084991455078125, -0.48000335693359375, -0.451507568359375, -0.42301177978515625, -0.3945159912109375, -0.36602020263671875, -0.3375244140625, -0.30902862548828125, -0.2805328369140625, -0.25203704833984375, -0.223541259765625, -0.19504547119140625, -0.1665496826171875, -0.13805389404296875, -0.10955810546875, -0.08106231689453125, -0.0525665283203125, -0.02407073974609375, 0.004425048828125, 0.03292083740234375, 0.0614166259765625, 0.08991241455078125, 0.118408203125, 0.14690399169921875, 0.1753997802734375, 0.20389556884765625, 0.232391357421875, 0.26088714599609375, 0.2893829345703125, 0.31787872314453125, 0.34637451171875, 0.37487030029296875, 0.4033660888671875, 0.43186187744140625, 0.460357666015625, 0.48885345458984375, 0.5173492431640625, 0.5458450317382812, 0.5743408203125, 0.6028366088867188, 0.6313323974609375, 0.6598281860351562, 0.688323974609375, 0.7168197631835938, 0.7453155517578125, 0.7738113403320312, 0.80230712890625, 0.8308029174804688, 0.8592987060546875, 0.8877944946289062, 0.916290283203125, 0.9447860717773438, 0.9732818603515625, 1.0017776489257812, 1.0302734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 9.0, 8.0, 9.0, 12.0, 18.0, 21.0, 18.0, 23.0, 30.0, 28.0, 28.0, 34.0, 40.0, 27.0, 40.0, 49.0, 57.0, 52.0, 47.0, 46.0, 51.0, 45.0, 36.0, 31.0, 33.0, 32.0, 20.0, 19.0, 21.0, 23.0, 17.0, 8.0, 8.0, 10.0, 6.0, 8.0, 7.0, 5.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.179861545562744, -2.1089839935302734, -2.0381064414978027, -1.9672290086746216, -1.8963515758514404, -1.8254740238189697, -1.754596471786499, -1.6837189197540283, -1.6128414869308472, -1.5419639348983765, -1.4710865020751953, -1.4002089500427246, -1.329331398010254, -1.2584539651870728, -1.187576413154602, -1.116698980331421, -1.0458214282989502, -0.9749439358711243, -0.9040664434432983, -0.8331888914108276, -0.7623113989830017, -0.6914339065551758, -0.6205563545227051, -0.5496788620948792, -0.4788013696670532, -0.4079238772392273, -0.337046355009079, -0.26616883277893066, -0.19529134035110474, -0.12441384792327881, -0.05353632569313049, 0.017341196537017822, 0.08821845054626465, 0.15909595787525177, 0.2299734652042389, 0.3008509874343872, 0.37172847986221313, 0.44260597229003906, 0.5134835243225098, 0.5843610167503357, 0.6552385091781616, 0.7261160016059875, 0.7969934940338135, 0.8678710460662842, 0.9387485384941101, 1.009626030921936, 1.0805035829544067, 1.151381015777588, 1.2222585678100586, 1.2931361198425293, 1.3640135526657104, 1.4348911046981812, 1.5057685375213623, 1.576646089553833, 1.6475236415863037, 1.7184011936187744, 1.7892786264419556, 1.8601561784744263, 1.9310336112976074, 2.001911163330078, 2.072788715362549, 2.1436662673950195, 2.214543581008911, 2.285421133041382, 2.3562986850738525]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 8.0, 3.0, 11.0, 7.0, 18.0, 10.0, 18.0, 21.0, 23.0, 21.0, 26.0, 40.0, 28.0, 32.0, 31.0, 28.0, 31.0, 42.0, 40.0, 41.0, 56.0, 40.0, 42.0, 29.0, 38.0, 35.0, 31.0, 25.0, 20.0, 42.0, 24.0, 17.0, 16.0, 23.0, 11.0, 7.0, 12.0, 12.0, 8.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021480083465576, -1.953728437423706, -1.8859769105911255, -1.818225383758545, -1.7504737377166748, -1.6827220916748047, -1.6149705648422241, -1.5472190380096436, -1.4794673919677734, -1.4117157459259033, -1.3439642190933228, -1.2762126922607422, -1.208461046218872, -1.140709400177002, -1.0729578733444214, -1.0052063465118408, -0.9374547004699707, -0.8697031140327454, -0.80195152759552, -0.7341999411582947, -0.6664483547210693, -0.598696768283844, -0.5309451818466187, -0.4631935954093933, -0.39544200897216797, -0.3276904225349426, -0.2599388360977173, -0.19218724966049194, -0.1244356632232666, -0.05668407678604126, 0.011067509651184082, 0.07881909608840942, 0.14657044410705566, 0.214322030544281, 0.28207361698150635, 0.3498252034187317, 0.41757678985595703, 0.4853283762931824, 0.5530799627304077, 0.6208315491676331, 0.6885831356048584, 0.7563347220420837, 0.8240863084793091, 0.8918378949165344, 0.9595894813537598, 1.0273411273956299, 1.0950926542282104, 1.162844181060791, 1.2305958271026611, 1.2983474731445312, 1.3660989999771118, 1.4338505268096924, 1.5016021728515625, 1.5693538188934326, 1.6371053457260132, 1.7048568725585938, 1.7726085186004639, 1.840360164642334, 1.9081116914749146, 1.9758632183074951, 2.0436148643493652, 2.1113665103912354, 2.1791181564331055, 2.2468695640563965, 2.3146212100982666]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 3.0, 3.0, 6.0, 7.0, 14.0, 19.0, 28.0, 37.0, 51.0, 78.0, 124.0, 168.0, 282.0, 407.0, 701.0, 1090.0, 1739.0, 2760.0, 4513.0, 7636.0, 12469.0, 20483.0, 33042.0, 52395.0, 78806.0, 110339.0, 137201.0, 147135.0, 133418.0, 104183.0, 73174.0, 48114.0, 30026.0, 18408.0, 11499.0, 6843.0, 4269.0, 2728.0, 1598.0, 973.0, 634.0, 401.0, 270.0, 161.0, 122.0, 70.0, 38.0, 36.0, 26.0, 12.0, 11.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6240234375, -0.6035003662109375, -0.582977294921875, -0.5624542236328125, -0.54193115234375, -0.5214080810546875, -0.500885009765625, -0.4803619384765625, -0.4598388671875, -0.4393157958984375, -0.418792724609375, -0.3982696533203125, -0.37774658203125, -0.3572235107421875, -0.336700439453125, -0.3161773681640625, -0.295654296875, -0.2751312255859375, -0.254608154296875, -0.2340850830078125, -0.21356201171875, -0.1930389404296875, -0.172515869140625, -0.1519927978515625, -0.1314697265625, -0.1109466552734375, -0.090423583984375, -0.0699005126953125, -0.04937744140625, -0.0288543701171875, -0.008331298828125, 0.0121917724609375, 0.03271484375, 0.0532379150390625, 0.073760986328125, 0.0942840576171875, 0.11480712890625, 0.1353302001953125, 0.155853271484375, 0.1763763427734375, 0.1968994140625, 0.2174224853515625, 0.237945556640625, 0.2584686279296875, 0.27899169921875, 0.2995147705078125, 0.320037841796875, 0.3405609130859375, 0.361083984375, 0.3816070556640625, 0.402130126953125, 0.4226531982421875, 0.44317626953125, 0.4636993408203125, 0.484222412109375, 0.5047454833984375, 0.5252685546875, 0.5457916259765625, 0.566314697265625, 0.5868377685546875, 0.60736083984375, 0.6278839111328125, 0.648406982421875, 0.6689300537109375, 0.689453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 4.0, 9.0, 12.0, 17.0, 19.0, 12.0, 18.0, 17.0, 25.0, 29.0, 28.0, 32.0, 38.0, 33.0, 30.0, 38.0, 31.0, 44.0, 52.0, 27.0, 31.0, 49.0, 41.0, 33.0, 35.0, 38.0, 24.0, 23.0, 26.0, 28.0, 24.0, 19.0, 12.0, 19.0, 8.0, 13.0, 9.0, 4.0, 4.0, 5.0, 4.0, 8.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.255859375, -2.186920166015625, -2.11798095703125, -2.049041748046875, -1.9801025390625, -1.911163330078125, -1.84222412109375, -1.773284912109375, -1.704345703125, -1.635406494140625, -1.56646728515625, -1.497528076171875, -1.4285888671875, -1.359649658203125, -1.29071044921875, -1.221771240234375, -1.15283203125, -1.083892822265625, -1.01495361328125, -0.946014404296875, -0.8770751953125, -0.808135986328125, -0.73919677734375, -0.670257568359375, -0.601318359375, -0.532379150390625, -0.46343994140625, -0.394500732421875, -0.3255615234375, -0.256622314453125, -0.18768310546875, -0.118743896484375, -0.0498046875, 0.019134521484375, 0.08807373046875, 0.157012939453125, 0.2259521484375, 0.294891357421875, 0.36383056640625, 0.432769775390625, 0.501708984375, 0.570648193359375, 0.63958740234375, 0.708526611328125, 0.7774658203125, 0.846405029296875, 0.91534423828125, 0.984283447265625, 1.05322265625, 1.122161865234375, 1.19110107421875, 1.260040283203125, 1.3289794921875, 1.397918701171875, 1.46685791015625, 1.535797119140625, 1.604736328125, 1.673675537109375, 1.74261474609375, 1.811553955078125, 1.8804931640625, 1.949432373046875, 2.01837158203125, 2.087310791015625, 2.15625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 1.0, 5.0, 4.0, 5.0, 3.0, 11.0, 7.0, 5.0, 12.0, 28.0, 28.0, 28.0, 44.0, 52.0, 74.0, 84.0, 140.0, 229.0, 364.0, 567.0, 1068.0, 2061.0, 4201.0, 8810.0, 18263.0, 41835.0, 788282.0, 130692.0, 26567.0, 12455.0, 6001.0, 2999.0, 1437.0, 819.0, 461.0, 294.0, 163.0, 117.0, 81.0, 64.0, 51.0, 33.0, 38.0, 19.0, 15.0, 11.0, 9.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.330078125, -2.251739501953125, -2.17340087890625, -2.095062255859375, -2.0167236328125, -1.938385009765625, -1.86004638671875, -1.781707763671875, -1.703369140625, -1.625030517578125, -1.54669189453125, -1.468353271484375, -1.3900146484375, -1.311676025390625, -1.23333740234375, -1.154998779296875, -1.07666015625, -0.998321533203125, -0.91998291015625, -0.841644287109375, -0.7633056640625, -0.684967041015625, -0.60662841796875, -0.528289794921875, -0.449951171875, -0.371612548828125, -0.29327392578125, -0.214935302734375, -0.1365966796875, -0.058258056640625, 0.02008056640625, 0.098419189453125, 0.1767578125, 0.255096435546875, 0.33343505859375, 0.411773681640625, 0.4901123046875, 0.568450927734375, 0.64678955078125, 0.725128173828125, 0.803466796875, 0.881805419921875, 0.96014404296875, 1.038482666015625, 1.1168212890625, 1.195159912109375, 1.27349853515625, 1.351837158203125, 1.43017578125, 1.508514404296875, 1.58685302734375, 1.665191650390625, 1.7435302734375, 1.821868896484375, 1.90020751953125, 1.978546142578125, 2.056884765625, 2.135223388671875, 2.21356201171875, 2.291900634765625, 2.3702392578125, 2.448577880859375, 2.52691650390625, 2.605255126953125, 2.68359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 13.0, 9.0, 11.0, 11.0, 25.0, 18.0, 12.0, 21.0, 32.0, 24.0, 32.0, 31.0, 35.0, 51.0, 40.0, 47.0, 44.0, 33.0, 32.0, 40.0, 46.0, 41.0, 39.0, 41.0, 24.0, 28.0, 30.0, 31.0, 17.0, 17.0, 20.0, 18.0, 18.0, 16.0, 14.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6845703125, -1.6329193115234375, -1.581268310546875, -1.5296173095703125, -1.47796630859375, -1.4263153076171875, -1.374664306640625, -1.3230133056640625, -1.2713623046875, -1.2197113037109375, -1.168060302734375, -1.1164093017578125, -1.06475830078125, -1.0131072998046875, -0.961456298828125, -0.9098052978515625, -0.858154296875, -0.8065032958984375, -0.754852294921875, -0.7032012939453125, -0.65155029296875, -0.5998992919921875, -0.548248291015625, -0.4965972900390625, -0.4449462890625, -0.3932952880859375, -0.341644287109375, -0.2899932861328125, -0.23834228515625, -0.1866912841796875, -0.135040283203125, -0.0833892822265625, -0.03173828125, 0.0199127197265625, 0.071563720703125, 0.1232147216796875, 0.17486572265625, 0.2265167236328125, 0.278167724609375, 0.3298187255859375, 0.3814697265625, 0.4331207275390625, 0.484771728515625, 0.5364227294921875, 0.58807373046875, 0.6397247314453125, 0.691375732421875, 0.7430267333984375, 0.794677734375, 0.8463287353515625, 0.897979736328125, 0.9496307373046875, 1.00128173828125, 1.0529327392578125, 1.104583740234375, 1.1562347412109375, 1.2078857421875, 1.2595367431640625, 1.311187744140625, 1.3628387451171875, 1.41448974609375, 1.4661407470703125, 1.517791748046875, 1.5694427490234375, 1.62109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 7.0, 21.0, 21.0, 23.0, 27.0, 45.0, 49.0, 83.0, 101.0, 126.0, 207.0, 322.0, 413.0, 589.0, 938.0, 1373.0, 2058.0, 3243.0, 4857.0, 7983.0, 13083.0, 22930.0, 68260.0, 693405.0, 157098.0, 29269.0, 15551.0, 9489.0, 5869.0, 3755.0, 2399.0, 1556.0, 1051.0, 697.0, 486.0, 344.0, 271.0, 161.0, 117.0, 73.0, 60.0, 42.0, 38.0, 18.0, 21.0, 4.0, 4.0, 7.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.13718223571777344, -0.13239669799804688, -0.1276111602783203, -0.12282562255859375, -0.11804008483886719, -0.11325454711914062, -0.10846900939941406, -0.1036834716796875, -0.09889793395996094, -0.09411239624023438, -0.08932685852050781, -0.08454132080078125, -0.07975578308105469, -0.07497024536132812, -0.07018470764160156, -0.065399169921875, -0.06061363220214844, -0.055828094482421875, -0.05104255676269531, -0.04625701904296875, -0.04147148132324219, -0.036685943603515625, -0.03190040588378906, -0.0271148681640625, -0.022329330444335938, -0.017543792724609375, -0.012758255004882812, -0.00797271728515625, -0.0031871795654296875, 0.001598358154296875, 0.0063838958740234375, 0.01116943359375, 0.015954971313476562, 0.020740509033203125, 0.025526046752929688, 0.03031158447265625, 0.03509712219238281, 0.039882659912109375, 0.04466819763183594, 0.0494537353515625, 0.05423927307128906, 0.059024810791015625, 0.06381034851074219, 0.06859588623046875, 0.07338142395019531, 0.07816696166992188, 0.08295249938964844, 0.087738037109375, 0.09252357482910156, 0.09730911254882812, 0.10209465026855469, 0.10688018798828125, 0.11166572570800781, 0.11645126342773438, 0.12123680114746094, 0.1260223388671875, 0.13080787658691406, 0.13559341430664062, 0.1403789520263672, 0.14516448974609375, 0.1499500274658203, 0.15473556518554688, 0.15952110290527344, 0.164306640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 10.0, 4.0, 8.0, 12.0, 14.0, 10.0, 14.0, 17.0, 31.0, 27.0, 39.0, 38.0, 46.0, 56.0, 50.0, 68.0, 33.0, 49.0, 52.0, 51.0, 37.0, 49.0, 31.0, 39.0, 27.0, 24.0, 32.0, 16.0, 14.0, 14.0, 15.0, 7.0, 5.0, 9.0, 8.0, 7.0, 6.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.2709369659423828e-05, -2.1996907889842987e-05, -2.1284446120262146e-05, -2.0571984350681305e-05, -1.9859522581100464e-05, -1.9147060811519623e-05, -1.8434599041938782e-05, -1.772213727235794e-05, -1.70096755027771e-05, -1.629721373319626e-05, -1.5584751963615417e-05, -1.4872290194034576e-05, -1.4159828424453735e-05, -1.3447366654872894e-05, -1.2734904885292053e-05, -1.2022443115711212e-05, -1.1309981346130371e-05, -1.059751957654953e-05, -9.885057806968689e-06, -9.172596037387848e-06, -8.460134267807007e-06, -7.747672498226166e-06, -7.035210728645325e-06, -6.322748959064484e-06, -5.610287189483643e-06, -4.8978254199028015e-06, -4.1853636503219604e-06, -3.4729018807411194e-06, -2.7604401111602783e-06, -2.0479783415794373e-06, -1.3355165719985962e-06, -6.230548024177551e-07, 8.940696716308594e-08, 8.01868736743927e-07, 1.514330506324768e-06, 2.226792275905609e-06, 2.93925404548645e-06, 3.6517158150672913e-06, 4.364177584648132e-06, 5.076639354228973e-06, 5.7891011238098145e-06, 6.5015628933906555e-06, 7.214024662971497e-06, 7.926486432552338e-06, 8.638948202133179e-06, 9.35140997171402e-06, 1.006387174129486e-05, 1.0776333510875702e-05, 1.1488795280456543e-05, 1.2201257050037384e-05, 1.2913718819618225e-05, 1.3626180589199066e-05, 1.4338642358779907e-05, 1.5051104128360748e-05, 1.576356589794159e-05, 1.647602766752243e-05, 1.718848943710327e-05, 1.7900951206684113e-05, 1.8613412976264954e-05, 1.9325874745845795e-05, 2.0038336515426636e-05, 2.0750798285007477e-05, 2.1463260054588318e-05, 2.217572182416916e-05, 2.288818359375e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 14.0, 6.0, 7.0, 13.0, 26.0, 39.0, 82.0, 113.0, 226.0, 348.0, 595.0, 1038.0, 1785.0, 3221.0, 5657.0, 9879.0, 17169.0, 29943.0, 51138.0, 82678.0, 123065.0, 159053.0, 167132.0, 142193.0, 99722.0, 63415.0, 38215.0, 22065.0, 12865.0, 7130.0, 4093.0, 2382.0, 1350.0, 809.0, 422.0, 254.0, 159.0, 89.0, 52.0, 42.0, 28.0, 15.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1474609375, -0.14315223693847656, -0.13884353637695312, -0.1345348358154297, -0.13022613525390625, -0.1259174346923828, -0.12160873413085938, -0.11730003356933594, -0.1129913330078125, -0.10868263244628906, -0.10437393188476562, -0.10006523132324219, -0.09575653076171875, -0.09144783020019531, -0.08713912963867188, -0.08283042907714844, -0.078521728515625, -0.07421302795410156, -0.06990432739257812, -0.06559562683105469, -0.06128692626953125, -0.05697822570800781, -0.052669525146484375, -0.04836082458496094, -0.0440521240234375, -0.03974342346191406, -0.035434722900390625, -0.031126022338867188, -0.02681732177734375, -0.022508621215820312, -0.018199920654296875, -0.013891220092773438, -0.00958251953125, -0.0052738189697265625, -0.000965118408203125, 0.0033435821533203125, 0.00765228271484375, 0.011960983276367188, 0.016269683837890625, 0.020578384399414062, 0.0248870849609375, 0.029195785522460938, 0.033504486083984375, 0.03781318664550781, 0.04212188720703125, 0.04643058776855469, 0.050739288330078125, 0.05504798889160156, 0.059356689453125, 0.06366539001464844, 0.06797409057617188, 0.07228279113769531, 0.07659149169921875, 0.08090019226074219, 0.08520889282226562, 0.08951759338378906, 0.0938262939453125, 0.09813499450683594, 0.10244369506835938, 0.10675239562988281, 0.11106109619140625, 0.11536979675292969, 0.11967849731445312, 0.12398719787597656, 0.1282958984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 8.0, 13.0, 12.0, 19.0, 20.0, 22.0, 16.0, 28.0, 34.0, 31.0, 39.0, 46.0, 40.0, 39.0, 37.0, 43.0, 34.0, 38.0, 46.0, 44.0, 44.0, 40.0, 48.0, 31.0, 30.0, 38.0, 22.0, 14.0, 17.0, 17.0, 18.0, 10.0, 15.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.046478271484375, -0.04496192932128906, -0.043445587158203125, -0.04192924499511719, -0.04041290283203125, -0.03889656066894531, -0.037380218505859375, -0.03586387634277344, -0.0343475341796875, -0.03283119201660156, -0.031314849853515625, -0.029798507690429688, -0.02828216552734375, -0.026765823364257812, -0.025249481201171875, -0.023733139038085938, -0.022216796875, -0.020700454711914062, -0.019184112548828125, -0.017667770385742188, -0.01615142822265625, -0.014635086059570312, -0.013118743896484375, -0.011602401733398438, -0.0100860595703125, -0.008569717407226562, -0.007053375244140625, -0.0055370330810546875, -0.00402069091796875, -0.0025043487548828125, -0.000988006591796875, 0.0005283355712890625, 0.002044677734375, 0.0035610198974609375, 0.005077362060546875, 0.0065937042236328125, 0.00811004638671875, 0.009626388549804688, 0.011142730712890625, 0.012659072875976562, 0.0141754150390625, 0.015691757202148438, 0.017208099365234375, 0.018724441528320312, 0.02024078369140625, 0.021757125854492188, 0.023273468017578125, 0.024789810180664062, 0.02630615234375, 0.027822494506835938, 0.029338836669921875, 0.030855178833007812, 0.03237152099609375, 0.03388786315917969, 0.035404205322265625, 0.03692054748535156, 0.0384368896484375, 0.03995323181152344, 0.041469573974609375, 0.04298591613769531, 0.04450225830078125, 0.04601860046386719, 0.047534942626953125, 0.04905128479003906, 0.050567626953125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 8.0, 7.0, 10.0, 9.0, 4.0, 20.0, 23.0, 13.0, 21.0, 21.0, 29.0, 30.0, 33.0, 33.0, 36.0, 38.0, 39.0, 49.0, 62.0, 41.0, 46.0, 42.0, 47.0, 42.0, 30.0, 35.0, 35.0, 28.0, 22.0, 26.0, 24.0, 17.0, 10.0, 11.0, 10.0, 9.0, 8.0, 5.0, 7.0, 2.0, 2.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1136229038238525, -2.044271945953369, -1.9749209880828857, -1.9055700302124023, -1.836219072341919, -1.7668681144714355, -1.6975171566009521, -1.6281661987304688, -1.5588152408599854, -1.489464282989502, -1.4201133251190186, -1.3507623672485352, -1.2814114093780518, -1.2120604515075684, -1.142709493637085, -1.0733585357666016, -1.0040075778961182, -0.9346566200256348, -0.8653056621551514, -0.795954704284668, -0.7266037464141846, -0.6572527885437012, -0.5879018306732178, -0.5185508728027344, -0.449199914932251, -0.3798489570617676, -0.3104979991912842, -0.24114704132080078, -0.17179608345031738, -0.10244512557983398, -0.033094167709350586, 0.03625679016113281, 0.10560750961303711, 0.1749584674835205, 0.2443094253540039, 0.3136603832244873, 0.3830113410949707, 0.4523622989654541, 0.5217132568359375, 0.5910642147064209, 0.6604151725769043, 0.7297661304473877, 0.7991170883178711, 0.8684680461883545, 0.9378190040588379, 1.0071699619293213, 1.0765209197998047, 1.145871877670288, 1.2152228355407715, 1.2845737934112549, 1.3539247512817383, 1.4232757091522217, 1.492626667022705, 1.5619776248931885, 1.6313285827636719, 1.7006795406341553, 1.7700304985046387, 1.839381456375122, 1.9087324142456055, 1.9780833721160889, 2.0474343299865723, 2.1167852878570557, 2.186136245727539, 2.2554872035980225, 2.324838161468506]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 7.0, 5.0, 9.0, 7.0, 16.0, 14.0, 17.0, 23.0, 16.0, 24.0, 24.0, 35.0, 36.0, 34.0, 19.0, 37.0, 32.0, 39.0, 38.0, 39.0, 51.0, 57.0, 33.0, 33.0, 34.0, 33.0, 34.0, 23.0, 27.0, 29.0, 31.0, 24.0, 16.0, 18.0, 13.0, 7.0, 9.0, 15.0, 9.0, 3.0, 7.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.016432046890259, -1.9491982460021973, -1.8819643259048462, -1.8147305250167847, -1.7474966049194336, -1.680262804031372, -1.6130290031433105, -1.545795202255249, -1.478561282157898, -1.4113274812698364, -1.3440935611724854, -1.2768597602844238, -1.2096259593963623, -1.1423920392990112, -1.0751582384109497, -1.0079243183135986, -0.9406905174255371, -0.8734566569328308, -0.8062227964401245, -0.738988995552063, -0.6717551350593567, -0.6045212745666504, -0.5372874736785889, -0.47005361318588257, -0.40281975269317627, -0.33558589220046997, -0.26835206151008606, -0.20111821591854095, -0.13388437032699585, -0.06665050983428955, 0.0005833208560943604, 0.06781715154647827, 0.13505101203918457, 0.20228485763072968, 0.2695187032222748, 0.3367525339126587, 0.403986394405365, 0.4712202548980713, 0.5384540557861328, 0.6056879162788391, 0.6729217767715454, 0.7401556372642517, 0.807389497756958, 0.8746232986450195, 0.9418571591377258, 1.0090910196304321, 1.0763248205184937, 1.1435587406158447, 1.2107925415039062, 1.2780263423919678, 1.3452602624893188, 1.4124940633773804, 1.4797279834747314, 1.546961784362793, 1.6141955852508545, 1.681429386138916, 1.748663306236267, 1.8158971071243286, 1.8831310272216797, 1.9503648281097412, 2.0175986289978027, 2.0848326683044434, 2.152066469192505, 2.2193002700805664, 2.286534070968628]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 12.0, 21.0, 49.0, 59.0, 107.0, 143.0, 240.0, 369.0, 573.0, 886.0, 1405.0, 2315.0, 3565.0, 5451.0, 8438.0, 12903.0, 18788.0, 27558.0, 38664.0, 51745.0, 66894.0, 81874.0, 93467.0, 100613.0, 100776.0, 95317.0, 83436.0, 69101.0, 54504.0, 40823.0, 28944.0, 20167.0, 13722.0, 9046.0, 5832.0, 3906.0, 2490.0, 1655.0, 946.0, 635.0, 405.0, 234.0, 170.0, 107.0, 61.0, 50.0, 24.0, 18.0, 15.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.3115234375, -1.2706451416015625, -1.229766845703125, -1.1888885498046875, -1.14801025390625, -1.1071319580078125, -1.066253662109375, -1.0253753662109375, -0.9844970703125, -0.9436187744140625, -0.902740478515625, -0.8618621826171875, -0.82098388671875, -0.7801055908203125, -0.739227294921875, -0.6983489990234375, -0.657470703125, -0.6165924072265625, -0.575714111328125, -0.5348358154296875, -0.49395751953125, -0.4530792236328125, -0.412200927734375, -0.3713226318359375, -0.3304443359375, -0.2895660400390625, -0.248687744140625, -0.2078094482421875, -0.16693115234375, -0.1260528564453125, -0.085174560546875, -0.0442962646484375, -0.00341796875, 0.0374603271484375, 0.078338623046875, 0.1192169189453125, 0.16009521484375, 0.2009735107421875, 0.241851806640625, 0.2827301025390625, 0.3236083984375, 0.3644866943359375, 0.405364990234375, 0.4462432861328125, 0.48712158203125, 0.5279998779296875, 0.568878173828125, 0.6097564697265625, 0.650634765625, 0.6915130615234375, 0.732391357421875, 0.7732696533203125, 0.81414794921875, 0.8550262451171875, 0.895904541015625, 0.9367828369140625, 0.9776611328125, 1.0185394287109375, 1.059417724609375, 1.1002960205078125, 1.14117431640625, 1.1820526123046875, 1.222930908203125, 1.2638092041015625, 1.3046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 5.0, 8.0, 10.0, 20.0, 17.0, 11.0, 16.0, 20.0, 20.0, 25.0, 25.0, 30.0, 35.0, 33.0, 24.0, 40.0, 35.0, 52.0, 45.0, 39.0, 36.0, 41.0, 46.0, 41.0, 30.0, 24.0, 26.0, 35.0, 29.0, 18.0, 19.0, 16.0, 16.0, 19.0, 14.0, 14.0, 7.0, 12.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.10546875, -2.03814697265625, -1.9708251953125, -1.90350341796875, -1.836181640625, -1.76885986328125, -1.7015380859375, -1.63421630859375, -1.56689453125, -1.49957275390625, -1.4322509765625, -1.36492919921875, -1.297607421875, -1.23028564453125, -1.1629638671875, -1.09564208984375, -1.0283203125, -0.96099853515625, -0.8936767578125, -0.82635498046875, -0.759033203125, -0.69171142578125, -0.6243896484375, -0.55706787109375, -0.48974609375, -0.42242431640625, -0.3551025390625, -0.28778076171875, -0.220458984375, -0.15313720703125, -0.0858154296875, -0.01849365234375, 0.048828125, 0.11614990234375, 0.1834716796875, 0.25079345703125, 0.318115234375, 0.38543701171875, 0.4527587890625, 0.52008056640625, 0.58740234375, 0.65472412109375, 0.7220458984375, 0.78936767578125, 0.856689453125, 0.92401123046875, 0.9913330078125, 1.05865478515625, 1.1259765625, 1.19329833984375, 1.2606201171875, 1.32794189453125, 1.395263671875, 1.46258544921875, 1.5299072265625, 1.59722900390625, 1.66455078125, 1.73187255859375, 1.7991943359375, 1.86651611328125, 1.933837890625, 2.00115966796875, 2.0684814453125, 2.13580322265625, 2.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 14.0, 24.0, 25.0, 40.0, 91.0, 139.0, 224.0, 394.0, 595.0, 1125.0, 1774.0, 2966.0, 5168.0, 8407.0, 14137.0, 22890.0, 35714.0, 52780.0, 74875.0, 97936.0, 117192.0, 127325.0, 122301.0, 105992.0, 83476.0, 60733.0, 41800.0, 27183.0, 17290.0, 10293.0, 6359.0, 3753.0, 2306.0, 1292.0, 785.0, 435.0, 266.0, 166.0, 104.0, 75.0, 32.0, 29.0, 11.0, 16.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7216796875, -1.6673583984375, -1.613037109375, -1.5587158203125, -1.50439453125, -1.4500732421875, -1.395751953125, -1.3414306640625, -1.287109375, -1.2327880859375, -1.178466796875, -1.1241455078125, -1.06982421875, -1.0155029296875, -0.961181640625, -0.9068603515625, -0.8525390625, -0.7982177734375, -0.743896484375, -0.6895751953125, -0.63525390625, -0.5809326171875, -0.526611328125, -0.4722900390625, -0.41796875, -0.3636474609375, -0.309326171875, -0.2550048828125, -0.20068359375, -0.1463623046875, -0.092041015625, -0.0377197265625, 0.0166015625, 0.0709228515625, 0.125244140625, 0.1795654296875, 0.23388671875, 0.2882080078125, 0.342529296875, 0.3968505859375, 0.451171875, 0.5054931640625, 0.559814453125, 0.6141357421875, 0.66845703125, 0.7227783203125, 0.777099609375, 0.8314208984375, 0.8857421875, 0.9400634765625, 0.994384765625, 1.0487060546875, 1.10302734375, 1.1573486328125, 1.211669921875, 1.2659912109375, 1.3203125, 1.3746337890625, 1.428955078125, 1.4832763671875, 1.53759765625, 1.5919189453125, 1.646240234375, 1.7005615234375, 1.7548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 9.0, 4.0, 7.0, 5.0, 3.0, 12.0, 6.0, 14.0, 12.0, 11.0, 21.0, 28.0, 21.0, 20.0, 27.0, 27.0, 37.0, 34.0, 40.0, 44.0, 22.0, 29.0, 31.0, 31.0, 30.0, 38.0, 36.0, 35.0, 42.0, 21.0, 28.0, 28.0, 39.0, 28.0, 24.0, 25.0, 19.0, 17.0, 16.0, 11.0, 10.0, 6.0, 7.0, 10.0, 9.0, 3.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.2158203125, -1.174957275390625, -1.13409423828125, -1.093231201171875, -1.0523681640625, -1.011505126953125, -0.97064208984375, -0.929779052734375, -0.888916015625, -0.848052978515625, -0.80718994140625, -0.766326904296875, -0.7254638671875, -0.684600830078125, -0.64373779296875, -0.602874755859375, -0.56201171875, -0.521148681640625, -0.48028564453125, -0.439422607421875, -0.3985595703125, -0.357696533203125, -0.31683349609375, -0.275970458984375, -0.235107421875, -0.194244384765625, -0.15338134765625, -0.112518310546875, -0.0716552734375, -0.030792236328125, 0.01007080078125, 0.050933837890625, 0.091796875, 0.132659912109375, 0.17352294921875, 0.214385986328125, 0.2552490234375, 0.296112060546875, 0.33697509765625, 0.377838134765625, 0.418701171875, 0.459564208984375, 0.50042724609375, 0.541290283203125, 0.5821533203125, 0.623016357421875, 0.66387939453125, 0.704742431640625, 0.74560546875, 0.786468505859375, 0.82733154296875, 0.868194580078125, 0.9090576171875, 0.949920654296875, 0.99078369140625, 1.031646728515625, 1.072509765625, 1.113372802734375, 1.15423583984375, 1.195098876953125, 1.2359619140625, 1.276824951171875, 1.31768798828125, 1.358551025390625, 1.3994140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 11.0, 14.0, 18.0, 38.0, 61.0, 83.0, 133.0, 217.0, 348.0, 588.0, 1021.0, 1736.0, 3073.0, 5804.0, 10938.0, 21018.0, 38364.0, 68155.0, 109598.0, 152640.0, 175413.0, 161737.0, 121140.0, 78613.0, 45168.0, 24186.0, 12953.0, 6899.0, 3694.0, 1999.0, 1156.0, 678.0, 411.0, 240.0, 143.0, 87.0, 64.0, 32.0, 25.0, 16.0, 16.0, 12.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.962890625, -0.9324493408203125, -0.902008056640625, -0.8715667724609375, -0.84112548828125, -0.8106842041015625, -0.780242919921875, -0.7498016357421875, -0.7193603515625, -0.6889190673828125, -0.658477783203125, -0.6280364990234375, -0.59759521484375, -0.5671539306640625, -0.536712646484375, -0.5062713623046875, -0.475830078125, -0.4453887939453125, -0.414947509765625, -0.3845062255859375, -0.35406494140625, -0.3236236572265625, -0.293182373046875, -0.2627410888671875, -0.2322998046875, -0.2018585205078125, -0.171417236328125, -0.1409759521484375, -0.11053466796875, -0.0800933837890625, -0.049652099609375, -0.0192108154296875, 0.01123046875, 0.0416717529296875, 0.072113037109375, 0.1025543212890625, 0.13299560546875, 0.1634368896484375, 0.193878173828125, 0.2243194580078125, 0.2547607421875, 0.2852020263671875, 0.315643310546875, 0.3460845947265625, 0.37652587890625, 0.4069671630859375, 0.437408447265625, 0.4678497314453125, 0.498291015625, 0.5287322998046875, 0.559173583984375, 0.5896148681640625, 0.62005615234375, 0.6504974365234375, 0.680938720703125, 0.7113800048828125, 0.7418212890625, 0.7722625732421875, 0.802703857421875, 0.8331451416015625, 0.86358642578125, 0.8940277099609375, 0.924468994140625, 0.9549102783203125, 0.9853515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 5.0, 15.0, 11.0, 16.0, 13.0, 17.0, 18.0, 25.0, 36.0, 26.0, 30.0, 43.0, 44.0, 50.0, 42.0, 52.0, 44.0, 50.0, 47.0, 47.0, 44.0, 41.0, 40.0, 30.0, 28.0, 22.0, 26.0, 21.0, 18.0, 13.0, 8.0, 11.0, 8.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-7.706880569458008e-05, -7.456168532371521e-05, -7.205456495285034e-05, -6.954744458198547e-05, -6.70403242111206e-05, -6.453320384025574e-05, -6.202608346939087e-05, -5.9518963098526e-05, -5.701184272766113e-05, -5.4504722356796265e-05, -5.1997601985931396e-05, -4.949048161506653e-05, -4.698336124420166e-05, -4.447624087333679e-05, -4.1969120502471924e-05, -3.9462000131607056e-05, -3.695487976074219e-05, -3.444775938987732e-05, -3.194063901901245e-05, -2.9433518648147583e-05, -2.6926398277282715e-05, -2.4419277906417847e-05, -2.191215753555298e-05, -1.940503716468811e-05, -1.6897916793823242e-05, -1.4390796422958374e-05, -1.1883676052093506e-05, -9.376555681228638e-06, -6.8694353103637695e-06, -4.362314939498901e-06, -1.8551945686340332e-06, 6.51925802230835e-07, 3.159046173095703e-06, 5.666166543960571e-06, 8.17328691482544e-06, 1.0680407285690308e-05, 1.3187527656555176e-05, 1.5694648027420044e-05, 1.8201768398284912e-05, 2.070888876914978e-05, 2.321600914001465e-05, 2.5723129510879517e-05, 2.8230249881744385e-05, 3.073737025260925e-05, 3.324449062347412e-05, 3.575161099433899e-05, 3.825873136520386e-05, 4.0765851736068726e-05, 4.3272972106933594e-05, 4.578009247779846e-05, 4.828721284866333e-05, 5.07943332195282e-05, 5.3301453590393066e-05, 5.5808573961257935e-05, 5.83156943321228e-05, 6.082281470298767e-05, 6.332993507385254e-05, 6.583705544471741e-05, 6.834417581558228e-05, 7.085129618644714e-05, 7.335841655731201e-05, 7.586553692817688e-05, 7.837265729904175e-05, 8.087977766990662e-05, 8.338689804077148e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 12.0, 11.0, 21.0, 21.0, 41.0, 53.0, 90.0, 148.0, 209.0, 320.0, 535.0, 788.0, 1170.0, 1914.0, 2889.0, 4676.0, 7244.0, 11350.0, 17447.0, 26368.0, 39158.0, 56080.0, 75878.0, 95789.0, 111378.0, 118252.0, 113440.0, 99228.0, 79769.0, 59628.0, 42208.0, 28654.0, 19228.0, 12318.0, 7966.0, 5111.0, 3285.0, 2134.0, 1327.0, 891.0, 536.0, 352.0, 230.0, 144.0, 103.0, 67.0, 33.0, 17.0, 17.0, 15.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.63916015625, -0.6189346313476562, -0.5987091064453125, -0.5784835815429688, -0.558258056640625, -0.5380325317382812, -0.5178070068359375, -0.49758148193359375, -0.47735595703125, -0.45713043212890625, -0.4369049072265625, -0.41667938232421875, -0.396453857421875, -0.37622833251953125, -0.3560028076171875, -0.33577728271484375, -0.3155517578125, -0.29532623291015625, -0.2751007080078125, -0.25487518310546875, -0.234649658203125, -0.21442413330078125, -0.1941986083984375, -0.17397308349609375, -0.15374755859375, -0.13352203369140625, -0.1132965087890625, -0.09307098388671875, -0.072845458984375, -0.05261993408203125, -0.0323944091796875, -0.01216888427734375, 0.008056640625, 0.02828216552734375, 0.0485076904296875, 0.06873321533203125, 0.088958740234375, 0.10918426513671875, 0.1294097900390625, 0.14963531494140625, 0.16986083984375, 0.19008636474609375, 0.2103118896484375, 0.23053741455078125, 0.250762939453125, 0.27098846435546875, 0.2912139892578125, 0.31143951416015625, 0.3316650390625, 0.35189056396484375, 0.3721160888671875, 0.39234161376953125, 0.412567138671875, 0.43279266357421875, 0.4530181884765625, 0.47324371337890625, 0.49346923828125, 0.5136947631835938, 0.5339202880859375, 0.5541458129882812, 0.574371337890625, 0.5945968627929688, 0.6148223876953125, 0.6350479125976562, 0.6552734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 3.0, 9.0, 13.0, 16.0, 19.0, 17.0, 21.0, 23.0, 32.0, 27.0, 30.0, 49.0, 47.0, 59.0, 52.0, 48.0, 47.0, 52.0, 54.0, 50.0, 48.0, 29.0, 37.0, 36.0, 26.0, 31.0, 23.0, 20.0, 10.0, 10.0, 10.0, 6.0, 10.0, 3.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.31974029541015625, -0.3101348876953125, -0.30052947998046875, -0.290924072265625, -0.28131866455078125, -0.2717132568359375, -0.26210784912109375, -0.25250244140625, -0.24289703369140625, -0.2332916259765625, -0.22368621826171875, -0.214080810546875, -0.20447540283203125, -0.1948699951171875, -0.18526458740234375, -0.1756591796875, -0.16605377197265625, -0.1564483642578125, -0.14684295654296875, -0.137237548828125, -0.12763214111328125, -0.1180267333984375, -0.10842132568359375, -0.09881591796875, -0.08921051025390625, -0.0796051025390625, -0.06999969482421875, -0.060394287109375, -0.05078887939453125, -0.0411834716796875, -0.03157806396484375, -0.02197265625, -0.01236724853515625, -0.0027618408203125, 0.00684356689453125, 0.016448974609375, 0.02605438232421875, 0.0356597900390625, 0.04526519775390625, 0.05487060546875, 0.06447601318359375, 0.0740814208984375, 0.08368682861328125, 0.093292236328125, 0.10289764404296875, 0.1125030517578125, 0.12210845947265625, 0.1317138671875, 0.14131927490234375, 0.1509246826171875, 0.16053009033203125, 0.170135498046875, 0.17974090576171875, 0.1893463134765625, 0.19895172119140625, 0.20855712890625, 0.21816253662109375, 0.2277679443359375, 0.23737335205078125, 0.246978759765625, 0.25658416748046875, 0.2661895751953125, 0.27579498291015625, 0.285400390625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 9.0, 9.0, 11.0, 11.0, 10.0, 13.0, 12.0, 23.0, 27.0, 27.0, 29.0, 36.0, 35.0, 41.0, 49.0, 39.0, 42.0, 53.0, 47.0, 39.0, 48.0, 40.0, 34.0, 38.0, 31.0, 27.0, 35.0, 29.0, 23.0, 22.0, 12.0, 15.0, 13.0, 11.0, 9.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.0822019577026367, -2.015906572341919, -1.9496111869812012, -1.8833158016204834, -1.8170204162597656, -1.7507250308990479, -1.6844295263290405, -1.6181341409683228, -1.551838755607605, -1.4855433702468872, -1.4192479848861694, -1.3529525995254517, -1.2866570949554443, -1.2203617095947266, -1.1540663242340088, -1.087770938873291, -1.0214755535125732, -0.9551801681518555, -0.8888847827911377, -0.8225893378257751, -0.7562939524650574, -0.6899985671043396, -0.623703122138977, -0.5574077367782593, -0.4911123514175415, -0.42481696605682373, -0.35852155089378357, -0.2922261357307434, -0.22593075037002563, -0.15963536500930786, -0.0933399498462677, -0.02704453468322754, 0.039250850677490234, 0.1055462509393692, 0.17184165120124817, 0.23813705146312714, 0.3044324517250061, 0.3707278370857239, 0.43702325224876404, 0.5033186674118042, 0.569614052772522, 0.6359094381332397, 0.7022048234939575, 0.7685002684593201, 0.8347956538200378, 0.9010910391807556, 0.9673864841461182, 1.033681869506836, 1.0999772548675537, 1.1662726402282715, 1.2325680255889893, 1.298863410949707, 1.3651587963104248, 1.4314541816711426, 1.49774968624115, 1.5640450716018677, 1.6303404569625854, 1.6966358423233032, 1.762931227684021, 1.8292266130447388, 1.895522117614746, 1.9618175029754639, 2.0281128883361816, 2.0944082736968994, 2.160703659057617]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 7.0, 22.0, 17.0, 22.0, 18.0, 20.0, 27.0, 26.0, 26.0, 35.0, 45.0, 47.0, 44.0, 49.0, 50.0, 47.0, 45.0, 44.0, 41.0, 53.0, 33.0, 37.0, 47.0, 35.0, 23.0, 22.0, 32.0, 14.0, 17.0, 7.0, 6.0, 6.0, 3.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716916561126709, -2.6308350563049316, -2.5447535514831543, -2.458672046661377, -2.3725905418395996, -2.2865090370178223, -2.200427532196045, -2.1143457889556885, -2.028264284133911, -1.9421827793121338, -1.8561012744903564, -1.770019769668579, -1.6839381456375122, -1.5978566408157349, -1.5117751359939575, -1.4256935119628906, -1.3396121263504028, -1.2535306215286255, -1.1674491167068481, -1.0813674926757812, -0.9952859878540039, -0.9092044830322266, -0.8231229782104492, -0.7370414137840271, -0.6509599089622498, -0.5648784041404724, -0.4787968397140503, -0.39271533489227295, -0.3066338002681732, -0.2205522656440735, -0.13447076082229614, -0.04838919639587402, 0.03769230842590332, 0.12377383559942245, 0.2098553627729416, 0.2959368824958801, 0.38201841711997986, 0.4680999517440796, 0.5541814565658569, 0.640263020992279, 0.7263445258140564, 0.8124260306358337, 0.8985075950622559, 0.9845890998840332, 1.0706706047058105, 1.156752109527588, 1.2428336143493652, 1.3289152383804321, 1.4149967432022095, 1.5010782480239868, 1.5871597528457642, 1.673241376876831, 1.7593228816986084, 1.8454043865203857, 1.931485891342163, 2.0175673961639404, 2.1036489009857178, 2.189730405807495, 2.2758119106292725, 2.36189341545105, 2.447974920272827, 2.5340566635131836, 2.620138168334961, 2.7062196731567383, 2.7923011779785156]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 14.0, 18.0, 35.0, 42.0, 90.0, 161.0, 251.0, 406.0, 760.0, 1286.0, 2076.0, 3638.0, 6166.0, 10761.0, 18390.0, 32211.0, 56391.0, 98831.0, 170316.0, 282524.0, 433318.0, 581020.0, 656553.0, 606918.0, 467468.0, 313685.0, 190260.0, 110596.0, 63604.0, 36379.0, 20460.0, 12094.0, 7027.0, 4202.0, 2449.0, 1527.0, 852.0, 552.0, 345.0, 226.0, 159.0, 85.0, 46.0, 38.0, 24.0, 16.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.691802978515625, -1.63653564453125, -1.581268310546875, -1.5260009765625, -1.470733642578125, -1.41546630859375, -1.360198974609375, -1.304931640625, -1.249664306640625, -1.19439697265625, -1.139129638671875, -1.0838623046875, -1.028594970703125, -0.97332763671875, -0.918060302734375, -0.86279296875, -0.807525634765625, -0.75225830078125, -0.696990966796875, -0.6417236328125, -0.586456298828125, -0.53118896484375, -0.475921630859375, -0.420654296875, -0.365386962890625, -0.31011962890625, -0.254852294921875, -0.1995849609375, -0.144317626953125, -0.08905029296875, -0.033782958984375, 0.021484375, 0.076751708984375, 0.13201904296875, 0.187286376953125, 0.2425537109375, 0.297821044921875, 0.35308837890625, 0.408355712890625, 0.463623046875, 0.518890380859375, 0.57415771484375, 0.629425048828125, 0.6846923828125, 0.739959716796875, 0.79522705078125, 0.850494384765625, 0.90576171875, 0.961029052734375, 1.01629638671875, 1.071563720703125, 1.1268310546875, 1.182098388671875, 1.23736572265625, 1.292633056640625, 1.347900390625, 1.403167724609375, 1.45843505859375, 1.513702392578125, 1.5689697265625, 1.624237060546875, 1.67950439453125, 1.734771728515625, 1.7900390625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 10.0, 6.0, 11.0, 9.0, 11.0, 20.0, 22.0, 24.0, 26.0, 23.0, 29.0, 30.0, 39.0, 40.0, 40.0, 43.0, 35.0, 53.0, 35.0, 46.0, 45.0, 56.0, 40.0, 41.0, 36.0, 31.0, 40.0, 29.0, 25.0, 24.0, 28.0, 10.0, 8.0, 7.0, 5.0, 5.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.2344970703125, -2.164306640625, -2.0941162109375, -2.02392578125, -1.9537353515625, -1.883544921875, -1.8133544921875, -1.7431640625, -1.6729736328125, -1.602783203125, -1.5325927734375, -1.46240234375, -1.3922119140625, -1.322021484375, -1.2518310546875, -1.181640625, -1.1114501953125, -1.041259765625, -0.9710693359375, -0.90087890625, -0.8306884765625, -0.760498046875, -0.6903076171875, -0.6201171875, -0.5499267578125, -0.479736328125, -0.4095458984375, -0.33935546875, -0.2691650390625, -0.198974609375, -0.1287841796875, -0.05859375, 0.0115966796875, 0.081787109375, 0.1519775390625, 0.22216796875, 0.2923583984375, 0.362548828125, 0.4327392578125, 0.5029296875, 0.5731201171875, 0.643310546875, 0.7135009765625, 0.78369140625, 0.8538818359375, 0.924072265625, 0.9942626953125, 1.064453125, 1.1346435546875, 1.204833984375, 1.2750244140625, 1.34521484375, 1.4154052734375, 1.485595703125, 1.5557861328125, 1.6259765625, 1.6961669921875, 1.766357421875, 1.8365478515625, 1.90673828125, 1.9769287109375, 2.047119140625, 2.1173095703125, 2.1875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 12.0, 6.0, 19.0, 49.0, 58.0, 82.0, 149.0, 266.0, 398.0, 729.0, 1198.0, 2057.0, 3665.0, 6431.0, 10973.0, 19278.0, 33559.0, 57987.0, 100224.0, 167184.0, 268680.0, 403880.0, 545410.0, 630562.0, 600570.0, 479166.0, 334418.0, 214773.0, 130629.0, 76582.0, 44838.0, 25559.0, 14852.0, 8435.0, 4856.0, 2850.0, 1599.0, 926.0, 555.0, 320.0, 210.0, 112.0, 74.0, 44.0, 31.0, 13.0, 15.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.9710693359375, -1.906982421875, -1.8428955078125, -1.77880859375, -1.7147216796875, -1.650634765625, -1.5865478515625, -1.5224609375, -1.4583740234375, -1.394287109375, -1.3302001953125, -1.26611328125, -1.2020263671875, -1.137939453125, -1.0738525390625, -1.009765625, -0.9456787109375, -0.881591796875, -0.8175048828125, -0.75341796875, -0.6893310546875, -0.625244140625, -0.5611572265625, -0.4970703125, -0.4329833984375, -0.368896484375, -0.3048095703125, -0.24072265625, -0.1766357421875, -0.112548828125, -0.0484619140625, 0.015625, 0.0797119140625, 0.143798828125, 0.2078857421875, 0.27197265625, 0.3360595703125, 0.400146484375, 0.4642333984375, 0.5283203125, 0.5924072265625, 0.656494140625, 0.7205810546875, 0.78466796875, 0.8487548828125, 0.912841796875, 0.9769287109375, 1.041015625, 1.1051025390625, 1.169189453125, 1.2332763671875, 1.29736328125, 1.3614501953125, 1.425537109375, 1.4896240234375, 1.5537109375, 1.6177978515625, 1.681884765625, 1.7459716796875, 1.81005859375, 1.8741455078125, 1.938232421875, 2.0023193359375, 2.06640625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 8.0, 14.0, 14.0, 10.0, 17.0, 21.0, 35.0, 40.0, 41.0, 78.0, 62.0, 87.0, 76.0, 99.0, 144.0, 133.0, 142.0, 185.0, 187.0, 208.0, 213.0, 240.0, 223.0, 227.0, 205.0, 191.0, 197.0, 147.0, 125.0, 124.0, 109.0, 98.0, 71.0, 70.0, 51.0, 33.0, 25.0, 26.0, 22.0, 17.0, 15.0, 11.0, 5.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.76806640625, -0.74224853515625, -0.7164306640625, -0.69061279296875, -0.664794921875, -0.63897705078125, -0.6131591796875, -0.58734130859375, -0.5615234375, -0.53570556640625, -0.5098876953125, -0.48406982421875, -0.458251953125, -0.43243408203125, -0.4066162109375, -0.38079833984375, -0.35498046875, -0.32916259765625, -0.3033447265625, -0.27752685546875, -0.251708984375, -0.22589111328125, -0.2000732421875, -0.17425537109375, -0.1484375, -0.12261962890625, -0.0968017578125, -0.07098388671875, -0.045166015625, -0.01934814453125, 0.0064697265625, 0.03228759765625, 0.05810546875, 0.08392333984375, 0.1097412109375, 0.13555908203125, 0.161376953125, 0.18719482421875, 0.2130126953125, 0.23883056640625, 0.2646484375, 0.29046630859375, 0.3162841796875, 0.34210205078125, 0.367919921875, 0.39373779296875, 0.4195556640625, 0.44537353515625, 0.47119140625, 0.49700927734375, 0.5228271484375, 0.54864501953125, 0.574462890625, 0.60028076171875, 0.6260986328125, 0.65191650390625, 0.677734375, 0.70355224609375, 0.7293701171875, 0.75518798828125, 0.781005859375, 0.80682373046875, 0.8326416015625, 0.85845947265625, 0.88427734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 9.0, 5.0, 11.0, 14.0, 21.0, 17.0, 28.0, 26.0, 24.0, 29.0, 26.0, 37.0, 44.0, 47.0, 31.0, 50.0, 47.0, 54.0, 42.0, 43.0, 47.0, 37.0, 38.0, 25.0, 30.0, 36.0, 26.0, 23.0, 18.0, 18.0, 18.0, 11.0, 11.0, 13.0, 3.0, 4.0, 6.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0932209491729736, -2.026160955429077, -1.9591008424758911, -1.8920408487319946, -1.8249807357788086, -1.757920742034912, -1.6908607482910156, -1.6238006353378296, -1.5567405223846436, -1.489680528640747, -1.422620415687561, -1.3555604219436646, -1.2885003089904785, -1.221440315246582, -1.1543803215026855, -1.0873202085494995, -1.020260214805603, -0.9532001614570618, -0.8861401081085205, -0.819080114364624, -0.752020001411438, -0.6849600076675415, -0.6178999543190002, -0.550839900970459, -0.4837798476219177, -0.41671979427337646, -0.3496597409248352, -0.28259971737861633, -0.21553966403007507, -0.1484796106815338, -0.08141958713531494, -0.014359533786773682, 0.05270051956176758, 0.11976056545972824, 0.1868206113576889, 0.25388064980506897, 0.32094070315361023, 0.3880007565021515, 0.45506078004837036, 0.5221208333969116, 0.5891808867454529, 0.6562409400939941, 0.7233009934425354, 0.7903610467910767, 0.8574210405349731, 0.9244811534881592, 0.9915411472320557, 1.0586011409759521, 1.1256612539291382, 1.1927212476730347, 1.2597813606262207, 1.3268413543701172, 1.3939014673233032, 1.4609614610671997, 1.5280215740203857, 1.5950815677642822, 1.6621415615081787, 1.7292015552520752, 1.7962616682052612, 1.8633216619491577, 1.9303817749023438, 1.9974417686462402, 2.0645017623901367, 2.131561756134033, 2.198621988296509]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 5.0, 4.0, 11.0, 6.0, 10.0, 14.0, 20.0, 19.0, 22.0, 17.0, 26.0, 35.0, 43.0, 41.0, 48.0, 29.0, 53.0, 58.0, 43.0, 56.0, 54.0, 53.0, 47.0, 38.0, 32.0, 37.0, 39.0, 26.0, 16.0, 19.0, 16.0, 20.0, 13.0, 13.0, 3.0, 3.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7041358947753906, -2.6193795204162598, -2.534623146057129, -2.449867010116577, -2.3651106357574463, -2.2803542613983154, -2.1955981254577637, -2.110841751098633, -2.026085376739502, -1.941329002380371, -1.8565727472305298, -1.7718164920806885, -1.6870601177215576, -1.6023037433624268, -1.5175474882125854, -1.4327912330627441, -1.3480348587036133, -1.2632784843444824, -1.1785222291946411, -1.0937659740447998, -1.009009599685669, -0.9242532849311829, -0.8394969701766968, -0.7547406554222107, -0.6699843406677246, -0.5852280259132385, -0.5004717111587524, -0.41571539640426636, -0.3309590816497803, -0.2462027668952942, -0.1614464521408081, -0.07669013738632202, 0.008065938949584961, 0.09282225370407104, 0.17757856845855713, 0.2623348832130432, 0.3470911979675293, 0.4318475127220154, 0.5166038274765015, 0.6013601422309875, 0.6861164569854736, 0.7708727717399597, 0.8556290864944458, 0.9403854012489319, 1.025141716003418, 1.1098980903625488, 1.1946543455123901, 1.2794106006622314, 1.3641669750213623, 1.4489233493804932, 1.5336796045303345, 1.6184358596801758, 1.7031922340393066, 1.7879486083984375, 1.8727048635482788, 1.9574611186981201, 2.042217493057251, 2.126973867416382, 2.2117300033569336, 2.2964863777160645, 2.3812427520751953, 2.465999126434326, 2.550755500793457, 2.635511636734009, 2.7202680110931396]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 10.0, 15.0, 10.0, 17.0, 30.0, 48.0, 55.0, 81.0, 112.0, 184.0, 269.0, 434.0, 613.0, 1051.0, 1673.0, 2654.0, 4266.0, 6774.0, 10970.0, 17395.0, 27545.0, 42298.0, 62406.0, 87304.0, 113266.0, 131290.0, 133284.0, 117435.0, 92189.0, 66904.0, 45718.0, 30216.0, 19263.0, 12262.0, 7499.0, 4829.0, 3049.0, 1753.0, 1187.0, 716.0, 501.0, 345.0, 216.0, 146.0, 98.0, 69.0, 43.0, 18.0, 19.0, 9.0, 7.0, 13.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.484619140625, -0.4695243835449219, -0.45442962646484375, -0.4393348693847656, -0.4242401123046875, -0.4091453552246094, -0.39405059814453125, -0.3789558410644531, -0.363861083984375, -0.3487663269042969, -0.33367156982421875, -0.3185768127441406, -0.3034820556640625, -0.2883872985839844, -0.27329254150390625, -0.2581977844238281, -0.24310302734375, -0.22800827026367188, -0.21291351318359375, -0.19781875610351562, -0.1827239990234375, -0.16762924194335938, -0.15253448486328125, -0.13743972778320312, -0.122344970703125, -0.10725021362304688, -0.09215545654296875, -0.07706069946289062, -0.0619659423828125, -0.046871185302734375, -0.03177642822265625, -0.016681671142578125, -0.0015869140625, 0.013507843017578125, 0.02860260009765625, 0.043697357177734375, 0.0587921142578125, 0.07388687133789062, 0.08898162841796875, 0.10407638549804688, 0.119171142578125, 0.13426589965820312, 0.14936065673828125, 0.16445541381835938, 0.1795501708984375, 0.19464492797851562, 0.20973968505859375, 0.22483444213867188, 0.23992919921875, 0.2550239562988281, 0.27011871337890625, 0.2852134704589844, 0.3003082275390625, 0.3154029846191406, 0.33049774169921875, 0.3455924987792969, 0.360687255859375, 0.3757820129394531, 0.39087677001953125, 0.4059715270996094, 0.4210662841796875, 0.4361610412597656, 0.45125579833984375, 0.4663505554199219, 0.4814453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 10.0, 7.0, 19.0, 18.0, 29.0, 17.0, 35.0, 30.0, 44.0, 41.0, 46.0, 65.0, 60.0, 57.0, 52.0, 55.0, 66.0, 58.0, 38.0, 45.0, 49.0, 27.0, 21.0, 18.0, 26.0, 15.0, 12.0, 12.0, 12.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.955078125, -2.85455322265625, -2.7540283203125, -2.65350341796875, -2.552978515625, -2.45245361328125, -2.3519287109375, -2.25140380859375, -2.15087890625, -2.05035400390625, -1.9498291015625, -1.84930419921875, -1.748779296875, -1.64825439453125, -1.5477294921875, -1.44720458984375, -1.3466796875, -1.24615478515625, -1.1456298828125, -1.04510498046875, -0.944580078125, -0.84405517578125, -0.7435302734375, -0.64300537109375, -0.54248046875, -0.44195556640625, -0.3414306640625, -0.24090576171875, -0.140380859375, -0.03985595703125, 0.0606689453125, 0.16119384765625, 0.26171875, 0.36224365234375, 0.4627685546875, 0.56329345703125, 0.663818359375, 0.76434326171875, 0.8648681640625, 0.96539306640625, 1.06591796875, 1.16644287109375, 1.2669677734375, 1.36749267578125, 1.468017578125, 1.56854248046875, 1.6690673828125, 1.76959228515625, 1.8701171875, 1.97064208984375, 2.0711669921875, 2.17169189453125, 2.272216796875, 2.37274169921875, 2.4732666015625, 2.57379150390625, 2.67431640625, 2.77484130859375, 2.8753662109375, 2.97589111328125, 3.076416015625, 3.17694091796875, 3.2774658203125, 3.37799072265625, 3.478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 13.0, 16.0, 24.0, 29.0, 32.0, 50.0, 69.0, 114.0, 139.0, 235.0, 401.0, 703.0, 1689.0, 3396.0, 8007.0, 18819.0, 49053.0, 852727.0, 72701.0, 22661.0, 9442.0, 4140.0, 1916.0, 901.0, 448.0, 245.0, 178.0, 109.0, 77.0, 60.0, 29.0, 28.0, 29.0, 18.0, 8.0, 14.0, 7.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.615234375, -2.541778564453125, -2.46832275390625, -2.394866943359375, -2.3214111328125, -2.247955322265625, -2.17449951171875, -2.101043701171875, -2.027587890625, -1.954132080078125, -1.88067626953125, -1.807220458984375, -1.7337646484375, -1.660308837890625, -1.58685302734375, -1.513397216796875, -1.43994140625, -1.366485595703125, -1.29302978515625, -1.219573974609375, -1.1461181640625, -1.072662353515625, -0.99920654296875, -0.925750732421875, -0.852294921875, -0.778839111328125, -0.70538330078125, -0.631927490234375, -0.5584716796875, -0.485015869140625, -0.41156005859375, -0.338104248046875, -0.2646484375, -0.191192626953125, -0.11773681640625, -0.044281005859375, 0.0291748046875, 0.102630615234375, 0.17608642578125, 0.249542236328125, 0.322998046875, 0.396453857421875, 0.46990966796875, 0.543365478515625, 0.6168212890625, 0.690277099609375, 0.76373291015625, 0.837188720703125, 0.91064453125, 0.984100341796875, 1.05755615234375, 1.131011962890625, 1.2044677734375, 1.277923583984375, 1.35137939453125, 1.424835205078125, 1.498291015625, 1.571746826171875, 1.64520263671875, 1.718658447265625, 1.7921142578125, 1.865570068359375, 1.93902587890625, 2.012481689453125, 2.0859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 5.0, 10.0, 10.0, 13.0, 12.0, 17.0, 18.0, 26.0, 21.0, 22.0, 29.0, 25.0, 36.0, 38.0, 32.0, 38.0, 49.0, 31.0, 47.0, 40.0, 45.0, 36.0, 42.0, 45.0, 39.0, 33.0, 32.0, 26.0, 29.0, 11.0, 27.0, 22.0, 7.0, 17.0, 15.0, 7.0, 8.0, 7.0, 4.0, 5.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6796875, -1.6269378662109375, -1.574188232421875, -1.5214385986328125, -1.46868896484375, -1.4159393310546875, -1.363189697265625, -1.3104400634765625, -1.2576904296875, -1.2049407958984375, -1.152191162109375, -1.0994415283203125, -1.04669189453125, -0.9939422607421875, -0.941192626953125, -0.8884429931640625, -0.835693359375, -0.7829437255859375, -0.730194091796875, -0.6774444580078125, -0.62469482421875, -0.5719451904296875, -0.519195556640625, -0.4664459228515625, -0.4136962890625, -0.3609466552734375, -0.308197021484375, -0.2554473876953125, -0.20269775390625, -0.1499481201171875, -0.097198486328125, -0.0444488525390625, 0.00830078125, 0.0610504150390625, 0.113800048828125, 0.1665496826171875, 0.21929931640625, 0.2720489501953125, 0.324798583984375, 0.3775482177734375, 0.4302978515625, 0.4830474853515625, 0.535797119140625, 0.5885467529296875, 0.64129638671875, 0.6940460205078125, 0.746795654296875, 0.7995452880859375, 0.852294921875, 0.9050445556640625, 0.957794189453125, 1.0105438232421875, 1.06329345703125, 1.1160430908203125, 1.168792724609375, 1.2215423583984375, 1.2742919921875, 1.3270416259765625, 1.379791259765625, 1.4325408935546875, 1.48529052734375, 1.5380401611328125, 1.590789794921875, 1.6435394287109375, 1.6962890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 11.0, 8.0, 17.0, 12.0, 14.0, 37.0, 45.0, 66.0, 97.0, 177.0, 298.0, 497.0, 1142.0, 2604.0, 6677.0, 18473.0, 65826.0, 879947.0, 47725.0, 14899.0, 5495.0, 2251.0, 1021.0, 484.0, 255.0, 166.0, 82.0, 63.0, 38.0, 27.0, 12.0, 12.0, 9.0, 7.0, 8.0, 6.0, 5.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.2705078125, -0.2621612548828125, -0.253814697265625, -0.2454681396484375, -0.23712158203125, -0.2287750244140625, -0.220428466796875, -0.2120819091796875, -0.2037353515625, -0.1953887939453125, -0.187042236328125, -0.1786956787109375, -0.17034912109375, -0.1620025634765625, -0.153656005859375, -0.1453094482421875, -0.136962890625, -0.1286163330078125, -0.120269775390625, -0.1119232177734375, -0.10357666015625, -0.0952301025390625, -0.086883544921875, -0.0785369873046875, -0.0701904296875, -0.0618438720703125, -0.053497314453125, -0.0451507568359375, -0.03680419921875, -0.0284576416015625, -0.020111083984375, -0.0117645263671875, -0.00341796875, 0.0049285888671875, 0.013275146484375, 0.0216217041015625, 0.02996826171875, 0.0383148193359375, 0.046661376953125, 0.0550079345703125, 0.0633544921875, 0.0717010498046875, 0.080047607421875, 0.0883941650390625, 0.09674072265625, 0.1050872802734375, 0.113433837890625, 0.1217803955078125, 0.130126953125, 0.1384735107421875, 0.146820068359375, 0.1551666259765625, 0.16351318359375, 0.1718597412109375, 0.180206298828125, 0.1885528564453125, 0.1968994140625, 0.2052459716796875, 0.213592529296875, 0.2219390869140625, 0.23028564453125, 0.2386322021484375, 0.246978759765625, 0.2553253173828125, 0.263671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 18.0, 7.0, 17.0, 15.0, 19.0, 22.0, 28.0, 31.0, 45.0, 35.0, 45.0, 50.0, 45.0, 46.0, 47.0, 60.0, 56.0, 40.0, 44.0, 51.0, 39.0, 24.0, 34.0, 31.0, 31.0, 17.0, 12.0, 10.0, 9.0, 14.0, 9.0, 8.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-05, -1.5028752386569977e-05, -1.4560297131538391e-05, -1.4091841876506805e-05, -1.362338662147522e-05, -1.3154931366443634e-05, -1.2686476111412048e-05, -1.2218020856380463e-05, -1.1749565601348877e-05, -1.1281110346317291e-05, -1.0812655091285706e-05, -1.034419983625412e-05, -9.875744581222534e-06, -9.407289326190948e-06, -8.938834071159363e-06, -8.470378816127777e-06, -8.001923561096191e-06, -7.533468306064606e-06, -7.06501305103302e-06, -6.596557796001434e-06, -6.128102540969849e-06, -5.659647285938263e-06, -5.191192030906677e-06, -4.7227367758750916e-06, -4.254281520843506e-06, -3.78582626581192e-06, -3.3173710107803345e-06, -2.8489157557487488e-06, -2.380460500717163e-06, -1.9120052456855774e-06, -1.4435499906539917e-06, -9.75094735622406e-07, -5.066394805908203e-07, -3.818422555923462e-08, 4.302710294723511e-07, 8.987262845039368e-07, 1.3671815395355225e-06, 1.8356367945671082e-06, 2.304092049598694e-06, 2.7725473046302795e-06, 3.2410025596618652e-06, 3.709457814693451e-06, 4.177913069725037e-06, 4.646368324756622e-06, 5.114823579788208e-06, 5.583278834819794e-06, 6.051734089851379e-06, 6.520189344882965e-06, 6.988644599914551e-06, 7.4570998549461365e-06, 7.925555109977722e-06, 8.394010365009308e-06, 8.862465620040894e-06, 9.33092087507248e-06, 9.799376130104065e-06, 1.026783138513565e-05, 1.0736286640167236e-05, 1.1204741895198822e-05, 1.1673197150230408e-05, 1.2141652405261993e-05, 1.2610107660293579e-05, 1.3078562915325165e-05, 1.354701817035675e-05, 1.4015473425388336e-05, 1.4483928680419922e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 12.0, 15.0, 22.0, 26.0, 37.0, 67.0, 96.0, 148.0, 219.0, 290.0, 546.0, 815.0, 1340.0, 2106.0, 3672.0, 6126.0, 10167.0, 17792.0, 29826.0, 49942.0, 80457.0, 119996.0, 155090.0, 163226.0, 140951.0, 101375.0, 65864.0, 40036.0, 23670.0, 14033.0, 8160.0, 4781.0, 2885.0, 1718.0, 1082.0, 687.0, 421.0, 289.0, 172.0, 124.0, 96.0, 59.0, 45.0, 24.0, 18.0, 16.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12337493896484375, -0.1194305419921875, -0.11548614501953125, -0.111541748046875, -0.10759735107421875, -0.1036529541015625, -0.09970855712890625, -0.09576416015625, -0.09181976318359375, -0.0878753662109375, -0.08393096923828125, -0.079986572265625, -0.07604217529296875, -0.0720977783203125, -0.06815338134765625, -0.064208984375, -0.06026458740234375, -0.0563201904296875, -0.05237579345703125, -0.048431396484375, -0.04448699951171875, -0.0405426025390625, -0.03659820556640625, -0.03265380859375, -0.02870941162109375, -0.0247650146484375, -0.02082061767578125, -0.016876220703125, -0.01293182373046875, -0.0089874267578125, -0.00504302978515625, -0.0010986328125, 0.00284576416015625, 0.0067901611328125, 0.01073455810546875, 0.014678955078125, 0.01862335205078125, 0.0225677490234375, 0.02651214599609375, 0.03045654296875, 0.03440093994140625, 0.0383453369140625, 0.04228973388671875, 0.046234130859375, 0.05017852783203125, 0.0541229248046875, 0.05806732177734375, 0.06201171875, 0.06595611572265625, 0.0699005126953125, 0.07384490966796875, 0.077789306640625, 0.08173370361328125, 0.0856781005859375, 0.08962249755859375, 0.09356689453125, 0.09751129150390625, 0.1014556884765625, 0.10540008544921875, 0.109344482421875, 0.11328887939453125, 0.1172332763671875, 0.12117767333984375, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 6.0, 7.0, 11.0, 6.0, 17.0, 23.0, 22.0, 34.0, 35.0, 45.0, 53.0, 61.0, 60.0, 61.0, 54.0, 75.0, 53.0, 56.0, 51.0, 44.0, 47.0, 26.0, 40.0, 15.0, 15.0, 14.0, 12.0, 13.0, 11.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055084228515625, -0.05327606201171875, -0.0514678955078125, -0.04965972900390625, -0.0478515625, -0.04604339599609375, -0.0442352294921875, -0.04242706298828125, -0.040618896484375, -0.03881072998046875, -0.0370025634765625, -0.03519439697265625, -0.03338623046875, -0.03157806396484375, -0.0297698974609375, -0.02796173095703125, -0.026153564453125, -0.02434539794921875, -0.0225372314453125, -0.02072906494140625, -0.0189208984375, -0.01711273193359375, -0.0153045654296875, -0.01349639892578125, -0.011688232421875, -0.00988006591796875, -0.0080718994140625, -0.00626373291015625, -0.00445556640625, -0.00264739990234375, -0.0008392333984375, 0.00096893310546875, 0.002777099609375, 0.00458526611328125, 0.0063934326171875, 0.00820159912109375, 0.010009765625, 0.01181793212890625, 0.0136260986328125, 0.01543426513671875, 0.017242431640625, 0.01905059814453125, 0.0208587646484375, 0.02266693115234375, 0.02447509765625, 0.02628326416015625, 0.0280914306640625, 0.02989959716796875, 0.031707763671875, 0.03351593017578125, 0.0353240966796875, 0.03713226318359375, 0.0389404296875, 0.04074859619140625, 0.0425567626953125, 0.04436492919921875, 0.046173095703125, 0.04798126220703125, 0.0497894287109375, 0.05159759521484375, 0.05340576171875, 0.05521392822265625, 0.0570220947265625, 0.05883026123046875, 0.060638427734375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 8.0, 7.0, 8.0, 14.0, 14.0, 12.0, 24.0, 25.0, 25.0, 23.0, 26.0, 27.0, 28.0, 37.0, 44.0, 37.0, 51.0, 42.0, 39.0, 43.0, 45.0, 43.0, 42.0, 40.0, 29.0, 26.0, 27.0, 29.0, 22.0, 24.0, 27.0, 7.0, 22.0, 14.0, 14.0, 10.0, 11.0, 1.0, 4.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9304888248443604, -1.8680355548858643, -1.8055821657180786, -1.7431288957595825, -1.6806755065917969, -1.6182222366333008, -1.5557689666748047, -1.493315577507019, -1.4308621883392334, -1.3684089183807373, -1.3059555292129517, -1.2435022592544556, -1.18104887008667, -1.1185956001281738, -1.0561423301696777, -0.9936889410018921, -0.931235671043396, -0.8687823414802551, -0.8063290119171143, -0.7438757419586182, -0.6814223527908325, -0.6189690828323364, -0.5565157532691956, -0.4940624237060547, -0.4316090941429138, -0.36915576457977295, -0.3067024350166321, -0.2442491352558136, -0.18179580569267273, -0.11934247612953186, -0.05688917636871338, 0.00556415319442749, 0.06801748275756836, 0.13047081232070923, 0.1929241269826889, 0.2553774416446686, 0.31783077120780945, 0.3802841007709503, 0.4427374005317688, 0.5051907300949097, 0.5676440596580505, 0.6300973892211914, 0.6925507187843323, 0.7550040483474731, 0.8174573183059692, 0.8799107074737549, 0.942363977432251, 1.004817247390747, 1.0672706365585327, 1.1297239065170288, 1.1921772956848145, 1.2546305656433105, 1.3170839548110962, 1.3795372247695923, 1.441990613937378, 1.504443883895874, 1.5668971538543701, 1.6293504238128662, 1.6918038129806519, 1.754257082939148, 1.8167104721069336, 1.8791637420654297, 1.9416170120239258, 2.004070281982422, 2.066523790359497]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 7.0, 15.0, 20.0, 18.0, 18.0, 21.0, 27.0, 30.0, 36.0, 43.0, 52.0, 34.0, 44.0, 57.0, 49.0, 56.0, 48.0, 52.0, 52.0, 41.0, 26.0, 38.0, 36.0, 31.0, 21.0, 22.0, 13.0, 14.0, 19.0, 17.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7020034790039062, -2.6178953647613525, -2.533787250518799, -2.449679374694824, -2.3655712604522705, -2.281463146209717, -2.197355031967163, -2.1132469177246094, -2.0291390419006348, -1.945030927658081, -1.860922932624817, -1.7768148183822632, -1.692706823348999, -1.6085987091064453, -1.5244905948638916, -1.4403825998306274, -1.3562744855880737, -1.27216637134552, -1.1880583763122559, -1.1039502620697021, -1.019842267036438, -0.9357341527938843, -0.8516260981559753, -0.7675180435180664, -0.6834099888801575, -0.5993019342422485, -0.5151938796043396, -0.4310857951641083, -0.34697774052619934, -0.2628696858882904, -0.17876160144805908, -0.09465354681015015, -0.010545492172241211, 0.07356256991624832, 0.15767063200473785, 0.24177870154380798, 0.3258867561817169, 0.40999481081962585, 0.4941028952598572, 0.5782109498977661, 0.662319004535675, 0.746427059173584, 0.8305351138114929, 0.9146431684494019, 0.9987512826919556, 1.0828592777252197, 1.1669673919677734, 1.2510755062103271, 1.3351835012435913, 1.419291615486145, 1.5033996105194092, 1.587507724761963, 1.671615719795227, 1.7557238340377808, 1.839831829071045, 1.9239399433135986, 2.0080480575561523, 2.092156171798706, 2.1762642860412598, 2.2603721618652344, 2.344480276107788, 2.428588390350342, 2.5126965045928955, 2.596804618835449, 2.680912494659424]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 9.0, 4.0, 13.0, 16.0, 24.0, 44.0, 53.0, 105.0, 149.0, 191.0, 346.0, 557.0, 929.0, 1340.0, 2166.0, 3378.0, 5083.0, 7901.0, 11591.0, 16959.0, 24625.0, 34073.0, 46539.0, 60295.0, 74979.0, 87941.0, 96718.0, 99206.0, 96807.0, 87510.0, 74234.0, 60015.0, 45625.0, 34389.0, 24298.0, 16983.0, 11469.0, 7673.0, 5127.0, 3265.0, 2142.0, 1379.0, 895.0, 547.0, 345.0, 235.0, 159.0, 77.0, 47.0, 47.0, 23.0, 18.0, 14.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0830078125, -1.0462799072265625, -1.009552001953125, -0.9728240966796875, -0.93609619140625, -0.8993682861328125, -0.862640380859375, -0.8259124755859375, -0.7891845703125, -0.7524566650390625, -0.715728759765625, -0.6790008544921875, -0.64227294921875, -0.6055450439453125, -0.568817138671875, -0.5320892333984375, -0.495361328125, -0.4586334228515625, -0.421905517578125, -0.3851776123046875, -0.34844970703125, -0.3117218017578125, -0.274993896484375, -0.2382659912109375, -0.2015380859375, -0.1648101806640625, -0.128082275390625, -0.0913543701171875, -0.05462646484375, -0.0178985595703125, 0.018829345703125, 0.0555572509765625, 0.09228515625, 0.1290130615234375, 0.165740966796875, 0.2024688720703125, 0.23919677734375, 0.2759246826171875, 0.312652587890625, 0.3493804931640625, 0.3861083984375, 0.4228363037109375, 0.459564208984375, 0.4962921142578125, 0.53302001953125, 0.5697479248046875, 0.606475830078125, 0.6432037353515625, 0.679931640625, 0.7166595458984375, 0.753387451171875, 0.7901153564453125, 0.82684326171875, 0.8635711669921875, 0.900299072265625, 0.9370269775390625, 0.9737548828125, 1.0104827880859375, 1.047210693359375, 1.0839385986328125, 1.12066650390625, 1.1573944091796875, 1.194122314453125, 1.2308502197265625, 1.267578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 7.0, 9.0, 15.0, 15.0, 16.0, 17.0, 20.0, 29.0, 36.0, 29.0, 41.0, 42.0, 54.0, 44.0, 53.0, 57.0, 56.0, 40.0, 52.0, 54.0, 50.0, 38.0, 30.0, 30.0, 29.0, 30.0, 14.0, 18.0, 18.0, 15.0, 7.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.551177978515625, -2.46368408203125, -2.376190185546875, -2.2886962890625, -2.201202392578125, -2.11370849609375, -2.026214599609375, -1.938720703125, -1.851226806640625, -1.76373291015625, -1.676239013671875, -1.5887451171875, -1.501251220703125, -1.41375732421875, -1.326263427734375, -1.23876953125, -1.151275634765625, -1.06378173828125, -0.976287841796875, -0.8887939453125, -0.801300048828125, -0.71380615234375, -0.626312255859375, -0.538818359375, -0.451324462890625, -0.36383056640625, -0.276336669921875, -0.1888427734375, -0.101348876953125, -0.01385498046875, 0.073638916015625, 0.1611328125, 0.248626708984375, 0.33612060546875, 0.423614501953125, 0.5111083984375, 0.598602294921875, 0.68609619140625, 0.773590087890625, 0.861083984375, 0.948577880859375, 1.03607177734375, 1.123565673828125, 1.2110595703125, 1.298553466796875, 1.38604736328125, 1.473541259765625, 1.56103515625, 1.648529052734375, 1.73602294921875, 1.823516845703125, 1.9110107421875, 1.998504638671875, 2.08599853515625, 2.173492431640625, 2.260986328125, 2.348480224609375, 2.43597412109375, 2.523468017578125, 2.6109619140625, 2.698455810546875, 2.78594970703125, 2.873443603515625, 2.9609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 9.0, 14.0, 18.0, 16.0, 32.0, 51.0, 79.0, 123.0, 197.0, 307.0, 465.0, 738.0, 1131.0, 1677.0, 2675.0, 4109.0, 6515.0, 9811.0, 15032.0, 21584.0, 31697.0, 44645.0, 60601.0, 77062.0, 92506.0, 103854.0, 108051.0, 103061.0, 90826.0, 75622.0, 58707.0, 43522.0, 30993.0, 21448.0, 14472.0, 9244.0, 6173.0, 4067.0, 2667.0, 1611.0, 1089.0, 721.0, 437.0, 292.0, 205.0, 128.0, 100.0, 51.0, 38.0, 25.0, 18.0, 10.0, 10.0, 1.0, 5.0, 2.0, 2.0, 3.0], "bins": [-1.3828125, -1.3402099609375, -1.297607421875, -1.2550048828125, -1.21240234375, -1.1697998046875, -1.127197265625, -1.0845947265625, -1.0419921875, -0.9993896484375, -0.956787109375, -0.9141845703125, -0.87158203125, -0.8289794921875, -0.786376953125, -0.7437744140625, -0.701171875, -0.6585693359375, -0.615966796875, -0.5733642578125, -0.53076171875, -0.4881591796875, -0.445556640625, -0.4029541015625, -0.3603515625, -0.3177490234375, -0.275146484375, -0.2325439453125, -0.18994140625, -0.1473388671875, -0.104736328125, -0.0621337890625, -0.01953125, 0.0230712890625, 0.065673828125, 0.1082763671875, 0.15087890625, 0.1934814453125, 0.236083984375, 0.2786865234375, 0.3212890625, 0.3638916015625, 0.406494140625, 0.4490966796875, 0.49169921875, 0.5343017578125, 0.576904296875, 0.6195068359375, 0.662109375, 0.7047119140625, 0.747314453125, 0.7899169921875, 0.83251953125, 0.8751220703125, 0.917724609375, 0.9603271484375, 1.0029296875, 1.0455322265625, 1.088134765625, 1.1307373046875, 1.17333984375, 1.2159423828125, 1.258544921875, 1.3011474609375, 1.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 9.0, 10.0, 7.0, 15.0, 12.0, 15.0, 23.0, 23.0, 39.0, 38.0, 29.0, 40.0, 34.0, 39.0, 45.0, 34.0, 43.0, 55.0, 40.0, 43.0, 37.0, 37.0, 47.0, 38.0, 31.0, 32.0, 29.0, 29.0, 19.0, 18.0, 19.0, 7.0, 15.0, 12.0, 10.0, 3.0, 3.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8408203125, -1.7874603271484375, -1.734100341796875, -1.6807403564453125, -1.62738037109375, -1.5740203857421875, -1.520660400390625, -1.4673004150390625, -1.4139404296875, -1.3605804443359375, -1.307220458984375, -1.2538604736328125, -1.20050048828125, -1.1471405029296875, -1.093780517578125, -1.0404205322265625, -0.987060546875, -0.9337005615234375, -0.880340576171875, -0.8269805908203125, -0.77362060546875, -0.7202606201171875, -0.666900634765625, -0.6135406494140625, -0.5601806640625, -0.5068206787109375, -0.453460693359375, -0.4001007080078125, -0.34674072265625, -0.2933807373046875, -0.240020751953125, -0.1866607666015625, -0.13330078125, -0.0799407958984375, -0.026580810546875, 0.0267791748046875, 0.08013916015625, 0.1334991455078125, 0.186859130859375, 0.2402191162109375, 0.2935791015625, 0.3469390869140625, 0.400299072265625, 0.4536590576171875, 0.50701904296875, 0.5603790283203125, 0.613739013671875, 0.6670989990234375, 0.720458984375, 0.7738189697265625, 0.827178955078125, 0.8805389404296875, 0.93389892578125, 0.9872589111328125, 1.040618896484375, 1.0939788818359375, 1.1473388671875, 1.2006988525390625, 1.254058837890625, 1.3074188232421875, 1.36077880859375, 1.4141387939453125, 1.467498779296875, 1.5208587646484375, 1.57421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 6.0, 11.0, 10.0, 15.0, 11.0, 35.0, 35.0, 70.0, 106.0, 137.0, 207.0, 336.0, 537.0, 882.0, 1516.0, 2295.0, 4027.0, 6628.0, 11138.0, 17739.0, 28318.0, 43918.0, 64018.0, 86500.0, 108975.0, 124159.0, 126966.0, 116153.0, 94804.0, 71684.0, 50328.0, 33177.0, 20803.0, 13106.0, 7924.0, 4653.0, 2849.0, 1698.0, 1027.0, 613.0, 382.0, 261.0, 158.0, 117.0, 68.0, 53.0, 39.0, 17.0, 17.0, 16.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.5532989501953125, -0.534332275390625, -0.5153656005859375, -0.49639892578125, -0.4774322509765625, -0.458465576171875, -0.4394989013671875, -0.4205322265625, -0.4015655517578125, -0.382598876953125, -0.3636322021484375, -0.34466552734375, -0.3256988525390625, -0.306732177734375, -0.2877655029296875, -0.268798828125, -0.2498321533203125, -0.230865478515625, -0.2118988037109375, -0.19293212890625, -0.1739654541015625, -0.154998779296875, -0.1360321044921875, -0.1170654296875, -0.0980987548828125, -0.079132080078125, -0.0601654052734375, -0.04119873046875, -0.0222320556640625, -0.003265380859375, 0.0157012939453125, 0.03466796875, 0.0536346435546875, 0.072601318359375, 0.0915679931640625, 0.11053466796875, 0.1295013427734375, 0.148468017578125, 0.1674346923828125, 0.1864013671875, 0.2053680419921875, 0.224334716796875, 0.2433013916015625, 0.26226806640625, 0.2812347412109375, 0.300201416015625, 0.3191680908203125, 0.338134765625, 0.3571014404296875, 0.376068115234375, 0.3950347900390625, 0.41400146484375, 0.4329681396484375, 0.451934814453125, 0.4709014892578125, 0.4898681640625, 0.5088348388671875, 0.527801513671875, 0.5467681884765625, 0.56573486328125, 0.5847015380859375, 0.603668212890625, 0.6226348876953125, 0.6416015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 7.0, 10.0, 16.0, 9.0, 18.0, 15.0, 24.0, 26.0, 40.0, 29.0, 31.0, 66.0, 45.0, 49.0, 56.0, 61.0, 62.0, 46.0, 66.0, 48.0, 43.0, 26.0, 40.0, 34.0, 36.0, 25.0, 17.0, 12.0, 11.0, 12.0, 4.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.499622344970703e-05, -8.261669427156448e-05, -8.023716509342194e-05, -7.785763591527939e-05, -7.547810673713684e-05, -7.309857755899429e-05, -7.071904838085175e-05, -6.83395192027092e-05, -6.595999002456665e-05, -6.35804608464241e-05, -6.120093166828156e-05, -5.882140249013901e-05, -5.644187331199646e-05, -5.406234413385391e-05, -5.1682814955711365e-05, -4.930328577756882e-05, -4.692375659942627e-05, -4.454422742128372e-05, -4.2164698243141174e-05, -3.978516906499863e-05, -3.740563988685608e-05, -3.502611070871353e-05, -3.2646581530570984e-05, -3.0267052352428436e-05, -2.788752317428589e-05, -2.550799399614334e-05, -2.3128464818000793e-05, -2.0748935639858246e-05, -1.8369406461715698e-05, -1.598987728357315e-05, -1.3610348105430603e-05, -1.1230818927288055e-05, -8.851289749145508e-06, -6.47176057100296e-06, -4.092231392860413e-06, -1.712702214717865e-06, 6.668269634246826e-07, 3.0463561415672302e-06, 5.425885319709778e-06, 7.805414497852325e-06, 1.0184943675994873e-05, 1.256447285413742e-05, 1.4944002032279968e-05, 1.7323531210422516e-05, 1.9703060388565063e-05, 2.208258956670761e-05, 2.446211874485016e-05, 2.6841647922992706e-05, 2.9221177101135254e-05, 3.16007062792778e-05, 3.398023545742035e-05, 3.63597646355629e-05, 3.8739293813705444e-05, 4.111882299184799e-05, 4.349835216999054e-05, 4.587788134813309e-05, 4.8257410526275635e-05, 5.063693970441818e-05, 5.301646888256073e-05, 5.539599806070328e-05, 5.7775527238845825e-05, 6.015505641698837e-05, 6.253458559513092e-05, 6.491411477327347e-05, 6.729364395141602e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 12.0, 19.0, 29.0, 29.0, 65.0, 101.0, 173.0, 275.0, 440.0, 710.0, 1130.0, 1804.0, 3008.0, 4875.0, 7965.0, 12379.0, 19056.0, 29304.0, 42622.0, 59965.0, 78786.0, 98157.0, 111645.0, 115582.0, 110401.0, 96174.0, 77030.0, 57682.0, 41003.0, 28013.0, 18703.0, 11772.0, 7570.0, 4671.0, 2802.0, 1713.0, 1108.0, 679.0, 411.0, 253.0, 157.0, 98.0, 57.0, 39.0, 26.0, 28.0, 4.0, 6.0, 9.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5189971923828125, -0.501373291015625, -0.4837493896484375, -0.46612548828125, -0.4485015869140625, -0.430877685546875, -0.4132537841796875, -0.3956298828125, -0.3780059814453125, -0.360382080078125, -0.3427581787109375, -0.32513427734375, -0.3075103759765625, -0.289886474609375, -0.2722625732421875, -0.254638671875, -0.2370147705078125, -0.219390869140625, -0.2017669677734375, -0.18414306640625, -0.1665191650390625, -0.148895263671875, -0.1312713623046875, -0.1136474609375, -0.0960235595703125, -0.078399658203125, -0.0607757568359375, -0.04315185546875, -0.0255279541015625, -0.007904052734375, 0.0097198486328125, 0.02734375, 0.0449676513671875, 0.062591552734375, 0.0802154541015625, 0.09783935546875, 0.1154632568359375, 0.133087158203125, 0.1507110595703125, 0.1683349609375, 0.1859588623046875, 0.203582763671875, 0.2212066650390625, 0.23883056640625, 0.2564544677734375, 0.274078369140625, 0.2917022705078125, 0.309326171875, 0.3269500732421875, 0.344573974609375, 0.3621978759765625, 0.37982177734375, 0.3974456787109375, 0.415069580078125, 0.4326934814453125, 0.4503173828125, 0.4679412841796875, 0.485565185546875, 0.5031890869140625, 0.52081298828125, 0.5384368896484375, 0.556060791015625, 0.5736846923828125, 0.59130859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 8.0, 16.0, 21.0, 23.0, 23.0, 27.0, 26.0, 41.0, 51.0, 40.0, 33.0, 47.0, 41.0, 47.0, 54.0, 51.0, 41.0, 38.0, 38.0, 48.0, 50.0, 24.0, 36.0, 33.0, 23.0, 17.0, 17.0, 11.0, 12.0, 5.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.282958984375, -0.2747211456298828, -0.2664833068847656, -0.25824546813964844, -0.25000762939453125, -0.24176979064941406, -0.23353195190429688, -0.2252941131591797, -0.2170562744140625, -0.2088184356689453, -0.20058059692382812, -0.19234275817871094, -0.18410491943359375, -0.17586708068847656, -0.16762924194335938, -0.1593914031982422, -0.151153564453125, -0.1429157257080078, -0.13467788696289062, -0.12644004821777344, -0.11820220947265625, -0.10996437072753906, -0.10172653198242188, -0.09348869323730469, -0.0852508544921875, -0.07701301574707031, -0.06877517700195312, -0.06053733825683594, -0.05229949951171875, -0.04406166076660156, -0.035823822021484375, -0.027585983276367188, -0.01934814453125, -0.011110305786132812, -0.002872467041015625, 0.0053653717041015625, 0.01360321044921875, 0.021841049194335938, 0.030078887939453125, 0.03831672668457031, 0.0465545654296875, 0.05479240417480469, 0.06303024291992188, 0.07126808166503906, 0.07950592041015625, 0.08774375915527344, 0.09598159790039062, 0.10421943664550781, 0.112457275390625, 0.12069511413574219, 0.12893295288085938, 0.13717079162597656, 0.14540863037109375, 0.15364646911621094, 0.16188430786132812, 0.1701221466064453, 0.1783599853515625, 0.1865978240966797, 0.19483566284179688, 0.20307350158691406, 0.21131134033203125, 0.21954917907714844, 0.22778701782226562, 0.2360248565673828, 0.2442626953125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 9.0, 11.0, 14.0, 20.0, 27.0, 21.0, 23.0, 27.0, 30.0, 22.0, 37.0, 35.0, 29.0, 47.0, 37.0, 38.0, 34.0, 32.0, 42.0, 49.0, 44.0, 28.0, 28.0, 26.0, 43.0, 18.0, 24.0, 23.0, 28.0, 29.0, 13.0, 15.0, 15.0, 12.0, 7.0, 4.0, 3.0, 9.0, 3.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.021284341812134, -1.96177339553833, -1.9022623300552368, -1.842751383781433, -1.7832403182983398, -1.7237293720245361, -1.6642184257507324, -1.6047073602676392, -1.545196294784546, -1.4856853485107422, -1.426174283027649, -1.3666633367538452, -1.307152271270752, -1.2476413249969482, -1.1881303787231445, -1.1286193132400513, -1.0691083669662476, -1.0095974206924438, -0.9500863552093506, -0.8905754089355469, -0.8310643434524536, -0.7715533971786499, -0.7120423913002014, -0.6525313854217529, -0.5930203795433044, -0.533509373664856, -0.47399836778640747, -0.41448739171028137, -0.3549763858318329, -0.2954653799533844, -0.2359544038772583, -0.17644339799880981, -0.11693227291107178, -0.05742127448320389, 0.0020897239446640015, 0.061600714921951294, 0.12111172080039978, 0.18062272667884827, 0.24013370275497437, 0.29964470863342285, 0.35915571451187134, 0.4186667203903198, 0.4781777262687683, 0.5376887321472168, 0.5971996784210205, 0.6567107439041138, 0.7162216901779175, 0.775732696056366, 0.8352437019348145, 0.8947547078132629, 0.9542657136917114, 1.0137766599655151, 1.0732877254486084, 1.132798671722412, 1.1923096179962158, 1.251820683479309, 1.3113317489624023, 1.370842695236206, 1.4303537607192993, 1.489864706993103, 1.5493757724761963, 1.60888671875, 1.6683976650238037, 1.727908730506897, 1.7874196767807007]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 3.0, 4.0, 11.0, 14.0, 16.0, 21.0, 27.0, 21.0, 25.0, 31.0, 37.0, 42.0, 39.0, 40.0, 46.0, 45.0, 56.0, 39.0, 64.0, 36.0, 58.0, 49.0, 40.0, 42.0, 33.0, 29.0, 25.0, 15.0, 25.0, 8.0, 17.0, 8.0, 7.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.84936785697937, -2.758127212524414, -2.666886329650879, -2.575645685195923, -2.484405040740967, -2.3931643962860107, -2.3019235134124756, -2.2106828689575195, -2.1194422245025635, -2.0282015800476074, -1.9369608163833618, -1.8457200527191162, -1.7544794082641602, -1.6632386445999146, -1.571997880935669, -1.480757236480713, -1.3895164728164673, -1.2982757091522217, -1.2070350646972656, -1.11579430103302, -1.024553656578064, -0.9333128929138184, -0.8420721888542175, -0.7508314847946167, -0.6595907807350159, -0.568350076675415, -0.4771093726158142, -0.385868638753891, -0.29462793469429016, -0.20338723063468933, -0.11214649677276611, -0.020905792713165283, 0.07033491134643555, 0.16157561540603638, 0.2528163194656372, 0.3440570533275604, 0.43529775738716125, 0.5265384912490845, 0.6177791953086853, 0.7090198993682861, 0.800260603427887, 0.8915013074874878, 0.9827420115470886, 1.0739827156066895, 1.165223479270935, 1.2564641237258911, 1.3477048873901367, 1.4389455318450928, 1.5301862955093384, 1.621427059173584, 1.71266770362854, 1.8039084672927856, 1.8951491117477417, 1.9863898754119873, 2.0776305198669434, 2.1688714027404785, 2.2601120471954346, 2.3513526916503906, 2.442593574523926, 2.533834218978882, 2.625074863433838, 2.716315507888794, 2.807556390762329, 2.898797035217285, 2.990037679672241]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 10.0, 21.0, 21.0, 35.0, 71.0, 118.0, 160.0, 269.0, 478.0, 683.0, 1072.0, 1793.0, 2726.0, 4496.0, 7238.0, 11453.0, 18547.0, 29771.0, 48497.0, 78818.0, 125040.0, 196693.0, 295286.0, 407473.0, 510218.0, 557130.0, 528329.0, 438226.0, 324283.0, 220768.0, 143726.0, 90169.0, 55919.0, 34841.0, 21946.0, 13856.0, 8632.0, 5559.0, 3562.0, 2301.0, 1475.0, 940.0, 558.0, 376.0, 257.0, 172.0, 114.0, 64.0, 36.0, 21.0, 14.0, 7.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.4970703125, -1.44976806640625, -1.4024658203125, -1.35516357421875, -1.307861328125, -1.26055908203125, -1.2132568359375, -1.16595458984375, -1.11865234375, -1.07135009765625, -1.0240478515625, -0.97674560546875, -0.929443359375, -0.88214111328125, -0.8348388671875, -0.78753662109375, -0.740234375, -0.69293212890625, -0.6456298828125, -0.59832763671875, -0.551025390625, -0.50372314453125, -0.4564208984375, -0.40911865234375, -0.36181640625, -0.31451416015625, -0.2672119140625, -0.21990966796875, -0.172607421875, -0.12530517578125, -0.0780029296875, -0.03070068359375, 0.0166015625, 0.06390380859375, 0.1112060546875, 0.15850830078125, 0.205810546875, 0.25311279296875, 0.3004150390625, 0.34771728515625, 0.39501953125, 0.44232177734375, 0.4896240234375, 0.53692626953125, 0.584228515625, 0.63153076171875, 0.6788330078125, 0.72613525390625, 0.7734375, 0.82073974609375, 0.8680419921875, 0.91534423828125, 0.962646484375, 1.00994873046875, 1.0572509765625, 1.10455322265625, 1.15185546875, 1.19915771484375, 1.2464599609375, 1.29376220703125, 1.341064453125, 1.38836669921875, 1.4356689453125, 1.48297119140625, 1.5302734375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 5.0, 3.0, 9.0, 11.0, 10.0, 13.0, 18.0, 22.0, 27.0, 34.0, 25.0, 39.0, 38.0, 45.0, 50.0, 41.0, 44.0, 36.0, 45.0, 46.0, 47.0, 48.0, 50.0, 46.0, 37.0, 36.0, 30.0, 21.0, 23.0, 13.0, 19.0, 16.0, 14.0, 9.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3203125, -2.24603271484375, -2.1717529296875, -2.09747314453125, -2.023193359375, -1.94891357421875, -1.8746337890625, -1.80035400390625, -1.72607421875, -1.65179443359375, -1.5775146484375, -1.50323486328125, -1.428955078125, -1.35467529296875, -1.2803955078125, -1.20611572265625, -1.1318359375, -1.05755615234375, -0.9832763671875, -0.90899658203125, -0.834716796875, -0.76043701171875, -0.6861572265625, -0.61187744140625, -0.53759765625, -0.46331787109375, -0.3890380859375, -0.31475830078125, -0.240478515625, -0.16619873046875, -0.0919189453125, -0.01763916015625, 0.056640625, 0.13092041015625, 0.2052001953125, 0.27947998046875, 0.353759765625, 0.42803955078125, 0.5023193359375, 0.57659912109375, 0.65087890625, 0.72515869140625, 0.7994384765625, 0.87371826171875, 0.947998046875, 1.02227783203125, 1.0965576171875, 1.17083740234375, 1.2451171875, 1.31939697265625, 1.3936767578125, 1.46795654296875, 1.542236328125, 1.61651611328125, 1.6907958984375, 1.76507568359375, 1.83935546875, 1.91363525390625, 1.9879150390625, 2.06219482421875, 2.136474609375, 2.21075439453125, 2.2850341796875, 2.35931396484375, 2.43359375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 11.0, 24.0, 40.0, 66.0, 112.0, 158.0, 258.0, 425.0, 690.0, 1057.0, 1793.0, 2827.0, 4520.0, 7552.0, 12102.0, 19608.0, 31879.0, 51963.0, 82228.0, 130234.0, 199160.0, 292348.0, 399818.0, 497987.0, 546310.0, 520442.0, 434149.0, 325796.0, 227270.0, 149664.0, 95945.0, 60367.0, 37574.0, 23042.0, 14058.0, 8710.0, 5353.0, 3312.0, 2101.0, 1284.0, 781.0, 502.0, 282.0, 158.0, 108.0, 78.0, 48.0, 28.0, 18.0, 6.0, 16.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-1.783203125, -1.7268829345703125, -1.670562744140625, -1.6142425537109375, -1.55792236328125, -1.5016021728515625, -1.445281982421875, -1.3889617919921875, -1.3326416015625, -1.2763214111328125, -1.220001220703125, -1.1636810302734375, -1.10736083984375, -1.0510406494140625, -0.994720458984375, -0.9384002685546875, -0.882080078125, -0.8257598876953125, -0.769439697265625, -0.7131195068359375, -0.65679931640625, -0.6004791259765625, -0.544158935546875, -0.4878387451171875, -0.4315185546875, -0.3751983642578125, -0.318878173828125, -0.2625579833984375, -0.20623779296875, -0.1499176025390625, -0.093597412109375, -0.0372772216796875, 0.01904296875, 0.0753631591796875, 0.131683349609375, 0.1880035400390625, 0.24432373046875, 0.3006439208984375, 0.356964111328125, 0.4132843017578125, 0.4696044921875, 0.5259246826171875, 0.582244873046875, 0.6385650634765625, 0.69488525390625, 0.7512054443359375, 0.807525634765625, 0.8638458251953125, 0.920166015625, 0.9764862060546875, 1.032806396484375, 1.0891265869140625, 1.14544677734375, 1.2017669677734375, 1.258087158203125, 1.3144073486328125, 1.3707275390625, 1.4270477294921875, 1.483367919921875, 1.5396881103515625, 1.59600830078125, 1.6523284912109375, 1.708648681640625, 1.7649688720703125, 1.8212890625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 12.0, 16.0, 14.0, 14.0, 38.0, 37.0, 36.0, 50.0, 63.0, 85.0, 100.0, 96.0, 130.0, 139.0, 136.0, 152.0, 191.0, 200.0, 223.0, 199.0, 190.0, 195.0, 203.0, 207.0, 177.0, 196.0, 132.0, 158.0, 115.0, 105.0, 84.0, 60.0, 70.0, 54.0, 26.0, 33.0, 32.0, 32.0, 13.0, 8.0, 12.0, 7.0, 10.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.79296875, -0.7668609619140625, -0.740753173828125, -0.7146453857421875, -0.68853759765625, -0.6624298095703125, -0.636322021484375, -0.6102142333984375, -0.5841064453125, -0.5579986572265625, -0.531890869140625, -0.5057830810546875, -0.47967529296875, -0.4535675048828125, -0.427459716796875, -0.4013519287109375, -0.375244140625, -0.3491363525390625, -0.323028564453125, -0.2969207763671875, -0.27081298828125, -0.2447052001953125, -0.218597412109375, -0.1924896240234375, -0.1663818359375, -0.1402740478515625, -0.114166259765625, -0.0880584716796875, -0.06195068359375, -0.0358428955078125, -0.009735107421875, 0.0163726806640625, 0.04248046875, 0.0685882568359375, 0.094696044921875, 0.1208038330078125, 0.14691162109375, 0.1730194091796875, 0.199127197265625, 0.2252349853515625, 0.2513427734375, 0.2774505615234375, 0.303558349609375, 0.3296661376953125, 0.35577392578125, 0.3818817138671875, 0.407989501953125, 0.4340972900390625, 0.460205078125, 0.4863128662109375, 0.512420654296875, 0.5385284423828125, 0.56463623046875, 0.5907440185546875, 0.616851806640625, 0.6429595947265625, 0.6690673828125, 0.6951751708984375, 0.721282958984375, 0.7473907470703125, 0.77349853515625, 0.7996063232421875, 0.825714111328125, 0.8518218994140625, 0.8779296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 7.0, 5.0, 10.0, 3.0, 14.0, 14.0, 16.0, 16.0, 28.0, 15.0, 30.0, 23.0, 31.0, 28.0, 35.0, 31.0, 37.0, 40.0, 47.0, 39.0, 42.0, 43.0, 41.0, 41.0, 36.0, 27.0, 39.0, 37.0, 28.0, 27.0, 17.0, 30.0, 20.0, 26.0, 10.0, 7.0, 8.0, 6.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.142209053039551, -2.0780487060546875, -2.0138885974884033, -1.9497283697128296, -1.8855681419372559, -1.8214077949523926, -1.7572475671768188, -1.6930873394012451, -1.6289271116256714, -1.5647668838500977, -1.500606656074524, -1.4364464282989502, -1.372286081314087, -1.3081259727478027, -1.2439656257629395, -1.1798053979873657, -1.115645170211792, -1.0514849424362183, -0.9873247146606445, -0.923164427280426, -0.8590041995048523, -0.7948439717292786, -0.7306836843490601, -0.6665234565734863, -0.6023632287979126, -0.5382030010223389, -0.47404274344444275, -0.40988248586654663, -0.3457222580909729, -0.28156203031539917, -0.21740177273750305, -0.15324151515960693, -0.0890815258026123, -0.02492128312587738, 0.039238959550857544, 0.10339920222759247, 0.1675594449043274, 0.23171967267990112, 0.29587993025779724, 0.36004018783569336, 0.4242004156112671, 0.4883606433868408, 0.5525208711624146, 0.6166811585426331, 0.6808413863182068, 0.7450016140937805, 0.809161901473999, 0.8733221292495728, 0.9374823570251465, 1.0016425848007202, 1.065802812576294, 1.1299630403518677, 1.1941232681274414, 1.2582836151123047, 1.3224438428878784, 1.3866040706634521, 1.4507642984390259, 1.5149245262145996, 1.5790847539901733, 1.643244981765747, 1.7074053287506104, 1.7715654373168945, 1.8357257843017578, 1.8998860120773315, 1.9640462398529053]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 4.0, 12.0, 9.0, 6.0, 10.0, 13.0, 9.0, 24.0, 18.0, 21.0, 33.0, 32.0, 25.0, 41.0, 43.0, 38.0, 48.0, 45.0, 47.0, 42.0, 49.0, 40.0, 43.0, 37.0, 35.0, 38.0, 21.0, 49.0, 33.0, 22.0, 22.0, 22.0, 10.0, 10.0, 11.0, 10.0, 10.0, 7.0, 4.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4738821983337402, -2.393336772918701, -2.312791347503662, -2.232245922088623, -2.151700258255005, -2.071154832839966, -1.9906094074249268, -1.9100639820098877, -1.8295185565948486, -1.7489731311798096, -1.668427586555481, -1.587882161140442, -1.5073367357254028, -1.4267911911010742, -1.3462457656860352, -1.265700340270996, -1.1851547956466675, -1.1046093702316284, -1.0240638256072998, -0.9435184001922607, -0.8629729747772217, -0.7824274897575378, -0.701882004737854, -0.6213365793228149, -0.5407910943031311, -0.46024563908576965, -0.3797001838684082, -0.29915469884872437, -0.21860924363136292, -0.13806378841400146, -0.05751830339431763, 0.023027122020721436, 0.10357260704040527, 0.18411806225776672, 0.2646635174751282, 0.345209002494812, 0.42575445771217346, 0.5062999129295349, 0.5868453979492188, 0.6673908233642578, 0.7479363083839417, 0.8284817934036255, 0.9090272188186646, 0.9895727038383484, 1.0701181888580322, 1.1506636142730713, 1.2312090396881104, 1.3117544651031494, 1.392300009727478, 1.472845435142517, 1.5533909797668457, 1.6339364051818848, 1.7144818305969238, 1.795027256011963, 1.8755728006362915, 1.9561182260513306, 2.036663770675659, 2.1172091960906982, 2.1977546215057373, 2.2783002853393555, 2.3588457107543945, 2.4393911361694336, 2.5199365615844727, 2.6004819869995117, 2.681027412414551]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 2.0, 6.0, 10.0, 12.0, 10.0, 17.0, 13.0, 19.0, 33.0, 47.0, 71.0, 96.0, 143.0, 223.0, 310.0, 483.0, 789.0, 1179.0, 1940.0, 3269.0, 5982.0, 10462.0, 19648.0, 36310.0, 66146.0, 112032.0, 166500.0, 194134.0, 167730.0, 112389.0, 66543.0, 36604.0, 19947.0, 10738.0, 5938.0, 3347.0, 1958.0, 1217.0, 797.0, 484.0, 283.0, 203.0, 157.0, 103.0, 80.0, 46.0, 37.0, 19.0, 20.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5739593505859375, -0.555145263671875, -0.5363311767578125, -0.51751708984375, -0.4987030029296875, -0.479888916015625, -0.4610748291015625, -0.4422607421875, -0.4234466552734375, -0.404632568359375, -0.3858184814453125, -0.36700439453125, -0.3481903076171875, -0.329376220703125, -0.3105621337890625, -0.291748046875, -0.2729339599609375, -0.254119873046875, -0.2353057861328125, -0.21649169921875, -0.1976776123046875, -0.178863525390625, -0.1600494384765625, -0.1412353515625, -0.1224212646484375, -0.103607177734375, -0.0847930908203125, -0.06597900390625, -0.0471649169921875, -0.028350830078125, -0.0095367431640625, 0.00927734375, 0.0280914306640625, 0.046905517578125, 0.0657196044921875, 0.08453369140625, 0.1033477783203125, 0.122161865234375, 0.1409759521484375, 0.1597900390625, 0.1786041259765625, 0.197418212890625, 0.2162322998046875, 0.23504638671875, 0.2538604736328125, 0.272674560546875, 0.2914886474609375, 0.310302734375, 0.3291168212890625, 0.347930908203125, 0.3667449951171875, 0.38555908203125, 0.4043731689453125, 0.423187255859375, 0.4420013427734375, 0.4608154296875, 0.4796295166015625, 0.498443603515625, 0.5172576904296875, 0.53607177734375, 0.5548858642578125, 0.573699951171875, 0.5925140380859375, 0.611328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 4.0, 16.0, 15.0, 15.0, 22.0, 19.0, 23.0, 25.0, 27.0, 39.0, 36.0, 43.0, 49.0, 48.0, 39.0, 48.0, 58.0, 43.0, 47.0, 35.0, 35.0, 34.0, 31.0, 29.0, 29.0, 25.0, 37.0, 20.0, 14.0, 21.0, 13.0, 12.0, 6.0, 3.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.462890625, -2.379119873046875, -2.29534912109375, -2.211578369140625, -2.1278076171875, -2.044036865234375, -1.96026611328125, -1.876495361328125, -1.792724609375, -1.708953857421875, -1.62518310546875, -1.541412353515625, -1.4576416015625, -1.373870849609375, -1.29010009765625, -1.206329345703125, -1.12255859375, -1.038787841796875, -0.95501708984375, -0.871246337890625, -0.7874755859375, -0.703704833984375, -0.61993408203125, -0.536163330078125, -0.452392578125, -0.368621826171875, -0.28485107421875, -0.201080322265625, -0.1173095703125, -0.033538818359375, 0.05023193359375, 0.134002685546875, 0.2177734375, 0.301544189453125, 0.38531494140625, 0.469085693359375, 0.5528564453125, 0.636627197265625, 0.72039794921875, 0.804168701171875, 0.887939453125, 0.971710205078125, 1.05548095703125, 1.139251708984375, 1.2230224609375, 1.306793212890625, 1.39056396484375, 1.474334716796875, 1.55810546875, 1.641876220703125, 1.72564697265625, 1.809417724609375, 1.8931884765625, 1.976959228515625, 2.06072998046875, 2.144500732421875, 2.228271484375, 2.312042236328125, 2.39581298828125, 2.479583740234375, 2.5633544921875, 2.647125244140625, 2.73089599609375, 2.814666748046875, 2.8984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 8.0, 11.0, 17.0, 13.0, 25.0, 22.0, 50.0, 60.0, 75.0, 84.0, 114.0, 231.0, 328.0, 591.0, 1189.0, 2681.0, 6905.0, 19844.0, 89562.0, 867047.0, 38949.0, 12245.0, 4358.0, 1924.0, 896.0, 451.0, 251.0, 178.0, 109.0, 77.0, 62.0, 39.0, 40.0, 22.0, 18.0, 21.0, 11.0, 10.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.483551025390625, -2.39874267578125, -2.313934326171875, -2.2291259765625, -2.144317626953125, -2.05950927734375, -1.974700927734375, -1.889892578125, -1.805084228515625, -1.72027587890625, -1.635467529296875, -1.5506591796875, -1.465850830078125, -1.38104248046875, -1.296234130859375, -1.21142578125, -1.126617431640625, -1.04180908203125, -0.957000732421875, -0.8721923828125, -0.787384033203125, -0.70257568359375, -0.617767333984375, -0.532958984375, -0.448150634765625, -0.36334228515625, -0.278533935546875, -0.1937255859375, -0.108917236328125, -0.02410888671875, 0.060699462890625, 0.1455078125, 0.230316162109375, 0.31512451171875, 0.399932861328125, 0.4847412109375, 0.569549560546875, 0.65435791015625, 0.739166259765625, 0.823974609375, 0.908782958984375, 0.99359130859375, 1.078399658203125, 1.1632080078125, 1.248016357421875, 1.33282470703125, 1.417633056640625, 1.50244140625, 1.587249755859375, 1.67205810546875, 1.756866455078125, 1.8416748046875, 1.926483154296875, 2.01129150390625, 2.096099853515625, 2.180908203125, 2.265716552734375, 2.35052490234375, 2.435333251953125, 2.5201416015625, 2.604949951171875, 2.68975830078125, 2.774566650390625, 2.859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 10.0, 6.0, 14.0, 9.0, 13.0, 12.0, 15.0, 17.0, 24.0, 35.0, 30.0, 26.0, 37.0, 28.0, 44.0, 43.0, 46.0, 37.0, 34.0, 40.0, 39.0, 30.0, 41.0, 33.0, 30.0, 37.0, 29.0, 30.0, 27.0, 17.0, 27.0, 24.0, 14.0, 16.0, 18.0, 9.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5595703125, -1.5070648193359375, -1.454559326171875, -1.4020538330078125, -1.34954833984375, -1.2970428466796875, -1.244537353515625, -1.1920318603515625, -1.1395263671875, -1.0870208740234375, -1.034515380859375, -0.9820098876953125, -0.92950439453125, -0.8769989013671875, -0.824493408203125, -0.7719879150390625, -0.719482421875, -0.6669769287109375, -0.614471435546875, -0.5619659423828125, -0.50946044921875, -0.4569549560546875, -0.404449462890625, -0.3519439697265625, -0.2994384765625, -0.2469329833984375, -0.194427490234375, -0.1419219970703125, -0.08941650390625, -0.0369110107421875, 0.015594482421875, 0.0680999755859375, 0.12060546875, 0.1731109619140625, 0.225616455078125, 0.2781219482421875, 0.33062744140625, 0.3831329345703125, 0.435638427734375, 0.4881439208984375, 0.5406494140625, 0.5931549072265625, 0.645660400390625, 0.6981658935546875, 0.75067138671875, 0.8031768798828125, 0.855682373046875, 0.9081878662109375, 0.960693359375, 1.0131988525390625, 1.065704345703125, 1.1182098388671875, 1.17071533203125, 1.2232208251953125, 1.275726318359375, 1.3282318115234375, 1.3807373046875, 1.4332427978515625, 1.485748291015625, 1.5382537841796875, 1.59075927734375, 1.6432647705078125, 1.695770263671875, 1.7482757568359375, 1.80078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 10.0, 14.0, 15.0, 23.0, 37.0, 35.0, 49.0, 63.0, 106.0, 182.0, 263.0, 391.0, 690.0, 1204.0, 2223.0, 4103.0, 8293.0, 17330.0, 42086.0, 778535.0, 141696.0, 26270.0, 11948.0, 5921.0, 3043.0, 1587.0, 899.0, 523.0, 344.0, 191.0, 131.0, 99.0, 48.0, 41.0, 39.0, 23.0, 27.0, 17.0, 9.0, 3.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1402587890625, -0.1356983184814453, -0.13113784790039062, -0.12657737731933594, -0.12201690673828125, -0.11745643615722656, -0.11289596557617188, -0.10833549499511719, -0.1037750244140625, -0.09921455383300781, -0.09465408325195312, -0.09009361267089844, -0.08553314208984375, -0.08097267150878906, -0.07641220092773438, -0.07185173034667969, -0.067291259765625, -0.06273078918457031, -0.058170318603515625, -0.05360984802246094, -0.04904937744140625, -0.04448890686035156, -0.039928436279296875, -0.03536796569824219, -0.0308074951171875, -0.026247024536132812, -0.021686553955078125, -0.017126083374023438, -0.01256561279296875, -0.008005142211914062, -0.003444671630859375, 0.0011157989501953125, 0.00567626953125, 0.010236740112304688, 0.014797210693359375, 0.019357681274414062, 0.02391815185546875, 0.028478622436523438, 0.033039093017578125, 0.03759956359863281, 0.0421600341796875, 0.04672050476074219, 0.051280975341796875, 0.05584144592285156, 0.06040191650390625, 0.06496238708496094, 0.06952285766601562, 0.07408332824707031, 0.078643798828125, 0.08320426940917969, 0.08776473999023438, 0.09232521057128906, 0.09688568115234375, 0.10144615173339844, 0.10600662231445312, 0.11056709289550781, 0.1151275634765625, 0.11968803405761719, 0.12424850463867188, 0.12880897521972656, 0.13336944580078125, 0.13792991638183594, 0.14249038696289062, 0.1470508575439453, 0.151611328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 8.0, 7.0, 8.0, 17.0, 11.0, 16.0, 15.0, 27.0, 23.0, 25.0, 27.0, 30.0, 53.0, 38.0, 39.0, 41.0, 47.0, 66.0, 42.0, 39.0, 43.0, 58.0, 43.0, 37.0, 34.0, 29.0, 34.0, 20.0, 25.0, 18.0, 15.0, 14.0, 6.0, 5.0, 7.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-05, -9.821727871894836e-06, -9.510666131973267e-06, -9.199604392051697e-06, -8.888542652130127e-06, -8.577480912208557e-06, -8.266419172286987e-06, -7.955357432365417e-06, -7.644295692443848e-06, -7.333233952522278e-06, -7.022172212600708e-06, -6.711110472679138e-06, -6.400048732757568e-06, -6.0889869928359985e-06, -5.777925252914429e-06, -5.466863512992859e-06, -5.155801773071289e-06, -4.844740033149719e-06, -4.533678293228149e-06, -4.22261655330658e-06, -3.91155481338501e-06, -3.60049307346344e-06, -3.28943133354187e-06, -2.9783695936203003e-06, -2.6673078536987305e-06, -2.3562461137771606e-06, -2.045184373855591e-06, -1.734122633934021e-06, -1.4230608940124512e-06, -1.1119991540908813e-06, -8.009374141693115e-07, -4.898756742477417e-07, -1.7881393432617188e-07, 1.3224780559539795e-07, 4.4330954551696777e-07, 7.543712854385376e-07, 1.0654330253601074e-06, 1.3764947652816772e-06, 1.687556505203247e-06, 1.998618245124817e-06, 2.3096799850463867e-06, 2.6207417249679565e-06, 2.9318034648895264e-06, 3.242865204811096e-06, 3.553926944732666e-06, 3.864988684654236e-06, 4.176050424575806e-06, 4.4871121644973755e-06, 4.798173904418945e-06, 5.109235644340515e-06, 5.420297384262085e-06, 5.731359124183655e-06, 6.042420864105225e-06, 6.3534826040267944e-06, 6.664544343948364e-06, 6.975606083869934e-06, 7.286667823791504e-06, 7.597729563713074e-06, 7.908791303634644e-06, 8.219853043556213e-06, 8.530914783477783e-06, 8.841976523399353e-06, 9.153038263320923e-06, 9.464100003242493e-06, 9.775161743164062e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 5.0, 0.0, 8.0, 18.0, 15.0, 38.0, 53.0, 64.0, 79.0, 117.0, 193.0, 286.0, 428.0, 616.0, 885.0, 1267.0, 2072.0, 3249.0, 5099.0, 8316.0, 14204.0, 23951.0, 41902.0, 72931.0, 124670.0, 185410.0, 199853.0, 147974.0, 89872.0, 51093.0, 29185.0, 16922.0, 10292.0, 6282.0, 3873.0, 2466.0, 1645.0, 997.0, 703.0, 466.0, 310.0, 225.0, 169.0, 101.0, 73.0, 52.0, 40.0, 32.0, 17.0, 17.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12107086181640625, -0.1167755126953125, -0.11248016357421875, -0.108184814453125, -0.10388946533203125, -0.0995941162109375, -0.09529876708984375, -0.09100341796875, -0.08670806884765625, -0.0824127197265625, -0.07811737060546875, -0.073822021484375, -0.06952667236328125, -0.0652313232421875, -0.06093597412109375, -0.056640625, -0.05234527587890625, -0.0480499267578125, -0.04375457763671875, -0.039459228515625, -0.03516387939453125, -0.0308685302734375, -0.02657318115234375, -0.02227783203125, -0.01798248291015625, -0.0136871337890625, -0.00939178466796875, -0.005096435546875, -0.00080108642578125, 0.0034942626953125, 0.00778961181640625, 0.0120849609375, 0.01638031005859375, 0.0206756591796875, 0.02497100830078125, 0.029266357421875, 0.03356170654296875, 0.0378570556640625, 0.04215240478515625, 0.04644775390625, 0.05074310302734375, 0.0550384521484375, 0.05933380126953125, 0.063629150390625, 0.06792449951171875, 0.0722198486328125, 0.07651519775390625, 0.080810546875, 0.08510589599609375, 0.0894012451171875, 0.09369659423828125, 0.097991943359375, 0.10228729248046875, 0.1065826416015625, 0.11087799072265625, 0.11517333984375, 0.11946868896484375, 0.1237640380859375, 0.12805938720703125, 0.132354736328125, 0.13665008544921875, 0.1409454345703125, 0.14524078369140625, 0.1495361328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 9.0, 4.0, 7.0, 10.0, 15.0, 11.0, 11.0, 12.0, 33.0, 21.0, 42.0, 62.0, 48.0, 69.0, 49.0, 74.0, 62.0, 61.0, 63.0, 62.0, 47.0, 41.0, 35.0, 31.0, 30.0, 18.0, 20.0, 14.0, 9.0, 11.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040863037109375, -0.03951549530029297, -0.03816795349121094, -0.036820411682128906, -0.035472869873046875, -0.034125328063964844, -0.03277778625488281, -0.03143024444580078, -0.03008270263671875, -0.02873516082763672, -0.027387619018554688, -0.026040077209472656, -0.024692535400390625, -0.023344993591308594, -0.021997451782226562, -0.02064990997314453, -0.0193023681640625, -0.01795482635498047, -0.016607284545898438, -0.015259742736816406, -0.013912200927734375, -0.012564659118652344, -0.011217117309570312, -0.009869575500488281, -0.00852203369140625, -0.007174491882324219, -0.0058269500732421875, -0.004479408264160156, -0.003131866455078125, -0.0017843246459960938, -0.0004367828369140625, 0.0009107589721679688, 0.00225830078125, 0.0036058425903320312, 0.0049533843994140625, 0.006300926208496094, 0.007648468017578125, 0.008996009826660156, 0.010343551635742188, 0.011691093444824219, 0.01303863525390625, 0.014386177062988281, 0.015733718872070312, 0.017081260681152344, 0.018428802490234375, 0.019776344299316406, 0.021123886108398438, 0.02247142791748047, 0.0238189697265625, 0.02516651153564453, 0.026514053344726562, 0.027861595153808594, 0.029209136962890625, 0.030556678771972656, 0.03190422058105469, 0.03325176239013672, 0.03459930419921875, 0.03594684600830078, 0.03729438781738281, 0.038641929626464844, 0.039989471435546875, 0.041337013244628906, 0.04268455505371094, 0.04403209686279297, 0.045379638671875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 6.0, 4.0, 2.0, 5.0, 6.0, 8.0, 9.0, 8.0, 12.0, 15.0, 18.0, 27.0, 19.0, 32.0, 21.0, 23.0, 28.0, 38.0, 26.0, 40.0, 39.0, 41.0, 46.0, 40.0, 47.0, 37.0, 38.0, 43.0, 29.0, 36.0, 38.0, 22.0, 33.0, 27.0, 20.0, 26.0, 26.0, 10.0, 7.0, 5.0, 7.0, 8.0, 7.0, 7.0, 2.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.134416103363037, -2.0708911418914795, -2.007366180419922, -1.9438414573669434, -1.8803164958953857, -1.8167915344238281, -1.75326669216156, -1.689741849899292, -1.6262168884277344, -1.5626919269561768, -1.4991670846939087, -1.4356422424316406, -1.372117280960083, -1.3085923194885254, -1.2450674772262573, -1.1815426349639893, -1.1180176734924316, -1.054492712020874, -0.990967869758606, -0.9274429678916931, -0.8639180660247803, -0.8003931641578674, -0.7368682622909546, -0.6733433604240417, -0.6098184585571289, -0.5462935566902161, -0.4827686548233032, -0.4192437529563904, -0.35571885108947754, -0.2921939492225647, -0.22866904735565186, -0.165144145488739, -0.10161900520324707, -0.03809410333633423, 0.025430798530578613, 0.08895570039749146, 0.1524806022644043, 0.21600550413131714, 0.27953040599823, 0.3430553078651428, 0.40658020973205566, 0.4701051115989685, 0.5336300134658813, 0.5971549153327942, 0.660679817199707, 0.7242047190666199, 0.7877296209335327, 0.8512545228004456, 0.9147794246673584, 0.9783043265342712, 1.041829228401184, 1.1053540706634521, 1.1688790321350098, 1.2324039936065674, 1.2959288358688354, 1.3594536781311035, 1.4229786396026611, 1.4865036010742188, 1.5500284433364868, 1.6135532855987549, 1.6770782470703125, 1.7406032085418701, 1.8041280508041382, 1.8676528930664062, 1.9311778545379639]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 15.0, 9.0, 6.0, 10.0, 13.0, 9.0, 20.0, 21.0, 23.0, 32.0, 32.0, 24.0, 43.0, 45.0, 39.0, 45.0, 46.0, 45.0, 44.0, 44.0, 46.0, 42.0, 33.0, 37.0, 36.0, 25.0, 46.0, 32.0, 23.0, 19.0, 24.0, 9.0, 9.0, 12.0, 9.0, 10.0, 9.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.432574510574341, -2.3530755043029785, -2.273576259613037, -2.194077253341675, -2.1145780086517334, -2.035079002380371, -1.9555797576904297, -1.8760807514190674, -1.796581506729126, -1.7170823812484741, -1.6375832557678223, -1.5580841302871704, -1.4785850048065186, -1.3990858793258667, -1.3195867538452148, -1.2400877475738525, -1.1605886220932007, -1.0810894966125488, -1.001590371131897, -0.9220912456512451, -0.8425921201705933, -0.7630929946899414, -0.6835939288139343, -0.6040948033332825, -0.5245956778526306, -0.44509655237197876, -0.3655974268913269, -0.28609833121299744, -0.20659920573234558, -0.12710008025169373, -0.04760098457336426, 0.0318981409072876, 0.11139726638793945, 0.1908963918685913, 0.27039551734924316, 0.34989461302757263, 0.4293937385082245, 0.5088928937911987, 0.5883919596672058, 0.6678910851478577, 0.7473902106285095, 0.8268893361091614, 0.9063884615898132, 0.9858875274658203, 1.0653866529464722, 1.144885778427124, 1.2243849039077759, 1.3038840293884277, 1.3833831548690796, 1.4628822803497314, 1.5423814058303833, 1.6218805313110352, 1.701379656791687, 1.7808787822723389, 1.8603777885437012, 1.9398770332336426, 2.019376039505005, 2.098875045776367, 2.1783742904663086, 2.257873296737671, 2.3373725414276123, 2.4168715476989746, 2.496370792388916, 2.5758697986602783, 2.6553690433502197]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 13.0, 16.0, 23.0, 45.0, 78.0, 100.0, 178.0, 265.0, 498.0, 668.0, 1007.0, 1775.0, 2563.0, 3885.0, 6133.0, 9160.0, 14035.0, 20095.0, 28446.0, 39045.0, 51873.0, 65358.0, 79701.0, 89837.0, 96405.0, 96761.0, 91913.0, 82246.0, 69316.0, 55386.0, 42504.0, 31510.0, 22250.0, 15242.0, 10524.0, 6975.0, 4458.0, 2897.0, 1897.0, 1257.0, 755.0, 541.0, 319.0, 221.0, 130.0, 81.0, 65.0, 29.0, 32.0, 17.0, 3.0, 7.0, 10.0, 5.0, 1.0, 3.0], "bins": [-1.162109375, -1.127044677734375, -1.09197998046875, -1.056915283203125, -1.0218505859375, -0.986785888671875, -0.95172119140625, -0.916656494140625, -0.881591796875, -0.846527099609375, -0.81146240234375, -0.776397705078125, -0.7413330078125, -0.706268310546875, -0.67120361328125, -0.636138916015625, -0.60107421875, -0.566009521484375, -0.53094482421875, -0.495880126953125, -0.4608154296875, -0.425750732421875, -0.39068603515625, -0.355621337890625, -0.320556640625, -0.285491943359375, -0.25042724609375, -0.215362548828125, -0.1802978515625, -0.145233154296875, -0.11016845703125, -0.075103759765625, -0.0400390625, -0.004974365234375, 0.03009033203125, 0.065155029296875, 0.1002197265625, 0.135284423828125, 0.17034912109375, 0.205413818359375, 0.240478515625, 0.275543212890625, 0.31060791015625, 0.345672607421875, 0.3807373046875, 0.415802001953125, 0.45086669921875, 0.485931396484375, 0.52099609375, 0.556060791015625, 0.59112548828125, 0.626190185546875, 0.6612548828125, 0.696319580078125, 0.73138427734375, 0.766448974609375, 0.801513671875, 0.836578369140625, 0.87164306640625, 0.906707763671875, 0.9417724609375, 0.976837158203125, 1.01190185546875, 1.046966552734375, 1.08203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 9.0, 8.0, 8.0, 8.0, 15.0, 19.0, 19.0, 21.0, 25.0, 32.0, 36.0, 40.0, 39.0, 37.0, 42.0, 35.0, 28.0, 48.0, 38.0, 47.0, 47.0, 44.0, 47.0, 35.0, 34.0, 22.0, 26.0, 29.0, 31.0, 18.0, 15.0, 13.0, 18.0, 13.0, 2.0, 4.0, 9.0, 3.0, 13.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.19140625, -2.113677978515625, -2.03594970703125, -1.958221435546875, -1.8804931640625, -1.802764892578125, -1.72503662109375, -1.647308349609375, -1.569580078125, -1.491851806640625, -1.41412353515625, -1.336395263671875, -1.2586669921875, -1.180938720703125, -1.10321044921875, -1.025482177734375, -0.94775390625, -0.870025634765625, -0.79229736328125, -0.714569091796875, -0.6368408203125, -0.559112548828125, -0.48138427734375, -0.403656005859375, -0.325927734375, -0.248199462890625, -0.17047119140625, -0.092742919921875, -0.0150146484375, 0.062713623046875, 0.14044189453125, 0.218170166015625, 0.2958984375, 0.373626708984375, 0.45135498046875, 0.529083251953125, 0.6068115234375, 0.684539794921875, 0.76226806640625, 0.839996337890625, 0.917724609375, 0.995452880859375, 1.07318115234375, 1.150909423828125, 1.2286376953125, 1.306365966796875, 1.38409423828125, 1.461822509765625, 1.53955078125, 1.617279052734375, 1.69500732421875, 1.772735595703125, 1.8504638671875, 1.928192138671875, 2.00592041015625, 2.083648681640625, 2.161376953125, 2.239105224609375, 2.31683349609375, 2.394561767578125, 2.4722900390625, 2.550018310546875, 2.62774658203125, 2.705474853515625, 2.783203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 11.0, 10.0, 14.0, 32.0, 59.0, 69.0, 98.0, 177.0, 261.0, 430.0, 675.0, 1094.0, 1635.0, 2562.0, 4179.0, 6624.0, 10049.0, 15351.0, 23055.0, 34061.0, 47830.0, 64925.0, 82673.0, 98616.0, 109067.0, 111257.0, 103389.0, 89221.0, 71221.0, 53636.0, 38823.0, 26738.0, 18019.0, 11939.0, 7509.0, 4860.0, 3076.0, 1879.0, 1199.0, 774.0, 524.0, 338.0, 181.0, 140.0, 93.0, 59.0, 35.0, 24.0, 18.0, 17.0, 8.0, 4.0, 9.0, 2.0, 0.0, 2.0, 3.0], "bins": [-1.38671875, -1.3436279296875, -1.300537109375, -1.2574462890625, -1.21435546875, -1.1712646484375, -1.128173828125, -1.0850830078125, -1.0419921875, -0.9989013671875, -0.955810546875, -0.9127197265625, -0.86962890625, -0.8265380859375, -0.783447265625, -0.7403564453125, -0.697265625, -0.6541748046875, -0.611083984375, -0.5679931640625, -0.52490234375, -0.4818115234375, -0.438720703125, -0.3956298828125, -0.3525390625, -0.3094482421875, -0.266357421875, -0.2232666015625, -0.18017578125, -0.1370849609375, -0.093994140625, -0.0509033203125, -0.0078125, 0.0352783203125, 0.078369140625, 0.1214599609375, 0.16455078125, 0.2076416015625, 0.250732421875, 0.2938232421875, 0.3369140625, 0.3800048828125, 0.423095703125, 0.4661865234375, 0.50927734375, 0.5523681640625, 0.595458984375, 0.6385498046875, 0.681640625, 0.7247314453125, 0.767822265625, 0.8109130859375, 0.85400390625, 0.8970947265625, 0.940185546875, 0.9832763671875, 1.0263671875, 1.0694580078125, 1.112548828125, 1.1556396484375, 1.19873046875, 1.2418212890625, 1.284912109375, 1.3280029296875, 1.37109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 13.0, 12.0, 14.0, 16.0, 16.0, 16.0, 40.0, 23.0, 27.0, 39.0, 33.0, 45.0, 34.0, 38.0, 47.0, 42.0, 47.0, 34.0, 35.0, 40.0, 48.0, 39.0, 35.0, 39.0, 27.0, 39.0, 18.0, 13.0, 22.0, 22.0, 13.0, 15.0, 13.0, 8.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.62445068359375, -1.5711669921875, -1.51788330078125, -1.464599609375, -1.41131591796875, -1.3580322265625, -1.30474853515625, -1.25146484375, -1.19818115234375, -1.1448974609375, -1.09161376953125, -1.038330078125, -0.98504638671875, -0.9317626953125, -0.87847900390625, -0.8251953125, -0.77191162109375, -0.7186279296875, -0.66534423828125, -0.612060546875, -0.55877685546875, -0.5054931640625, -0.45220947265625, -0.39892578125, -0.34564208984375, -0.2923583984375, -0.23907470703125, -0.185791015625, -0.13250732421875, -0.0792236328125, -0.02593994140625, 0.02734375, 0.08062744140625, 0.1339111328125, 0.18719482421875, 0.240478515625, 0.29376220703125, 0.3470458984375, 0.40032958984375, 0.45361328125, 0.50689697265625, 0.5601806640625, 0.61346435546875, 0.666748046875, 0.72003173828125, 0.7733154296875, 0.82659912109375, 0.8798828125, 0.93316650390625, 0.9864501953125, 1.03973388671875, 1.093017578125, 1.14630126953125, 1.1995849609375, 1.25286865234375, 1.30615234375, 1.35943603515625, 1.4127197265625, 1.46600341796875, 1.519287109375, 1.57257080078125, 1.6258544921875, 1.67913818359375, 1.732421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 12.0, 16.0, 32.0, 33.0, 52.0, 75.0, 124.0, 207.0, 324.0, 504.0, 853.0, 1388.0, 2368.0, 3927.0, 6516.0, 10890.0, 18154.0, 28911.0, 43807.0, 63714.0, 88094.0, 109439.0, 123497.0, 126473.0, 115559.0, 95054.0, 71395.0, 50228.0, 33306.0, 21108.0, 12862.0, 7824.0, 4719.0, 2771.0, 1649.0, 1000.0, 643.0, 379.0, 243.0, 131.0, 96.0, 67.0, 47.0, 30.0, 13.0, 8.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5654296875, -0.5472869873046875, -0.529144287109375, -0.5110015869140625, -0.49285888671875, -0.4747161865234375, -0.456573486328125, -0.4384307861328125, -0.4202880859375, -0.4021453857421875, -0.384002685546875, -0.3658599853515625, -0.34771728515625, -0.3295745849609375, -0.311431884765625, -0.2932891845703125, -0.275146484375, -0.2570037841796875, -0.238861083984375, -0.2207183837890625, -0.20257568359375, -0.1844329833984375, -0.166290283203125, -0.1481475830078125, -0.1300048828125, -0.1118621826171875, -0.093719482421875, -0.0755767822265625, -0.05743408203125, -0.0392913818359375, -0.021148681640625, -0.0030059814453125, 0.01513671875, 0.0332794189453125, 0.051422119140625, 0.0695648193359375, 0.08770751953125, 0.1058502197265625, 0.123992919921875, 0.1421356201171875, 0.1602783203125, 0.1784210205078125, 0.196563720703125, 0.2147064208984375, 0.23284912109375, 0.2509918212890625, 0.269134521484375, 0.2872772216796875, 0.305419921875, 0.3235626220703125, 0.341705322265625, 0.3598480224609375, 0.37799072265625, 0.3961334228515625, 0.414276123046875, 0.4324188232421875, 0.4505615234375, 0.4687042236328125, 0.486846923828125, 0.5049896240234375, 0.52313232421875, 0.5412750244140625, 0.559417724609375, 0.5775604248046875, 0.595703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 6.0, 8.0, 11.0, 15.0, 17.0, 31.0, 25.0, 27.0, 38.0, 28.0, 35.0, 57.0, 56.0, 58.0, 65.0, 56.0, 52.0, 63.0, 57.0, 37.0, 42.0, 36.0, 32.0, 26.0, 28.0, 21.0, 16.0, 11.0, 9.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.289648056030273e-05, -7.047690451145172e-05, -6.805732846260071e-05, -6.56377524137497e-05, -6.321817636489868e-05, -6.079860031604767e-05, -5.8379024267196655e-05, -5.595944821834564e-05, -5.353987216949463e-05, -5.1120296120643616e-05, -4.87007200717926e-05, -4.628114402294159e-05, -4.3861567974090576e-05, -4.144199192523956e-05, -3.902241587638855e-05, -3.660283982753754e-05, -3.4183263778686523e-05, -3.176368772983551e-05, -2.9344111680984497e-05, -2.6924535632133484e-05, -2.450495958328247e-05, -2.2085383534431458e-05, -1.9665807485580444e-05, -1.724623143672943e-05, -1.4826655387878418e-05, -1.2407079339027405e-05, -9.987503290176392e-06, -7.567927241325378e-06, -5.148351192474365e-06, -2.728775143623352e-06, -3.0919909477233887e-07, 2.1103769540786743e-06, 4.5299530029296875e-06, 6.949529051780701e-06, 9.369105100631714e-06, 1.1788681149482727e-05, 1.420825719833374e-05, 1.6627833247184753e-05, 1.9047409296035767e-05, 2.146698534488678e-05, 2.3886561393737793e-05, 2.6306137442588806e-05, 2.872571349143982e-05, 3.114528954029083e-05, 3.3564865589141846e-05, 3.598444163799286e-05, 3.840401768684387e-05, 4.0823593735694885e-05, 4.32431697845459e-05, 4.566274583339691e-05, 4.8082321882247925e-05, 5.050189793109894e-05, 5.292147397994995e-05, 5.5341050028800964e-05, 5.776062607765198e-05, 6.018020212650299e-05, 6.2599778175354e-05, 6.501935422420502e-05, 6.743893027305603e-05, 6.985850632190704e-05, 7.227808237075806e-05, 7.469765841960907e-05, 7.711723446846008e-05, 7.95368105173111e-05, 8.195638656616211e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 10.0, 17.0, 36.0, 48.0, 78.0, 158.0, 247.0, 368.0, 612.0, 912.0, 1433.0, 2509.0, 3979.0, 6337.0, 10293.0, 16119.0, 25169.0, 38730.0, 55776.0, 76376.0, 96875.0, 114040.0, 121599.0, 117235.0, 101802.0, 80761.0, 59752.0, 41648.0, 27657.0, 17864.0, 11382.0, 7076.0, 4434.0, 2715.0, 1742.0, 1070.0, 621.0, 379.0, 248.0, 157.0, 124.0, 57.0, 40.0, 18.0, 22.0, 12.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.62255859375, -0.604034423828125, -0.58551025390625, -0.566986083984375, -0.5484619140625, -0.529937744140625, -0.51141357421875, -0.492889404296875, -0.474365234375, -0.455841064453125, -0.43731689453125, -0.418792724609375, -0.4002685546875, -0.381744384765625, -0.36322021484375, -0.344696044921875, -0.326171875, -0.307647705078125, -0.28912353515625, -0.270599365234375, -0.2520751953125, -0.233551025390625, -0.21502685546875, -0.196502685546875, -0.177978515625, -0.159454345703125, -0.14093017578125, -0.122406005859375, -0.1038818359375, -0.085357666015625, -0.06683349609375, -0.048309326171875, -0.02978515625, -0.011260986328125, 0.00726318359375, 0.025787353515625, 0.0443115234375, 0.062835693359375, 0.08135986328125, 0.099884033203125, 0.118408203125, 0.136932373046875, 0.15545654296875, 0.173980712890625, 0.1925048828125, 0.211029052734375, 0.22955322265625, 0.248077392578125, 0.2666015625, 0.285125732421875, 0.30364990234375, 0.322174072265625, 0.3406982421875, 0.359222412109375, 0.37774658203125, 0.396270751953125, 0.414794921875, 0.433319091796875, 0.45184326171875, 0.470367431640625, 0.4888916015625, 0.507415771484375, 0.52593994140625, 0.544464111328125, 0.56298828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 4.0, 3.0, 14.0, 16.0, 11.0, 21.0, 30.0, 34.0, 33.0, 44.0, 56.0, 51.0, 67.0, 57.0, 80.0, 60.0, 70.0, 62.0, 49.0, 45.0, 44.0, 34.0, 26.0, 24.0, 9.0, 14.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.30859375, -0.2978324890136719, -0.28707122802734375, -0.2763099670410156, -0.2655487060546875, -0.2547874450683594, -0.24402618408203125, -0.23326492309570312, -0.222503662109375, -0.21174240112304688, -0.20098114013671875, -0.19021987915039062, -0.1794586181640625, -0.16869735717773438, -0.15793609619140625, -0.14717483520507812, -0.13641357421875, -0.12565231323242188, -0.11489105224609375, -0.10412979125976562, -0.0933685302734375, -0.08260726928710938, -0.07184600830078125, -0.061084747314453125, -0.050323486328125, -0.039562225341796875, -0.02880096435546875, -0.018039703369140625, -0.0072784423828125, 0.003482818603515625, 0.01424407958984375, 0.025005340576171875, 0.0357666015625, 0.046527862548828125, 0.05728912353515625, 0.06805038452148438, 0.0788116455078125, 0.08957290649414062, 0.10033416748046875, 0.11109542846679688, 0.121856689453125, 0.13261795043945312, 0.14337921142578125, 0.15414047241210938, 0.1649017333984375, 0.17566299438476562, 0.18642425537109375, 0.19718551635742188, 0.20794677734375, 0.21870803833007812, 0.22946929931640625, 0.24023056030273438, 0.2509918212890625, 0.2617530822753906, 0.27251434326171875, 0.2832756042480469, 0.294036865234375, 0.3047981262207031, 0.31555938720703125, 0.3263206481933594, 0.3370819091796875, 0.3478431701660156, 0.35860443115234375, 0.3693656921386719, 0.380126953125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 4.0, 3.0, 1.0, 11.0, 7.0, 8.0, 23.0, 18.0, 32.0, 34.0, 31.0, 31.0, 24.0, 33.0, 39.0, 31.0, 46.0, 49.0, 51.0, 45.0, 53.0, 41.0, 46.0, 49.0, 38.0, 33.0, 32.0, 34.0, 33.0, 19.0, 26.0, 15.0, 10.0, 11.0, 3.0, 11.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-2.708096981048584, -2.635241746902466, -2.5623865127563477, -2.4895312786102295, -2.4166760444641113, -2.343820810317993, -2.270965576171875, -2.198110580444336, -2.1252551078796387, -2.0523998737335205, -1.9795446395874023, -1.9066894054412842, -1.833834171295166, -1.7609789371490479, -1.6881238222122192, -1.615268588066101, -1.5424134731292725, -1.4695582389831543, -1.3967030048370361, -1.323847770690918, -1.2509925365447998, -1.1781373023986816, -1.105282187461853, -1.0324269533157349, -0.9595717191696167, -0.8867164850234985, -0.8138612508773804, -0.741006076335907, -0.6681508421897888, -0.5952956080436707, -0.5224404335021973, -0.4495851993560791, -0.3767298460006714, -0.3038746118545532, -0.23101940751075745, -0.15816418826580048, -0.0853089690208435, -0.012453734874725342, 0.060401469469070435, 0.1332566738128662, 0.20611190795898438, 0.27896714210510254, 0.3518223464488983, 0.4246775507926941, 0.49753278493881226, 0.5703880190849304, 0.6432431936264038, 0.716098427772522, 0.7889536619186401, 0.8618088960647583, 0.9346641302108765, 1.0075193643569946, 1.0803744792938232, 1.1532297134399414, 1.2260849475860596, 1.2989401817321777, 1.371795415878296, 1.444650650024414, 1.5175058841705322, 1.5903611183166504, 1.6632163524627686, 1.7360715866088867, 1.8089267015457153, 1.8817819356918335, 1.9546371698379517]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 6.0, 8.0, 8.0, 11.0, 25.0, 16.0, 22.0, 21.0, 27.0, 34.0, 34.0, 33.0, 33.0, 38.0, 36.0, 42.0, 46.0, 44.0, 36.0, 42.0, 34.0, 38.0, 36.0, 38.0, 24.0, 35.0, 32.0, 28.0, 21.0, 22.0, 14.0, 21.0, 13.0, 12.0, 10.0, 3.0, 5.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2908196449279785, -2.2137062549591064, -2.1365926265716553, -2.059479236602783, -1.9823658466339111, -1.9052523374557495, -1.828138828277588, -1.7510254383087158, -1.6739120483398438, -1.5967985391616821, -1.51968514919281, -1.4425716400146484, -1.3654582500457764, -1.2883447408676147, -1.2112312316894531, -1.134117841720581, -1.0570043325424194, -0.9798908829689026, -0.9027774333953857, -0.8256639242172241, -0.748550534248352, -0.6714370250701904, -0.5943235754966736, -0.5172101259231567, -0.4400966763496399, -0.36298322677612305, -0.2858697772026062, -0.20875629782676697, -0.13164284825325012, -0.054529398679733276, 0.022584080696105957, 0.0996975302696228, 0.17681097984313965, 0.2539244294166565, 0.33103787899017334, 0.4081513583660126, 0.4852648079395294, 0.5623782873153687, 0.6394917368888855, 0.7166051864624023, 0.7937186360359192, 0.870832085609436, 0.9479455351829529, 1.0250589847564697, 1.1021724939346313, 1.1792858839035034, 1.256399393081665, 1.333512783050537, 1.4106262922286987, 1.4877398014068604, 1.5648531913757324, 1.641966700553894, 1.7190800905227661, 1.7961935997009277, 1.8733069896697998, 1.9504204988479614, 2.027534008026123, 2.104647397994995, 2.1817610263824463, 2.2588744163513184, 2.3359878063201904, 2.4131011962890625, 2.4902148246765137, 2.5673282146453857, 2.644441604614258]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 5.0, 3.0, 6.0, 23.0, 31.0, 42.0, 66.0, 97.0, 144.0, 262.0, 412.0, 612.0, 985.0, 1584.0, 2369.0, 3922.0, 6297.0, 10273.0, 16903.0, 27997.0, 46369.0, 76744.0, 125116.0, 201740.0, 310336.0, 437572.0, 546087.0, 591437.0, 544248.0, 431763.0, 302487.0, 196216.0, 121929.0, 73498.0, 44429.0, 27411.0, 16512.0, 10361.0, 6444.0, 4166.0, 2627.0, 1654.0, 1056.0, 673.0, 495.0, 309.0, 213.0, 113.0, 85.0, 61.0, 40.0, 22.0, 16.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 4.0], "bins": [-1.6201171875, -1.5686492919921875, -1.517181396484375, -1.4657135009765625, -1.41424560546875, -1.3627777099609375, -1.311309814453125, -1.2598419189453125, -1.2083740234375, -1.1569061279296875, -1.105438232421875, -1.0539703369140625, -1.00250244140625, -0.9510345458984375, -0.899566650390625, -0.8480987548828125, -0.796630859375, -0.7451629638671875, -0.693695068359375, -0.6422271728515625, -0.59075927734375, -0.5392913818359375, -0.487823486328125, -0.4363555908203125, -0.3848876953125, -0.3334197998046875, -0.281951904296875, -0.2304840087890625, -0.17901611328125, -0.1275482177734375, -0.076080322265625, -0.0246124267578125, 0.02685546875, 0.0783233642578125, 0.129791259765625, 0.1812591552734375, 0.23272705078125, 0.2841949462890625, 0.335662841796875, 0.3871307373046875, 0.4385986328125, 0.4900665283203125, 0.541534423828125, 0.5930023193359375, 0.64447021484375, 0.6959381103515625, 0.747406005859375, 0.7988739013671875, 0.850341796875, 0.9018096923828125, 0.953277587890625, 1.0047454833984375, 1.05621337890625, 1.1076812744140625, 1.159149169921875, 1.2106170654296875, 1.2620849609375, 1.3135528564453125, 1.365020751953125, 1.4164886474609375, 1.46795654296875, 1.5194244384765625, 1.570892333984375, 1.6223602294921875, 1.673828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 3.0, 9.0, 12.0, 12.0, 12.0, 12.0, 18.0, 28.0, 29.0, 27.0, 21.0, 39.0, 35.0, 33.0, 36.0, 32.0, 51.0, 37.0, 41.0, 35.0, 37.0, 41.0, 46.0, 38.0, 31.0, 33.0, 42.0, 22.0, 23.0, 28.0, 20.0, 22.0, 18.0, 14.0, 11.0, 3.0, 12.0, 3.0, 3.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.06640625, -1.998016357421875, -1.92962646484375, -1.861236572265625, -1.7928466796875, -1.724456787109375, -1.65606689453125, -1.587677001953125, -1.519287109375, -1.450897216796875, -1.38250732421875, -1.314117431640625, -1.2457275390625, -1.177337646484375, -1.10894775390625, -1.040557861328125, -0.97216796875, -0.903778076171875, -0.83538818359375, -0.766998291015625, -0.6986083984375, -0.630218505859375, -0.56182861328125, -0.493438720703125, -0.425048828125, -0.356658935546875, -0.28826904296875, -0.219879150390625, -0.1514892578125, -0.083099365234375, -0.01470947265625, 0.053680419921875, 0.1220703125, 0.190460205078125, 0.25885009765625, 0.327239990234375, 0.3956298828125, 0.464019775390625, 0.53240966796875, 0.600799560546875, 0.669189453125, 0.737579345703125, 0.80596923828125, 0.874359130859375, 0.9427490234375, 1.011138916015625, 1.07952880859375, 1.147918701171875, 1.21630859375, 1.284698486328125, 1.35308837890625, 1.421478271484375, 1.4898681640625, 1.558258056640625, 1.62664794921875, 1.695037841796875, 1.763427734375, 1.831817626953125, 1.90020751953125, 1.968597412109375, 2.0369873046875, 2.105377197265625, 2.17376708984375, 2.242156982421875, 2.310546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 3.0, 7.0, 28.0, 25.0, 55.0, 73.0, 104.0, 219.0, 336.0, 630.0, 1008.0, 1740.0, 2880.0, 5043.0, 8627.0, 15017.0, 26236.0, 44996.0, 76161.0, 127421.0, 206013.0, 318793.0, 450685.0, 566291.0, 606654.0, 547212.0, 423543.0, 294315.0, 189640.0, 116010.0, 68949.0, 40315.0, 23166.0, 13290.0, 7809.0, 4503.0, 2623.0, 1552.0, 890.0, 556.0, 301.0, 233.0, 138.0, 70.0, 48.0, 34.0, 16.0, 13.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.052734375, -1.98736572265625, -1.9219970703125, -1.85662841796875, -1.791259765625, -1.72589111328125, -1.6605224609375, -1.59515380859375, -1.52978515625, -1.46441650390625, -1.3990478515625, -1.33367919921875, -1.268310546875, -1.20294189453125, -1.1375732421875, -1.07220458984375, -1.0068359375, -0.94146728515625, -0.8760986328125, -0.81072998046875, -0.745361328125, -0.67999267578125, -0.6146240234375, -0.54925537109375, -0.48388671875, -0.41851806640625, -0.3531494140625, -0.28778076171875, -0.222412109375, -0.15704345703125, -0.0916748046875, -0.02630615234375, 0.0390625, 0.10443115234375, 0.1697998046875, 0.23516845703125, 0.300537109375, 0.36590576171875, 0.4312744140625, 0.49664306640625, 0.56201171875, 0.62738037109375, 0.6927490234375, 0.75811767578125, 0.823486328125, 0.88885498046875, 0.9542236328125, 1.01959228515625, 1.0849609375, 1.15032958984375, 1.2156982421875, 1.28106689453125, 1.346435546875, 1.41180419921875, 1.4771728515625, 1.54254150390625, 1.60791015625, 1.67327880859375, 1.7386474609375, 1.80401611328125, 1.869384765625, 1.93475341796875, 2.0001220703125, 2.06549072265625, 2.130859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 8.0, 11.0, 24.0, 26.0, 31.0, 37.0, 66.0, 59.0, 66.0, 99.0, 112.0, 130.0, 148.0, 156.0, 195.0, 193.0, 186.0, 206.0, 224.0, 219.0, 210.0, 221.0, 208.0, 175.0, 180.0, 153.0, 121.0, 95.0, 100.0, 85.0, 67.0, 60.0, 39.0, 42.0, 31.0, 25.0, 10.0, 12.0, 10.0, 7.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9693374633789062, -0.9401397705078125, -0.9109420776367188, -0.881744384765625, -0.8525466918945312, -0.8233489990234375, -0.7941513061523438, -0.76495361328125, -0.7357559204101562, -0.7065582275390625, -0.6773605346679688, -0.648162841796875, -0.6189651489257812, -0.5897674560546875, -0.5605697631835938, -0.5313720703125, -0.5021743774414062, -0.4729766845703125, -0.44377899169921875, -0.414581298828125, -0.38538360595703125, -0.3561859130859375, -0.32698822021484375, -0.29779052734375, -0.26859283447265625, -0.2393951416015625, -0.21019744873046875, -0.180999755859375, -0.15180206298828125, -0.1226043701171875, -0.09340667724609375, -0.064208984375, -0.03501129150390625, -0.0058135986328125, 0.02338409423828125, 0.052581787109375, 0.08177947998046875, 0.1109771728515625, 0.14017486572265625, 0.16937255859375, 0.19857025146484375, 0.2277679443359375, 0.25696563720703125, 0.286163330078125, 0.31536102294921875, 0.3445587158203125, 0.37375640869140625, 0.4029541015625, 0.43215179443359375, 0.4613494873046875, 0.49054718017578125, 0.519744873046875, 0.5489425659179688, 0.5781402587890625, 0.6073379516601562, 0.63653564453125, 0.6657333374023438, 0.6949310302734375, 0.7241287231445312, 0.753326416015625, 0.7825241088867188, 0.8117218017578125, 0.8409194946289062, 0.8701171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 3.0, 3.0, 6.0, 5.0, 13.0, 7.0, 16.0, 28.0, 19.0, 25.0, 24.0, 39.0, 38.0, 46.0, 52.0, 37.0, 44.0, 49.0, 60.0, 65.0, 48.0, 55.0, 45.0, 36.0, 37.0, 31.0, 36.0, 32.0, 27.0, 20.0, 11.0, 10.0, 10.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7574942111968994, -2.6728153228759766, -2.5881361961364746, -2.5034573078155518, -2.41877818107605, -2.334099292755127, -2.249420166015625, -2.164741277694702, -2.0800623893737793, -1.995383381843567, -1.9107043743133545, -1.8260254859924316, -1.7413463592529297, -1.6566674709320068, -1.5719884634017944, -1.487309455871582, -1.40263032913208, -1.3179513216018677, -1.2332723140716553, -1.1485934257507324, -1.0639142990112305, -0.9792353510856628, -0.8945564031600952, -0.8098773956298828, -0.7251983880996704, -0.640519380569458, -0.5558403730392456, -0.471161425113678, -0.3864824175834656, -0.3018034100532532, -0.21712446212768555, -0.13244545459747314, -0.047766685485839844, 0.036912307143211365, 0.12159129977226257, 0.2062702775001526, 0.290949285030365, 0.3756282925605774, 0.460307240486145, 0.5449862480163574, 0.6296652555465698, 0.7143442630767822, 0.7990232706069946, 0.8837022185325623, 0.9683812260627747, 1.0530602931976318, 1.1377391815185547, 1.222418189048767, 1.3070971965789795, 1.391776204109192, 1.4764552116394043, 1.5611340999603271, 1.645813226699829, 1.730492115020752, 1.8151711225509644, 1.8998501300811768, 1.9845291376113892, 2.0692081451416016, 2.1538870334625244, 2.2385661602020264, 2.323245048522949, 2.407924175262451, 2.492603063583374, 2.577281951904297, 2.661961078643799]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 10.0, 8.0, 9.0, 9.0, 15.0, 21.0, 27.0, 24.0, 28.0, 17.0, 38.0, 33.0, 42.0, 27.0, 45.0, 51.0, 37.0, 49.0, 43.0, 52.0, 42.0, 39.0, 36.0, 30.0, 36.0, 35.0, 29.0, 26.0, 22.0, 19.0, 11.0, 12.0, 8.0, 7.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431406021118164, -2.3538308143615723, -2.2762553691864014, -2.1986801624298096, -2.1211049556732178, -2.043529510498047, -1.965954303741455, -1.8883789777755737, -1.8108036518096924, -1.733228325843811, -1.6556531190872192, -1.578077793121338, -1.5005024671554565, -1.4229271411895752, -1.3453519344329834, -1.267776608467102, -1.1902014017105103, -1.112626075744629, -1.035050868988037, -0.9574755430221558, -0.8799002170562744, -0.8023249506950378, -0.7247496843338013, -0.6471743583679199, -0.5695990920066833, -0.4920237958431244, -0.41444849967956543, -0.33687323331832886, -0.2592979371547699, -0.18172264099121094, -0.10414737462997437, -0.026572048664093018, 0.051003217697143555, 0.12857851386070251, 0.20615379512310028, 0.28372907638549805, 0.361304372549057, 0.43887966871261597, 0.5164549350738525, 0.5940302610397339, 0.6716055274009705, 0.749180793762207, 0.8267561197280884, 0.904331386089325, 0.9819066524505615, 1.0594819784164429, 1.1370573043823242, 1.214632511138916, 1.2922078371047974, 1.3697831630706787, 1.4473583698272705, 1.5249336957931519, 1.6025090217590332, 1.680084228515625, 1.7576595544815063, 1.8352348804473877, 1.9128100872039795, 1.9903854131698608, 2.067960739135742, 2.145535945892334, 2.223111152648926, 2.3006865978240967, 2.3782618045806885, 2.4558372497558594, 2.533412456512451]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 10.0, 18.0, 29.0, 26.0, 40.0, 65.0, 89.0, 150.0, 254.0, 419.0, 679.0, 1082.0, 1947.0, 3175.0, 5803.0, 10345.0, 19769.0, 36251.0, 66035.0, 113815.0, 171393.0, 199026.0, 167689.0, 110187.0, 63415.0, 34770.0, 18547.0, 10247.0, 5654.0, 3118.0, 1703.0, 1035.0, 643.0, 442.0, 261.0, 156.0, 80.0, 54.0, 42.0, 32.0, 23.0, 15.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5341796875, -0.5186805725097656, -0.5031814575195312, -0.4876823425292969, -0.4721832275390625, -0.4566841125488281, -0.44118499755859375, -0.4256858825683594, -0.410186767578125, -0.3946876525878906, -0.37918853759765625, -0.3636894226074219, -0.3481903076171875, -0.3326911926269531, -0.31719207763671875, -0.3016929626464844, -0.28619384765625, -0.2706947326660156, -0.25519561767578125, -0.23969650268554688, -0.2241973876953125, -0.20869827270507812, -0.19319915771484375, -0.17770004272460938, -0.162200927734375, -0.14670181274414062, -0.13120269775390625, -0.11570358276367188, -0.1002044677734375, -0.08470535278320312, -0.06920623779296875, -0.053707122802734375, -0.0382080078125, -0.022708892822265625, -0.00720977783203125, 0.008289337158203125, 0.0237884521484375, 0.039287567138671875, 0.05478668212890625, 0.07028579711914062, 0.085784912109375, 0.10128402709960938, 0.11678314208984375, 0.13228225708007812, 0.1477813720703125, 0.16328048706054688, 0.17877960205078125, 0.19427871704101562, 0.20977783203125, 0.22527694702148438, 0.24077606201171875, 0.2562751770019531, 0.2717742919921875, 0.2872734069824219, 0.30277252197265625, 0.3182716369628906, 0.333770751953125, 0.3492698669433594, 0.36476898193359375, 0.3802680969238281, 0.3957672119140625, 0.4112663269042969, 0.42676544189453125, 0.4422645568847656, 0.457763671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 12.0, 10.0, 7.0, 13.0, 20.0, 19.0, 19.0, 17.0, 22.0, 30.0, 22.0, 37.0, 32.0, 44.0, 39.0, 42.0, 49.0, 65.0, 40.0, 39.0, 44.0, 34.0, 42.0, 44.0, 30.0, 30.0, 26.0, 31.0, 31.0, 23.0, 8.0, 9.0, 15.0, 7.0, 6.0, 9.0, 5.0, 10.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.499053955078125, -2.41607666015625, -2.333099365234375, -2.2501220703125, -2.167144775390625, -2.08416748046875, -2.001190185546875, -1.918212890625, -1.835235595703125, -1.75225830078125, -1.669281005859375, -1.5863037109375, -1.503326416015625, -1.42034912109375, -1.337371826171875, -1.25439453125, -1.171417236328125, -1.08843994140625, -1.005462646484375, -0.9224853515625, -0.839508056640625, -0.75653076171875, -0.673553466796875, -0.590576171875, -0.507598876953125, -0.42462158203125, -0.341644287109375, -0.2586669921875, -0.175689697265625, -0.09271240234375, -0.009735107421875, 0.0732421875, 0.156219482421875, 0.23919677734375, 0.322174072265625, 0.4051513671875, 0.488128662109375, 0.57110595703125, 0.654083251953125, 0.737060546875, 0.820037841796875, 0.90301513671875, 0.985992431640625, 1.0689697265625, 1.151947021484375, 1.23492431640625, 1.317901611328125, 1.40087890625, 1.483856201171875, 1.56683349609375, 1.649810791015625, 1.7327880859375, 1.815765380859375, 1.89874267578125, 1.981719970703125, 2.064697265625, 2.147674560546875, 2.23065185546875, 2.313629150390625, 2.3966064453125, 2.479583740234375, 2.56256103515625, 2.645538330078125, 2.728515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 6.0, 2.0, 0.0, 3.0, 9.0, 10.0, 16.0, 23.0, 33.0, 45.0, 79.0, 110.0, 196.0, 364.0, 707.0, 1807.0, 5112.0, 15648.0, 60564.0, 894297.0, 48572.0, 13528.0, 4421.0, 1558.0, 670.0, 309.0, 171.0, 100.0, 68.0, 38.0, 22.0, 19.0, 21.0, 7.0, 7.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.057403564453125, -1.98980712890625, -1.922210693359375, -1.8546142578125, -1.787017822265625, -1.71942138671875, -1.651824951171875, -1.584228515625, -1.516632080078125, -1.44903564453125, -1.381439208984375, -1.3138427734375, -1.246246337890625, -1.17864990234375, -1.111053466796875, -1.04345703125, -0.975860595703125, -0.90826416015625, -0.840667724609375, -0.7730712890625, -0.705474853515625, -0.63787841796875, -0.570281982421875, -0.502685546875, -0.435089111328125, -0.36749267578125, -0.299896240234375, -0.2322998046875, -0.164703369140625, -0.09710693359375, -0.029510498046875, 0.0380859375, 0.105682373046875, 0.17327880859375, 0.240875244140625, 0.3084716796875, 0.376068115234375, 0.44366455078125, 0.511260986328125, 0.578857421875, 0.646453857421875, 0.71405029296875, 0.781646728515625, 0.8492431640625, 0.916839599609375, 0.98443603515625, 1.052032470703125, 1.11962890625, 1.187225341796875, 1.25482177734375, 1.322418212890625, 1.3900146484375, 1.457611083984375, 1.52520751953125, 1.592803955078125, 1.660400390625, 1.727996826171875, 1.79559326171875, 1.863189697265625, 1.9307861328125, 1.998382568359375, 2.06597900390625, 2.133575439453125, 2.201171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 7.0, 8.0, 5.0, 12.0, 10.0, 9.0, 20.0, 17.0, 28.0, 24.0, 21.0, 32.0, 37.0, 31.0, 47.0, 33.0, 43.0, 33.0, 42.0, 46.0, 41.0, 48.0, 39.0, 41.0, 47.0, 32.0, 35.0, 31.0, 22.0, 23.0, 19.0, 11.0, 16.0, 19.0, 15.0, 12.0, 9.0, 3.0, 5.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6005859375, -1.5468292236328125, -1.493072509765625, -1.4393157958984375, -1.38555908203125, -1.3318023681640625, -1.278045654296875, -1.2242889404296875, -1.1705322265625, -1.1167755126953125, -1.063018798828125, -1.0092620849609375, -0.95550537109375, -0.9017486572265625, -0.847991943359375, -0.7942352294921875, -0.740478515625, -0.6867218017578125, -0.632965087890625, -0.5792083740234375, -0.52545166015625, -0.4716949462890625, -0.417938232421875, -0.3641815185546875, -0.3104248046875, -0.2566680908203125, -0.202911376953125, -0.1491546630859375, -0.09539794921875, -0.0416412353515625, 0.012115478515625, 0.0658721923828125, 0.11962890625, 0.1733856201171875, 0.227142333984375, 0.2808990478515625, 0.33465576171875, 0.3884124755859375, 0.442169189453125, 0.4959259033203125, 0.5496826171875, 0.6034393310546875, 0.657196044921875, 0.7109527587890625, 0.76470947265625, 0.8184661865234375, 0.872222900390625, 0.9259796142578125, 0.979736328125, 1.0334930419921875, 1.087249755859375, 1.1410064697265625, 1.19476318359375, 1.2485198974609375, 1.302276611328125, 1.3560333251953125, 1.4097900390625, 1.4635467529296875, 1.517303466796875, 1.5710601806640625, 1.62481689453125, 1.6785736083984375, 1.732330322265625, 1.7860870361328125, 1.83984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 15.0, 16.0, 23.0, 35.0, 32.0, 81.0, 116.0, 181.0, 346.0, 667.0, 1431.0, 3374.0, 9694.0, 30289.0, 772185.0, 194231.0, 23001.0, 7619.0, 2680.0, 1152.0, 539.0, 329.0, 139.0, 116.0, 81.0, 31.0, 37.0, 24.0, 17.0, 11.0, 7.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.25328636169433594, -0.24534225463867188, -0.2373981475830078, -0.22945404052734375, -0.2215099334716797, -0.21356582641601562, -0.20562171936035156, -0.1976776123046875, -0.18973350524902344, -0.18178939819335938, -0.1738452911376953, -0.16590118408203125, -0.1579570770263672, -0.15001296997070312, -0.14206886291503906, -0.134124755859375, -0.12618064880371094, -0.11823654174804688, -0.11029243469238281, -0.10234832763671875, -0.09440422058105469, -0.08646011352539062, -0.07851600646972656, -0.0705718994140625, -0.06262779235839844, -0.054683685302734375, -0.04673957824707031, -0.03879547119140625, -0.030851364135742188, -0.022907257080078125, -0.014963150024414062, -0.00701904296875, 0.0009250640869140625, 0.008869171142578125, 0.016813278198242188, 0.02475738525390625, 0.03270149230957031, 0.040645599365234375, 0.04858970642089844, 0.0565338134765625, 0.06447792053222656, 0.07242202758789062, 0.08036613464355469, 0.08831024169921875, 0.09625434875488281, 0.10419845581054688, 0.11214256286621094, 0.120086669921875, 0.12803077697753906, 0.13597488403320312, 0.1439189910888672, 0.15186309814453125, 0.1598072052001953, 0.16775131225585938, 0.17569541931152344, 0.1836395263671875, 0.19158363342285156, 0.19952774047851562, 0.2074718475341797, 0.21541595458984375, 0.2233600616455078, 0.23130416870117188, 0.23924827575683594, 0.2471923828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 12.0, 8.0, 6.0, 14.0, 12.0, 19.0, 17.0, 17.0, 25.0, 29.0, 28.0, 27.0, 41.0, 34.0, 51.0, 38.0, 58.0, 42.0, 36.0, 44.0, 44.0, 39.0, 43.0, 38.0, 39.0, 35.0, 29.0, 29.0, 16.0, 24.0, 14.0, 12.0, 10.0, 18.0, 12.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.570240318775177e-06, -5.358830094337463e-06, -5.14741986989975e-06, -4.936009645462036e-06, -4.7245994210243225e-06, -4.513189196586609e-06, -4.301778972148895e-06, -4.090368747711182e-06, -3.878958523273468e-06, -3.6675482988357544e-06, -3.4561380743980408e-06, -3.244727849960327e-06, -3.0333176255226135e-06, -2.8219074010849e-06, -2.6104971766471863e-06, -2.3990869522094727e-06, -2.187676727771759e-06, -1.9762665033340454e-06, -1.7648562788963318e-06, -1.5534460544586182e-06, -1.3420358300209045e-06, -1.130625605583191e-06, -9.192153811454773e-07, -7.078051567077637e-07, -4.9639493227005e-07, -2.849847078323364e-07, -7.35744833946228e-08, 1.3783574104309082e-07, 3.4924596548080444e-07, 5.606561899185181e-07, 7.720664143562317e-07, 9.834766387939453e-07, 1.194886863231659e-06, 1.4062970876693726e-06, 1.6177073121070862e-06, 1.8291175365447998e-06, 2.0405277609825134e-06, 2.251937985420227e-06, 2.4633482098579407e-06, 2.6747584342956543e-06, 2.886168658733368e-06, 3.0975788831710815e-06, 3.308989107608795e-06, 3.520399332046509e-06, 3.7318095564842224e-06, 3.943219780921936e-06, 4.15463000535965e-06, 4.366040229797363e-06, 4.577450454235077e-06, 4.7888606786727905e-06, 5.000270903110504e-06, 5.211681127548218e-06, 5.423091351985931e-06, 5.634501576423645e-06, 5.845911800861359e-06, 6.057322025299072e-06, 6.268732249736786e-06, 6.4801424741744995e-06, 6.691552698612213e-06, 6.902962923049927e-06, 7.11437314748764e-06, 7.325783371925354e-06, 7.537193596363068e-06, 7.748603820800781e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 8.0, 10.0, 23.0, 27.0, 51.0, 63.0, 91.0, 120.0, 168.0, 296.0, 402.0, 558.0, 820.0, 1219.0, 1916.0, 2797.0, 4251.0, 6546.0, 9924.0, 15191.0, 23594.0, 36852.0, 57952.0, 89128.0, 128578.0, 161326.0, 156569.0, 119849.0, 81231.0, 52750.0, 33691.0, 21789.0, 14163.0, 9005.0, 5909.0, 3887.0, 2555.0, 1661.0, 1189.0, 764.0, 536.0, 331.0, 260.0, 172.0, 102.0, 78.0, 47.0, 40.0, 22.0, 23.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1107177734375, -0.10724639892578125, -0.1037750244140625, -0.10030364990234375, -0.096832275390625, -0.09336090087890625, -0.0898895263671875, -0.08641815185546875, -0.08294677734375, -0.07947540283203125, -0.0760040283203125, -0.07253265380859375, -0.069061279296875, -0.06558990478515625, -0.0621185302734375, -0.05864715576171875, -0.05517578125, -0.05170440673828125, -0.0482330322265625, -0.04476165771484375, -0.041290283203125, -0.03781890869140625, -0.0343475341796875, -0.03087615966796875, -0.02740478515625, -0.02393341064453125, -0.0204620361328125, -0.01699066162109375, -0.013519287109375, -0.01004791259765625, -0.0065765380859375, -0.00310516357421875, 0.0003662109375, 0.00383758544921875, 0.0073089599609375, 0.01078033447265625, 0.014251708984375, 0.01772308349609375, 0.0211944580078125, 0.02466583251953125, 0.02813720703125, 0.03160858154296875, 0.0350799560546875, 0.03855133056640625, 0.042022705078125, 0.04549407958984375, 0.0489654541015625, 0.05243682861328125, 0.055908203125, 0.05937957763671875, 0.0628509521484375, 0.06632232666015625, 0.069793701171875, 0.07326507568359375, 0.0767364501953125, 0.08020782470703125, 0.08367919921875, 0.08715057373046875, 0.0906219482421875, 0.09409332275390625, 0.097564697265625, 0.10103607177734375, 0.1045074462890625, 0.10797882080078125, 0.1114501953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 7.0, 14.0, 12.0, 18.0, 25.0, 15.0, 21.0, 34.0, 38.0, 49.0, 42.0, 47.0, 63.0, 51.0, 41.0, 57.0, 61.0, 61.0, 48.0, 35.0, 46.0, 30.0, 29.0, 17.0, 17.0, 14.0, 17.0, 14.0, 9.0, 9.0, 6.0, 5.0, 3.0, 8.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05401611328125, -0.052278995513916016, -0.05054187774658203, -0.04880475997924805, -0.04706764221191406, -0.04533052444458008, -0.043593406677246094, -0.04185628890991211, -0.040119171142578125, -0.03838205337524414, -0.036644935607910156, -0.03490781784057617, -0.03317070007324219, -0.0314335823059082, -0.02969646453857422, -0.027959346771240234, -0.02622222900390625, -0.024485111236572266, -0.02274799346923828, -0.021010875701904297, -0.019273757934570312, -0.017536640167236328, -0.015799522399902344, -0.01406240463256836, -0.012325286865234375, -0.01058816909790039, -0.008851051330566406, -0.007113933563232422, -0.0053768157958984375, -0.003639698028564453, -0.0019025802612304688, -0.00016546249389648438, 0.0015716552734375, 0.0033087730407714844, 0.005045890808105469, 0.006783008575439453, 0.008520126342773438, 0.010257244110107422, 0.011994361877441406, 0.01373147964477539, 0.015468597412109375, 0.01720571517944336, 0.018942832946777344, 0.020679950714111328, 0.022417068481445312, 0.024154186248779297, 0.02589130401611328, 0.027628421783447266, 0.02936553955078125, 0.031102657318115234, 0.03283977508544922, 0.0345768928527832, 0.03631401062011719, 0.03805112838745117, 0.039788246154785156, 0.04152536392211914, 0.043262481689453125, 0.04499959945678711, 0.046736717224121094, 0.04847383499145508, 0.05021095275878906, 0.05194807052612305, 0.05368518829345703, 0.055422306060791016, 0.057159423828125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 6.0, 1.0, 4.0, 8.0, 12.0, 7.0, 15.0, 20.0, 24.0, 23.0, 29.0, 26.0, 42.0, 36.0, 58.0, 37.0, 32.0, 49.0, 57.0, 51.0, 61.0, 48.0, 41.0, 45.0, 37.0, 35.0, 29.0, 33.0, 36.0, 26.0, 16.0, 12.0, 13.0, 6.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587836503982544, -2.507200241088867, -2.4265642166137695, -2.3459279537200928, -2.265291929244995, -2.1846556663513184, -2.1040196418762207, -2.023383378982544, -1.9427472352981567, -1.8621110916137695, -1.7814749479293823, -1.7008388042449951, -1.6202025413513184, -1.5395665168762207, -1.458930253982544, -1.3782941102981567, -1.2976579666137695, -1.2170218229293823, -1.1363856792449951, -1.055749535560608, -0.9751133322715759, -0.8944771885871887, -0.8138409852981567, -0.7332048416137695, -0.6525686979293823, -0.5719325542449951, -0.4912963807582855, -0.4106602072715759, -0.3300240635871887, -0.2493879199028015, -0.16875174641609192, -0.08811557292938232, -0.007479667663574219, 0.07315649092197418, 0.15379264950752258, 0.23442880809307098, 0.3150649666786194, 0.3957011103630066, 0.4763372838497162, 0.5569734573364258, 0.637609601020813, 0.7182457447052002, 0.7988818883895874, 0.8795180916786194, 0.9601542353630066, 1.040790319442749, 1.1214265823364258, 1.202062726020813, 1.2826988697052002, 1.3633350133895874, 1.4439711570739746, 1.5246073007583618, 1.605243444442749, 1.6858797073364258, 1.766515851020813, 1.8471519947052002, 1.9277881383895874, 2.0084242820739746, 2.0890605449676514, 2.169696569442749, 2.250332832336426, 2.3309688568115234, 2.4116051197052, 2.492241382598877, 2.5728774070739746]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 10.0, 9.0, 7.0, 10.0, 7.0, 13.0, 19.0, 26.0, 28.0, 26.0, 21.0, 35.0, 37.0, 32.0, 37.0, 41.0, 54.0, 36.0, 52.0, 39.0, 52.0, 37.0, 47.0, 34.0, 33.0, 33.0, 40.0, 28.0, 33.0, 16.0, 19.0, 13.0, 9.0, 8.0, 8.0, 8.0, 9.0, 1.0, 3.0, 3.0, 5.0, 6.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462100028991699, -2.384106159210205, -2.30611252784729, -2.228118658065796, -2.150125026702881, -2.0721311569213867, -1.9941374063491821, -1.9161436557769775, -1.8381497859954834, -1.7601560354232788, -1.6821622848510742, -1.60416841506958, -1.5261746644973755, -1.448180913925171, -1.3701871633529663, -1.2921934127807617, -1.2141996622085571, -1.1362059116363525, -1.058212161064148, -0.9802183508872986, -0.9022245407104492, -0.8242307901382446, -0.74623703956604, -0.6682432293891907, -0.5902494788169861, -0.5122557282447815, -0.43426191806793213, -0.35626816749572754, -0.27827438712120056, -0.20028060674667358, -0.122286856174469, -0.04429304599761963, 0.03370070457458496, 0.11169447749853134, 0.18968825042247772, 0.2676820158958435, 0.3456757962703705, 0.42366957664489746, 0.501663327217102, 0.5796571373939514, 0.657650887966156, 0.7356446385383606, 0.81363844871521, 0.8916321992874146, 0.9696259498596191, 1.0476198196411133, 1.1256134510040283, 1.2036073207855225, 1.281601071357727, 1.3595948219299316, 1.4375885725021362, 1.5155823230743408, 1.593576192855835, 1.6715699434280396, 1.7495636940002441, 1.8275575637817383, 1.9055511951446533, 1.983544945716858, 2.0615386962890625, 2.1395325660705566, 2.2175261974334717, 2.295520067214966, 2.373513698577881, 2.451507568359375, 2.529501438140869]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 11.0, 12.0, 18.0, 31.0, 56.0, 70.0, 107.0, 177.0, 347.0, 494.0, 695.0, 1046.0, 1688.0, 2536.0, 4060.0, 5982.0, 8992.0, 13389.0, 19377.0, 27498.0, 37116.0, 49323.0, 62921.0, 75430.0, 86827.0, 94393.0, 95537.0, 92263.0, 83202.0, 71584.0, 58480.0, 45214.0, 33799.0, 24213.0, 17030.0, 11763.0, 7851.0, 5216.0, 3537.0, 2285.0, 1415.0, 883.0, 641.0, 370.0, 253.0, 179.0, 79.0, 77.0, 36.0, 21.0, 14.0, 11.0, 12.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0378570556640625, -1.002471923828125, -0.9670867919921875, -0.93170166015625, -0.8963165283203125, -0.860931396484375, -0.8255462646484375, -0.7901611328125, -0.7547760009765625, -0.719390869140625, -0.6840057373046875, -0.64862060546875, -0.6132354736328125, -0.577850341796875, -0.5424652099609375, -0.507080078125, -0.4716949462890625, -0.436309814453125, -0.4009246826171875, -0.36553955078125, -0.3301544189453125, -0.294769287109375, -0.2593841552734375, -0.2239990234375, -0.1886138916015625, -0.153228759765625, -0.1178436279296875, -0.08245849609375, -0.0470733642578125, -0.011688232421875, 0.0236968994140625, 0.05908203125, 0.0944671630859375, 0.129852294921875, 0.1652374267578125, 0.20062255859375, 0.2360076904296875, 0.271392822265625, 0.3067779541015625, 0.3421630859375, 0.3775482177734375, 0.412933349609375, 0.4483184814453125, 0.48370361328125, 0.5190887451171875, 0.554473876953125, 0.5898590087890625, 0.625244140625, 0.6606292724609375, 0.696014404296875, 0.7313995361328125, 0.76678466796875, 0.8021697998046875, 0.837554931640625, 0.8729400634765625, 0.9083251953125, 0.9437103271484375, 0.979095458984375, 1.0144805908203125, 1.04986572265625, 1.0852508544921875, 1.120635986328125, 1.1560211181640625, 1.19140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 9.0, 11.0, 8.0, 7.0, 7.0, 8.0, 9.0, 17.0, 15.0, 13.0, 27.0, 24.0, 38.0, 27.0, 38.0, 36.0, 35.0, 33.0, 48.0, 44.0, 51.0, 37.0, 41.0, 39.0, 51.0, 38.0, 37.0, 38.0, 34.0, 38.0, 29.0, 23.0, 15.0, 21.0, 5.0, 12.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.357421875, -2.278289794921875, -2.19915771484375, -2.120025634765625, -2.0408935546875, -1.961761474609375, -1.88262939453125, -1.803497314453125, -1.724365234375, -1.645233154296875, -1.56610107421875, -1.486968994140625, -1.4078369140625, -1.328704833984375, -1.24957275390625, -1.170440673828125, -1.09130859375, -1.012176513671875, -0.93304443359375, -0.853912353515625, -0.7747802734375, -0.695648193359375, -0.61651611328125, -0.537384033203125, -0.458251953125, -0.379119873046875, -0.29998779296875, -0.220855712890625, -0.1417236328125, -0.062591552734375, 0.01654052734375, 0.095672607421875, 0.1748046875, 0.253936767578125, 0.33306884765625, 0.412200927734375, 0.4913330078125, 0.570465087890625, 0.64959716796875, 0.728729248046875, 0.807861328125, 0.886993408203125, 0.96612548828125, 1.045257568359375, 1.1243896484375, 1.203521728515625, 1.28265380859375, 1.361785888671875, 1.44091796875, 1.520050048828125, 1.59918212890625, 1.678314208984375, 1.7574462890625, 1.836578369140625, 1.91571044921875, 1.994842529296875, 2.073974609375, 2.153106689453125, 2.23223876953125, 2.311370849609375, 2.3905029296875, 2.469635009765625, 2.54876708984375, 2.627899169921875, 2.70703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 12.0, 19.0, 32.0, 42.0, 72.0, 86.0, 146.0, 225.0, 402.0, 542.0, 925.0, 1426.0, 2160.0, 3263.0, 4983.0, 7896.0, 11668.0, 17247.0, 24929.0, 35308.0, 48266.0, 62454.0, 77760.0, 90770.0, 100214.0, 102339.0, 97189.0, 87080.0, 72814.0, 57464.0, 43173.0, 31092.0, 22068.0, 15040.0, 10234.0, 6652.0, 4347.0, 2971.0, 1853.0, 1210.0, 798.0, 547.0, 331.0, 166.0, 128.0, 96.0, 48.0, 24.0, 18.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.337890625, -1.2977447509765625, -1.257598876953125, -1.2174530029296875, -1.17730712890625, -1.1371612548828125, -1.097015380859375, -1.0568695068359375, -1.0167236328125, -0.9765777587890625, -0.936431884765625, -0.8962860107421875, -0.85614013671875, -0.8159942626953125, -0.775848388671875, -0.7357025146484375, -0.695556640625, -0.6554107666015625, -0.615264892578125, -0.5751190185546875, -0.53497314453125, -0.4948272705078125, -0.454681396484375, -0.4145355224609375, -0.3743896484375, -0.3342437744140625, -0.294097900390625, -0.2539520263671875, -0.21380615234375, -0.1736602783203125, -0.133514404296875, -0.0933685302734375, -0.05322265625, -0.0130767822265625, 0.027069091796875, 0.0672149658203125, 0.10736083984375, 0.1475067138671875, 0.187652587890625, 0.2277984619140625, 0.2679443359375, 0.3080902099609375, 0.348236083984375, 0.3883819580078125, 0.42852783203125, 0.4686737060546875, 0.508819580078125, 0.5489654541015625, 0.589111328125, 0.6292572021484375, 0.669403076171875, 0.7095489501953125, 0.74969482421875, 0.7898406982421875, 0.829986572265625, 0.8701324462890625, 0.9102783203125, 0.9504241943359375, 0.990570068359375, 1.0307159423828125, 1.07086181640625, 1.1110076904296875, 1.151153564453125, 1.1912994384765625, 1.2314453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 11.0, 12.0, 10.0, 13.0, 19.0, 17.0, 13.0, 23.0, 22.0, 34.0, 33.0, 43.0, 38.0, 34.0, 46.0, 39.0, 32.0, 49.0, 47.0, 40.0, 46.0, 36.0, 34.0, 45.0, 29.0, 30.0, 21.0, 27.0, 20.0, 22.0, 23.0, 11.0, 10.0, 7.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5986328125, -1.54925537109375, -1.4998779296875, -1.45050048828125, -1.401123046875, -1.35174560546875, -1.3023681640625, -1.25299072265625, -1.20361328125, -1.15423583984375, -1.1048583984375, -1.05548095703125, -1.006103515625, -0.95672607421875, -0.9073486328125, -0.85797119140625, -0.80859375, -0.75921630859375, -0.7098388671875, -0.66046142578125, -0.611083984375, -0.56170654296875, -0.5123291015625, -0.46295166015625, -0.41357421875, -0.36419677734375, -0.3148193359375, -0.26544189453125, -0.216064453125, -0.16668701171875, -0.1173095703125, -0.06793212890625, -0.0185546875, 0.03082275390625, 0.0802001953125, 0.12957763671875, 0.178955078125, 0.22833251953125, 0.2777099609375, 0.32708740234375, 0.37646484375, 0.42584228515625, 0.4752197265625, 0.52459716796875, 0.573974609375, 0.62335205078125, 0.6727294921875, 0.72210693359375, 0.771484375, 0.82086181640625, 0.8702392578125, 0.91961669921875, 0.968994140625, 1.01837158203125, 1.0677490234375, 1.11712646484375, 1.16650390625, 1.21588134765625, 1.2652587890625, 1.31463623046875, 1.364013671875, 1.41339111328125, 1.4627685546875, 1.51214599609375, 1.5615234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 16.0, 18.0, 19.0, 33.0, 44.0, 87.0, 167.0, 276.0, 428.0, 757.0, 1303.0, 2246.0, 3873.0, 6251.0, 10489.0, 16995.0, 26249.0, 39208.0, 56205.0, 76058.0, 95131.0, 110692.0, 117557.0, 113668.0, 100836.0, 82823.0, 62471.0, 44406.0, 30177.0, 19493.0, 12201.0, 7432.0, 4494.0, 2623.0, 1552.0, 935.0, 563.0, 325.0, 198.0, 101.0, 64.0, 39.0, 25.0, 12.0, 6.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.580078125, -0.5633430480957031, -0.5466079711914062, -0.5298728942871094, -0.5131378173828125, -0.4964027404785156, -0.47966766357421875, -0.4629325866699219, -0.446197509765625, -0.4294624328613281, -0.41272735595703125, -0.3959922790527344, -0.3792572021484375, -0.3625221252441406, -0.34578704833984375, -0.3290519714355469, -0.31231689453125, -0.2955818176269531, -0.27884674072265625, -0.2621116638183594, -0.2453765869140625, -0.22864151000976562, -0.21190643310546875, -0.19517135620117188, -0.178436279296875, -0.16170120239257812, -0.14496612548828125, -0.12823104858398438, -0.1114959716796875, -0.09476089477539062, -0.07802581787109375, -0.061290740966796875, -0.0445556640625, -0.027820587158203125, -0.01108551025390625, 0.005649566650390625, 0.0223846435546875, 0.039119720458984375, 0.05585479736328125, 0.07258987426757812, 0.089324951171875, 0.10606002807617188, 0.12279510498046875, 0.13953018188476562, 0.1562652587890625, 0.17300033569335938, 0.18973541259765625, 0.20647048950195312, 0.22320556640625, 0.23994064331054688, 0.25667572021484375, 0.2734107971191406, 0.2901458740234375, 0.3068809509277344, 0.32361602783203125, 0.3403511047363281, 0.357086181640625, 0.3738212585449219, 0.39055633544921875, 0.4072914123535156, 0.4240264892578125, 0.4407615661621094, 0.45749664306640625, 0.4742317199707031, 0.490966796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 9.0, 10.0, 17.0, 22.0, 19.0, 28.0, 33.0, 36.0, 40.0, 58.0, 57.0, 47.0, 52.0, 69.0, 79.0, 52.0, 62.0, 43.0, 53.0, 41.0, 28.0, 27.0, 30.0, 19.0, 15.0, 8.0, 8.0, 9.0, 9.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03795051574707e-05, -5.781091749668121e-05, -5.5242329835891724e-05, -5.2673742175102234e-05, -5.0105154514312744e-05, -4.7536566853523254e-05, -4.4967979192733765e-05, -4.2399391531944275e-05, -3.9830803871154785e-05, -3.7262216210365295e-05, -3.4693628549575806e-05, -3.2125040888786316e-05, -2.9556453227996826e-05, -2.6987865567207336e-05, -2.4419277906417847e-05, -2.1850690245628357e-05, -1.9282102584838867e-05, -1.6713514924049377e-05, -1.4144927263259888e-05, -1.1576339602470398e-05, -9.007751941680908e-06, -6.4391642808914185e-06, -3.870576620101929e-06, -1.301988959312439e-06, 1.2665987014770508e-06, 3.8351863622665405e-06, 6.40377402305603e-06, 8.97236168384552e-06, 1.154094934463501e-05, 1.41095370054245e-05, 1.667812466621399e-05, 1.924671232700348e-05, 2.181529998779297e-05, 2.438388764858246e-05, 2.6952475309371948e-05, 2.9521062970161438e-05, 3.208965063095093e-05, 3.465823829174042e-05, 3.722682595252991e-05, 3.97954136133194e-05, 4.236400127410889e-05, 4.4932588934898376e-05, 4.7501176595687866e-05, 5.0069764256477356e-05, 5.2638351917266846e-05, 5.5206939578056335e-05, 5.7775527238845825e-05, 6.0344114899635315e-05, 6.29127025604248e-05, 6.54812902212143e-05, 6.804987788200378e-05, 7.061846554279327e-05, 7.318705320358276e-05, 7.575564086437225e-05, 7.832422852516174e-05, 8.089281618595123e-05, 8.346140384674072e-05, 8.602999150753021e-05, 8.85985791683197e-05, 9.116716682910919e-05, 9.373575448989868e-05, 9.630434215068817e-05, 9.887292981147766e-05, 0.00010144151747226715, 0.00010401010513305664]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 13.0, 15.0, 36.0, 75.0, 123.0, 188.0, 287.0, 530.0, 780.0, 1309.0, 2141.0, 3291.0, 5287.0, 8271.0, 12763.0, 19508.0, 28187.0, 39833.0, 54419.0, 70094.0, 85083.0, 97262.0, 104512.0, 103647.0, 95727.0, 82374.0, 66697.0, 51307.0, 37669.0, 26429.0, 17824.0, 12012.0, 7701.0, 4984.0, 3167.0, 1940.0, 1176.0, 739.0, 466.0, 279.0, 171.0, 93.0, 58.0, 32.0, 21.0, 12.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4966278076171875, -0.480560302734375, -0.4644927978515625, -0.44842529296875, -0.4323577880859375, -0.416290283203125, -0.4002227783203125, -0.3841552734375, -0.3680877685546875, -0.352020263671875, -0.3359527587890625, -0.31988525390625, -0.3038177490234375, -0.287750244140625, -0.2716827392578125, -0.255615234375, -0.2395477294921875, -0.223480224609375, -0.2074127197265625, -0.19134521484375, -0.1752777099609375, -0.159210205078125, -0.1431427001953125, -0.1270751953125, -0.1110076904296875, -0.094940185546875, -0.0788726806640625, -0.06280517578125, -0.0467376708984375, -0.030670166015625, -0.0146026611328125, 0.00146484375, 0.0175323486328125, 0.033599853515625, 0.0496673583984375, 0.06573486328125, 0.0818023681640625, 0.097869873046875, 0.1139373779296875, 0.1300048828125, 0.1460723876953125, 0.162139892578125, 0.1782073974609375, 0.19427490234375, 0.2103424072265625, 0.226409912109375, 0.2424774169921875, 0.258544921875, 0.2746124267578125, 0.290679931640625, 0.3067474365234375, 0.32281494140625, 0.3388824462890625, 0.354949951171875, 0.3710174560546875, 0.3870849609375, 0.4031524658203125, 0.419219970703125, 0.4352874755859375, 0.45135498046875, 0.4674224853515625, 0.483489990234375, 0.4995574951171875, 0.515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 3.0, 12.0, 19.0, 18.0, 21.0, 21.0, 28.0, 33.0, 37.0, 45.0, 59.0, 63.0, 52.0, 48.0, 42.0, 51.0, 39.0, 48.0, 47.0, 40.0, 55.0, 34.0, 38.0, 31.0, 15.0, 22.0, 13.0, 8.0, 13.0, 13.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2978515625, -0.2892417907714844, -0.28063201904296875, -0.2720222473144531, -0.2634124755859375, -0.2548027038574219, -0.24619293212890625, -0.23758316040039062, -0.228973388671875, -0.22036361694335938, -0.21175384521484375, -0.20314407348632812, -0.1945343017578125, -0.18592453002929688, -0.17731475830078125, -0.16870498657226562, -0.16009521484375, -0.15148544311523438, -0.14287567138671875, -0.13426589965820312, -0.1256561279296875, -0.11704635620117188, -0.10843658447265625, -0.09982681274414062, -0.091217041015625, -0.08260726928710938, -0.07399749755859375, -0.06538772583007812, -0.0567779541015625, -0.048168182373046875, -0.03955841064453125, -0.030948638916015625, -0.0223388671875, -0.013729095458984375, -0.00511932373046875, 0.003490447998046875, 0.0121002197265625, 0.020709991455078125, 0.02931976318359375, 0.037929534912109375, 0.046539306640625, 0.055149078369140625, 0.06375885009765625, 0.07236862182617188, 0.0809783935546875, 0.08958816528320312, 0.09819793701171875, 0.10680770874023438, 0.11541748046875, 0.12402725219726562, 0.13263702392578125, 0.14124679565429688, 0.1498565673828125, 0.15846633911132812, 0.16707611083984375, 0.17568588256835938, 0.184295654296875, 0.19290542602539062, 0.20151519775390625, 0.21012496948242188, 0.2187347412109375, 0.22734451293945312, 0.23595428466796875, 0.24456405639648438, 0.253173828125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 7.0, 8.0, 14.0, 19.0, 22.0, 23.0, 26.0, 27.0, 27.0, 31.0, 37.0, 43.0, 44.0, 49.0, 57.0, 47.0, 38.0, 54.0, 50.0, 41.0, 35.0, 43.0, 37.0, 28.0, 32.0, 38.0, 26.0, 17.0, 13.0, 15.0, 10.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.377398729324341, -2.3006482124328613, -2.223897695541382, -2.1471471786499023, -2.0703964233398438, -1.9936460256576538, -1.9168953895568848, -1.8401448726654053, -1.7633943557739258, -1.6866438388824463, -1.6098933219909668, -1.5331426858901978, -1.4563921689987183, -1.3796416521072388, -1.3028910160064697, -1.2261404991149902, -1.1493899822235107, -1.0726394653320312, -0.995888888835907, -0.9191383123397827, -0.8423877954483032, -0.7656372785568237, -0.6888867020606995, -0.6121361255645752, -0.5353856086730957, -0.4586350619792938, -0.38188451528549194, -0.30513396859169006, -0.22838342189788818, -0.1516328752040863, -0.07488232851028442, 0.0018682479858398438, 0.07861900329589844, 0.15536954998970032, 0.2321200966835022, 0.3088706433773041, 0.38562119007110596, 0.46237173676490784, 0.5391222834587097, 0.615872859954834, 0.6926233768463135, 0.769373893737793, 0.8461244702339172, 0.9228750467300415, 0.999625563621521, 1.0763760805130005, 1.1531267166137695, 1.229877233505249, 1.3066277503967285, 1.383378267288208, 1.4601287841796875, 1.5368794202804565, 1.613629937171936, 1.6903804540634155, 1.7671310901641846, 1.843881607055664, 1.9206321239471436, 1.997382640838623, 2.0741331577301025, 2.150883674621582, 2.2276344299316406, 2.30438494682312, 2.3811354637145996, 2.457885980606079, 2.5346364974975586]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 8.0, 10.0, 18.0, 23.0, 14.0, 21.0, 29.0, 24.0, 40.0, 31.0, 36.0, 37.0, 41.0, 42.0, 29.0, 52.0, 48.0, 49.0, 49.0, 41.0, 43.0, 34.0, 46.0, 33.0, 26.0, 26.0, 24.0, 15.0, 12.0, 19.0, 5.0, 5.0, 6.0, 7.0, 12.0, 4.0, 5.0, 1.0, 3.0, 0.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.768204689025879, -2.6827192306518555, -2.597234010696411, -2.5117485523223877, -2.4262630939483643, -2.34077787399292, -2.2552924156188965, -2.169806957244873, -2.0843214988708496, -1.9988361597061157, -1.9133507013320923, -1.8278653621673584, -1.742379903793335, -1.656894564628601, -1.5714092254638672, -1.4859237670898438, -1.4004385471343994, -1.3149532079696655, -1.229467749595642, -1.1439824104309082, -1.0584969520568848, -0.9730116128921509, -0.887526273727417, -0.8020408749580383, -0.7165554761886597, -0.631070077419281, -0.5455846786499023, -0.46009933948516846, -0.3746139407157898, -0.28912854194641113, -0.20364320278167725, -0.11815780401229858, -0.03267264366149902, 0.052812740206718445, 0.1382981240749359, 0.2237834930419922, 0.30926889181137085, 0.3947542905807495, 0.4802396297454834, 0.5657250285148621, 0.6512104272842407, 0.7366958260536194, 0.822181224822998, 0.9076665639877319, 0.9931519627571106, 1.0786373615264893, 1.1641227006912231, 1.249608039855957, 1.3350934982299805, 1.4205788373947144, 1.5060642957687378, 1.5915496349334717, 1.6770350933074951, 1.762520432472229, 1.848005771636963, 1.9334912300109863, 2.0189766883850098, 2.104462146759033, 2.1899473667144775, 2.275432825088501, 2.3609182834625244, 2.4464035034179688, 2.531888961791992, 2.6173744201660156, 2.70285964012146]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 6.0, 8.0, 11.0, 18.0, 34.0, 48.0, 59.0, 113.0, 200.0, 267.0, 451.0, 726.0, 1246.0, 1940.0, 3334.0, 5459.0, 9218.0, 15644.0, 26806.0, 45980.0, 78738.0, 133646.0, 223951.0, 350797.0, 498537.0, 611238.0, 627329.0, 537251.0, 390915.0, 254375.0, 154449.0, 91114.0, 53324.0, 31136.0, 18245.0, 10755.0, 6514.0, 3928.0, 2387.0, 1504.0, 915.0, 613.0, 374.0, 251.0, 138.0, 105.0, 66.0, 46.0, 30.0, 17.0, 10.0, 7.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.736328125, -1.6767578125, -1.6171875, -1.5576171875, -1.498046875, -1.4384765625, -1.37890625, -1.3193359375, -1.259765625, -1.2001953125, -1.140625, -1.0810546875, -1.021484375, -0.9619140625, -0.90234375, -0.8427734375, -0.783203125, -0.7236328125, -0.6640625, -0.6044921875, -0.544921875, -0.4853515625, -0.42578125, -0.3662109375, -0.306640625, -0.2470703125, -0.1875, -0.1279296875, -0.068359375, -0.0087890625, 0.05078125, 0.1103515625, 0.169921875, 0.2294921875, 0.2890625, 0.3486328125, 0.408203125, 0.4677734375, 0.52734375, 0.5869140625, 0.646484375, 0.7060546875, 0.765625, 0.8251953125, 0.884765625, 0.9443359375, 1.00390625, 1.0634765625, 1.123046875, 1.1826171875, 1.2421875, 1.3017578125, 1.361328125, 1.4208984375, 1.48046875, 1.5400390625, 1.599609375, 1.6591796875, 1.71875, 1.7783203125, 1.837890625, 1.8974609375, 1.95703125, 2.0166015625, 2.076171875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 12.0, 11.0, 12.0, 16.0, 18.0, 14.0, 9.0, 31.0, 23.0, 36.0, 36.0, 35.0, 39.0, 45.0, 48.0, 46.0, 39.0, 58.0, 34.0, 52.0, 52.0, 47.0, 43.0, 24.0, 31.0, 35.0, 25.0, 17.0, 18.0, 18.0, 9.0, 9.0, 13.0, 7.0, 12.0, 1.0, 5.0, 1.0, 3.0, 8.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.845703125, -2.765289306640625, -2.68487548828125, -2.604461669921875, -2.5240478515625, -2.443634033203125, -2.36322021484375, -2.282806396484375, -2.202392578125, -2.121978759765625, -2.04156494140625, -1.961151123046875, -1.8807373046875, -1.800323486328125, -1.71990966796875, -1.639495849609375, -1.55908203125, -1.478668212890625, -1.39825439453125, -1.317840576171875, -1.2374267578125, -1.157012939453125, -1.07659912109375, -0.996185302734375, -0.915771484375, -0.835357666015625, -0.75494384765625, -0.674530029296875, -0.5941162109375, -0.513702392578125, -0.43328857421875, -0.352874755859375, -0.2724609375, -0.192047119140625, -0.11163330078125, -0.031219482421875, 0.0491943359375, 0.129608154296875, 0.21002197265625, 0.290435791015625, 0.370849609375, 0.451263427734375, 0.53167724609375, 0.612091064453125, 0.6925048828125, 0.772918701171875, 0.85333251953125, 0.933746337890625, 1.01416015625, 1.094573974609375, 1.17498779296875, 1.255401611328125, 1.3358154296875, 1.416229248046875, 1.49664306640625, 1.577056884765625, 1.657470703125, 1.737884521484375, 1.81829833984375, 1.898712158203125, 1.9791259765625, 2.059539794921875, 2.13995361328125, 2.220367431640625, 2.30078125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 10.0, 15.0, 14.0, 15.0, 28.0, 70.0, 90.0, 161.0, 228.0, 425.0, 694.0, 1121.0, 1963.0, 3307.0, 5553.0, 9145.0, 15408.0, 26019.0, 44149.0, 72535.0, 118390.0, 185470.0, 281233.0, 397337.0, 504526.0, 565457.0, 545822.0, 454883.0, 340855.0, 232785.0, 150476.0, 93752.0, 57194.0, 34482.0, 20620.0, 12161.0, 7147.0, 4364.0, 2558.0, 1541.0, 924.0, 554.0, 302.0, 198.0, 112.0, 75.0, 50.0, 28.0, 19.0, 16.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9677734375, -1.9016571044921875, -1.835540771484375, -1.7694244384765625, -1.70330810546875, -1.6371917724609375, -1.571075439453125, -1.5049591064453125, -1.4388427734375, -1.3727264404296875, -1.306610107421875, -1.2404937744140625, -1.17437744140625, -1.1082611083984375, -1.042144775390625, -0.9760284423828125, -0.909912109375, -0.8437957763671875, -0.777679443359375, -0.7115631103515625, -0.64544677734375, -0.5793304443359375, -0.513214111328125, -0.4470977783203125, -0.3809814453125, -0.3148651123046875, -0.248748779296875, -0.1826324462890625, -0.11651611328125, -0.0503997802734375, 0.015716552734375, 0.0818328857421875, 0.14794921875, 0.2140655517578125, 0.280181884765625, 0.3462982177734375, 0.41241455078125, 0.4785308837890625, 0.544647216796875, 0.6107635498046875, 0.6768798828125, 0.7429962158203125, 0.809112548828125, 0.8752288818359375, 0.94134521484375, 1.0074615478515625, 1.073577880859375, 1.1396942138671875, 1.205810546875, 1.2719268798828125, 1.338043212890625, 1.4041595458984375, 1.47027587890625, 1.5363922119140625, 1.602508544921875, 1.6686248779296875, 1.7347412109375, 1.8008575439453125, 1.866973876953125, 1.9330902099609375, 1.99920654296875, 2.0653228759765625, 2.131439208984375, 2.1975555419921875, 2.263671875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 12.0, 15.0, 18.0, 27.0, 19.0, 41.0, 41.0, 59.0, 88.0, 93.0, 109.0, 143.0, 147.0, 160.0, 208.0, 188.0, 227.0, 201.0, 276.0, 237.0, 201.0, 198.0, 214.0, 187.0, 150.0, 149.0, 115.0, 114.0, 96.0, 88.0, 58.0, 48.0, 36.0, 19.0, 25.0, 17.0, 12.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1328125, -1.099609375, -1.06640625, -1.033203125, -1.0, -0.966796875, -0.93359375, -0.900390625, -0.8671875, -0.833984375, -0.80078125, -0.767578125, -0.734375, -0.701171875, -0.66796875, -0.634765625, -0.6015625, -0.568359375, -0.53515625, -0.501953125, -0.46875, -0.435546875, -0.40234375, -0.369140625, -0.3359375, -0.302734375, -0.26953125, -0.236328125, -0.203125, -0.169921875, -0.13671875, -0.103515625, -0.0703125, -0.037109375, -0.00390625, 0.029296875, 0.0625, 0.095703125, 0.12890625, 0.162109375, 0.1953125, 0.228515625, 0.26171875, 0.294921875, 0.328125, 0.361328125, 0.39453125, 0.427734375, 0.4609375, 0.494140625, 0.52734375, 0.560546875, 0.59375, 0.626953125, 0.66015625, 0.693359375, 0.7265625, 0.759765625, 0.79296875, 0.826171875, 0.859375, 0.892578125, 0.92578125, 0.958984375, 0.9921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 5.0, 5.0, 7.0, 5.0, 14.0, 21.0, 17.0, 17.0, 20.0, 26.0, 35.0, 34.0, 44.0, 46.0, 41.0, 38.0, 50.0, 40.0, 60.0, 40.0, 46.0, 53.0, 49.0, 45.0, 30.0, 33.0, 28.0, 22.0, 23.0, 26.0, 18.0, 12.0, 10.0, 12.0, 6.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.924391269683838, -2.841459035873413, -2.7585268020629883, -2.6755948066711426, -2.5926625728607178, -2.509730339050293, -2.426798105239868, -2.3438658714294434, -2.2609338760375977, -2.178001642227173, -2.095069408416748, -2.0121374130249023, -1.9292051792144775, -1.8462729454040527, -1.763340711593628, -1.6804084777832031, -1.5974762439727783, -1.5145440101623535, -1.4316118955612183, -1.3486796617507935, -1.2657475471496582, -1.1828153133392334, -1.0998830795288086, -1.0169508457183838, -0.9340187311172485, -0.8510865569114685, -0.7681543827056885, -0.6852221488952637, -0.6022899746894836, -0.5193578004837036, -0.4364255964756012, -0.3534933924674988, -0.27056145668029785, -0.18762926757335663, -0.1046970784664154, -0.021764889359474182, 0.06116729974746704, 0.14409947395324707, 0.2270316779613495, 0.3099638819694519, 0.39289605617523193, 0.47582823038101196, 0.558760404586792, 0.6416926383972168, 0.7246248126029968, 0.8075569868087769, 0.8904892206192017, 0.9734213948249817, 1.0563535690307617, 1.1392858028411865, 1.2222179174423218, 1.3051501512527466, 1.3880822658538818, 1.4710144996643066, 1.5539467334747314, 1.6368789672851562, 1.7198110818862915, 1.8027433156967163, 1.8856754302978516, 1.9686076641082764, 2.051539897918701, 2.134471893310547, 2.2174041271209717, 2.3003363609313965, 2.3832685947418213]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 17.0, 14.0, 17.0, 15.0, 18.0, 20.0, 25.0, 29.0, 21.0, 32.0, 25.0, 37.0, 55.0, 42.0, 46.0, 44.0, 42.0, 38.0, 55.0, 54.0, 40.0, 26.0, 38.0, 38.0, 32.0, 22.0, 17.0, 20.0, 10.0, 17.0, 17.0, 15.0, 7.0, 6.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.689835548400879, -2.6031672954559326, -2.5164992809295654, -2.429831027984619, -2.343163013458252, -2.2564947605133057, -2.1698265075683594, -2.083158493041992, -1.996490240097046, -1.9098221063613892, -1.8231539726257324, -1.7364857196807861, -1.6498175859451294, -1.5631494522094727, -1.4764811992645264, -1.3898130655288696, -1.303144931793213, -1.2164767980575562, -1.1298086643218994, -1.0431404113769531, -0.9564722776412964, -0.8698041439056396, -0.7831359505653381, -0.6964677572250366, -0.6097996234893799, -0.5231314897537231, -0.43646329641342163, -0.3497951328754425, -0.2631269693374634, -0.17645880579948425, -0.08979064226150513, -0.0031224489212036133, 0.08354544639587402, 0.17021360993385315, 0.2568817734718323, 0.3435499370098114, 0.4302181005477905, 0.5168862342834473, 0.6035544276237488, 0.6902226209640503, 0.776890754699707, 0.8635588884353638, 0.9502270817756653, 1.0368952751159668, 1.1235634088516235, 1.2102315425872803, 1.2968997955322266, 1.3835679292678833, 1.47023606300354, 1.5569041967391968, 1.6435723304748535, 1.7302405834197998, 1.8169087171554565, 1.9035768508911133, 1.9902451038360596, 2.076913356781006, 2.163581371307373, 2.2502496242523193, 2.3369176387786865, 2.423585891723633, 2.51025390625, 2.5969221591949463, 2.6835904121398926, 2.7702584266662598, 2.856926679611206]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 4.0, 10.0, 9.0, 27.0, 27.0, 55.0, 52.0, 73.0, 101.0, 187.0, 248.0, 359.0, 533.0, 797.0, 1118.0, 1694.0, 2513.0, 3865.0, 5760.0, 8915.0, 13897.0, 21337.0, 32955.0, 49867.0, 72580.0, 99925.0, 124565.0, 135828.0, 128890.0, 105648.0, 78376.0, 54610.0, 36179.0, 23620.0, 15110.0, 9926.0, 6339.0, 4171.0, 2715.0, 1787.0, 1184.0, 850.0, 566.0, 401.0, 246.0, 218.0, 129.0, 96.0, 61.0, 51.0, 37.0, 16.0, 11.0, 7.0, 5.0, 3.0, 4.0], "bins": [-0.331787109375, -0.3222007751464844, -0.31261444091796875, -0.3030281066894531, -0.2934417724609375, -0.2838554382324219, -0.27426910400390625, -0.2646827697753906, -0.255096435546875, -0.24551010131835938, -0.23592376708984375, -0.22633743286132812, -0.2167510986328125, -0.20716476440429688, -0.19757843017578125, -0.18799209594726562, -0.17840576171875, -0.16881942749023438, -0.15923309326171875, -0.14964675903320312, -0.1400604248046875, -0.13047409057617188, -0.12088775634765625, -0.11130142211914062, -0.101715087890625, -0.09212875366210938, -0.08254241943359375, -0.07295608520507812, -0.0633697509765625, -0.053783416748046875, -0.04419708251953125, -0.034610748291015625, -0.0250244140625, -0.015438079833984375, -0.00585174560546875, 0.003734588623046875, 0.0133209228515625, 0.022907257080078125, 0.03249359130859375, 0.042079925537109375, 0.051666259765625, 0.061252593994140625, 0.07083892822265625, 0.08042526245117188, 0.0900115966796875, 0.09959793090820312, 0.10918426513671875, 0.11877059936523438, 0.12835693359375, 0.13794326782226562, 0.14752960205078125, 0.15711593627929688, 0.1667022705078125, 0.17628860473632812, 0.18587493896484375, 0.19546127319335938, 0.205047607421875, 0.21463394165039062, 0.22422027587890625, 0.23380661010742188, 0.2433929443359375, 0.2529792785644531, 0.26256561279296875, 0.2721519470214844, 0.28173828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 0.0, 2.0, 2.0, 13.0, 6.0, 8.0, 9.0, 12.0, 15.0, 17.0, 31.0, 19.0, 34.0, 21.0, 34.0, 39.0, 35.0, 45.0, 50.0, 41.0, 51.0, 41.0, 60.0, 40.0, 55.0, 46.0, 35.0, 41.0, 30.0, 31.0, 21.0, 23.0, 21.0, 8.0, 13.0, 9.0, 11.0, 7.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.84454345703125, -2.7476806640625, -2.65081787109375, -2.553955078125, -2.45709228515625, -2.3602294921875, -2.26336669921875, -2.16650390625, -2.06964111328125, -1.9727783203125, -1.87591552734375, -1.779052734375, -1.68218994140625, -1.5853271484375, -1.48846435546875, -1.3916015625, -1.29473876953125, -1.1978759765625, -1.10101318359375, -1.004150390625, -0.90728759765625, -0.8104248046875, -0.71356201171875, -0.61669921875, -0.51983642578125, -0.4229736328125, -0.32611083984375, -0.229248046875, -0.13238525390625, -0.0355224609375, 0.06134033203125, 0.158203125, 0.25506591796875, 0.3519287109375, 0.44879150390625, 0.545654296875, 0.64251708984375, 0.7393798828125, 0.83624267578125, 0.93310546875, 1.02996826171875, 1.1268310546875, 1.22369384765625, 1.320556640625, 1.41741943359375, 1.5142822265625, 1.61114501953125, 1.7080078125, 1.80487060546875, 1.9017333984375, 1.99859619140625, 2.095458984375, 2.19232177734375, 2.2891845703125, 2.38604736328125, 2.48291015625, 2.57977294921875, 2.6766357421875, 2.77349853515625, 2.870361328125, 2.96722412109375, 3.0640869140625, 3.16094970703125, 3.2578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 13.0, 15.0, 17.0, 25.0, 39.0, 61.0, 123.0, 208.0, 339.0, 470.0, 855.0, 1471.0, 2827.0, 5179.0, 9802.0, 19655.0, 52126.0, 715498.0, 180547.0, 29305.0, 13924.0, 7229.0, 3719.0, 2130.0, 1220.0, 656.0, 404.0, 227.0, 144.0, 117.0, 56.0, 42.0, 29.0, 19.0, 11.0, 9.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.024383544921875, -0.99310302734375, -0.961822509765625, -0.9305419921875, -0.899261474609375, -0.86798095703125, -0.836700439453125, -0.805419921875, -0.774139404296875, -0.74285888671875, -0.711578369140625, -0.6802978515625, -0.649017333984375, -0.61773681640625, -0.586456298828125, -0.55517578125, -0.523895263671875, -0.49261474609375, -0.461334228515625, -0.4300537109375, -0.398773193359375, -0.36749267578125, -0.336212158203125, -0.304931640625, -0.273651123046875, -0.24237060546875, -0.211090087890625, -0.1798095703125, -0.148529052734375, -0.11724853515625, -0.085968017578125, -0.0546875, -0.023406982421875, 0.00787353515625, 0.039154052734375, 0.0704345703125, 0.101715087890625, 0.13299560546875, 0.164276123046875, 0.195556640625, 0.226837158203125, 0.25811767578125, 0.289398193359375, 0.3206787109375, 0.351959228515625, 0.38323974609375, 0.414520263671875, 0.44580078125, 0.477081298828125, 0.50836181640625, 0.539642333984375, 0.5709228515625, 0.602203369140625, 0.63348388671875, 0.664764404296875, 0.696044921875, 0.727325439453125, 0.75860595703125, 0.789886474609375, 0.8211669921875, 0.852447509765625, 0.88372802734375, 0.915008544921875, 0.9462890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 15.0, 11.0, 12.0, 10.0, 8.0, 20.0, 23.0, 16.0, 26.0, 23.0, 24.0, 34.0, 27.0, 33.0, 43.0, 36.0, 30.0, 27.0, 32.0, 39.0, 33.0, 42.0, 38.0, 36.0, 32.0, 37.0, 27.0, 34.0, 29.0, 22.0, 20.0, 22.0, 21.0, 16.0, 12.0, 11.0, 10.0, 20.0, 4.0, 4.0, 3.0, 7.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0], "bins": [-1.8525390625, -1.800628662109375, -1.74871826171875, -1.696807861328125, -1.6448974609375, -1.592987060546875, -1.54107666015625, -1.489166259765625, -1.437255859375, -1.385345458984375, -1.33343505859375, -1.281524658203125, -1.2296142578125, -1.177703857421875, -1.12579345703125, -1.073883056640625, -1.02197265625, -0.970062255859375, -0.91815185546875, -0.866241455078125, -0.8143310546875, -0.762420654296875, -0.71051025390625, -0.658599853515625, -0.606689453125, -0.554779052734375, -0.50286865234375, -0.450958251953125, -0.3990478515625, -0.347137451171875, -0.29522705078125, -0.243316650390625, -0.19140625, -0.139495849609375, -0.08758544921875, -0.035675048828125, 0.0162353515625, 0.068145751953125, 0.12005615234375, 0.171966552734375, 0.223876953125, 0.275787353515625, 0.32769775390625, 0.379608154296875, 0.4315185546875, 0.483428955078125, 0.53533935546875, 0.587249755859375, 0.63916015625, 0.691070556640625, 0.74298095703125, 0.794891357421875, 0.8468017578125, 0.898712158203125, 0.95062255859375, 1.002532958984375, 1.054443359375, 1.106353759765625, 1.15826416015625, 1.210174560546875, 1.2620849609375, 1.313995361328125, 1.36590576171875, 1.417816162109375, 1.4697265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 7.0, 12.0, 8.0, 13.0, 26.0, 24.0, 42.0, 61.0, 97.0, 115.0, 201.0, 289.0, 507.0, 691.0, 1169.0, 1787.0, 3109.0, 5297.0, 8797.0, 15071.0, 26969.0, 125031.0, 758774.0, 48354.0, 21676.0, 12167.0, 7100.0, 4314.0, 2595.0, 1499.0, 984.0, 577.0, 384.0, 257.0, 174.0, 99.0, 79.0, 45.0, 42.0, 29.0, 25.0, 15.0, 14.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.10675048828125, -0.103546142578125, -0.100341796875, -0.097137451171875, -0.09393310546875, -0.090728759765625, -0.0875244140625, -0.084320068359375, -0.08111572265625, -0.077911376953125, -0.07470703125, -0.071502685546875, -0.06829833984375, -0.065093994140625, -0.0618896484375, -0.058685302734375, -0.05548095703125, -0.052276611328125, -0.049072265625, -0.045867919921875, -0.04266357421875, -0.039459228515625, -0.0362548828125, -0.033050537109375, -0.02984619140625, -0.026641845703125, -0.0234375, -0.020233154296875, -0.01702880859375, -0.013824462890625, -0.0106201171875, -0.007415771484375, -0.00421142578125, -0.001007080078125, 0.002197265625, 0.005401611328125, 0.00860595703125, 0.011810302734375, 0.0150146484375, 0.018218994140625, 0.02142333984375, 0.024627685546875, 0.02783203125, 0.031036376953125, 0.03424072265625, 0.037445068359375, 0.0406494140625, 0.043853759765625, 0.04705810546875, 0.050262451171875, 0.053466796875, 0.056671142578125, 0.05987548828125, 0.063079833984375, 0.0662841796875, 0.069488525390625, 0.07269287109375, 0.075897216796875, 0.0791015625, 0.082305908203125, 0.08551025390625, 0.088714599609375, 0.0919189453125, 0.095123291015625, 0.09832763671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 15.0, 12.0, 15.0, 16.0, 34.0, 32.0, 30.0, 27.0, 28.0, 43.0, 37.0, 29.0, 35.0, 47.0, 37.0, 39.0, 42.0, 35.0, 42.0, 43.0, 38.0, 35.0, 35.0, 41.0, 29.0, 23.0, 23.0, 21.0, 16.0, 15.0, 16.0, 10.0, 9.0, 8.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.7220458984375e-06, -5.543231964111328e-06, -5.364418029785156e-06, -5.185604095458984e-06, -5.0067901611328125e-06, -4.827976226806641e-06, -4.649162292480469e-06, -4.470348358154297e-06, -4.291534423828125e-06, -4.112720489501953e-06, -3.933906555175781e-06, -3.7550926208496094e-06, -3.5762786865234375e-06, -3.3974647521972656e-06, -3.2186508178710938e-06, -3.039836883544922e-06, -2.86102294921875e-06, -2.682209014892578e-06, -2.5033950805664062e-06, -2.3245811462402344e-06, -2.1457672119140625e-06, -1.9669532775878906e-06, -1.7881393432617188e-06, -1.6093254089355469e-06, -1.430511474609375e-06, -1.2516975402832031e-06, -1.0728836059570312e-06, -8.940696716308594e-07, -7.152557373046875e-07, -5.364418029785156e-07, -3.5762786865234375e-07, -1.7881393432617188e-07, 0.0, 1.7881393432617188e-07, 3.5762786865234375e-07, 5.364418029785156e-07, 7.152557373046875e-07, 8.940696716308594e-07, 1.0728836059570312e-06, 1.2516975402832031e-06, 1.430511474609375e-06, 1.6093254089355469e-06, 1.7881393432617188e-06, 1.9669532775878906e-06, 2.1457672119140625e-06, 2.3245811462402344e-06, 2.5033950805664062e-06, 2.682209014892578e-06, 2.86102294921875e-06, 3.039836883544922e-06, 3.2186508178710938e-06, 3.3974647521972656e-06, 3.5762786865234375e-06, 3.7550926208496094e-06, 3.933906555175781e-06, 4.112720489501953e-06, 4.291534423828125e-06, 4.470348358154297e-06, 4.649162292480469e-06, 4.827976226806641e-06, 5.0067901611328125e-06, 5.185604095458984e-06, 5.364418029785156e-06, 5.543231964111328e-06, 5.7220458984375e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 15.0, 11.0, 23.0, 33.0, 37.0, 71.0, 128.0, 214.0, 296.0, 498.0, 898.0, 1627.0, 2845.0, 5217.0, 9441.0, 16735.0, 29566.0, 51537.0, 88367.0, 141122.0, 191110.0, 184378.0, 132696.0, 81985.0, 47574.0, 26994.0, 15383.0, 8552.0, 4817.0, 2742.0, 1554.0, 869.0, 481.0, 291.0, 163.0, 91.0, 62.0, 55.0, 25.0, 12.0, 11.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09362602233886719, -0.09038925170898438, -0.08715248107910156, -0.08391571044921875, -0.08067893981933594, -0.07744216918945312, -0.07420539855957031, -0.0709686279296875, -0.06773185729980469, -0.06449508666992188, -0.06125831604003906, -0.05802154541015625, -0.05478477478027344, -0.051548004150390625, -0.04831123352050781, -0.045074462890625, -0.04183769226074219, -0.038600921630859375, -0.03536415100097656, -0.03212738037109375, -0.028890609741210938, -0.025653839111328125, -0.022417068481445312, -0.0191802978515625, -0.015943527221679688, -0.012706756591796875, -0.009469985961914062, -0.00623321533203125, -0.0029964447021484375, 0.000240325927734375, 0.0034770965576171875, 0.0067138671875, 0.009950637817382812, 0.013187408447265625, 0.016424179077148438, 0.01966094970703125, 0.022897720336914062, 0.026134490966796875, 0.029371261596679688, 0.0326080322265625, 0.03584480285644531, 0.039081573486328125, 0.04231834411621094, 0.04555511474609375, 0.04879188537597656, 0.052028656005859375, 0.05526542663574219, 0.058502197265625, 0.06173896789550781, 0.06497573852539062, 0.06821250915527344, 0.07144927978515625, 0.07468605041503906, 0.07792282104492188, 0.08115959167480469, 0.0843963623046875, 0.08763313293457031, 0.09086990356445312, 0.09410667419433594, 0.09734344482421875, 0.10058021545410156, 0.10381698608398438, 0.10705375671386719, 0.11029052734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 5.0, 7.0, 12.0, 15.0, 16.0, 11.0, 18.0, 23.0, 25.0, 18.0, 28.0, 33.0, 40.0, 70.0, 63.0, 58.0, 48.0, 51.0, 54.0, 50.0, 60.0, 44.0, 47.0, 33.0, 39.0, 23.0, 21.0, 11.0, 16.0, 12.0, 4.0, 12.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.031035900115966797, -0.030028343200683594, -0.02902078628540039, -0.028013229370117188, -0.027005672454833984, -0.02599811553955078, -0.024990558624267578, -0.023983001708984375, -0.022975444793701172, -0.02196788787841797, -0.020960330963134766, -0.019952774047851562, -0.01894521713256836, -0.017937660217285156, -0.016930103302001953, -0.01592254638671875, -0.014914989471435547, -0.013907432556152344, -0.01289987564086914, -0.011892318725585938, -0.010884761810302734, -0.009877204895019531, -0.008869647979736328, -0.007862091064453125, -0.006854534149169922, -0.005846977233886719, -0.004839420318603516, -0.0038318634033203125, -0.0028243064880371094, -0.0018167495727539062, -0.0008091926574707031, 0.0001983642578125, 0.0012059211730957031, 0.0022134780883789062, 0.0032210350036621094, 0.0042285919189453125, 0.005236148834228516, 0.006243705749511719, 0.007251262664794922, 0.008258819580078125, 0.009266376495361328, 0.010273933410644531, 0.011281490325927734, 0.012289047241210938, 0.01329660415649414, 0.014304161071777344, 0.015311717987060547, 0.01631927490234375, 0.017326831817626953, 0.018334388732910156, 0.01934194564819336, 0.020349502563476562, 0.021357059478759766, 0.02236461639404297, 0.023372173309326172, 0.024379730224609375, 0.025387287139892578, 0.02639484405517578, 0.027402400970458984, 0.028409957885742188, 0.02941751480102539, 0.030425071716308594, 0.0314326286315918, 0.032440185546875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 7.0, 3.0, 7.0, 17.0, 16.0, 17.0, 18.0, 17.0, 30.0, 30.0, 41.0, 45.0, 44.0, 47.0, 30.0, 55.0, 42.0, 56.0, 41.0, 42.0, 57.0, 46.0, 41.0, 37.0, 31.0, 31.0, 26.0, 22.0, 20.0, 15.0, 11.0, 11.0, 14.0, 6.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919909954071045, -2.836925506591797, -2.753941297531128, -2.67095685005188, -2.587972640991211, -2.504988193511963, -2.422003746032715, -2.339019298553467, -2.256035089492798, -2.17305064201355, -2.090066432952881, -2.007081985473633, -1.9240976572036743, -1.8411133289337158, -1.7581288814544678, -1.6751445531845093, -1.5921602249145508, -1.5091758966445923, -1.4261915683746338, -1.3432071208953857, -1.2602227926254272, -1.1772384643554688, -1.0942540168762207, -1.0112696886062622, -0.9282853603363037, -0.8453010320663452, -0.7623166441917419, -0.6793322563171387, -0.5963479280471802, -0.5133635997772217, -0.4303792119026184, -0.34739482402801514, -0.26441025733947754, -0.18142589926719666, -0.09844154119491577, -0.015457183122634888, 0.067527174949646, 0.15051153302192688, 0.23349589109420776, 0.31648027896881104, 0.39946460723876953, 0.4824489653110504, 0.5654333233833313, 0.6484177112579346, 0.7314020395278931, 0.8143863677978516, 0.8973707556724548, 0.9803551435470581, 1.0633394718170166, 1.146323800086975, 1.2293081283569336, 1.3122925758361816, 1.3952769041061401, 1.4782612323760986, 1.5612456798553467, 1.6442300081253052, 1.7272143363952637, 1.8101986646652222, 1.8931829929351807, 1.9761674404144287, 2.0591516494750977, 2.1421360969543457, 2.2251205444335938, 2.308104991912842, 2.3910892009735107]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 14.0, 14.0, 15.0, 15.0, 18.0, 16.0, 20.0, 26.0, 28.0, 19.0, 38.0, 21.0, 34.0, 58.0, 43.0, 43.0, 45.0, 42.0, 36.0, 55.0, 54.0, 38.0, 28.0, 36.0, 45.0, 26.0, 27.0, 16.0, 19.0, 8.0, 16.0, 18.0, 17.0, 4.0, 9.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.689192533493042, -2.6032466888427734, -2.517300605773926, -2.4313547611236572, -2.3454089164733887, -2.259462833404541, -2.1735169887542725, -2.087571144104004, -2.0016250610351562, -1.9156790971755981, -1.8297332525253296, -1.7437872886657715, -1.657841444015503, -1.5718954801559448, -1.4859495162963867, -1.4000036716461182, -1.3140578269958496, -1.2281118631362915, -1.142166018486023, -1.0562200546264648, -0.9702741503715515, -0.8843282461166382, -0.7983822822570801, -0.7124363780021667, -0.6264904737472534, -0.5405445694923401, -0.45459863543510437, -0.36865270137786865, -0.2827067971229553, -0.196760892868042, -0.11081492900848389, -0.024869024753570557, 0.061077117919921875, 0.1470230370759964, 0.23296895623207092, 0.31891489028930664, 0.40486079454421997, 0.4908066987991333, 0.5767526626586914, 0.6626985669136047, 0.7486444711685181, 0.8345903754234314, 0.9205362796783447, 1.0064822435379028, 1.092428207397461, 1.1783740520477295, 1.2643200159072876, 1.3502659797668457, 1.4362118244171143, 1.5221577882766724, 1.608103632926941, 1.694049596786499, 1.7799954414367676, 1.8659414052963257, 1.9518873691558838, 2.0378332138061523, 2.123779296875, 2.2097251415252686, 2.295671224594116, 2.3816170692443848, 2.4675629138946533, 2.553508758544922, 2.6394548416137695, 2.725400686264038, 2.8113465309143066]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 6.0, 6.0, 8.0, 8.0, 17.0, 28.0, 30.0, 60.0, 104.0, 151.0, 248.0, 380.0, 521.0, 878.0, 1181.0, 1813.0, 2658.0, 3882.0, 5727.0, 8244.0, 12009.0, 16334.0, 22665.0, 30532.0, 39901.0, 50692.0, 62027.0, 73266.0, 81600.0, 87151.0, 88243.0, 85261.0, 77595.0, 67471.0, 56195.0, 45350.0, 35261.0, 26501.0, 19372.0, 13904.0, 9807.0, 6961.0, 4748.0, 3249.0, 2174.0, 1489.0, 947.0, 643.0, 458.0, 284.0, 177.0, 125.0, 91.0, 48.0, 43.0, 18.0, 6.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.0751953125, -1.0407867431640625, -1.006378173828125, -0.9719696044921875, -0.93756103515625, -0.9031524658203125, -0.868743896484375, -0.8343353271484375, -0.7999267578125, -0.7655181884765625, -0.731109619140625, -0.6967010498046875, -0.66229248046875, -0.6278839111328125, -0.593475341796875, -0.5590667724609375, -0.524658203125, -0.4902496337890625, -0.455841064453125, -0.4214324951171875, -0.38702392578125, -0.3526153564453125, -0.318206787109375, -0.2837982177734375, -0.2493896484375, -0.2149810791015625, -0.180572509765625, -0.1461639404296875, -0.11175537109375, -0.0773468017578125, -0.042938232421875, -0.0085296630859375, 0.02587890625, 0.0602874755859375, 0.094696044921875, 0.1291046142578125, 0.16351318359375, 0.1979217529296875, 0.232330322265625, 0.2667388916015625, 0.3011474609375, 0.3355560302734375, 0.369964599609375, 0.4043731689453125, 0.43878173828125, 0.4731903076171875, 0.507598876953125, 0.5420074462890625, 0.576416015625, 0.6108245849609375, 0.645233154296875, 0.6796417236328125, 0.71405029296875, 0.7484588623046875, 0.782867431640625, 0.8172760009765625, 0.8516845703125, 0.8860931396484375, 0.920501708984375, 0.9549102783203125, 0.98931884765625, 1.0237274169921875, 1.058135986328125, 1.0925445556640625, 1.126953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 3.0, 5.0, 4.0, 5.0, 11.0, 10.0, 13.0, 9.0, 18.0, 18.0, 19.0, 26.0, 28.0, 20.0, 32.0, 30.0, 28.0, 51.0, 47.0, 41.0, 51.0, 34.0, 56.0, 49.0, 29.0, 48.0, 37.0, 40.0, 36.0, 29.0, 26.0, 24.0, 18.0, 24.0, 20.0, 9.0, 10.0, 9.0, 7.0, 7.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.84765625, -2.76055908203125, -2.6734619140625, -2.58636474609375, -2.499267578125, -2.41217041015625, -2.3250732421875, -2.23797607421875, -2.15087890625, -2.06378173828125, -1.9766845703125, -1.88958740234375, -1.802490234375, -1.71539306640625, -1.6282958984375, -1.54119873046875, -1.4541015625, -1.36700439453125, -1.2799072265625, -1.19281005859375, -1.105712890625, -1.01861572265625, -0.9315185546875, -0.84442138671875, -0.75732421875, -0.67022705078125, -0.5831298828125, -0.49603271484375, -0.408935546875, -0.32183837890625, -0.2347412109375, -0.14764404296875, -0.060546875, 0.02655029296875, 0.1136474609375, 0.20074462890625, 0.287841796875, 0.37493896484375, 0.4620361328125, 0.54913330078125, 0.63623046875, 0.72332763671875, 0.8104248046875, 0.89752197265625, 0.984619140625, 1.07171630859375, 1.1588134765625, 1.24591064453125, 1.3330078125, 1.42010498046875, 1.5072021484375, 1.59429931640625, 1.681396484375, 1.76849365234375, 1.8555908203125, 1.94268798828125, 2.02978515625, 2.11688232421875, 2.2039794921875, 2.29107666015625, 2.378173828125, 2.46527099609375, 2.5523681640625, 2.63946533203125, 2.7265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 8.0, 9.0, 18.0, 39.0, 46.0, 72.0, 112.0, 145.0, 232.0, 407.0, 609.0, 964.0, 1531.0, 2535.0, 3863.0, 5924.0, 9173.0, 13986.0, 20946.0, 30060.0, 42442.0, 57567.0, 74007.0, 88826.0, 100422.0, 105159.0, 102963.0, 93416.0, 78920.0, 62809.0, 47368.0, 34247.0, 23941.0, 16143.0, 10687.0, 6840.0, 4412.0, 2775.0, 1810.0, 1124.0, 743.0, 456.0, 303.0, 179.0, 106.0, 75.0, 52.0, 30.0, 21.0, 14.0, 8.0, 2.0, 5.0, 6.0, 2.0, 3.0], "bins": [-1.4677734375, -1.4241790771484375, -1.380584716796875, -1.3369903564453125, -1.29339599609375, -1.2498016357421875, -1.206207275390625, -1.1626129150390625, -1.1190185546875, -1.0754241943359375, -1.031829833984375, -0.9882354736328125, -0.94464111328125, -0.9010467529296875, -0.857452392578125, -0.8138580322265625, -0.770263671875, -0.7266693115234375, -0.683074951171875, -0.6394805908203125, -0.59588623046875, -0.5522918701171875, -0.508697509765625, -0.4651031494140625, -0.4215087890625, -0.3779144287109375, -0.334320068359375, -0.2907257080078125, -0.24713134765625, -0.2035369873046875, -0.159942626953125, -0.1163482666015625, -0.07275390625, -0.0291595458984375, 0.014434814453125, 0.0580291748046875, 0.10162353515625, 0.1452178955078125, 0.188812255859375, 0.2324066162109375, 0.2760009765625, 0.3195953369140625, 0.363189697265625, 0.4067840576171875, 0.45037841796875, 0.4939727783203125, 0.537567138671875, 0.5811614990234375, 0.624755859375, 0.6683502197265625, 0.711944580078125, 0.7555389404296875, 0.79913330078125, 0.8427276611328125, 0.886322021484375, 0.9299163818359375, 0.9735107421875, 1.0171051025390625, 1.060699462890625, 1.1042938232421875, 1.14788818359375, 1.1914825439453125, 1.235076904296875, 1.2786712646484375, 1.322265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 9.0, 13.0, 9.0, 15.0, 9.0, 27.0, 21.0, 23.0, 22.0, 26.0, 35.0, 28.0, 28.0, 41.0, 32.0, 36.0, 39.0, 43.0, 45.0, 36.0, 30.0, 40.0, 38.0, 42.0, 45.0, 34.0, 23.0, 38.0, 21.0, 17.0, 23.0, 14.0, 15.0, 14.0, 8.0, 14.0, 14.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.666015625, -1.6128387451171875, -1.559661865234375, -1.5064849853515625, -1.45330810546875, -1.4001312255859375, -1.346954345703125, -1.2937774658203125, -1.2406005859375, -1.1874237060546875, -1.134246826171875, -1.0810699462890625, -1.02789306640625, -0.9747161865234375, -0.921539306640625, -0.8683624267578125, -0.815185546875, -0.7620086669921875, -0.708831787109375, -0.6556549072265625, -0.60247802734375, -0.5493011474609375, -0.496124267578125, -0.4429473876953125, -0.3897705078125, -0.3365936279296875, -0.283416748046875, -0.2302398681640625, -0.17706298828125, -0.1238861083984375, -0.070709228515625, -0.0175323486328125, 0.03564453125, 0.0888214111328125, 0.141998291015625, 0.1951751708984375, 0.24835205078125, 0.3015289306640625, 0.354705810546875, 0.4078826904296875, 0.4610595703125, 0.5142364501953125, 0.567413330078125, 0.6205902099609375, 0.67376708984375, 0.7269439697265625, 0.780120849609375, 0.8332977294921875, 0.886474609375, 0.9396514892578125, 0.992828369140625, 1.0460052490234375, 1.09918212890625, 1.1523590087890625, 1.205535888671875, 1.2587127685546875, 1.3118896484375, 1.3650665283203125, 1.418243408203125, 1.4714202880859375, 1.52459716796875, 1.5777740478515625, 1.630950927734375, 1.6841278076171875, 1.7373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 7.0, 12.0, 10.0, 26.0, 39.0, 62.0, 87.0, 160.0, 256.0, 401.0, 648.0, 1033.0, 1935.0, 3380.0, 5768.0, 9710.0, 16454.0, 26703.0, 42141.0, 61588.0, 84906.0, 107080.0, 123241.0, 127596.0, 118034.0, 99088.0, 75680.0, 52673.0, 35546.0, 22006.0, 13282.0, 7818.0, 4615.0, 2722.0, 1634.0, 876.0, 505.0, 327.0, 178.0, 118.0, 69.0, 45.0, 32.0, 20.0, 13.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6318359375, -0.6116485595703125, -0.591461181640625, -0.5712738037109375, -0.55108642578125, -0.5308990478515625, -0.510711669921875, -0.4905242919921875, -0.4703369140625, -0.4501495361328125, -0.429962158203125, -0.4097747802734375, -0.38958740234375, -0.3694000244140625, -0.349212646484375, -0.3290252685546875, -0.308837890625, -0.2886505126953125, -0.268463134765625, -0.2482757568359375, -0.22808837890625, -0.2079010009765625, -0.187713623046875, -0.1675262451171875, -0.1473388671875, -0.1271514892578125, -0.106964111328125, -0.0867767333984375, -0.06658935546875, -0.0464019775390625, -0.026214599609375, -0.0060272216796875, 0.01416015625, 0.0343475341796875, 0.054534912109375, 0.0747222900390625, 0.09490966796875, 0.1150970458984375, 0.135284423828125, 0.1554718017578125, 0.1756591796875, 0.1958465576171875, 0.216033935546875, 0.2362213134765625, 0.25640869140625, 0.2765960693359375, 0.296783447265625, 0.3169708251953125, 0.337158203125, 0.3573455810546875, 0.377532958984375, 0.3977203369140625, 0.41790771484375, 0.4380950927734375, 0.458282470703125, 0.4784698486328125, 0.4986572265625, 0.5188446044921875, 0.539031982421875, 0.5592193603515625, 0.57940673828125, 0.5995941162109375, 0.619781494140625, 0.6399688720703125, 0.66015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 9.0, 8.0, 16.0, 18.0, 19.0, 36.0, 27.0, 33.0, 30.0, 43.0, 43.0, 59.0, 62.0, 62.0, 52.0, 59.0, 58.0, 51.0, 48.0, 51.0, 32.0, 46.0, 22.0, 30.0, 14.0, 16.0, 8.0, 8.0, 8.0, 4.0, 6.0, 8.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.557868957519531e-05, -7.284712046384811e-05, -7.011555135250092e-05, -6.738398224115372e-05, -6.465241312980652e-05, -6.192084401845932e-05, -5.918927490711212e-05, -5.645770579576492e-05, -5.3726136684417725e-05, -5.0994567573070526e-05, -4.826299846172333e-05, -4.553142935037613e-05, -4.279986023902893e-05, -4.006829112768173e-05, -3.7336722016334534e-05, -3.4605152904987335e-05, -3.187358379364014e-05, -2.9142014682292938e-05, -2.641044557094574e-05, -2.367887645959854e-05, -2.0947307348251343e-05, -1.8215738236904144e-05, -1.5484169125556946e-05, -1.2752600014209747e-05, -1.0021030902862549e-05, -7.28946179151535e-06, -4.557892680168152e-06, -1.8263235688209534e-06, 9.052455425262451e-07, 3.6368146538734436e-06, 6.368383765220642e-06, 9.09995287656784e-06, 1.1831521987915039e-05, 1.4563091099262238e-05, 1.7294660210609436e-05, 2.0026229321956635e-05, 2.2757798433303833e-05, 2.548936754465103e-05, 2.822093665599823e-05, 3.095250576734543e-05, 3.368407487869263e-05, 3.6415643990039825e-05, 3.9147213101387024e-05, 4.187878221273422e-05, 4.461035132408142e-05, 4.734192043542862e-05, 5.007348954677582e-05, 5.2805058658123016e-05, 5.5536627769470215e-05, 5.826819688081741e-05, 6.099976599216461e-05, 6.373133510351181e-05, 6.646290421485901e-05, 6.919447332620621e-05, 7.19260424375534e-05, 7.46576115489006e-05, 7.73891806602478e-05, 8.0120749771595e-05, 8.28523188829422e-05, 8.55838879942894e-05, 8.83154571056366e-05, 9.10470262169838e-05, 9.3778595328331e-05, 9.651016443967819e-05, 9.924173355102539e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 8.0, 16.0, 40.0, 46.0, 61.0, 116.0, 170.0, 260.0, 467.0, 700.0, 1177.0, 1900.0, 3021.0, 4815.0, 7818.0, 12927.0, 20330.0, 31380.0, 45566.0, 63845.0, 83609.0, 102088.0, 114539.0, 116257.0, 109335.0, 93405.0, 73873.0, 54586.0, 38268.0, 25283.0, 16229.0, 10147.0, 6276.0, 3842.0, 2301.0, 1411.0, 902.0, 555.0, 350.0, 213.0, 135.0, 103.0, 64.0, 53.0, 26.0, 13.0, 4.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.654296875, -0.6340103149414062, -0.6137237548828125, -0.5934371948242188, -0.573150634765625, -0.5528640747070312, -0.5325775146484375, -0.5122909545898438, -0.49200439453125, -0.47171783447265625, -0.4514312744140625, -0.43114471435546875, -0.410858154296875, -0.39057159423828125, -0.3702850341796875, -0.34999847412109375, -0.3297119140625, -0.30942535400390625, -0.2891387939453125, -0.26885223388671875, -0.248565673828125, -0.22827911376953125, -0.2079925537109375, -0.18770599365234375, -0.16741943359375, -0.14713287353515625, -0.1268463134765625, -0.10655975341796875, -0.086273193359375, -0.06598663330078125, -0.0457000732421875, -0.02541351318359375, -0.005126953125, 0.01515960693359375, 0.0354461669921875, 0.05573272705078125, 0.076019287109375, 0.09630584716796875, 0.1165924072265625, 0.13687896728515625, 0.15716552734375, 0.17745208740234375, 0.1977386474609375, 0.21802520751953125, 0.238311767578125, 0.25859832763671875, 0.2788848876953125, 0.29917144775390625, 0.3194580078125, 0.33974456787109375, 0.3600311279296875, 0.38031768798828125, 0.400604248046875, 0.42089080810546875, 0.4411773681640625, 0.46146392822265625, 0.48175048828125, 0.5020370483398438, 0.5223236083984375, 0.5426101684570312, 0.562896728515625, 0.5831832885742188, 0.6034698486328125, 0.6237564086914062, 0.64404296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 7.0, 6.0, 10.0, 12.0, 9.0, 12.0, 21.0, 22.0, 23.0, 31.0, 35.0, 31.0, 39.0, 39.0, 54.0, 37.0, 50.0, 58.0, 56.0, 54.0, 35.0, 56.0, 41.0, 51.0, 44.0, 34.0, 26.0, 19.0, 21.0, 17.0, 15.0, 5.0, 16.0, 5.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3511772155761719, -0.34053802490234375, -0.3298988342285156, -0.3192596435546875, -0.3086204528808594, -0.29798126220703125, -0.2873420715332031, -0.276702880859375, -0.2660636901855469, -0.25542449951171875, -0.24478530883789062, -0.2341461181640625, -0.22350692749023438, -0.21286773681640625, -0.20222854614257812, -0.19158935546875, -0.18095016479492188, -0.17031097412109375, -0.15967178344726562, -0.1490325927734375, -0.13839340209960938, -0.12775421142578125, -0.11711502075195312, -0.106475830078125, -0.09583663940429688, -0.08519744873046875, -0.07455825805664062, -0.0639190673828125, -0.053279876708984375, -0.04264068603515625, -0.032001495361328125, -0.0213623046875, -0.010723114013671875, -8.392333984375e-05, 0.010555267333984375, 0.0211944580078125, 0.031833648681640625, 0.04247283935546875, 0.053112030029296875, 0.063751220703125, 0.07439041137695312, 0.08502960205078125, 0.09566879272460938, 0.1063079833984375, 0.11694717407226562, 0.12758636474609375, 0.13822555541992188, 0.14886474609375, 0.15950393676757812, 0.17014312744140625, 0.18078231811523438, 0.1914215087890625, 0.20206069946289062, 0.21269989013671875, 0.22333908081054688, 0.233978271484375, 0.24461746215820312, 0.25525665283203125, 0.2658958435058594, 0.2765350341796875, 0.2871742248535156, 0.29781341552734375, 0.3084526062011719, 0.319091796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 10.0, 8.0, 13.0, 13.0, 15.0, 14.0, 18.0, 17.0, 28.0, 37.0, 36.0, 41.0, 44.0, 41.0, 43.0, 52.0, 43.0, 45.0, 45.0, 34.0, 60.0, 46.0, 52.0, 35.0, 45.0, 25.0, 22.0, 19.0, 14.0, 11.0, 24.0, 11.0, 10.0, 5.0, 8.0, 2.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-3.257091522216797, -3.17411732673645, -3.0911428928375244, -3.0081686973571777, -2.925194501876831, -2.8422203063964844, -2.7592458724975586, -2.676271677017212, -2.5932974815368652, -2.5103232860565186, -2.4273488521575928, -2.344374656677246, -2.2614004611968994, -2.1784262657165527, -2.095451831817627, -2.0124776363372803, -1.9295032024383545, -1.8465288877487183, -1.7635546922683716, -1.6805803775787354, -1.5976061820983887, -1.5146318674087524, -1.4316575527191162, -1.3486833572387695, -1.2657090425491333, -1.182734727859497, -1.0997605323791504, -1.0167862176895142, -0.9338119626045227, -0.8508377075195312, -0.767863392829895, -0.6848891377449036, -0.6019151210784912, -0.5189408659934998, -0.4359665811061859, -0.35299229621887207, -0.2700180411338806, -0.18704378604888916, -0.10406950116157532, -0.021095216274261475, 0.06187903881072998, 0.14485330879688263, 0.22782757878303528, 0.3108018636703491, 0.3937761187553406, 0.47675037384033203, 0.5597246885299683, 0.6426989436149597, 0.7256731986999512, 0.8086474537849426, 0.8916217088699341, 0.9745960235595703, 1.057570219039917, 1.1405445337295532, 1.2235188484191895, 1.3064930438995361, 1.3894673585891724, 1.4724416732788086, 1.5554158687591553, 1.6383901834487915, 1.7213644981384277, 1.8043386936187744, 1.8873130083084106, 1.9702873229980469, 2.0532615184783936]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 8.0, 14.0, 16.0, 15.0, 15.0, 21.0, 18.0, 25.0, 25.0, 31.0, 21.0, 36.0, 46.0, 36.0, 49.0, 44.0, 46.0, 29.0, 47.0, 42.0, 39.0, 43.0, 33.0, 30.0, 27.0, 27.0, 26.0, 21.0, 20.0, 20.0, 17.0, 14.0, 8.0, 14.0, 13.0, 11.0, 6.0, 0.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.0123064517974854, -2.9227168560028076, -2.83312726020813, -2.7435379028320312, -2.6539483070373535, -2.564358711242676, -2.474769115447998, -2.3851795196533203, -2.2955899238586426, -2.206000328063965, -2.116410732269287, -2.0268211364746094, -1.9372317790985107, -1.847642183303833, -1.7580525875091553, -1.6684629917144775, -1.578873634338379, -1.4892840385437012, -1.399694561958313, -1.3101049661636353, -1.220515489578247, -1.1309258937835693, -1.0413362979888916, -0.9517467617988586, -0.8621572256088257, -0.7725676894187927, -0.6829781532287598, -0.593388557434082, -0.5037990212440491, -0.4142094850540161, -0.3246198892593384, -0.23503035306930542, -0.14544081687927246, -0.05585126578807831, 0.033738285303115845, 0.12332785129547119, 0.21291738748550415, 0.3025069236755371, 0.39209651947021484, 0.4816860556602478, 0.5712755918502808, 0.6608651280403137, 0.7504546642303467, 0.8400442600250244, 0.9296337962150574, 1.0192233324050903, 1.108812928199768, 1.1984024047851562, 1.287992000579834, 1.3775815963745117, 1.4671710729599, 1.5567606687545776, 1.6463501453399658, 1.7359397411346436, 1.8255293369293213, 1.915118932723999, 2.0047082901000977, 2.0942978858947754, 2.183887481689453, 2.273477077484131, 2.3630664348602295, 2.4526560306549072, 2.542245626449585, 2.6318352222442627, 2.7214248180389404]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 12.0, 22.0, 37.0, 74.0, 95.0, 171.0, 316.0, 518.0, 881.0, 1383.0, 2508.0, 4244.0, 7564.0, 13029.0, 22589.0, 38848.0, 67364.0, 115844.0, 194032.0, 309135.0, 453945.0, 582798.0, 632237.0, 568839.0, 432763.0, 292830.0, 184342.0, 110837.0, 65190.0, 38297.0, 22227.0, 13047.0, 7477.0, 4430.0, 2543.0, 1548.0, 863.0, 549.0, 345.0, 214.0, 120.0, 71.0, 49.0, 23.0, 15.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.094879150390625, -2.02374267578125, -1.952606201171875, -1.8814697265625, -1.810333251953125, -1.73919677734375, -1.668060302734375, -1.596923828125, -1.525787353515625, -1.45465087890625, -1.383514404296875, -1.3123779296875, -1.241241455078125, -1.17010498046875, -1.098968505859375, -1.02783203125, -0.956695556640625, -0.88555908203125, -0.814422607421875, -0.7432861328125, -0.672149658203125, -0.60101318359375, -0.529876708984375, -0.458740234375, -0.387603759765625, -0.31646728515625, -0.245330810546875, -0.1741943359375, -0.103057861328125, -0.03192138671875, 0.039215087890625, 0.1103515625, 0.181488037109375, 0.25262451171875, 0.323760986328125, 0.3948974609375, 0.466033935546875, 0.53717041015625, 0.608306884765625, 0.679443359375, 0.750579833984375, 0.82171630859375, 0.892852783203125, 0.9639892578125, 1.035125732421875, 1.10626220703125, 1.177398681640625, 1.24853515625, 1.319671630859375, 1.39080810546875, 1.461944580078125, 1.5330810546875, 1.604217529296875, 1.67535400390625, 1.746490478515625, 1.817626953125, 1.888763427734375, 1.95989990234375, 2.031036376953125, 2.1021728515625, 2.173309326171875, 2.24444580078125, 2.315582275390625, 2.38671875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 11.0, 8.0, 9.0, 10.0, 11.0, 19.0, 11.0, 10.0, 21.0, 30.0, 32.0, 30.0, 29.0, 32.0, 36.0, 36.0, 43.0, 41.0, 35.0, 45.0, 35.0, 42.0, 44.0, 47.0, 27.0, 28.0, 37.0, 24.0, 25.0, 21.0, 19.0, 20.0, 18.0, 14.0, 18.0, 11.0, 15.0, 10.0, 6.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.49609375, -2.41796875, -2.33984375, -2.26171875, -2.18359375, -2.10546875, -2.02734375, -1.94921875, -1.87109375, -1.79296875, -1.71484375, -1.63671875, -1.55859375, -1.48046875, -1.40234375, -1.32421875, -1.24609375, -1.16796875, -1.08984375, -1.01171875, -0.93359375, -0.85546875, -0.77734375, -0.69921875, -0.62109375, -0.54296875, -0.46484375, -0.38671875, -0.30859375, -0.23046875, -0.15234375, -0.07421875, 0.00390625, 0.08203125, 0.16015625, 0.23828125, 0.31640625, 0.39453125, 0.47265625, 0.55078125, 0.62890625, 0.70703125, 0.78515625, 0.86328125, 0.94140625, 1.01953125, 1.09765625, 1.17578125, 1.25390625, 1.33203125, 1.41015625, 1.48828125, 1.56640625, 1.64453125, 1.72265625, 1.80078125, 1.87890625, 1.95703125, 2.03515625, 2.11328125, 2.19140625, 2.26953125, 2.34765625, 2.42578125, 2.50390625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 12.0, 13.0, 25.0, 47.0, 49.0, 116.0, 147.0, 253.0, 447.0, 660.0, 1059.0, 1782.0, 2723.0, 4521.0, 7284.0, 11631.0, 18616.0, 29804.0, 48023.0, 74936.0, 114591.0, 172496.0, 247383.0, 334928.0, 423550.0, 485742.0, 497691.0, 457418.0, 378971.0, 287524.0, 204540.0, 138259.0, 91616.0, 58382.0, 37676.0, 23211.0, 14412.0, 8823.0, 5566.0, 3580.0, 2188.0, 1343.0, 872.0, 493.0, 328.0, 212.0, 136.0, 74.0, 43.0, 31.0, 29.0, 14.0, 5.0, 8.0, 2.0, 3.0], "bins": [-2.337890625, -2.26959228515625, -2.2012939453125, -2.13299560546875, -2.064697265625, -1.99639892578125, -1.9281005859375, -1.85980224609375, -1.79150390625, -1.72320556640625, -1.6549072265625, -1.58660888671875, -1.518310546875, -1.45001220703125, -1.3817138671875, -1.31341552734375, -1.2451171875, -1.17681884765625, -1.1085205078125, -1.04022216796875, -0.971923828125, -0.90362548828125, -0.8353271484375, -0.76702880859375, -0.69873046875, -0.63043212890625, -0.5621337890625, -0.49383544921875, -0.425537109375, -0.35723876953125, -0.2889404296875, -0.22064208984375, -0.15234375, -0.08404541015625, -0.0157470703125, 0.05255126953125, 0.120849609375, 0.18914794921875, 0.2574462890625, 0.32574462890625, 0.39404296875, 0.46234130859375, 0.5306396484375, 0.59893798828125, 0.667236328125, 0.73553466796875, 0.8038330078125, 0.87213134765625, 0.9404296875, 1.00872802734375, 1.0770263671875, 1.14532470703125, 1.213623046875, 1.28192138671875, 1.3502197265625, 1.41851806640625, 1.48681640625, 1.55511474609375, 1.6234130859375, 1.69171142578125, 1.760009765625, 1.82830810546875, 1.8966064453125, 1.96490478515625, 2.033203125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 10.0, 17.0, 17.0, 17.0, 35.0, 32.0, 52.0, 74.0, 81.0, 108.0, 128.0, 147.0, 169.0, 202.0, 184.0, 207.0, 218.0, 212.0, 235.0, 238.0, 231.0, 206.0, 212.0, 188.0, 146.0, 129.0, 126.0, 96.0, 94.0, 57.0, 55.0, 21.0, 34.0, 20.0, 23.0, 11.0, 14.0, 2.0, 11.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.291015625, -1.2513275146484375, -1.211639404296875, -1.1719512939453125, -1.13226318359375, -1.0925750732421875, -1.052886962890625, -1.0131988525390625, -0.9735107421875, -0.9338226318359375, -0.894134521484375, -0.8544464111328125, -0.81475830078125, -0.7750701904296875, -0.735382080078125, -0.6956939697265625, -0.656005859375, -0.6163177490234375, -0.576629638671875, -0.5369415283203125, -0.49725341796875, -0.4575653076171875, -0.417877197265625, -0.3781890869140625, -0.3385009765625, -0.2988128662109375, -0.259124755859375, -0.2194366455078125, -0.17974853515625, -0.1400604248046875, -0.100372314453125, -0.0606842041015625, -0.02099609375, 0.0186920166015625, 0.058380126953125, 0.0980682373046875, 0.13775634765625, 0.1774444580078125, 0.217132568359375, 0.2568206787109375, 0.2965087890625, 0.3361968994140625, 0.375885009765625, 0.4155731201171875, 0.45526123046875, 0.4949493408203125, 0.534637451171875, 0.5743255615234375, 0.614013671875, 0.6537017822265625, 0.693389892578125, 0.7330780029296875, 0.77276611328125, 0.8124542236328125, 0.852142333984375, 0.8918304443359375, 0.9315185546875, 0.9712066650390625, 1.010894775390625, 1.0505828857421875, 1.09027099609375, 1.1299591064453125, 1.169647216796875, 1.2093353271484375, 1.2490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 7.0, 16.0, 9.0, 15.0, 18.0, 19.0, 26.0, 25.0, 29.0, 33.0, 33.0, 35.0, 35.0, 41.0, 36.0, 41.0, 37.0, 47.0, 41.0, 43.0, 42.0, 44.0, 43.0, 25.0, 35.0, 36.0, 30.0, 22.0, 24.0, 16.0, 8.0, 13.0, 17.0, 6.0, 7.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.231991767883301, -3.1437156200408936, -3.0554394721984863, -2.967163324356079, -2.878887176513672, -2.7906112670898438, -2.7023351192474365, -2.6140589714050293, -2.525782823562622, -2.437506675720215, -2.3492305278778076, -2.2609543800354004, -2.1726784706115723, -2.084402322769165, -1.9961261749267578, -1.9078500270843506, -1.8195738792419434, -1.7312977313995361, -1.643021583557129, -1.5547455549240112, -1.466469407081604, -1.3781932592391968, -1.289917230606079, -1.2016410827636719, -1.1133649349212646, -1.0250887870788574, -0.936812698841095, -0.8485366106033325, -0.7602604627609253, -0.6719843149185181, -0.5837082266807556, -0.49543213844299316, -0.40715622901916504, -0.3188801109790802, -0.23060399293899536, -0.14232787489891052, -0.054051756858825684, 0.034224361181259155, 0.122500479221344, 0.21077656745910645, 0.29905271530151367, 0.3873288333415985, 0.47560495138168335, 0.5638810396194458, 0.652157187461853, 0.7404333353042603, 0.8287094235420227, 0.9169855117797852, 1.0052616596221924, 1.0935378074645996, 1.1818139553070068, 1.2700899839401245, 1.3583661317825317, 1.446642279624939, 1.5349183082580566, 1.6231944561004639, 1.711470603942871, 1.7997467517852783, 1.8880228996276855, 1.9762989282608032, 2.0645751953125, 2.152851104736328, 2.2411272525787354, 2.3294034004211426, 2.41767954826355]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 2.0, 5.0, 9.0, 10.0, 11.0, 6.0, 14.0, 14.0, 14.0, 18.0, 24.0, 23.0, 17.0, 26.0, 32.0, 38.0, 35.0, 31.0, 32.0, 45.0, 32.0, 30.0, 38.0, 35.0, 38.0, 43.0, 45.0, 35.0, 39.0, 36.0, 29.0, 22.0, 28.0, 17.0, 16.0, 13.0, 14.0, 16.0, 11.0, 9.0, 12.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.8771049976348877, -2.7872562408447266, -2.6974077224731445, -2.6075589656829834, -2.5177102088928223, -2.427861452102661, -2.3380126953125, -2.248164176940918, -2.158315420150757, -2.0684666633605957, -1.9786180257797241, -1.8887693881988525, -1.7989206314086914, -1.7090718746185303, -1.6192232370376587, -1.529374599456787, -1.439525842666626, -1.3496770858764648, -1.2598284482955933, -1.1699798107147217, -1.0801310539245605, -0.9902823567390442, -0.9004336595535278, -0.8105849623680115, -0.7207362651824951, -0.6308875679969788, -0.5410388708114624, -0.45119017362594604, -0.3613414764404297, -0.27149277925491333, -0.18164408206939697, -0.09179538488388062, -0.0019466876983642578, 0.0879020094871521, 0.17775070667266846, 0.2675994038581848, 0.35744810104370117, 0.44729679822921753, 0.5371454954147339, 0.6269941926002502, 0.7168428897857666, 0.806691586971283, 0.8965402841567993, 0.9863889813423157, 1.076237678527832, 1.1660864353179932, 1.2559350728988647, 1.3457837104797363, 1.4356324672698975, 1.5254812240600586, 1.6153298616409302, 1.7051784992218018, 1.795027256011963, 1.884876012802124, 1.9747246503829956, 2.064573287963867, 2.1544220447540283, 2.2442708015441895, 2.3341193199157715, 2.4239680767059326, 2.5138168334960938, 2.603665590286255, 2.693514347076416, 2.783362865447998, 2.873211622238159]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 12.0, 12.0, 24.0, 42.0, 62.0, 98.0, 131.0, 184.0, 337.0, 540.0, 770.0, 1217.0, 1942.0, 2986.0, 4861.0, 7572.0, 12522.0, 20176.0, 32939.0, 53479.0, 82677.0, 118576.0, 149656.0, 156382.0, 132767.0, 97078.0, 64830.0, 40811.0, 24756.0, 15562.0, 9534.0, 5793.0, 3750.0, 2230.0, 1539.0, 994.0, 623.0, 394.0, 240.0, 151.0, 105.0, 51.0, 47.0, 30.0, 25.0, 14.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.4345703125, -0.42148590087890625, -0.4084014892578125, -0.39531707763671875, -0.382232666015625, -0.36914825439453125, -0.3560638427734375, -0.34297943115234375, -0.32989501953125, -0.31681060791015625, -0.3037261962890625, -0.29064178466796875, -0.277557373046875, -0.26447296142578125, -0.2513885498046875, -0.23830413818359375, -0.2252197265625, -0.21213531494140625, -0.1990509033203125, -0.18596649169921875, -0.172882080078125, -0.15979766845703125, -0.1467132568359375, -0.13362884521484375, -0.12054443359375, -0.10746002197265625, -0.0943756103515625, -0.08129119873046875, -0.068206787109375, -0.05512237548828125, -0.0420379638671875, -0.02895355224609375, -0.015869140625, -0.00278472900390625, 0.0102996826171875, 0.02338409423828125, 0.036468505859375, 0.04955291748046875, 0.0626373291015625, 0.07572174072265625, 0.08880615234375, 0.10189056396484375, 0.1149749755859375, 0.12805938720703125, 0.141143798828125, 0.15422821044921875, 0.1673126220703125, 0.18039703369140625, 0.1934814453125, 0.20656585693359375, 0.2196502685546875, 0.23273468017578125, 0.245819091796875, 0.25890350341796875, 0.2719879150390625, 0.28507232666015625, 0.29815673828125, 0.31124114990234375, 0.3243255615234375, 0.33740997314453125, 0.350494384765625, 0.36357879638671875, 0.3766632080078125, 0.38974761962890625, 0.40283203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 13.0, 5.0, 6.0, 11.0, 9.0, 8.0, 13.0, 14.0, 16.0, 26.0, 25.0, 21.0, 38.0, 39.0, 32.0, 29.0, 24.0, 38.0, 26.0, 38.0, 23.0, 41.0, 43.0, 42.0, 44.0, 36.0, 43.0, 41.0, 38.0, 17.0, 23.0, 38.0, 11.0, 19.0, 12.0, 19.0, 15.0, 12.0, 7.0, 8.0, 4.0, 9.0, 8.0, 2.0, 2.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.990234375, -2.8946533203125, -2.799072265625, -2.7034912109375, -2.60791015625, -2.5123291015625, -2.416748046875, -2.3211669921875, -2.2255859375, -2.1300048828125, -2.034423828125, -1.9388427734375, -1.84326171875, -1.7476806640625, -1.652099609375, -1.5565185546875, -1.4609375, -1.3653564453125, -1.269775390625, -1.1741943359375, -1.07861328125, -0.9830322265625, -0.887451171875, -0.7918701171875, -0.6962890625, -0.6007080078125, -0.505126953125, -0.4095458984375, -0.31396484375, -0.2183837890625, -0.122802734375, -0.0272216796875, 0.068359375, 0.1639404296875, 0.259521484375, 0.3551025390625, 0.45068359375, 0.5462646484375, 0.641845703125, 0.7374267578125, 0.8330078125, 0.9285888671875, 1.024169921875, 1.1197509765625, 1.21533203125, 1.3109130859375, 1.406494140625, 1.5020751953125, 1.59765625, 1.6932373046875, 1.788818359375, 1.8843994140625, 1.97998046875, 2.0755615234375, 2.171142578125, 2.2667236328125, 2.3623046875, 2.4578857421875, 2.553466796875, 2.6490478515625, 2.74462890625, 2.8402099609375, 2.935791015625, 3.0313720703125, 3.126953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 1.0, 5.0, 6.0, 9.0, 16.0, 15.0, 27.0, 42.0, 55.0, 89.0, 154.0, 241.0, 418.0, 636.0, 1133.0, 1967.0, 3465.0, 6524.0, 12391.0, 25557.0, 106941.0, 758283.0, 81806.0, 23759.0, 11507.0, 5887.0, 3239.0, 1753.0, 1008.0, 607.0, 382.0, 225.0, 156.0, 85.0, 51.0, 36.0, 21.0, 16.0, 10.0, 9.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -1.0023040771484375, -0.970428466796875, -0.9385528564453125, -0.90667724609375, -0.8748016357421875, -0.842926025390625, -0.8110504150390625, -0.7791748046875, -0.7472991943359375, -0.715423583984375, -0.6835479736328125, -0.65167236328125, -0.6197967529296875, -0.587921142578125, -0.5560455322265625, -0.524169921875, -0.4922943115234375, -0.460418701171875, -0.4285430908203125, -0.39666748046875, -0.3647918701171875, -0.332916259765625, -0.3010406494140625, -0.2691650390625, -0.2372894287109375, -0.205413818359375, -0.1735382080078125, -0.14166259765625, -0.1097869873046875, -0.077911376953125, -0.0460357666015625, -0.01416015625, 0.0177154541015625, 0.049591064453125, 0.0814666748046875, 0.11334228515625, 0.1452178955078125, 0.177093505859375, 0.2089691162109375, 0.2408447265625, 0.2727203369140625, 0.304595947265625, 0.3364715576171875, 0.36834716796875, 0.4002227783203125, 0.432098388671875, 0.4639739990234375, 0.495849609375, 0.5277252197265625, 0.559600830078125, 0.5914764404296875, 0.62335205078125, 0.6552276611328125, 0.687103271484375, 0.7189788818359375, 0.7508544921875, 0.7827301025390625, 0.814605712890625, 0.8464813232421875, 0.87835693359375, 0.9102325439453125, 0.942108154296875, 0.9739837646484375, 1.005859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 6.0, 3.0, 10.0, 13.0, 20.0, 21.0, 19.0, 23.0, 24.0, 22.0, 33.0, 35.0, 46.0, 33.0, 32.0, 43.0, 45.0, 47.0, 48.0, 37.0, 40.0, 41.0, 54.0, 30.0, 38.0, 40.0, 31.0, 24.0, 16.0, 13.0, 14.0, 20.0, 13.0, 12.0, 8.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.017303466796875, -1.94281005859375, -1.868316650390625, -1.7938232421875, -1.719329833984375, -1.64483642578125, -1.570343017578125, -1.495849609375, -1.421356201171875, -1.34686279296875, -1.272369384765625, -1.1978759765625, -1.123382568359375, -1.04888916015625, -0.974395751953125, -0.89990234375, -0.825408935546875, -0.75091552734375, -0.676422119140625, -0.6019287109375, -0.527435302734375, -0.45294189453125, -0.378448486328125, -0.303955078125, -0.229461669921875, -0.15496826171875, -0.080474853515625, -0.0059814453125, 0.068511962890625, 0.14300537109375, 0.217498779296875, 0.2919921875, 0.366485595703125, 0.44097900390625, 0.515472412109375, 0.5899658203125, 0.664459228515625, 0.73895263671875, 0.813446044921875, 0.887939453125, 0.962432861328125, 1.03692626953125, 1.111419677734375, 1.1859130859375, 1.260406494140625, 1.33489990234375, 1.409393310546875, 1.48388671875, 1.558380126953125, 1.63287353515625, 1.707366943359375, 1.7818603515625, 1.856353759765625, 1.93084716796875, 2.005340576171875, 2.079833984375, 2.154327392578125, 2.22882080078125, 2.303314208984375, 2.3778076171875, 2.452301025390625, 2.52679443359375, 2.601287841796875, 2.67578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 7.0, 4.0, 9.0, 26.0, 23.0, 35.0, 47.0, 83.0, 111.0, 188.0, 353.0, 665.0, 1123.0, 2273.0, 4952.0, 10960.0, 25531.0, 120099.0, 812498.0, 39406.0, 15993.0, 7293.0, 3283.0, 1616.0, 829.0, 492.0, 229.0, 147.0, 98.0, 69.0, 37.0, 28.0, 7.0, 19.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.196533203125, -0.18957138061523438, -0.18260955810546875, -0.17564773559570312, -0.1686859130859375, -0.16172409057617188, -0.15476226806640625, -0.14780044555664062, -0.140838623046875, -0.13387680053710938, -0.12691497802734375, -0.11995315551757812, -0.1129913330078125, -0.10602951049804688, -0.09906768798828125, -0.09210586547851562, -0.08514404296875, -0.07818222045898438, -0.07122039794921875, -0.06425857543945312, -0.0572967529296875, -0.050334930419921875, -0.04337310791015625, -0.036411285400390625, -0.029449462890625, -0.022487640380859375, -0.01552581787109375, -0.008563995361328125, -0.0016021728515625, 0.005359649658203125, 0.01232147216796875, 0.019283294677734375, 0.0262451171875, 0.033206939697265625, 0.04016876220703125, 0.047130584716796875, 0.0540924072265625, 0.061054229736328125, 0.06801605224609375, 0.07497787475585938, 0.081939697265625, 0.08890151977539062, 0.09586334228515625, 0.10282516479492188, 0.1097869873046875, 0.11674880981445312, 0.12371063232421875, 0.13067245483398438, 0.13763427734375, 0.14459609985351562, 0.15155792236328125, 0.15851974487304688, 0.1654815673828125, 0.17244338989257812, 0.17940521240234375, 0.18636703491210938, 0.193328857421875, 0.20029067993164062, 0.20725250244140625, 0.21421432495117188, 0.2211761474609375, 0.22813796997070312, 0.23509979248046875, 0.24206161499023438, 0.2490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 9.0, 6.0, 16.0, 9.0, 15.0, 19.0, 20.0, 23.0, 48.0, 41.0, 68.0, 48.0, 50.0, 56.0, 79.0, 62.0, 53.0, 59.0, 44.0, 57.0, 31.0, 47.0, 30.0, 30.0, 20.0, 20.0, 9.0, 11.0, 12.0, 11.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.64267349243164e-06, -8.373521268367767e-06, -8.104369044303894e-06, -7.83521682024002e-06, -7.5660645961761475e-06, -7.296912372112274e-06, -7.027760148048401e-06, -6.758607923984528e-06, -6.489455699920654e-06, -6.220303475856781e-06, -5.951151251792908e-06, -5.6819990277290344e-06, -5.412846803665161e-06, -5.143694579601288e-06, -4.8745423555374146e-06, -4.605390131473541e-06, -4.336237907409668e-06, -4.067085683345795e-06, -3.7979334592819214e-06, -3.528781235218048e-06, -3.259629011154175e-06, -2.9904767870903015e-06, -2.7213245630264282e-06, -2.452172338962555e-06, -2.1830201148986816e-06, -1.9138678908348083e-06, -1.644715666770935e-06, -1.3755634427070618e-06, -1.1064112186431885e-06, -8.372589945793152e-07, -5.681067705154419e-07, -2.989545464515686e-07, -2.9802322387695312e-08, 2.39349901676178e-07, 5.085021257400513e-07, 7.776543498039246e-07, 1.0468065738677979e-06, 1.3159587979316711e-06, 1.5851110219955444e-06, 1.8542632460594177e-06, 2.123415470123291e-06, 2.3925676941871643e-06, 2.6617199182510376e-06, 2.930872142314911e-06, 3.200024366378784e-06, 3.4691765904426575e-06, 3.7383288145065308e-06, 4.007481038570404e-06, 4.276633262634277e-06, 4.545785486698151e-06, 4.814937710762024e-06, 5.084089934825897e-06, 5.3532421588897705e-06, 5.622394382953644e-06, 5.891546607017517e-06, 6.16069883108139e-06, 6.429851055145264e-06, 6.699003279209137e-06, 6.96815550327301e-06, 7.2373077273368835e-06, 7.506459951400757e-06, 7.77561217546463e-06, 8.044764399528503e-06, 8.313916623592377e-06, 8.58306884765625e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 17.0, 16.0, 26.0, 41.0, 63.0, 136.0, 167.0, 274.0, 412.0, 624.0, 939.0, 1430.0, 2210.0, 3469.0, 5151.0, 8028.0, 12234.0, 18701.0, 28454.0, 42938.0, 65823.0, 98607.0, 140992.0, 166971.0, 145875.0, 103678.0, 69341.0, 45796.0, 29441.0, 19333.0, 13134.0, 8453.0, 5591.0, 3529.0, 2248.0, 1495.0, 984.0, 642.0, 439.0, 293.0, 196.0, 122.0, 77.0, 54.0, 35.0, 26.0, 11.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.11199951171875, -0.10845088958740234, -0.10490226745605469, -0.10135364532470703, -0.09780502319335938, -0.09425640106201172, -0.09070777893066406, -0.0871591567993164, -0.08361053466796875, -0.0800619125366211, -0.07651329040527344, -0.07296466827392578, -0.06941604614257812, -0.06586742401123047, -0.06231880187988281, -0.058770179748535156, -0.0552215576171875, -0.051672935485839844, -0.04812431335449219, -0.04457569122314453, -0.041027069091796875, -0.03747844696044922, -0.03392982482910156, -0.030381202697753906, -0.02683258056640625, -0.023283958435058594, -0.019735336303710938, -0.01618671417236328, -0.012638092041015625, -0.009089469909667969, -0.0055408477783203125, -0.0019922256469726562, 0.001556396484375, 0.005105018615722656, 0.008653640747070312, 0.012202262878417969, 0.015750885009765625, 0.01929950714111328, 0.022848129272460938, 0.026396751403808594, 0.02994537353515625, 0.033493995666503906, 0.03704261779785156, 0.04059123992919922, 0.044139862060546875, 0.04768848419189453, 0.05123710632324219, 0.054785728454589844, 0.0583343505859375, 0.061882972717285156, 0.06543159484863281, 0.06898021697998047, 0.07252883911132812, 0.07607746124267578, 0.07962608337402344, 0.0831747055053711, 0.08672332763671875, 0.0902719497680664, 0.09382057189941406, 0.09736919403076172, 0.10091781616210938, 0.10446643829345703, 0.10801506042480469, 0.11156368255615234, 0.1151123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 1.0, 7.0, 17.0, 14.0, 25.0, 19.0, 20.0, 29.0, 28.0, 32.0, 43.0, 49.0, 58.0, 62.0, 59.0, 59.0, 68.0, 74.0, 60.0, 47.0, 36.0, 29.0, 42.0, 17.0, 18.0, 21.0, 14.0, 10.0, 7.0, 8.0, 1.0, 8.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.05508756637573242, -0.053381919860839844, -0.051676273345947266, -0.04997062683105469, -0.04826498031616211, -0.04655933380126953, -0.04485368728637695, -0.043148040771484375, -0.0414423942565918, -0.03973674774169922, -0.03803110122680664, -0.03632545471191406, -0.034619808197021484, -0.032914161682128906, -0.031208515167236328, -0.02950286865234375, -0.027797222137451172, -0.026091575622558594, -0.024385929107666016, -0.022680282592773438, -0.02097463607788086, -0.01926898956298828, -0.017563343048095703, -0.015857696533203125, -0.014152050018310547, -0.012446403503417969, -0.01074075698852539, -0.009035110473632812, -0.007329463958740234, -0.005623817443847656, -0.003918170928955078, -0.0022125244140625, -0.0005068778991699219, 0.0011987686157226562, 0.0029044151306152344, 0.0046100616455078125, 0.006315708160400391, 0.008021354675292969, 0.009727001190185547, 0.011432647705078125, 0.013138294219970703, 0.014843940734863281, 0.01654958724975586, 0.018255233764648438, 0.019960880279541016, 0.021666526794433594, 0.023372173309326172, 0.02507781982421875, 0.026783466339111328, 0.028489112854003906, 0.030194759368896484, 0.03190040588378906, 0.03360605239868164, 0.03531169891357422, 0.0370173454284668, 0.038722991943359375, 0.04042863845825195, 0.04213428497314453, 0.04383993148803711, 0.04554557800292969, 0.047251224517822266, 0.048956871032714844, 0.05066251754760742, 0.0523681640625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 7.0, 13.0, 18.0, 16.0, 15.0, 18.0, 26.0, 25.0, 32.0, 35.0, 28.0, 35.0, 38.0, 40.0, 39.0, 41.0, 41.0, 39.0, 44.0, 48.0, 41.0, 43.0, 42.0, 23.0, 37.0, 35.0, 23.0, 31.0, 17.0, 12.0, 12.0, 12.0, 13.0, 8.0, 9.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.2060248851776123, -3.1178689002990723, -3.0297129154205322, -2.9415571689605713, -2.8534011840820312, -2.765245199203491, -2.677089214324951, -2.5889334678649902, -2.50077748298645, -2.41262149810791, -2.32446551322937, -2.236309766769409, -2.148153781890869, -2.059997797012329, -1.971841812133789, -1.8836859464645386, -1.7955299615859985, -1.7073739767074585, -1.619218111038208, -1.531062126159668, -1.4429062604904175, -1.3547502756118774, -1.266594409942627, -1.178438425064087, -1.0902824401855469, -1.0021264553070068, -0.9139705896377563, -0.8258146047592163, -0.7376587390899658, -0.6495027542114258, -0.5613468289375305, -0.47319090366363525, -0.38503503799438477, -0.2968791127204895, -0.20872317254543304, -0.12056723237037659, -0.03241130709648132, 0.05574461817741394, 0.1439005732536316, 0.23205649852752686, 0.3202124238014221, 0.4083683490753174, 0.49652427434921265, 0.5846801996231079, 0.672836184501648, 0.7609920501708984, 0.8491480350494385, 0.9373039603233337, 1.025459885597229, 1.113615870475769, 1.2017717361450195, 1.2899277210235596, 1.37808358669281, 1.46623957157135, 1.5543954372406006, 1.6425514221191406, 1.7307074069976807, 1.8188633918762207, 1.9070192575454712, 1.9951752424240112, 2.0833311080932617, 2.1714870929718018, 2.259643077850342, 2.3477988243103027, 2.4359548091888428]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 9.0, 3.0, 2.0, 6.0, 10.0, 7.0, 12.0, 8.0, 13.0, 13.0, 15.0, 15.0, 27.0, 21.0, 17.0, 25.0, 34.0, 36.0, 38.0, 32.0, 30.0, 45.0, 34.0, 25.0, 40.0, 41.0, 36.0, 40.0, 43.0, 37.0, 43.0, 31.0, 30.0, 21.0, 28.0, 13.0, 22.0, 16.0, 10.0, 16.0, 12.0, 9.0, 11.0, 4.0, 2.0, 5.0, 2.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.889296293258667, -2.7994768619537354, -2.7096571922302246, -2.619837760925293, -2.5300183296203613, -2.4401988983154297, -2.350379228591919, -2.2605597972869873, -2.1707401275634766, -2.080920696258545, -1.9911011457443237, -1.9012815952301025, -1.811462163925171, -1.7216426134109497, -1.6318230628967285, -1.5420036315917969, -1.4521842002868652, -1.362364649772644, -1.2725452184677124, -1.1827256679534912, -1.0929062366485596, -1.0030866861343384, -0.9132671356201172, -0.8234476447105408, -0.7336281538009644, -0.6438086628913879, -0.5539891719818115, -0.46416962146759033, -0.3743501305580139, -0.2845306396484375, -0.1947110891342163, -0.10489159822463989, -0.015072107315063477, 0.07474739849567413, 0.16456690430641174, 0.25438642501831055, 0.34420591592788696, 0.4340254068374634, 0.5238449573516846, 0.613664448261261, 0.7034839391708374, 0.7933034300804138, 0.8831229209899902, 0.9729424715042114, 1.0627620220184326, 1.1525814533233643, 1.2424010038375854, 1.3322205543518066, 1.4220399856567383, 1.5118595361709595, 1.6016789674758911, 1.6914985179901123, 1.781317949295044, 1.8711374998092651, 1.9609570503234863, 2.050776481628418, 2.1405959129333496, 2.2304153442382812, 2.320235013961792, 2.4100544452667236, 2.4998738765716553, 2.589693546295166, 2.6795129776000977, 2.7693324089050293, 2.85915207862854]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 15.0, 22.0, 31.0, 61.0, 93.0, 131.0, 192.0, 368.0, 526.0, 889.0, 1463.0, 2423.0, 4079.0, 6518.0, 10578.0, 16701.0, 25341.0, 38160.0, 55041.0, 73009.0, 92736.0, 107830.0, 115988.0, 113222.0, 101614.0, 83342.0, 64220.0, 46331.0, 31785.0, 20837.0, 13406.0, 8508.0, 5086.0, 3108.0, 1880.0, 1192.0, 689.0, 443.0, 258.0, 177.0, 94.0, 64.0, 31.0, 28.0, 12.0, 7.0, 9.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.830078125, -1.7742156982421875, -1.718353271484375, -1.6624908447265625, -1.60662841796875, -1.5507659912109375, -1.494903564453125, -1.4390411376953125, -1.3831787109375, -1.3273162841796875, -1.271453857421875, -1.2155914306640625, -1.15972900390625, -1.1038665771484375, -1.048004150390625, -0.9921417236328125, -0.936279296875, -0.8804168701171875, -0.824554443359375, -0.7686920166015625, -0.71282958984375, -0.6569671630859375, -0.601104736328125, -0.5452423095703125, -0.4893798828125, -0.4335174560546875, -0.377655029296875, -0.3217926025390625, -0.26593017578125, -0.2100677490234375, -0.154205322265625, -0.0983428955078125, -0.04248046875, 0.0133819580078125, 0.069244384765625, 0.1251068115234375, 0.18096923828125, 0.2368316650390625, 0.292694091796875, 0.3485565185546875, 0.4044189453125, 0.4602813720703125, 0.516143798828125, 0.5720062255859375, 0.62786865234375, 0.6837310791015625, 0.739593505859375, 0.7954559326171875, 0.851318359375, 0.9071807861328125, 0.963043212890625, 1.0189056396484375, 1.07476806640625, 1.1306304931640625, 1.186492919921875, 1.2423553466796875, 1.2982177734375, 1.3540802001953125, 1.409942626953125, 1.4658050537109375, 1.52166748046875, 1.5775299072265625, 1.633392333984375, 1.6892547607421875, 1.7451171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 1.0, 4.0, 7.0, 7.0, 9.0, 10.0, 15.0, 11.0, 11.0, 11.0, 13.0, 14.0, 23.0, 23.0, 32.0, 32.0, 30.0, 47.0, 33.0, 32.0, 36.0, 38.0, 35.0, 35.0, 32.0, 40.0, 39.0, 44.0, 36.0, 37.0, 18.0, 35.0, 36.0, 19.0, 20.0, 28.0, 20.0, 14.0, 9.0, 9.0, 11.0, 11.0, 6.0, 5.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.90625, -2.819091796875, -2.73193359375, -2.644775390625, -2.5576171875, -2.470458984375, -2.38330078125, -2.296142578125, -2.208984375, -2.121826171875, -2.03466796875, -1.947509765625, -1.8603515625, -1.773193359375, -1.68603515625, -1.598876953125, -1.51171875, -1.424560546875, -1.33740234375, -1.250244140625, -1.1630859375, -1.075927734375, -0.98876953125, -0.901611328125, -0.814453125, -0.727294921875, -0.64013671875, -0.552978515625, -0.4658203125, -0.378662109375, -0.29150390625, -0.204345703125, -0.1171875, -0.030029296875, 0.05712890625, 0.144287109375, 0.2314453125, 0.318603515625, 0.40576171875, 0.492919921875, 0.580078125, 0.667236328125, 0.75439453125, 0.841552734375, 0.9287109375, 1.015869140625, 1.10302734375, 1.190185546875, 1.27734375, 1.364501953125, 1.45166015625, 1.538818359375, 1.6259765625, 1.713134765625, 1.80029296875, 1.887451171875, 1.974609375, 2.061767578125, 2.14892578125, 2.236083984375, 2.3232421875, 2.410400390625, 2.49755859375, 2.584716796875, 2.671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 12.0, 19.0, 37.0, 27.0, 54.0, 103.0, 137.0, 198.0, 433.0, 608.0, 1019.0, 1625.0, 2822.0, 4776.0, 7733.0, 12609.0, 20563.0, 32721.0, 49823.0, 72416.0, 97059.0, 117344.0, 129252.0, 125953.0, 109994.0, 86592.0, 62173.0, 42034.0, 27201.0, 16969.0, 10320.0, 6306.0, 3794.0, 2260.0, 1396.0, 812.0, 502.0, 279.0, 184.0, 142.0, 76.0, 64.0, 28.0, 20.0, 23.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.384765625, -2.312042236328125, -2.23931884765625, -2.166595458984375, -2.0938720703125, -2.021148681640625, -1.94842529296875, -1.875701904296875, -1.802978515625, -1.730255126953125, -1.65753173828125, -1.584808349609375, -1.5120849609375, -1.439361572265625, -1.36663818359375, -1.293914794921875, -1.22119140625, -1.148468017578125, -1.07574462890625, -1.003021240234375, -0.9302978515625, -0.857574462890625, -0.78485107421875, -0.712127685546875, -0.639404296875, -0.566680908203125, -0.49395751953125, -0.421234130859375, -0.3485107421875, -0.275787353515625, -0.20306396484375, -0.130340576171875, -0.0576171875, 0.015106201171875, 0.08782958984375, 0.160552978515625, 0.2332763671875, 0.305999755859375, 0.37872314453125, 0.451446533203125, 0.524169921875, 0.596893310546875, 0.66961669921875, 0.742340087890625, 0.8150634765625, 0.887786865234375, 0.96051025390625, 1.033233642578125, 1.10595703125, 1.178680419921875, 1.25140380859375, 1.324127197265625, 1.3968505859375, 1.469573974609375, 1.54229736328125, 1.615020751953125, 1.687744140625, 1.760467529296875, 1.83319091796875, 1.905914306640625, 1.9786376953125, 2.051361083984375, 2.12408447265625, 2.196807861328125, 2.26953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 8.0, 9.0, 8.0, 13.0, 14.0, 21.0, 21.0, 20.0, 20.0, 24.0, 25.0, 22.0, 27.0, 22.0, 30.0, 27.0, 40.0, 27.0, 27.0, 38.0, 37.0, 31.0, 34.0, 34.0, 34.0, 34.0, 35.0, 34.0, 33.0, 25.0, 28.0, 17.0, 22.0, 23.0, 24.0, 24.0, 9.0, 12.0, 7.0, 12.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0], "bins": [-1.828125, -1.7725067138671875, -1.716888427734375, -1.6612701416015625, -1.60565185546875, -1.5500335693359375, -1.494415283203125, -1.4387969970703125, -1.3831787109375, -1.3275604248046875, -1.271942138671875, -1.2163238525390625, -1.16070556640625, -1.1050872802734375, -1.049468994140625, -0.9938507080078125, -0.938232421875, -0.8826141357421875, -0.826995849609375, -0.7713775634765625, -0.71575927734375, -0.6601409912109375, -0.604522705078125, -0.5489044189453125, -0.4932861328125, -0.4376678466796875, -0.382049560546875, -0.3264312744140625, -0.27081298828125, -0.2151947021484375, -0.159576416015625, -0.1039581298828125, -0.04833984375, 0.0072784423828125, 0.062896728515625, 0.1185150146484375, 0.17413330078125, 0.2297515869140625, 0.285369873046875, 0.3409881591796875, 0.3966064453125, 0.4522247314453125, 0.507843017578125, 0.5634613037109375, 0.61907958984375, 0.6746978759765625, 0.730316162109375, 0.7859344482421875, 0.841552734375, 0.8971710205078125, 0.952789306640625, 1.0084075927734375, 1.06402587890625, 1.1196441650390625, 1.175262451171875, 1.2308807373046875, 1.2864990234375, 1.3421173095703125, 1.397735595703125, 1.4533538818359375, 1.50897216796875, 1.5645904541015625, 1.620208740234375, 1.6758270263671875, 1.7314453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 4.0, 2.0, 14.0, 16.0, 20.0, 28.0, 45.0, 50.0, 104.0, 168.0, 247.0, 390.0, 598.0, 931.0, 1410.0, 2425.0, 4102.0, 7358.0, 13140.0, 24064.0, 42508.0, 70913.0, 107746.0, 143779.0, 161609.0, 150870.0, 119354.0, 81516.0, 49835.0, 28635.0, 15505.0, 8801.0, 4873.0, 2902.0, 1669.0, 1056.0, 669.0, 403.0, 265.0, 168.0, 110.0, 96.0, 43.0, 34.0, 26.0, 15.0, 12.0, 9.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3603515625, -1.3173675537109375, -1.274383544921875, -1.2313995361328125, -1.18841552734375, -1.1454315185546875, -1.102447509765625, -1.0594635009765625, -1.0164794921875, -0.9734954833984375, -0.930511474609375, -0.8875274658203125, -0.84454345703125, -0.8015594482421875, -0.758575439453125, -0.7155914306640625, -0.672607421875, -0.6296234130859375, -0.586639404296875, -0.5436553955078125, -0.50067138671875, -0.4576873779296875, -0.414703369140625, -0.3717193603515625, -0.3287353515625, -0.2857513427734375, -0.242767333984375, -0.1997833251953125, -0.15679931640625, -0.1138153076171875, -0.070831298828125, -0.0278472900390625, 0.01513671875, 0.0581207275390625, 0.101104736328125, 0.1440887451171875, 0.18707275390625, 0.2300567626953125, 0.273040771484375, 0.3160247802734375, 0.3590087890625, 0.4019927978515625, 0.444976806640625, 0.4879608154296875, 0.53094482421875, 0.5739288330078125, 0.616912841796875, 0.6598968505859375, 0.702880859375, 0.7458648681640625, 0.788848876953125, 0.8318328857421875, 0.87481689453125, 0.9178009033203125, 0.960784912109375, 1.0037689208984375, 1.0467529296875, 1.0897369384765625, 1.132720947265625, 1.1757049560546875, 1.21868896484375, 1.2616729736328125, 1.304656982421875, 1.3476409912109375, 1.390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 10.0, 12.0, 9.0, 21.0, 24.0, 33.0, 38.0, 45.0, 52.0, 60.0, 54.0, 64.0, 68.0, 67.0, 59.0, 73.0, 65.0, 40.0, 39.0, 39.0, 14.0, 31.0, 16.0, 19.0, 7.0, 14.0, 1.0, 5.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020051002502441406, -0.00019547995179891586, -0.00019044987857341766, -0.00018541980534791946, -0.00018038973212242126, -0.00017535965889692307, -0.00017032958567142487, -0.00016529951244592667, -0.00016026943922042847, -0.00015523936599493027, -0.00015020929276943207, -0.00014517921954393387, -0.00014014914631843567, -0.00013511907309293747, -0.00013008899986743927, -0.00012505892664194107, -0.00012002885341644287, -0.00011499878019094467, -0.00010996870696544647, -0.00010493863373994827, -9.990856051445007e-05, -9.487848728895187e-05, -8.984841406345367e-05, -8.481834083795547e-05, -7.978826761245728e-05, -7.475819438695908e-05, -6.972812116146088e-05, -6.469804793596268e-05, -5.966797471046448e-05, -5.463790148496628e-05, -4.960782825946808e-05, -4.457775503396988e-05, -3.954768180847168e-05, -3.451760858297348e-05, -2.948753535747528e-05, -2.445746213197708e-05, -1.9427388906478882e-05, -1.4397315680980682e-05, -9.367242455482483e-06, -4.3371692299842834e-06, 6.92903995513916e-07, 5.7229772210121155e-06, 1.0753050446510315e-05, 1.5783123672008514e-05, 2.0813196897506714e-05, 2.5843270123004913e-05, 3.087334334850311e-05, 3.590341657400131e-05, 4.093348979949951e-05, 4.596356302499771e-05, 5.099363625049591e-05, 5.602370947599411e-05, 6.105378270149231e-05, 6.608385592699051e-05, 7.111392915248871e-05, 7.614400237798691e-05, 8.117407560348511e-05, 8.620414882898331e-05, 9.12342220544815e-05, 9.62642952799797e-05, 0.0001012943685054779, 0.0001063244417309761, 0.0001113545149564743, 0.0001163845881819725, 0.0001214146614074707]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 2.0, 6.0, 11.0, 21.0, 29.0, 45.0, 65.0, 99.0, 139.0, 240.0, 394.0, 586.0, 991.0, 1752.0, 3066.0, 5377.0, 10089.0, 18016.0, 33076.0, 56919.0, 90932.0, 129751.0, 158794.0, 160409.0, 135782.0, 97859.0, 62150.0, 36379.0, 20418.0, 11069.0, 5990.0, 3314.0, 1860.0, 1084.0, 724.0, 385.0, 263.0, 162.0, 105.0, 66.0, 51.0, 31.0, 22.0, 12.0, 12.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.37890625, -1.3345489501953125, -1.290191650390625, -1.2458343505859375, -1.20147705078125, -1.1571197509765625, -1.112762451171875, -1.0684051513671875, -1.0240478515625, -0.9796905517578125, -0.935333251953125, -0.8909759521484375, -0.84661865234375, -0.8022613525390625, -0.757904052734375, -0.7135467529296875, -0.669189453125, -0.6248321533203125, -0.580474853515625, -0.5361175537109375, -0.49176025390625, -0.4474029541015625, -0.403045654296875, -0.3586883544921875, -0.3143310546875, -0.2699737548828125, -0.225616455078125, -0.1812591552734375, -0.13690185546875, -0.0925445556640625, -0.048187255859375, -0.0038299560546875, 0.04052734375, 0.0848846435546875, 0.129241943359375, 0.1735992431640625, 0.21795654296875, 0.2623138427734375, 0.306671142578125, 0.3510284423828125, 0.3953857421875, 0.4397430419921875, 0.484100341796875, 0.5284576416015625, 0.57281494140625, 0.6171722412109375, 0.661529541015625, 0.7058868408203125, 0.750244140625, 0.7946014404296875, 0.838958740234375, 0.8833160400390625, 0.92767333984375, 0.9720306396484375, 1.016387939453125, 1.0607452392578125, 1.1051025390625, 1.1494598388671875, 1.193817138671875, 1.2381744384765625, 1.28253173828125, 1.3268890380859375, 1.371246337890625, 1.4156036376953125, 1.4599609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 12.0, 8.0, 13.0, 7.0, 23.0, 20.0, 27.0, 25.0, 25.0, 33.0, 39.0, 54.0, 49.0, 50.0, 46.0, 56.0, 52.0, 78.0, 44.0, 47.0, 44.0, 32.0, 33.0, 29.0, 28.0, 31.0, 24.0, 15.0, 15.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454345703125, -0.4378852844238281, -0.42142486572265625, -0.4049644470214844, -0.3885040283203125, -0.3720436096191406, -0.35558319091796875, -0.3391227722167969, -0.322662353515625, -0.3062019348144531, -0.28974151611328125, -0.2732810974121094, -0.2568206787109375, -0.24036026000976562, -0.22389984130859375, -0.20743942260742188, -0.19097900390625, -0.17451858520507812, -0.15805816650390625, -0.14159774780273438, -0.1251373291015625, -0.10867691040039062, -0.09221649169921875, -0.07575607299804688, -0.059295654296875, -0.042835235595703125, -0.02637481689453125, -0.009914398193359375, 0.0065460205078125, 0.023006439208984375, 0.03946685791015625, 0.055927276611328125, 0.0723876953125, 0.08884811401367188, 0.10530853271484375, 0.12176895141601562, 0.1382293701171875, 0.15468978881835938, 0.17115020751953125, 0.18761062622070312, 0.204071044921875, 0.22053146362304688, 0.23699188232421875, 0.2534523010253906, 0.2699127197265625, 0.2863731384277344, 0.30283355712890625, 0.3192939758300781, 0.33575439453125, 0.3522148132324219, 0.36867523193359375, 0.3851356506347656, 0.4015960693359375, 0.4180564880371094, 0.43451690673828125, 0.4509773254394531, 0.467437744140625, 0.4838981628417969, 0.5003585815429688, 0.5168190002441406, 0.5332794189453125, 0.5497398376464844, 0.5662002563476562, 0.5826606750488281, 0.59912109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 19.0, 16.0, 24.0, 26.0, 31.0, 24.0, 25.0, 31.0, 33.0, 46.0, 34.0, 47.0, 47.0, 61.0, 46.0, 49.0, 46.0, 32.0, 53.0, 38.0, 29.0, 32.0, 29.0, 30.0, 22.0, 19.0, 9.0, 17.0, 11.0, 14.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.332444906234741, -3.2350804805755615, -3.1377158164978027, -3.040351390838623, -2.9429869651794434, -2.8456223011016846, -2.748257875442505, -2.650893211364746, -2.5535287857055664, -2.4561643600463867, -2.358799695968628, -2.2614352703094482, -2.1640708446502686, -2.0667061805725098, -1.96934175491333, -1.8719772100448608, -1.7746127843856812, -1.677248239517212, -1.5798838138580322, -1.482519268989563, -1.3851547241210938, -1.287790298461914, -1.1904257535934448, -1.0930612087249756, -0.9956967234611511, -0.8983322381973267, -0.8009676933288574, -0.703603208065033, -0.6062387228012085, -0.5088741779327393, -0.4115096926689148, -0.31414514780044556, -0.2167806625366211, -0.11941615492105484, -0.022051647305488586, 0.07531285285949707, 0.17267736792564392, 0.27004188299179077, 0.36740636825561523, 0.4647709131240845, 0.5621353983879089, 0.6594998836517334, 0.7568644285202026, 0.8542289137840271, 0.9515933990478516, 1.0489579439163208, 1.14632248878479, 1.2436869144439697, 1.341051459312439, 1.4384160041809082, 1.535780429840088, 1.6331449747085571, 1.7305095195770264, 1.827873945236206, 1.9252384901046753, 2.0226030349731445, 2.119967460632324, 2.217331886291504, 2.3146965503692627, 2.4120609760284424, 2.509425401687622, 2.606790065765381, 2.7041544914245605, 2.8015189170837402, 2.898883581161499]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 8.0, 13.0, 15.0, 23.0, 14.0, 12.0, 18.0, 31.0, 29.0, 31.0, 25.0, 31.0, 37.0, 39.0, 42.0, 41.0, 51.0, 38.0, 48.0, 35.0, 34.0, 36.0, 37.0, 25.0, 19.0, 36.0, 24.0, 22.0, 35.0, 27.0, 16.0, 23.0, 10.0, 17.0, 6.0, 4.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-3.7193801403045654, -3.612565279006958, -3.5057501792907715, -3.398935317993164, -3.2921204566955566, -3.185305595397949, -3.078490734100342, -2.9716756343841553, -2.864860773086548, -2.7580459117889404, -2.651230812072754, -2.5444159507751465, -2.437601089477539, -2.3307862281799316, -2.223971366882324, -2.1171562671661377, -2.0103414058685303, -1.9035265445709229, -1.7967115640640259, -1.689896583557129, -1.5830817222595215, -1.476266860961914, -1.369451880455017, -1.2626368999481201, -1.1558220386505127, -1.0490071773529053, -0.9421921968460083, -0.8353772759437561, -0.7285623550415039, -0.6217474341392517, -0.5149325132369995, -0.4081175923347473, -0.3013026714324951, -0.19448775053024292, -0.08767282962799072, 0.019142091274261475, 0.12595701217651367, 0.23277193307876587, 0.33958685398101807, 0.44640177488327026, 0.5532166957855225, 0.6600316166877747, 0.7668465375900269, 0.873661458492279, 0.9804763793945312, 1.0872912406921387, 1.1941062211990356, 1.3009212017059326, 1.40773606300354, 1.5145509243011475, 1.6213659048080444, 1.7281808853149414, 1.8349957466125488, 1.9418106079101562, 2.0486254692077637, 2.15544056892395, 2.2622554302215576, 2.369070291519165, 2.4758853912353516, 2.582700252532959, 2.6895151138305664, 2.796329975128174, 2.9031448364257812, 3.0099599361419678, 3.116774797439575]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 11.0, 14.0, 8.0, 18.0, 29.0, 29.0, 47.0, 55.0, 70.0, 84.0, 124.0, 176.0, 228.0, 270.0, 353.0, 491.0, 652.0, 896.0, 1303.0, 2024.0, 3214.0, 4679.0, 1012691.0, 8707.0, 4696.0, 3050.0, 1932.0, 1295.0, 901.0, 624.0, 463.0, 328.0, 238.0, 213.0, 180.0, 123.0, 86.0, 66.0, 57.0, 54.0, 30.0, 22.0, 12.0, 14.0, 7.0, 7.0, 11.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.585060119628906, -32.50035858154297, -31.415658950805664, -30.330957412719727, -29.246257781982422, -28.161556243896484, -27.076854705810547, -25.99215316772461, -24.907453536987305, -23.822751998901367, -22.738052368164062, -21.653350830078125, -20.568649291992188, -19.483949661254883, -18.399248123168945, -17.31454849243164, -16.229846954345703, -15.145146369934082, -14.060445785522461, -12.975744247436523, -11.891043663024902, -10.806343078613281, -9.721641540527344, -8.636940956115723, -7.552240371704102, -6.4675397872924805, -5.382838726043701, -4.298137664794922, -3.213437080383301, -2.1287364959716797, -1.0440354347229004, 0.040665626525878906, 1.1253700256347656, 2.210070848464966, 3.294771671295166, 4.379472732543945, 5.464173316955566, 6.5488739013671875, 7.633574962615967, 8.718276023864746, 9.802976608276367, 10.887677192687988, 11.97237777709961, 13.057079315185547, 14.141779899597168, 15.226480484008789, 16.311182022094727, 17.39588165283203, 18.48058319091797, 19.565284729003906, 20.64998435974121, 21.73468589782715, 22.819385528564453, 23.90408706665039, 24.988788604736328, 26.073490142822266, 27.15818977355957, 28.242891311645508, 29.327590942382812, 30.41229248046875, 31.496994018554688, 32.581695556640625, 33.6663932800293, 34.751094818115234, 35.83579635620117]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 12.0, 8.0, 15.0, 26.0, 34.0, 45.0, 73.0, 112.0, 167.0, 251.0, 362.0, 540.0, 814.0, 1219.0, 1864.0, 3126.0, 5898.0, 17159.0, 51365000.0, 54112.0, 9320.0, 4246.0, 2449.0, 1472.0, 932.0, 698.0, 453.0, 327.0, 205.0, 110.0, 88.0, 67.0, 39.0, 31.0, 21.0, 17.0, 7.0, 9.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-100.8420639038086, -97.9404525756836, -95.0388412475586, -92.1372299194336, -89.23562622070312, -86.33401489257812, -83.43240356445312, -80.53079223632812, -77.62918090820312, -74.72756958007812, -71.82595825195312, -68.92434692382812, -66.02273559570312, -63.12112808227539, -60.219520568847656, -57.317909240722656, -54.416297912597656, -51.514686584472656, -48.613075256347656, -45.71146774291992, -42.80985641479492, -39.90824508666992, -37.00663757324219, -34.10502624511719, -31.203414916992188, -28.301803588867188, -25.40019416809082, -22.498584747314453, -19.596973419189453, -16.695362091064453, -13.793752670288086, -10.892143249511719, -7.9905242919921875, -5.088913917541504, -2.1873035430908203, 0.7143068313598633, 3.615917205810547, 6.5175275802612305, 9.419137954711914, 12.320747375488281, 15.222358703613281, 18.12397003173828, 21.02557945251465, 23.927188873291016, 26.828800201416016, 29.730411529541016, 32.63201904296875, 35.53363037109375, 38.43524169921875, 41.33685302734375, 44.23846435546875, 47.140071868896484, 50.041683197021484, 52.943294525146484, 55.84490203857422, 58.74651336669922, 61.64812469482422, 64.54973602294922, 67.45134735107422, 70.35295867919922, 73.25456237792969, 76.15617370605469, 79.05778503417969, 81.95939636230469, 84.86100769042969]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 2.0, 8.0, 8.0, 5.0, 5.0, 10.0, 7.0, 22.0, 14.0, 20.0, 22.0, 25.0, 39.0, 41.0, 42.0, 54.0, 46.0, 76.0, 71.0, 73.0, 53.0, 66.0, 57.0, 46.0, 45.0, 25.0, 18.0, 14.0, 12.0, 17.0, 11.0, 7.0, 10.0, 8.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.785274505615234, -43.9940185546875, -42.2027587890625, -40.411502838134766, -38.62024688720703, -36.8289909362793, -35.03773498535156, -33.24647521972656, -31.455219268798828, -29.663963317871094, -27.872705459594727, -26.08144760131836, -24.290191650390625, -22.49893569946289, -20.707677841186523, -18.916419982910156, -17.125164031982422, -15.333907127380371, -13.54265022277832, -11.75139331817627, -9.960136413574219, -8.168879508972168, -6.377622604370117, -4.586365699768066, -2.7951087951660156, -1.0038518905639648, 0.7874050140380859, 2.5786619186401367, 4.3699188232421875, 6.161175727844238, 7.952432632446289, 9.74368953704834, 11.534942626953125, 13.326199531555176, 15.117456436157227, 16.908714294433594, 18.699970245361328, 20.491226196289062, 22.28248405456543, 24.073741912841797, 25.86499786376953, 27.656253814697266, 29.447511672973633, 31.23876953125, 33.030025482177734, 34.82128143310547, 36.61254119873047, 38.4037971496582, 40.19505310058594, 41.98630905151367, 43.777565002441406, 45.568824768066406, 47.36008071899414, 49.151336669921875, 50.942596435546875, 52.73385238647461, 54.525108337402344, 56.31636428833008, 58.10762023925781, 59.89888000488281, 61.69013595581055, 63.48139190673828, 65.27265167236328, 67.06390380859375, 68.85516357421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 8.0, 11.0, 13.0, 10.0, 14.0, 25.0, 17.0, 22.0, 21.0, 26.0, 38.0, 53.0, 64.0, 81.0, 68.0, 74.0, 72.0, 58.0, 43.0, 39.0, 50.0, 21.0, 28.0, 23.0, 22.0, 17.0, 11.0, 12.0, 7.0, 8.0, 11.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.8296127319336, -69.53622436523438, -67.24283599853516, -64.94944763183594, -62.656063079833984, -60.362674713134766, -58.06929016113281, -55.775901794433594, -53.482513427734375, -51.189125061035156, -48.89573669433594, -46.602352142333984, -44.308963775634766, -42.01557540893555, -39.722190856933594, -37.428802490234375, -35.135414123535156, -32.84202575683594, -30.54863929748535, -28.255252838134766, -25.961864471435547, -23.668476104736328, -21.375089645385742, -19.081703186035156, -16.788314819335938, -14.494927406311035, -12.201539993286133, -9.90815258026123, -7.614765167236328, -5.321377754211426, -3.0279903411865234, -0.7346038818359375, 1.5587921142578125, 3.852179527282715, 6.145566940307617, 8.43895435333252, 10.732341766357422, 13.025729179382324, 15.319116592407227, 17.612503051757812, 19.90589141845703, 22.19927978515625, 24.492666244506836, 26.786052703857422, 29.07944107055664, 31.37282943725586, 33.66621398925781, 35.95960235595703, 38.25299072265625, 40.54637908935547, 42.83976745605469, 45.13315200805664, 47.42654037475586, 49.71992874145508, 52.01331329345703, 54.30670166015625, 56.60009002685547, 58.89347839355469, 61.186866760253906, 63.48025131225586, 65.77363586425781, 68.06702423095703, 70.36041259765625, 72.65380096435547, 74.94718933105469]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 22.0, 28.0, 24.0, 50.0, 68.0, 92.0, 153.0, 227.0, 364.0, 574.0, 836.0, 1418.0, 2298.0, 3831.0, 6481.0, 10984.0, 19054.0, 35694.0, 67903.0, 138862.0, 303686.0, 729133.0, 1695158.0, 639027.0, 273195.0, 127383.0, 62660.0, 32434.0, 17600.0, 9976.0, 5866.0, 3426.0, 2118.0, 1294.0, 861.0, 524.0, 340.0, 232.0, 131.0, 85.0, 64.0, 38.0, 27.0, 21.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8792572021484375, -0.851287841796875, -0.8233184814453125, -0.79534912109375, -0.7673797607421875, -0.739410400390625, -0.7114410400390625, -0.6834716796875, -0.6555023193359375, -0.627532958984375, -0.5995635986328125, -0.57159423828125, -0.5436248779296875, -0.515655517578125, -0.4876861572265625, -0.459716796875, -0.4317474365234375, -0.403778076171875, -0.3758087158203125, -0.34783935546875, -0.3198699951171875, -0.291900634765625, -0.2639312744140625, -0.2359619140625, -0.2079925537109375, -0.180023193359375, -0.1520538330078125, -0.12408447265625, -0.0961151123046875, -0.068145751953125, -0.0401763916015625, -0.01220703125, 0.0157623291015625, 0.043731689453125, 0.0717010498046875, 0.09967041015625, 0.1276397705078125, 0.155609130859375, 0.1835784912109375, 0.2115478515625, 0.2395172119140625, 0.267486572265625, 0.2954559326171875, 0.32342529296875, 0.3513946533203125, 0.379364013671875, 0.4073333740234375, 0.435302734375, 0.4632720947265625, 0.491241455078125, 0.5192108154296875, 0.54718017578125, 0.5751495361328125, 0.603118896484375, 0.6310882568359375, 0.6590576171875, 0.6870269775390625, 0.714996337890625, 0.7429656982421875, 0.77093505859375, 0.7989044189453125, 0.826873779296875, 0.8548431396484375, 0.8828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 12.0, 8.0, 12.0, 12.0, 23.0, 17.0, 27.0, 29.0, 30.0, 32.0, 46.0, 41.0, 74.0, 61.0, 64.0, 62.0, 48.0, 63.0, 63.0, 37.0, 39.0, 42.0, 20.0, 29.0, 18.0, 17.0, 14.0, 12.0, 5.0, 6.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1065673828125, -0.10301971435546875, -0.0994720458984375, -0.09592437744140625, -0.092376708984375, -0.08882904052734375, -0.0852813720703125, -0.08173370361328125, -0.07818603515625, -0.07463836669921875, -0.0710906982421875, -0.06754302978515625, -0.063995361328125, -0.06044769287109375, -0.0569000244140625, -0.05335235595703125, -0.0498046875, -0.04625701904296875, -0.0427093505859375, -0.03916168212890625, -0.035614013671875, -0.03206634521484375, -0.0285186767578125, -0.02497100830078125, -0.02142333984375, -0.01787567138671875, -0.0143280029296875, -0.01078033447265625, -0.007232666015625, -0.00368499755859375, -0.0001373291015625, 0.00341033935546875, 0.0069580078125, 0.01050567626953125, 0.0140533447265625, 0.01760101318359375, 0.021148681640625, 0.02469635009765625, 0.0282440185546875, 0.03179168701171875, 0.03533935546875, 0.03888702392578125, 0.0424346923828125, 0.04598236083984375, 0.049530029296875, 0.05307769775390625, 0.0566253662109375, 0.06017303466796875, 0.063720703125, 0.06726837158203125, 0.0708160400390625, 0.07436370849609375, 0.077911376953125, 0.08145904541015625, 0.0850067138671875, 0.08855438232421875, 0.09210205078125, 0.09564971923828125, 0.0991973876953125, 0.10274505615234375, 0.106292724609375, 0.10984039306640625, 0.1133880615234375, 0.11693572998046875, 0.1204833984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 7.0, 14.0, 28.0, 25.0, 46.0, 94.0, 152.0, 267.0, 640.0, 1350.0, 3433.0, 9784.0, 31683.0, 119044.0, 487176.0, 1902420.0, 1223739.0, 304966.0, 76346.0, 21436.0, 6894.0, 2472.0, 1121.0, 481.0, 285.0, 155.0, 94.0, 35.0, 34.0, 25.0, 15.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9195938110351562, -0.8865509033203125, -0.8535079956054688, -0.820465087890625, -0.7874221801757812, -0.7543792724609375, -0.7213363647460938, -0.68829345703125, -0.6552505493164062, -0.6222076416015625, -0.5891647338867188, -0.556121826171875, -0.5230789184570312, -0.4900360107421875, -0.45699310302734375, -0.4239501953125, -0.39090728759765625, -0.3578643798828125, -0.32482147216796875, -0.291778564453125, -0.25873565673828125, -0.2256927490234375, -0.19264984130859375, -0.15960693359375, -0.12656402587890625, -0.0935211181640625, -0.06047821044921875, -0.027435302734375, 0.00560760498046875, 0.0386505126953125, 0.07169342041015625, 0.104736328125, 0.13777923583984375, 0.1708221435546875, 0.20386505126953125, 0.236907958984375, 0.26995086669921875, 0.3029937744140625, 0.33603668212890625, 0.36907958984375, 0.40212249755859375, 0.4351654052734375, 0.46820831298828125, 0.501251220703125, 0.5342941284179688, 0.5673370361328125, 0.6003799438476562, 0.6334228515625, 0.6664657592773438, 0.6995086669921875, 0.7325515747070312, 0.765594482421875, 0.7986373901367188, 0.8316802978515625, 0.8647232055664062, 0.89776611328125, 0.9308090209960938, 0.9638519287109375, 0.9968948364257812, 1.029937744140625, 1.0629806518554688, 1.0960235595703125, 1.1290664672851562, 1.162109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 9.0, 9.0, 21.0, 19.0, 28.0, 30.0, 34.0, 51.0, 63.0, 87.0, 113.0, 116.0, 155.0, 194.0, 245.0, 300.0, 341.0, 409.0, 308.0, 264.0, 253.0, 204.0, 158.0, 135.0, 126.0, 91.0, 66.0, 62.0, 36.0, 26.0, 26.0, 21.0, 19.0, 13.0, 8.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.26123046875, -0.2534046173095703, -0.24557876586914062, -0.23775291442871094, -0.22992706298828125, -0.22210121154785156, -0.21427536010742188, -0.2064495086669922, -0.1986236572265625, -0.1907978057861328, -0.18297195434570312, -0.17514610290527344, -0.16732025146484375, -0.15949440002441406, -0.15166854858398438, -0.1438426971435547, -0.136016845703125, -0.1281909942626953, -0.12036514282226562, -0.11253929138183594, -0.10471343994140625, -0.09688758850097656, -0.08906173706054688, -0.08123588562011719, -0.0734100341796875, -0.06558418273925781, -0.057758331298828125, -0.04993247985839844, -0.04210662841796875, -0.03428077697753906, -0.026454925537109375, -0.018629074096679688, -0.01080322265625, -0.0029773712158203125, 0.004848480224609375, 0.012674331665039062, 0.02050018310546875, 0.028326034545898438, 0.036151885986328125, 0.04397773742675781, 0.0518035888671875, 0.05962944030761719, 0.06745529174804688, 0.07528114318847656, 0.08310699462890625, 0.09093284606933594, 0.09875869750976562, 0.10658454895019531, 0.114410400390625, 0.12223625183105469, 0.13006210327148438, 0.13788795471191406, 0.14571380615234375, 0.15353965759277344, 0.16136550903320312, 0.1691913604736328, 0.1770172119140625, 0.1848430633544922, 0.19266891479492188, 0.20049476623535156, 0.20832061767578125, 0.21614646911621094, 0.22397232055664062, 0.2317981719970703, 0.2396240234375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 13.0, 15.0, 35.0, 48.0, 84.0, 125.0, 179.0, 144.0, 135.0, 82.0, 59.0, 38.0, 16.0, 14.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6010751724243164, -2.4481801986694336, -2.295285224914551, -2.142390251159668, -1.9894952774047852, -1.8366003036499023, -1.6837053298950195, -1.5308103561401367, -1.377915382385254, -1.225020408630371, -1.0721254348754883, -0.9192304611206055, -0.7663354873657227, -0.6134405136108398, -0.46054553985595703, -0.3076505661010742, -0.1547555923461914, -0.0018606185913085938, 0.15103435516357422, 0.30392932891845703, 0.45682430267333984, 0.6097192764282227, 0.7626142501831055, 0.9155092239379883, 1.068404197692871, 1.221299171447754, 1.3741941452026367, 1.5270891189575195, 1.6799840927124023, 1.8328790664672852, 1.985774040222168, 2.138669013977051, 2.2915639877319336, 2.4444589614868164, 2.597353935241699, 2.750248908996582, 2.903143882751465, 3.0560388565063477, 3.2089338302612305, 3.3618288040161133, 3.514723777770996, 3.667618751525879, 3.8205137252807617, 3.9734086990356445, 4.126303672790527, 4.27919864654541, 4.432093620300293, 4.584988594055176, 4.737883567810059, 4.890778541564941, 5.043673515319824, 5.196568489074707, 5.34946346282959, 5.502358436584473, 5.6552534103393555, 5.808148384094238, 5.961043357849121, 6.113938331604004, 6.266833305358887, 6.4197282791137695, 6.572623252868652, 6.725518226623535, 6.878413200378418, 7.031308174133301, 7.184203147888184]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 6.0, 12.0, 14.0, 7.0, 23.0, 27.0, 20.0, 27.0, 31.0, 40.0, 42.0, 43.0, 55.0, 47.0, 52.0, 43.0, 42.0, 51.0, 50.0, 39.0, 37.0, 47.0, 43.0, 26.0, 28.0, 24.0, 28.0, 17.0, 19.0, 14.0, 14.0, 9.0, 7.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7236855030059814, -1.6671802997589111, -1.6106750965118408, -1.554169774055481, -1.4976645708084106, -1.4411593675613403, -1.38465416431427, -1.3281488418579102, -1.2716436386108398, -1.2151384353637695, -1.1586332321166992, -1.1021279096603394, -1.045622706413269, -0.9891175031661987, -0.9326122999191284, -0.8761070370674133, -0.819601833820343, -0.7630966305732727, -0.7065913677215576, -0.6500861644744873, -0.5935809016227722, -0.5370756983757019, -0.4805704653263092, -0.4240652322769165, -0.3675599992275238, -0.3110547661781311, -0.2545495331287384, -0.1980443149805069, -0.1415390819311142, -0.08503386378288269, -0.02852863073348999, 0.02797660231590271, 0.08448183536529541, 0.1409870684146881, 0.1974923014640808, 0.2539975047111511, 0.3105027675628662, 0.3670079708099365, 0.4235132038593292, 0.4800184369087219, 0.536523699760437, 0.5930289030075073, 0.6495341658592224, 0.7060393691062927, 0.7625446319580078, 0.8190498352050781, 0.8755550384521484, 0.9320603013038635, 0.9885655045509338, 1.045070767402649, 1.1015759706497192, 1.1580811738967896, 1.2145863771438599, 1.2710916996002197, 1.32759690284729, 1.3841021060943604, 1.4406073093414307, 1.497112512588501, 1.5536177158355713, 1.6101230382919312, 1.6666282415390015, 1.7231334447860718, 1.779638648033142, 1.836143970489502, 1.8926491737365723]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 11.0, 5.0, 17.0, 12.0, 17.0, 48.0, 61.0, 80.0, 147.0, 183.0, 313.0, 488.0, 753.0, 1193.0, 2057.0, 3572.0, 6372.0, 12230.0, 25102.0, 53503.0, 119300.0, 247339.0, 286077.0, 154530.0, 69256.0, 32058.0, 15282.0, 8057.0, 4273.0, 2413.0, 1387.0, 871.0, 544.0, 327.0, 217.0, 146.0, 105.0, 73.0, 35.0, 35.0, 27.0, 9.0, 9.0, 10.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.50146484375, -0.4863433837890625, -0.471221923828125, -0.4561004638671875, -0.44097900390625, -0.4258575439453125, -0.410736083984375, -0.3956146240234375, -0.3804931640625, -0.3653717041015625, -0.350250244140625, -0.3351287841796875, -0.32000732421875, -0.3048858642578125, -0.289764404296875, -0.2746429443359375, -0.259521484375, -0.2444000244140625, -0.229278564453125, -0.2141571044921875, -0.19903564453125, -0.1839141845703125, -0.168792724609375, -0.1536712646484375, -0.1385498046875, -0.1234283447265625, -0.108306884765625, -0.0931854248046875, -0.07806396484375, -0.0629425048828125, -0.047821044921875, -0.0326995849609375, -0.017578125, -0.0024566650390625, 0.012664794921875, 0.0277862548828125, 0.04290771484375, 0.0580291748046875, 0.073150634765625, 0.0882720947265625, 0.1033935546875, 0.1185150146484375, 0.133636474609375, 0.1487579345703125, 0.16387939453125, 0.1790008544921875, 0.194122314453125, 0.2092437744140625, 0.224365234375, 0.2394866943359375, 0.254608154296875, 0.2697296142578125, 0.28485107421875, 0.2999725341796875, 0.315093994140625, 0.3302154541015625, 0.3453369140625, 0.3604583740234375, 0.375579833984375, 0.3907012939453125, 0.40582275390625, 0.4209442138671875, 0.436065673828125, 0.4511871337890625, 0.46630859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 14.0, 9.0, 19.0, 9.0, 17.0, 23.0, 31.0, 32.0, 32.0, 26.0, 46.0, 56.0, 51.0, 67.0, 51.0, 69.0, 69.0, 51.0, 41.0, 48.0, 44.0, 34.0, 26.0, 21.0, 23.0, 21.0, 13.0, 11.0, 9.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12213134765625, -0.11817455291748047, -0.11421775817871094, -0.1102609634399414, -0.10630416870117188, -0.10234737396240234, -0.09839057922363281, -0.09443378448486328, -0.09047698974609375, -0.08652019500732422, -0.08256340026855469, -0.07860660552978516, -0.07464981079101562, -0.0706930160522461, -0.06673622131347656, -0.06277942657470703, -0.0588226318359375, -0.05486583709716797, -0.05090904235839844, -0.046952247619628906, -0.042995452880859375, -0.039038658142089844, -0.03508186340332031, -0.03112506866455078, -0.02716827392578125, -0.02321147918701172, -0.019254684448242188, -0.015297889709472656, -0.011341094970703125, -0.007384300231933594, -0.0034275054931640625, 0.0005292892456054688, 0.004486083984375, 0.008442878723144531, 0.012399673461914062, 0.016356468200683594, 0.020313262939453125, 0.024270057678222656, 0.028226852416992188, 0.03218364715576172, 0.03614044189453125, 0.04009723663330078, 0.04405403137207031, 0.048010826110839844, 0.051967620849609375, 0.055924415588378906, 0.05988121032714844, 0.06383800506591797, 0.0677947998046875, 0.07175159454345703, 0.07570838928222656, 0.0796651840209961, 0.08362197875976562, 0.08757877349853516, 0.09153556823730469, 0.09549236297607422, 0.09944915771484375, 0.10340595245361328, 0.10736274719238281, 0.11131954193115234, 0.11527633666992188, 0.1192331314086914, 0.12318992614746094, 0.12714672088623047, 0.131103515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 7.0, 4.0, 7.0, 9.0, 7.0, 14.0, 20.0, 35.0, 55.0, 108.0, 229.0, 508.0, 1651.0, 7558.0, 70268.0, 795078.0, 156596.0, 12773.0, 2351.0, 701.0, 263.0, 117.0, 65.0, 39.0, 23.0, 21.0, 10.0, 12.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3685455322265625, -1.317169189453125, -1.2657928466796875, -1.21441650390625, -1.1630401611328125, -1.111663818359375, -1.0602874755859375, -1.0089111328125, -0.9575347900390625, -0.906158447265625, -0.8547821044921875, -0.80340576171875, -0.7520294189453125, -0.700653076171875, -0.6492767333984375, -0.597900390625, -0.5465240478515625, -0.495147705078125, -0.4437713623046875, -0.39239501953125, -0.3410186767578125, -0.289642333984375, -0.2382659912109375, -0.1868896484375, -0.1355133056640625, -0.084136962890625, -0.0327606201171875, 0.01861572265625, 0.0699920654296875, 0.121368408203125, 0.1727447509765625, 0.22412109375, 0.2754974365234375, 0.326873779296875, 0.3782501220703125, 0.42962646484375, 0.4810028076171875, 0.532379150390625, 0.5837554931640625, 0.6351318359375, 0.6865081787109375, 0.737884521484375, 0.7892608642578125, 0.84063720703125, 0.8920135498046875, 0.943389892578125, 0.9947662353515625, 1.046142578125, 1.0975189208984375, 1.148895263671875, 1.2002716064453125, 1.25164794921875, 1.3030242919921875, 1.354400634765625, 1.4057769775390625, 1.4571533203125, 1.5085296630859375, 1.559906005859375, 1.6112823486328125, 1.66265869140625, 1.7140350341796875, 1.765411376953125, 1.8167877197265625, 1.8681640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 6.0, 6.0, 9.0, 10.0, 23.0, 13.0, 22.0, 31.0, 27.0, 34.0, 35.0, 33.0, 49.0, 36.0, 45.0, 53.0, 42.0, 48.0, 49.0, 50.0, 41.0, 44.0, 37.0, 29.0, 27.0, 40.0, 26.0, 18.0, 28.0, 17.0, 16.0, 9.0, 10.0, 10.0, 5.0, 11.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55859375, -0.5385055541992188, -0.5184173583984375, -0.49832916259765625, -0.478240966796875, -0.45815277099609375, -0.4380645751953125, -0.41797637939453125, -0.39788818359375, -0.37779998779296875, -0.3577117919921875, -0.33762359619140625, -0.317535400390625, -0.29744720458984375, -0.2773590087890625, -0.25727081298828125, -0.2371826171875, -0.21709442138671875, -0.1970062255859375, -0.17691802978515625, -0.156829833984375, -0.13674163818359375, -0.1166534423828125, -0.09656524658203125, -0.07647705078125, -0.05638885498046875, -0.0363006591796875, -0.01621246337890625, 0.003875732421875, 0.02396392822265625, 0.0440521240234375, 0.06414031982421875, 0.084228515625, 0.10431671142578125, 0.1244049072265625, 0.14449310302734375, 0.164581298828125, 0.18466949462890625, 0.2047576904296875, 0.22484588623046875, 0.24493408203125, 0.26502227783203125, 0.2851104736328125, 0.30519866943359375, 0.325286865234375, 0.34537506103515625, 0.3654632568359375, 0.38555145263671875, 0.4056396484375, 0.42572784423828125, 0.4458160400390625, 0.46590423583984375, 0.485992431640625, 0.5060806274414062, 0.5261688232421875, 0.5462570190429688, 0.56634521484375, 0.5864334106445312, 0.6065216064453125, 0.6266098022460938, 0.646697998046875, 0.6667861938476562, 0.6868743896484375, 0.7069625854492188, 0.72705078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 8.0, 17.0, 27.0, 44.0, 54.0, 101.0, 186.0, 383.0, 919.0, 2797.0, 12926.0, 287798.0, 715955.0, 21086.0, 3950.0, 1202.0, 474.0, 259.0, 134.0, 77.0, 40.0, 30.0, 17.0, 10.0, 7.0, 13.0, 4.0, 7.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.9302978515625, -1.843017578125, -1.7557373046875, -1.66845703125, -1.5811767578125, -1.493896484375, -1.4066162109375, -1.3193359375, -1.2320556640625, -1.144775390625, -1.0574951171875, -0.97021484375, -0.8829345703125, -0.795654296875, -0.7083740234375, -0.62109375, -0.5338134765625, -0.446533203125, -0.3592529296875, -0.27197265625, -0.1846923828125, -0.097412109375, -0.0101318359375, 0.0771484375, 0.1644287109375, 0.251708984375, 0.3389892578125, 0.42626953125, 0.5135498046875, 0.600830078125, 0.6881103515625, 0.775390625, 0.8626708984375, 0.949951171875, 1.0372314453125, 1.12451171875, 1.2117919921875, 1.299072265625, 1.3863525390625, 1.4736328125, 1.5609130859375, 1.648193359375, 1.7354736328125, 1.82275390625, 1.9100341796875, 1.997314453125, 2.0845947265625, 2.171875, 2.2591552734375, 2.346435546875, 2.4337158203125, 2.52099609375, 2.6082763671875, 2.695556640625, 2.7828369140625, 2.8701171875, 2.9573974609375, 3.044677734375, 3.1319580078125, 3.21923828125, 3.3065185546875, 3.393798828125, 3.4810791015625, 3.568359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 11.0, 6.0, 4.0, 15.0, 18.0, 16.0, 18.0, 24.0, 24.0, 29.0, 41.0, 47.0, 67.0, 57.0, 58.0, 65.0, 56.0, 48.0, 59.0, 66.0, 46.0, 42.0, 43.0, 25.0, 21.0, 14.0, 9.0, 14.0, 11.0, 4.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0001304149627685547, -0.00012676697224378586, -0.00012311898171901703, -0.0001194709911942482, -0.00011582300066947937, -0.00011217501014471054, -0.00010852701961994171, -0.00010487902909517288, -0.00010123103857040405, -9.758304804563522e-05, -9.39350575208664e-05, -9.028706699609756e-05, -8.663907647132874e-05, -8.29910859465599e-05, -7.934309542179108e-05, -7.569510489702225e-05, -7.204711437225342e-05, -6.839912384748459e-05, -6.475113332271576e-05, -6.110314279794693e-05, -5.74551522731781e-05, -5.380716174840927e-05, -5.015917122364044e-05, -4.651118069887161e-05, -4.286319017410278e-05, -3.9215199649333954e-05, -3.5567209124565125e-05, -3.1919218599796295e-05, -2.8271228075027466e-05, -2.4623237550258636e-05, -2.0975247025489807e-05, -1.7327256500720978e-05, -1.3679265975952148e-05, -1.0031275451183319e-05, -6.38328492641449e-06, -2.7352944016456604e-06, 9.126961231231689e-07, 4.560686647891998e-06, 8.208677172660828e-06, 1.1856667697429657e-05, 1.5504658222198486e-05, 1.9152648746967316e-05, 2.2800639271736145e-05, 2.6448629796504974e-05, 3.0096620321273804e-05, 3.374461084604263e-05, 3.739260137081146e-05, 4.104059189558029e-05, 4.468858242034912e-05, 4.833657294511795e-05, 5.198456346988678e-05, 5.563255399465561e-05, 5.928054451942444e-05, 6.292853504419327e-05, 6.65765255689621e-05, 7.022451609373093e-05, 7.387250661849976e-05, 7.752049714326859e-05, 8.116848766803741e-05, 8.481647819280624e-05, 8.846446871757507e-05, 9.21124592423439e-05, 9.576044976711273e-05, 9.940844029188156e-05, 0.00010305643081665039]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 9.0, 18.0, 42.0, 53.0, 87.0, 152.0, 235.0, 358.0, 691.0, 1502.0, 3195.0, 8214.0, 26567.0, 150852.0, 696719.0, 122857.0, 23626.0, 7363.0, 3019.0, 1370.0, 711.0, 350.0, 216.0, 127.0, 61.0, 49.0, 34.0, 21.0, 13.0, 15.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6416015625, -1.592529296875, -1.54345703125, -1.494384765625, -1.4453125, -1.396240234375, -1.34716796875, -1.298095703125, -1.2490234375, -1.199951171875, -1.15087890625, -1.101806640625, -1.052734375, -1.003662109375, -0.95458984375, -0.905517578125, -0.8564453125, -0.807373046875, -0.75830078125, -0.709228515625, -0.66015625, -0.611083984375, -0.56201171875, -0.512939453125, -0.4638671875, -0.414794921875, -0.36572265625, -0.316650390625, -0.267578125, -0.218505859375, -0.16943359375, -0.120361328125, -0.0712890625, -0.022216796875, 0.02685546875, 0.075927734375, 0.125, 0.174072265625, 0.22314453125, 0.272216796875, 0.3212890625, 0.370361328125, 0.41943359375, 0.468505859375, 0.517578125, 0.566650390625, 0.61572265625, 0.664794921875, 0.7138671875, 0.762939453125, 0.81201171875, 0.861083984375, 0.91015625, 0.959228515625, 1.00830078125, 1.057373046875, 1.1064453125, 1.155517578125, 1.20458984375, 1.253662109375, 1.302734375, 1.351806640625, 1.40087890625, 1.449951171875, 1.4990234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 12.0, 10.0, 13.0, 26.0, 23.0, 53.0, 63.0, 69.0, 103.0, 112.0, 114.0, 91.0, 81.0, 55.0, 47.0, 26.0, 37.0, 14.0, 9.0, 8.0, 3.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8820877075195312, -0.8569488525390625, -0.8318099975585938, -0.806671142578125, -0.7815322875976562, -0.7563934326171875, -0.7312545776367188, -0.70611572265625, -0.6809768676757812, -0.6558380126953125, -0.6306991577148438, -0.605560302734375, -0.5804214477539062, -0.5552825927734375, -0.5301437377929688, -0.5050048828125, -0.47986602783203125, -0.4547271728515625, -0.42958831787109375, -0.404449462890625, -0.37931060791015625, -0.3541717529296875, -0.32903289794921875, -0.30389404296875, -0.27875518798828125, -0.2536163330078125, -0.22847747802734375, -0.203338623046875, -0.17819976806640625, -0.1530609130859375, -0.12792205810546875, -0.102783203125, -0.07764434814453125, -0.0525054931640625, -0.02736663818359375, -0.002227783203125, 0.02291107177734375, 0.0480499267578125, 0.07318878173828125, 0.09832763671875, 0.12346649169921875, 0.1486053466796875, 0.17374420166015625, 0.198883056640625, 0.22402191162109375, 0.2491607666015625, 0.27429962158203125, 0.2994384765625, 0.32457733154296875, 0.3497161865234375, 0.37485504150390625, 0.399993896484375, 0.42513275146484375, 0.4502716064453125, 0.47541046142578125, 0.50054931640625, 0.5256881713867188, 0.5508270263671875, 0.5759658813476562, 0.601104736328125, 0.6262435913085938, 0.6513824462890625, 0.6765213012695312, 0.70166015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 16.0, 16.0, 28.0, 53.0, 101.0, 177.0, 188.0, 178.0, 114.0, 55.0, 25.0, 20.0, 10.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.138835430145264, -6.857891082763672, -6.57694673538208, -6.296002388000488, -6.0150580406188965, -5.734113693237305, -5.453169345855713, -5.172224998474121, -4.891280651092529, -4.6103363037109375, -4.329391956329346, -4.048447608947754, -3.767503261566162, -3.4865589141845703, -3.2056145668029785, -2.9246702194213867, -2.643725872039795, -2.362781524658203, -2.0818371772766113, -1.8008928298950195, -1.5199484825134277, -1.239004135131836, -0.9580597877502441, -0.6771154403686523, -0.39617109298706055, -0.11522674560546875, 0.16571760177612305, 0.44666194915771484, 0.7276062965393066, 1.0085506439208984, 1.2894949913024902, 1.570439338684082, 1.8513832092285156, 2.1323275566101074, 2.413271903991699, 2.694216251373291, 2.975160598754883, 3.2561049461364746, 3.5370492935180664, 3.817993640899658, 4.09893798828125, 4.379882335662842, 4.660826683044434, 4.941771030426025, 5.222715377807617, 5.503659725189209, 5.784604072570801, 6.065548419952393, 6.346492767333984, 6.627437114715576, 6.908381462097168, 7.18932580947876, 7.470270156860352, 7.751214504241943, 8.032158851623535, 8.313102722167969, 8.594047546386719, 8.874992370605469, 9.155936241149902, 9.436880111694336, 9.717824935913086, 9.998769760131836, 10.27971363067627, 10.560657501220703, 10.841602325439453]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 9.0, 14.0, 26.0, 38.0, 52.0, 123.0, 144.0, 156.0, 131.0, 105.0, 62.0, 36.0, 21.0, 7.0, 11.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.944893836975098, -10.583532333374023, -10.222169876098633, -9.860808372497559, -9.499445915222168, -9.138084411621094, -8.776721954345703, -8.415360450744629, -8.053998947143555, -7.692636966705322, -7.33127498626709, -6.969913482666016, -6.608551025390625, -6.247189521789551, -5.885827541351318, -5.524465560913086, -5.163103103637695, -4.801741123199463, -4.4403791427612305, -4.079017639160156, -3.7176554203033447, -3.3562934398651123, -2.994931697845459, -2.6335697174072266, -2.272207736968994, -1.9108457565307617, -1.5494838953018188, -1.188122034072876, -0.8267600536346436, -0.46539807319641113, -0.10403633117675781, 0.2573256492614746, 0.618687629699707, 0.9800495505332947, 1.3414114713668823, 1.7027733325958252, 2.0641353130340576, 2.42549729347229, 2.7868590354919434, 3.148221015930176, 3.509582996368408, 3.8709449768066406, 4.232306957244873, 4.5936689376831055, 4.95503044128418, 5.31639289855957, 5.6777544021606445, 6.039116382598877, 6.400478363037109, 6.761840343475342, 7.123202323913574, 7.484563827514648, 7.845926284790039, 8.207287788391113, 8.568649291992188, 8.930011749267578, 9.291374206542969, 9.652735710144043, 10.014098167419434, 10.375459671020508, 10.736822128295898, 11.098183631896973, 11.459545135498047, 11.820907592773438, 12.182269096374512]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 1.0, 7.0, 5.0, 4.0, 27.0, 30.0, 34.0, 58.0, 114.0, 179.0, 345.0, 670.0, 1447.0, 3190.0, 7744.0, 20552.0, 63818.0, 274274.0, 3227346.0, 459404.0, 90018.0, 27526.0, 9934.0, 3998.0, 1826.0, 844.0, 369.0, 193.0, 130.0, 59.0, 45.0, 21.0, 27.0, 13.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.154296875, -2.086181640625, -2.01806640625, -1.949951171875, -1.8818359375, -1.813720703125, -1.74560546875, -1.677490234375, -1.609375, -1.541259765625, -1.47314453125, -1.405029296875, -1.3369140625, -1.268798828125, -1.20068359375, -1.132568359375, -1.064453125, -0.996337890625, -0.92822265625, -0.860107421875, -0.7919921875, -0.723876953125, -0.65576171875, -0.587646484375, -0.51953125, -0.451416015625, -0.38330078125, -0.315185546875, -0.2470703125, -0.178955078125, -0.11083984375, -0.042724609375, 0.025390625, 0.093505859375, 0.16162109375, 0.229736328125, 0.2978515625, 0.365966796875, 0.43408203125, 0.502197265625, 0.5703125, 0.638427734375, 0.70654296875, 0.774658203125, 0.8427734375, 0.910888671875, 0.97900390625, 1.047119140625, 1.115234375, 1.183349609375, 1.25146484375, 1.319580078125, 1.3876953125, 1.455810546875, 1.52392578125, 1.592041015625, 1.66015625, 1.728271484375, 1.79638671875, 1.864501953125, 1.9326171875, 2.000732421875, 2.06884765625, 2.136962890625, 2.205078125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 5.0, 8.0, 10.0, 15.0, 20.0, 18.0, 21.0, 21.0, 30.0, 32.0, 38.0, 44.0, 47.0, 50.0, 61.0, 56.0, 51.0, 56.0, 41.0, 47.0, 36.0, 42.0, 32.0, 34.0, 32.0, 26.0, 23.0, 22.0, 14.0, 14.0, 9.0, 4.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.119384765625, -0.11568450927734375, -0.1119842529296875, -0.10828399658203125, -0.104583740234375, -0.10088348388671875, -0.0971832275390625, -0.09348297119140625, -0.08978271484375, -0.08608245849609375, -0.0823822021484375, -0.07868194580078125, -0.074981689453125, -0.07128143310546875, -0.0675811767578125, -0.06388092041015625, -0.0601806640625, -0.05648040771484375, -0.0527801513671875, -0.04907989501953125, -0.045379638671875, -0.04167938232421875, -0.0379791259765625, -0.03427886962890625, -0.03057861328125, -0.02687835693359375, -0.0231781005859375, -0.01947784423828125, -0.015777587890625, -0.01207733154296875, -0.0083770751953125, -0.00467681884765625, -0.0009765625, 0.00272369384765625, 0.0064239501953125, 0.01012420654296875, 0.013824462890625, 0.01752471923828125, 0.0212249755859375, 0.02492523193359375, 0.02862548828125, 0.03232574462890625, 0.0360260009765625, 0.03972625732421875, 0.043426513671875, 0.04712677001953125, 0.0508270263671875, 0.05452728271484375, 0.0582275390625, 0.06192779541015625, 0.0656280517578125, 0.06932830810546875, 0.073028564453125, 0.07672882080078125, 0.0804290771484375, 0.08412933349609375, 0.08782958984375, 0.09152984619140625, 0.0952301025390625, 0.09893035888671875, 0.102630615234375, 0.10633087158203125, 0.1100311279296875, 0.11373138427734375, 0.117431640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 11.0, 10.0, 11.0, 27.0, 51.0, 69.0, 148.0, 228.0, 422.0, 748.0, 1520.0, 3412.0, 8244.0, 22807.0, 70942.0, 274230.0, 2603905.0, 960583.0, 170946.0, 48161.0, 16194.0, 6268.0, 2629.0, 1264.0, 623.0, 346.0, 184.0, 111.0, 70.0, 37.0, 27.0, 14.0, 13.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3280792236328125, -1.272369384765625, -1.2166595458984375, -1.16094970703125, -1.1052398681640625, -1.049530029296875, -0.9938201904296875, -0.9381103515625, -0.8824005126953125, -0.826690673828125, -0.7709808349609375, -0.71527099609375, -0.6595611572265625, -0.603851318359375, -0.5481414794921875, -0.492431640625, -0.4367218017578125, -0.381011962890625, -0.3253021240234375, -0.26959228515625, -0.2138824462890625, -0.158172607421875, -0.1024627685546875, -0.0467529296875, 0.0089569091796875, 0.064666748046875, 0.1203765869140625, 0.17608642578125, 0.2317962646484375, 0.287506103515625, 0.3432159423828125, 0.39892578125, 0.4546356201171875, 0.510345458984375, 0.5660552978515625, 0.62176513671875, 0.6774749755859375, 0.733184814453125, 0.7888946533203125, 0.8446044921875, 0.9003143310546875, 0.956024169921875, 1.0117340087890625, 1.06744384765625, 1.1231536865234375, 1.178863525390625, 1.2345733642578125, 1.290283203125, 1.3459930419921875, 1.401702880859375, 1.4574127197265625, 1.51312255859375, 1.5688323974609375, 1.624542236328125, 1.6802520751953125, 1.7359619140625, 1.7916717529296875, 1.847381591796875, 1.9030914306640625, 1.95880126953125, 2.0145111083984375, 2.070220947265625, 2.1259307861328125, 2.181640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 4.0, 6.0, 14.0, 15.0, 26.0, 25.0, 30.0, 41.0, 76.0, 70.0, 133.0, 184.0, 242.0, 489.0, 1256.0, 567.0, 287.0, 172.0, 125.0, 84.0, 64.0, 41.0, 34.0, 28.0, 13.0, 14.0, 10.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2166748046875, -0.2082080841064453, -0.19974136352539062, -0.19127464294433594, -0.18280792236328125, -0.17434120178222656, -0.16587448120117188, -0.1574077606201172, -0.1489410400390625, -0.1404743194580078, -0.13200759887695312, -0.12354087829589844, -0.11507415771484375, -0.10660743713378906, -0.09814071655273438, -0.08967399597167969, -0.081207275390625, -0.07274055480957031, -0.06427383422851562, -0.05580711364746094, -0.04734039306640625, -0.03887367248535156, -0.030406951904296875, -0.021940231323242188, -0.0134735107421875, -0.0050067901611328125, 0.003459930419921875, 0.011926651000976562, 0.02039337158203125, 0.028860092163085938, 0.037326812744140625, 0.04579353332519531, 0.05426025390625, 0.06272697448730469, 0.07119369506835938, 0.07966041564941406, 0.08812713623046875, 0.09659385681152344, 0.10506057739257812, 0.11352729797363281, 0.1219940185546875, 0.1304607391357422, 0.13892745971679688, 0.14739418029785156, 0.15586090087890625, 0.16432762145996094, 0.17279434204101562, 0.1812610626220703, 0.189727783203125, 0.1981945037841797, 0.20666122436523438, 0.21512794494628906, 0.22359466552734375, 0.23206138610839844, 0.24052810668945312, 0.2489948272705078, 0.2574615478515625, 0.2659282684326172, 0.2743949890136719, 0.28286170959472656, 0.29132843017578125, 0.29979515075683594, 0.3082618713378906, 0.3167285919189453, 0.3251953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 21.0, 50.0, 79.0, 160.0, 210.0, 177.0, 131.0, 87.0, 39.0, 14.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6224756240844727, -3.515925407409668, -3.4093754291534424, -3.3028252124786377, -3.196275234222412, -3.0897250175476074, -2.9831748008728027, -2.876624822616577, -2.7700748443603516, -2.663524627685547, -2.5569746494293213, -2.4504244327545166, -2.343874454498291, -2.2373242378234863, -2.1307740211486816, -2.024224042892456, -1.9176738262176514, -1.8111237287521362, -1.704573631286621, -1.5980234146118164, -1.4914734363555908, -1.3849232196807861, -1.278373122215271, -1.1718230247497559, -1.0652729272842407, -0.9587228298187256, -0.8521727323532104, -0.7456225752830505, -0.6390724778175354, -0.5325223803520203, -0.42597222328186035, -0.3194221258163452, -0.21287226676940918, -0.10632215440273285, 0.00022795796394348145, 0.106778085231781, 0.21332818269729614, 0.3198782801628113, 0.4264284372329712, 0.5329785346984863, 0.6395286321640015, 0.7460787296295166, 0.8526288270950317, 0.9591789841651917, 1.0657291412353516, 1.1722791194915771, 1.2788293361663818, 1.385379433631897, 1.491929531097412, 1.5984796285629272, 1.7050297260284424, 1.811579942703247, 1.9181299209594727, 2.0246801376342773, 2.131230354309082, 2.2377803325653076, 2.344330310821533, 2.450880527496338, 2.5574305057525635, 2.663980722427368, 2.7705307006835938, 2.8770809173583984, 2.983631134033203, 3.0901811122894287, 3.1967313289642334]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 15.0, 15.0, 26.0, 26.0, 39.0, 44.0, 50.0, 58.0, 65.0, 60.0, 68.0, 64.0, 67.0, 65.0, 57.0, 51.0, 60.0, 42.0, 25.0, 24.0, 14.0, 15.0, 10.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7708759307861328, -1.7244644165039062, -1.6780530214309692, -1.6316415071487427, -1.5852301120758057, -1.538818597793579, -1.492407202720642, -1.4459956884384155, -1.3995842933654785, -1.353172779083252, -1.306761384010315, -1.2603498697280884, -1.2139384746551514, -1.1675269603729248, -1.1211155652999878, -1.0747040510177612, -1.0282926559448242, -0.9818812012672424, -0.9354697465896606, -0.8890582919120789, -0.8426468372344971, -0.7962353825569153, -0.7498239278793335, -0.7034124135971069, -0.6570008993148804, -0.6105894446372986, -0.5641779899597168, -0.517766535282135, -0.4713550806045532, -0.42494362592697144, -0.37853214144706726, -0.3321206867694855, -0.2857092618942261, -0.2392978072166443, -0.1928863525390625, -0.14647488296031952, -0.10006342828273773, -0.053651973605155945, -0.007240504026412964, 0.03917095065116882, 0.08558240532875061, 0.1319938600063324, 0.17840531468391418, 0.22481678426265717, 0.27122825384140015, 0.31763970851898193, 0.3640511631965637, 0.4104626178741455, 0.4568740725517273, 0.5032855272293091, 0.5496969819068909, 0.5961084365844727, 0.6425198912620544, 0.6889313459396362, 0.7353428602218628, 0.7817542552947998, 0.8281657695770264, 0.8745772242546082, 0.9209886789321899, 0.9674001336097717, 1.0138115882873535, 1.06022310256958, 1.106634497642517, 1.1530460119247437, 1.1994574069976807]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 12.0, 22.0, 16.0, 44.0, 72.0, 99.0, 179.0, 322.0, 644.0, 1367.0, 2904.0, 6581.0, 16364.0, 46668.0, 138617.0, 339872.0, 310901.0, 118494.0, 40144.0, 14415.0, 5758.0, 2545.0, 1186.0, 562.0, 318.0, 185.0, 93.0, 51.0, 41.0, 24.0, 13.0, 13.0, 8.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.0985107421875, -1.054443359375, -1.0103759765625, -0.96630859375, -0.9222412109375, -0.878173828125, -0.8341064453125, -0.7900390625, -0.7459716796875, -0.701904296875, -0.6578369140625, -0.61376953125, -0.5697021484375, -0.525634765625, -0.4815673828125, -0.4375, -0.3934326171875, -0.349365234375, -0.3052978515625, -0.26123046875, -0.2171630859375, -0.173095703125, -0.1290283203125, -0.0849609375, -0.0408935546875, 0.003173828125, 0.0472412109375, 0.09130859375, 0.1353759765625, 0.179443359375, 0.2235107421875, 0.267578125, 0.3116455078125, 0.355712890625, 0.3997802734375, 0.44384765625, 0.4879150390625, 0.531982421875, 0.5760498046875, 0.6201171875, 0.6641845703125, 0.708251953125, 0.7523193359375, 0.79638671875, 0.8404541015625, 0.884521484375, 0.9285888671875, 0.97265625, 1.0167236328125, 1.060791015625, 1.1048583984375, 1.14892578125, 1.1929931640625, 1.237060546875, 1.2811279296875, 1.3251953125, 1.3692626953125, 1.413330078125, 1.4573974609375, 1.50146484375, 1.5455322265625, 1.589599609375, 1.6336669921875, 1.677734375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 11.0, 5.0, 9.0, 17.0, 14.0, 31.0, 33.0, 41.0, 34.0, 43.0, 52.0, 64.0, 76.0, 66.0, 67.0, 68.0, 57.0, 40.0, 49.0, 45.0, 33.0, 33.0, 33.0, 22.0, 14.0, 7.0, 5.0, 10.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12131118774414062, -0.11664581298828125, -0.11198043823242188, -0.1073150634765625, -0.10264968872070312, -0.09798431396484375, -0.09331893920898438, -0.088653564453125, -0.08398818969726562, -0.07932281494140625, -0.07465744018554688, -0.0699920654296875, -0.06532669067382812, -0.06066131591796875, -0.055995941162109375, -0.05133056640625, -0.046665191650390625, -0.04199981689453125, -0.037334442138671875, -0.0326690673828125, -0.028003692626953125, -0.02333831787109375, -0.018672943115234375, -0.014007568359375, -0.009342193603515625, -0.00467681884765625, -1.1444091796875e-05, 0.0046539306640625, 0.009319305419921875, 0.01398468017578125, 0.018650054931640625, 0.0233154296875, 0.027980804443359375, 0.03264617919921875, 0.037311553955078125, 0.0419769287109375, 0.046642303466796875, 0.05130767822265625, 0.055973052978515625, 0.060638427734375, 0.06530380249023438, 0.06996917724609375, 0.07463455200195312, 0.0792999267578125, 0.08396530151367188, 0.08863067626953125, 0.09329605102539062, 0.09796142578125, 0.10262680053710938, 0.10729217529296875, 0.11195755004882812, 0.1166229248046875, 0.12128829956054688, 0.12595367431640625, 0.13061904907226562, 0.135284423828125, 0.13994979858398438, 0.14461517333984375, 0.14928054809570312, 0.1539459228515625, 0.15861129760742188, 0.16327667236328125, 0.16794204711914062, 0.172607421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 15.0, 22.0, 67.0, 119.0, 280.0, 733.0, 2408.0, 10168.0, 65147.0, 586997.0, 337671.0, 35779.0, 6466.0, 1673.0, 584.0, 221.0, 95.0, 38.0, 24.0, 13.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.284088134765625, -2.21661376953125, -2.149139404296875, -2.0816650390625, -2.014190673828125, -1.94671630859375, -1.879241943359375, -1.811767578125, -1.744293212890625, -1.67681884765625, -1.609344482421875, -1.5418701171875, -1.474395751953125, -1.40692138671875, -1.339447021484375, -1.27197265625, -1.204498291015625, -1.13702392578125, -1.069549560546875, -1.0020751953125, -0.934600830078125, -0.86712646484375, -0.799652099609375, -0.732177734375, -0.664703369140625, -0.59722900390625, -0.529754638671875, -0.4622802734375, -0.394805908203125, -0.32733154296875, -0.259857177734375, -0.1923828125, -0.124908447265625, -0.05743408203125, 0.010040283203125, 0.0775146484375, 0.144989013671875, 0.21246337890625, 0.279937744140625, 0.347412109375, 0.414886474609375, 0.48236083984375, 0.549835205078125, 0.6173095703125, 0.684783935546875, 0.75225830078125, 0.819732666015625, 0.88720703125, 0.954681396484375, 1.02215576171875, 1.089630126953125, 1.1571044921875, 1.224578857421875, 1.29205322265625, 1.359527587890625, 1.427001953125, 1.494476318359375, 1.56195068359375, 1.629425048828125, 1.6968994140625, 1.764373779296875, 1.83184814453125, 1.899322509765625, 1.966796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 2.0, 9.0, 10.0, 12.0, 15.0, 20.0, 20.0, 19.0, 28.0, 29.0, 30.0, 31.0, 45.0, 42.0, 47.0, 51.0, 53.0, 61.0, 41.0, 49.0, 45.0, 36.0, 48.0, 33.0, 28.0, 33.0, 24.0, 19.0, 24.0, 23.0, 12.0, 10.0, 6.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.59375, -0.57537841796875, -0.5570068359375, -0.53863525390625, -0.520263671875, -0.50189208984375, -0.4835205078125, -0.46514892578125, -0.44677734375, -0.42840576171875, -0.4100341796875, -0.39166259765625, -0.373291015625, -0.35491943359375, -0.3365478515625, -0.31817626953125, -0.2998046875, -0.28143310546875, -0.2630615234375, -0.24468994140625, -0.226318359375, -0.20794677734375, -0.1895751953125, -0.17120361328125, -0.15283203125, -0.13446044921875, -0.1160888671875, -0.09771728515625, -0.079345703125, -0.06097412109375, -0.0426025390625, -0.02423095703125, -0.005859375, 0.01251220703125, 0.0308837890625, 0.04925537109375, 0.067626953125, 0.08599853515625, 0.1043701171875, 0.12274169921875, 0.14111328125, 0.15948486328125, 0.1778564453125, 0.19622802734375, 0.214599609375, 0.23297119140625, 0.2513427734375, 0.26971435546875, 0.2880859375, 0.30645751953125, 0.3248291015625, 0.34320068359375, 0.361572265625, 0.37994384765625, 0.3983154296875, 0.41668701171875, 0.43505859375, 0.45343017578125, 0.4718017578125, 0.49017333984375, 0.508544921875, 0.52691650390625, 0.5452880859375, 0.56365966796875, 0.58203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 4.0, 8.0, 9.0, 9.0, 23.0, 62.0, 118.0, 534.0, 2831.0, 26616.0, 684348.0, 318634.0, 13068.0, 1709.0, 385.0, 105.0, 41.0, 18.0, 8.0, 8.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7734375, -3.6427001953125, -3.511962890625, -3.3812255859375, -3.25048828125, -3.1197509765625, -2.989013671875, -2.8582763671875, -2.7275390625, -2.5968017578125, -2.466064453125, -2.3353271484375, -2.20458984375, -2.0738525390625, -1.943115234375, -1.8123779296875, -1.681640625, -1.5509033203125, -1.420166015625, -1.2894287109375, -1.15869140625, -1.0279541015625, -0.897216796875, -0.7664794921875, -0.6357421875, -0.5050048828125, -0.374267578125, -0.2435302734375, -0.11279296875, 0.0179443359375, 0.148681640625, 0.2794189453125, 0.41015625, 0.5408935546875, 0.671630859375, 0.8023681640625, 0.93310546875, 1.0638427734375, 1.194580078125, 1.3253173828125, 1.4560546875, 1.5867919921875, 1.717529296875, 1.8482666015625, 1.97900390625, 2.1097412109375, 2.240478515625, 2.3712158203125, 2.501953125, 2.6326904296875, 2.763427734375, 2.8941650390625, 3.02490234375, 3.1556396484375, 3.286376953125, 3.4171142578125, 3.5478515625, 3.6785888671875, 3.809326171875, 3.9400634765625, 4.07080078125, 4.2015380859375, 4.332275390625, 4.4630126953125, 4.59375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 12.0, 22.0, 27.0, 21.0, 37.0, 45.0, 60.0, 90.0, 95.0, 85.0, 86.0, 86.0, 76.0, 51.0, 57.0, 27.0, 18.0, 24.0, 18.0, 9.0, 11.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022125244140625, -0.00021431222558021545, -0.0002073720097541809, -0.00020043179392814636, -0.00019349157810211182, -0.00018655136227607727, -0.00017961114645004272, -0.00017267093062400818, -0.00016573071479797363, -0.0001587904989719391, -0.00015185028314590454, -0.00014491006731987, -0.00013796985149383545, -0.0001310296356678009, -0.00012408941984176636, -0.00011714920401573181, -0.00011020898818969727, -0.00010326877236366272, -9.632855653762817e-05, -8.938834071159363e-05, -8.244812488555908e-05, -7.550790905952454e-05, -6.856769323348999e-05, -6.162747740745544e-05, -5.46872615814209e-05, -4.774704575538635e-05, -4.080682992935181e-05, -3.386661410331726e-05, -2.6926398277282715e-05, -1.998618245124817e-05, -1.3045966625213623e-05, -6.105750799179077e-06, 8.344650268554688e-07, 7.774680852890015e-06, 1.471489667892456e-05, 2.1655112504959106e-05, 2.8595328330993652e-05, 3.55355441570282e-05, 4.2475759983062744e-05, 4.941597580909729e-05, 5.6356191635131836e-05, 6.329640746116638e-05, 7.023662328720093e-05, 7.717683911323547e-05, 8.411705493927002e-05, 9.105727076530457e-05, 9.799748659133911e-05, 0.00010493770241737366, 0.0001118779182434082, 0.00011881813406944275, 0.0001257583498954773, 0.00013269856572151184, 0.0001396387815475464, 0.00014657899737358093, 0.00015351921319961548, 0.00016045942902565002, 0.00016739964485168457, 0.00017433986067771912, 0.00018128007650375366, 0.0001882202923297882, 0.00019516050815582275, 0.0002021007239818573, 0.00020904093980789185, 0.0002159811556339264, 0.00022292137145996094]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 6.0, 14.0, 9.0, 25.0, 23.0, 37.0, 42.0, 62.0, 104.0, 150.0, 193.0, 289.0, 464.0, 743.0, 1442.0, 2544.0, 4940.0, 10801.0, 26903.0, 79660.0, 254237.0, 400389.0, 174203.0, 54572.0, 19544.0, 8225.0, 3845.0, 2030.0, 1188.0, 667.0, 388.0, 243.0, 162.0, 117.0, 79.0, 54.0, 38.0, 33.0, 21.0, 16.0, 14.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.3603515625, -1.3195343017578125, -1.278717041015625, -1.2378997802734375, -1.19708251953125, -1.1562652587890625, -1.115447998046875, -1.0746307373046875, -1.0338134765625, -0.9929962158203125, -0.952178955078125, -0.9113616943359375, -0.87054443359375, -0.8297271728515625, -0.788909912109375, -0.7480926513671875, -0.707275390625, -0.6664581298828125, -0.625640869140625, -0.5848236083984375, -0.54400634765625, -0.5031890869140625, -0.462371826171875, -0.4215545654296875, -0.3807373046875, -0.3399200439453125, -0.299102783203125, -0.2582855224609375, -0.21746826171875, -0.1766510009765625, -0.135833740234375, -0.0950164794921875, -0.05419921875, -0.0133819580078125, 0.027435302734375, 0.0682525634765625, 0.10906982421875, 0.1498870849609375, 0.190704345703125, 0.2315216064453125, 0.2723388671875, 0.3131561279296875, 0.353973388671875, 0.3947906494140625, 0.43560791015625, 0.4764251708984375, 0.517242431640625, 0.5580596923828125, 0.598876953125, 0.6396942138671875, 0.680511474609375, 0.7213287353515625, 0.76214599609375, 0.8029632568359375, 0.843780517578125, 0.8845977783203125, 0.9254150390625, 0.9662322998046875, 1.007049560546875, 1.0478668212890625, 1.08868408203125, 1.1295013427734375, 1.170318603515625, 1.2111358642578125, 1.251953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 7.0, 12.0, 10.0, 12.0, 22.0, 23.0, 25.0, 32.0, 49.0, 77.0, 60.0, 77.0, 84.0, 79.0, 77.0, 62.0, 72.0, 52.0, 41.0, 30.0, 26.0, 16.0, 10.0, 6.0, 7.0, 11.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.96533203125, -0.936798095703125, -0.90826416015625, -0.879730224609375, -0.8511962890625, -0.822662353515625, -0.79412841796875, -0.765594482421875, -0.737060546875, -0.708526611328125, -0.67999267578125, -0.651458740234375, -0.6229248046875, -0.594390869140625, -0.56585693359375, -0.537322998046875, -0.5087890625, -0.480255126953125, -0.45172119140625, -0.423187255859375, -0.3946533203125, -0.366119384765625, -0.33758544921875, -0.309051513671875, -0.280517578125, -0.251983642578125, -0.22344970703125, -0.194915771484375, -0.1663818359375, -0.137847900390625, -0.10931396484375, -0.080780029296875, -0.05224609375, -0.023712158203125, 0.00482177734375, 0.033355712890625, 0.0618896484375, 0.090423583984375, 0.11895751953125, 0.147491455078125, 0.176025390625, 0.204559326171875, 0.23309326171875, 0.261627197265625, 0.2901611328125, 0.318695068359375, 0.34722900390625, 0.375762939453125, 0.404296875, 0.432830810546875, 0.46136474609375, 0.489898681640625, 0.5184326171875, 0.546966552734375, 0.57550048828125, 0.604034423828125, 0.632568359375, 0.661102294921875, 0.68963623046875, 0.718170166015625, 0.7467041015625, 0.775238037109375, 0.80377197265625, 0.832305908203125, 0.86083984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 16.0, 24.0, 65.0, 125.0, 204.0, 253.0, 169.0, 74.0, 39.0, 15.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.233915328979492, -13.805442810058594, -13.376970291137695, -12.948497772216797, -12.520026206970215, -12.091553688049316, -11.663081169128418, -11.23460865020752, -10.806136131286621, -10.377663612365723, -9.949191093444824, -9.520719528198242, -9.092247009277344, -8.663774490356445, -8.235301971435547, -7.806829452514648, -7.378357410430908, -6.94988489151001, -6.5214128494262695, -6.092940330505371, -5.664467811584473, -5.235995292663574, -4.807523250579834, -4.3790507316589355, -3.950578451156616, -3.522106170654297, -3.0936336517333984, -2.665161371231079, -2.2366890907287598, -1.8082165718078613, -1.379744291305542, -0.9512717723846436, -0.5227994918823242, -0.09432712197303772, 0.3341452479362488, 0.7626175880432129, 1.1910899877548218, 1.6195623874664307, 2.04803466796875, 2.4765071868896484, 2.9049794673919678, 3.333451747894287, 3.7619242668151855, 4.190396308898926, 4.618868827819824, 5.047341346740723, 5.475813865661621, 5.9042863845825195, 6.33275842666626, 6.761230945587158, 7.189702987670898, 7.618175506591797, 8.046648025512695, 8.475120544433594, 8.903593063354492, 9.33206558227539, 9.760537147521973, 10.189009666442871, 10.61748218536377, 11.045953750610352, 11.47442626953125, 11.902898788452148, 12.331371307373047, 12.759843826293945, 13.188316345214844]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 6.0, 8.0, 21.0, 14.0, 45.0, 55.0, 79.0, 104.0, 137.0, 123.0, 116.0, 90.0, 65.0, 46.0, 25.0, 19.0, 16.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.942750930786133, -13.600939750671387, -13.259129524230957, -12.917318344116211, -12.575507164001465, -12.233696937561035, -11.891885757446289, -11.55007553100586, -11.208264350891113, -10.866453170776367, -10.524642944335938, -10.182831764221191, -9.841020584106445, -9.499210357666016, -9.15739917755127, -8.815587997436523, -8.473777770996094, -8.131966590881348, -7.79015588760376, -7.448345184326172, -7.106534481048584, -6.764723777770996, -6.42291259765625, -6.081101894378662, -5.739290237426758, -5.39747953414917, -5.055668354034424, -4.713857650756836, -4.372046947479248, -4.03023624420166, -3.688425064086914, -3.346614360809326, -3.0048041343688965, -2.6629931926727295, -2.3211824893951416, -1.9793715476989746, -1.6375607252120972, -1.2957499027252197, -0.9539389610290527, -0.6121282577514648, -0.27031731605529785, 0.07149353623390198, 0.4133043885231018, 0.755115270614624, 1.0969260931015015, 1.438736915588379, 1.780547857284546, 2.122358560562134, 2.464169502258301, 2.8059804439544678, 3.1477911472320557, 3.4896020889282227, 3.8314127922058105, 4.173223495483398, 4.5150346755981445, 4.856845378875732, 5.19865608215332, 5.540466785430908, 5.882277965545654, 6.224088668823242, 6.56589937210083, 6.907710075378418, 7.249521255493164, 7.591331958770752, 7.933143138885498]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 3.0, 7.0, 6.0, 9.0, 12.0, 5.0, 15.0, 26.0, 15.0, 24.0, 30.0, 25.0, 41.0, 71.0, 87.0, 161.0, 360.0, 875.0, 2371.0, 8356.0, 35493.0, 235821.0, 3476082.0, 371697.0, 48182.0, 10387.0, 2663.0, 868.0, 288.0, 137.0, 70.0, 35.0, 21.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.0703125, -5.937164306640625, -5.80401611328125, -5.670867919921875, -5.5377197265625, -5.404571533203125, -5.27142333984375, -5.138275146484375, -5.005126953125, -4.871978759765625, -4.73883056640625, -4.605682373046875, -4.4725341796875, -4.339385986328125, -4.20623779296875, -4.073089599609375, -3.93994140625, -3.806793212890625, -3.67364501953125, -3.540496826171875, -3.4073486328125, -3.274200439453125, -3.14105224609375, -3.007904052734375, -2.874755859375, -2.741607666015625, -2.60845947265625, -2.475311279296875, -2.3421630859375, -2.209014892578125, -2.07586669921875, -1.942718505859375, -1.8095703125, -1.676422119140625, -1.54327392578125, -1.410125732421875, -1.2769775390625, -1.143829345703125, -1.01068115234375, -0.877532958984375, -0.744384765625, -0.611236572265625, -0.47808837890625, -0.344940185546875, -0.2117919921875, -0.078643798828125, 0.05450439453125, 0.187652587890625, 0.32080078125, 0.453948974609375, 0.58709716796875, 0.720245361328125, 0.8533935546875, 0.986541748046875, 1.11968994140625, 1.252838134765625, 1.385986328125, 1.519134521484375, 1.65228271484375, 1.785430908203125, 1.9185791015625, 2.051727294921875, 2.18487548828125, 2.318023681640625, 2.451171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 6.0, 13.0, 14.0, 27.0, 22.0, 32.0, 44.0, 51.0, 50.0, 65.0, 76.0, 83.0, 81.0, 69.0, 64.0, 57.0, 46.0, 54.0, 38.0, 28.0, 19.0, 19.0, 13.0, 11.0, 2.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17319679260253906, -0.16743850708007812, -0.1616802215576172, -0.15592193603515625, -0.1501636505126953, -0.14440536499023438, -0.13864707946777344, -0.1328887939453125, -0.12713050842285156, -0.12137222290039062, -0.11561393737792969, -0.10985565185546875, -0.10409736633300781, -0.09833908081054688, -0.09258079528808594, -0.086822509765625, -0.08106422424316406, -0.07530593872070312, -0.06954765319824219, -0.06378936767578125, -0.05803108215332031, -0.052272796630859375, -0.04651451110839844, -0.0407562255859375, -0.03499794006347656, -0.029239654541015625, -0.023481369018554688, -0.01772308349609375, -0.011964797973632812, -0.006206512451171875, -0.0004482269287109375, 0.00531005859375, 0.011068344116210938, 0.016826629638671875, 0.022584915161132812, 0.02834320068359375, 0.03410148620605469, 0.039859771728515625, 0.04561805725097656, 0.0513763427734375, 0.05713462829589844, 0.06289291381835938, 0.06865119934082031, 0.07440948486328125, 0.08016777038574219, 0.08592605590820312, 0.09168434143066406, 0.097442626953125, 0.10320091247558594, 0.10895919799804688, 0.11471748352050781, 0.12047576904296875, 0.1262340545654297, 0.13199234008789062, 0.13775062561035156, 0.1435089111328125, 0.14926719665527344, 0.15502548217773438, 0.1607837677001953, 0.16654205322265625, 0.1723003387451172, 0.17805862426757812, 0.18381690979003906, 0.1895751953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 12.0, 7.0, 16.0, 22.0, 24.0, 70.0, 127.0, 278.0, 669.0, 2028.0, 10512.0, 105595.0, 3096962.0, 921044.0, 48478.0, 5977.0, 1455.0, 501.0, 191.0, 127.0, 58.0, 43.0, 24.0, 17.0, 10.0, 12.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.67694091796875, -5.5140380859375, -5.35113525390625, -5.188232421875, -5.02532958984375, -4.8624267578125, -4.69952392578125, -4.53662109375, -4.37371826171875, -4.2108154296875, -4.04791259765625, -3.885009765625, -3.72210693359375, -3.5592041015625, -3.39630126953125, -3.2333984375, -3.07049560546875, -2.9075927734375, -2.74468994140625, -2.581787109375, -2.41888427734375, -2.2559814453125, -2.09307861328125, -1.93017578125, -1.76727294921875, -1.6043701171875, -1.44146728515625, -1.278564453125, -1.11566162109375, -0.9527587890625, -0.78985595703125, -0.626953125, -0.46405029296875, -0.3011474609375, -0.13824462890625, 0.024658203125, 0.18756103515625, 0.3504638671875, 0.51336669921875, 0.67626953125, 0.83917236328125, 1.0020751953125, 1.16497802734375, 1.327880859375, 1.49078369140625, 1.6536865234375, 1.81658935546875, 1.9794921875, 2.14239501953125, 2.3052978515625, 2.46820068359375, 2.631103515625, 2.79400634765625, 2.9569091796875, 3.11981201171875, 3.28271484375, 3.44561767578125, 3.6085205078125, 3.77142333984375, 3.934326171875, 4.09722900390625, 4.2601318359375, 4.42303466796875, 4.5859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 8.0, 24.0, 35.0, 42.0, 87.0, 75.0, 136.0, 214.0, 260.0, 505.0, 1111.0, 598.0, 354.0, 213.0, 126.0, 88.0, 56.0, 34.0, 34.0, 22.0, 10.0, 6.0, 3.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.457763671875, -0.4428291320800781, -0.42789459228515625, -0.4129600524902344, -0.3980255126953125, -0.3830909729003906, -0.36815643310546875, -0.3532218933105469, -0.338287353515625, -0.3233528137207031, -0.30841827392578125, -0.2934837341308594, -0.2785491943359375, -0.2636146545410156, -0.24868011474609375, -0.23374557495117188, -0.21881103515625, -0.20387649536132812, -0.18894195556640625, -0.17400741577148438, -0.1590728759765625, -0.14413833618164062, -0.12920379638671875, -0.11426925659179688, -0.099334716796875, -0.08440017700195312, -0.06946563720703125, -0.054531097412109375, -0.0395965576171875, -0.024662017822265625, -0.00972747802734375, 0.005207061767578125, 0.0201416015625, 0.035076141357421875, 0.05001068115234375, 0.06494522094726562, 0.0798797607421875, 0.09481430053710938, 0.10974884033203125, 0.12468338012695312, 0.139617919921875, 0.15455245971679688, 0.16948699951171875, 0.18442153930664062, 0.1993560791015625, 0.21429061889648438, 0.22922515869140625, 0.24415969848632812, 0.25909423828125, 0.2740287780761719, 0.28896331787109375, 0.3038978576660156, 0.3188323974609375, 0.3337669372558594, 0.34870147705078125, 0.3636360168457031, 0.378570556640625, 0.3935050964355469, 0.40843963623046875, 0.4233741760253906, 0.4383087158203125, 0.4532432556152344, 0.46817779541015625, 0.4831123352050781, 0.498046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 14.0, 27.0, 38.0, 78.0, 126.0, 152.0, 134.0, 137.0, 108.0, 73.0, 47.0, 17.0, 17.0, 8.0, 9.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.803281307220459, -2.6787705421447754, -2.554259777069092, -2.429749011993408, -2.3052380084991455, -2.180727243423462, -2.0562164783477783, -1.9317057132720947, -1.8071949481964111, -1.6826841831207275, -1.5581732988357544, -1.4336625337600708, -1.3091517686843872, -1.184640884399414, -1.0601301193237305, -0.9356193542480469, -0.8111084699630737, -0.6865976452827454, -0.5620868802070618, -0.4375760555267334, -0.3130652606487274, -0.18855446577072144, -0.06404364109039307, 0.06046712398529053, 0.1849779486656189, 0.3094887435436249, 0.43399953842163086, 0.5585103631019592, 0.6830211877822876, 0.8075319528579712, 0.9320427775382996, 1.056553602218628, 1.1810643672943115, 1.3055751323699951, 1.4300860166549683, 1.5545967817306519, 1.6791075468063354, 1.8036184310913086, 1.9281291961669922, 2.052639961242676, 2.1771507263183594, 2.301661491394043, 2.4261722564697266, 2.55068302154541, 2.675194025039673, 2.7997047901153564, 2.92421555519104, 3.0487263202667236, 3.1732373237609863, 3.29774808883667, 3.4222588539123535, 3.546769618988037, 3.6712806224823, 3.7957913875579834, 3.920302152633667, 4.04481315612793, 4.169323444366455, 4.293834209442139, 4.418344974517822, 4.542855739593506, 4.6673665046691895, 4.791877269744873, 4.916388511657715, 5.040899276733398, 5.165410041809082]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 10.0, 12.0, 5.0, 11.0, 8.0, 14.0, 18.0, 21.0, 16.0, 22.0, 29.0, 28.0, 37.0, 44.0, 28.0, 44.0, 27.0, 40.0, 42.0, 40.0, 39.0, 47.0, 45.0, 38.0, 32.0, 30.0, 48.0, 25.0, 29.0, 25.0, 15.0, 19.0, 20.0, 11.0, 16.0, 10.0, 7.0, 8.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.284921407699585, -1.2372956275939941, -1.1896699666976929, -1.142044186592102, -1.0944185256958008, -1.04679274559021, -0.9991669654846191, -0.9515412449836731, -0.903915524482727, -0.856289803981781, -0.808664083480835, -0.7610383033752441, -0.7134125828742981, -0.665786862373352, -0.6181610822677612, -0.5705353617668152, -0.5229096412658691, -0.4752839207649231, -0.42765817046165466, -0.38003242015838623, -0.3324066996574402, -0.28478097915649414, -0.2371552288532257, -0.18952947854995728, -0.14190375804901123, -0.09427802264690399, -0.04665228724479675, 0.0009734481573104858, 0.048599183559417725, 0.09622491896152496, 0.1438506543636322, 0.19147640466690063, 0.23910212516784668, 0.2867278456687927, 0.33435359597206116, 0.3819793462753296, 0.42960506677627563, 0.4772307872772217, 0.5248565673828125, 0.5724822878837585, 0.6201080083847046, 0.6677337288856506, 0.7153594493865967, 0.7629852294921875, 0.8106109499931335, 0.8582366704940796, 0.9058624505996704, 0.9534881711006165, 1.0011138916015625, 1.0487396717071533, 1.0963653326034546, 1.1439911127090454, 1.1916167736053467, 1.2392425537109375, 1.2868683338165283, 1.3344941139221191, 1.3821197748184204, 1.4297455549240112, 1.4773712158203125, 1.5249969959259033, 1.5726227760314941, 1.6202484369277954, 1.6678742170333862, 1.7154998779296875, 1.7631256580352783]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 17.0, 17.0, 38.0, 46.0, 72.0, 95.0, 193.0, 301.0, 553.0, 915.0, 1787.0, 3391.0, 6541.0, 13271.0, 27643.0, 58033.0, 123631.0, 230337.0, 267058.0, 162197.0, 79374.0, 37199.0, 17597.0, 8774.0, 4362.0, 2284.0, 1136.0, 651.0, 400.0, 207.0, 147.0, 100.0, 54.0, 38.0, 28.0, 20.0, 15.0, 10.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.2123870849609375, -1.170867919921875, -1.1293487548828125, -1.08782958984375, -1.0463104248046875, -1.004791259765625, -0.9632720947265625, -0.9217529296875, -0.8802337646484375, -0.838714599609375, -0.7971954345703125, -0.75567626953125, -0.7141571044921875, -0.672637939453125, -0.6311187744140625, -0.589599609375, -0.5480804443359375, -0.506561279296875, -0.4650421142578125, -0.42352294921875, -0.3820037841796875, -0.340484619140625, -0.2989654541015625, -0.2574462890625, -0.2159271240234375, -0.174407958984375, -0.1328887939453125, -0.09136962890625, -0.0498504638671875, -0.008331298828125, 0.0331878662109375, 0.07470703125, 0.1162261962890625, 0.157745361328125, 0.1992645263671875, 0.24078369140625, 0.2823028564453125, 0.323822021484375, 0.3653411865234375, 0.4068603515625, 0.4483795166015625, 0.489898681640625, 0.5314178466796875, 0.57293701171875, 0.6144561767578125, 0.655975341796875, 0.6974945068359375, 0.739013671875, 0.7805328369140625, 0.822052001953125, 0.8635711669921875, 0.90509033203125, 0.9466094970703125, 0.988128662109375, 1.0296478271484375, 1.0711669921875, 1.1126861572265625, 1.154205322265625, 1.1957244873046875, 1.23724365234375, 1.2787628173828125, 1.320281982421875, 1.3618011474609375, 1.4033203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 14.0, 19.0, 29.0, 22.0, 42.0, 34.0, 48.0, 58.0, 63.0, 47.0, 70.0, 71.0, 62.0, 68.0, 65.0, 59.0, 43.0, 31.0, 32.0, 27.0, 27.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1343555450439453, -0.12881851196289062, -0.12328147888183594, -0.11774444580078125, -0.11220741271972656, -0.10667037963867188, -0.10113334655761719, -0.0955963134765625, -0.09005928039550781, -0.08452224731445312, -0.07898521423339844, -0.07344818115234375, -0.06791114807128906, -0.062374114990234375, -0.05683708190917969, -0.051300048828125, -0.04576301574707031, -0.040225982666015625, -0.03468894958496094, -0.02915191650390625, -0.023614883422851562, -0.018077850341796875, -0.012540817260742188, -0.0070037841796875, -0.0014667510986328125, 0.004070281982421875, 0.009607315063476562, 0.01514434814453125, 0.020681381225585938, 0.026218414306640625, 0.03175544738769531, 0.03729248046875, 0.04282951354980469, 0.048366546630859375, 0.05390357971191406, 0.05944061279296875, 0.06497764587402344, 0.07051467895507812, 0.07605171203613281, 0.0815887451171875, 0.08712577819824219, 0.09266281127929688, 0.09819984436035156, 0.10373687744140625, 0.10927391052246094, 0.11481094360351562, 0.12034797668457031, 0.125885009765625, 0.1314220428466797, 0.13695907592773438, 0.14249610900878906, 0.14803314208984375, 0.15357017517089844, 0.15910720825195312, 0.1646442413330078, 0.1701812744140625, 0.1757183074951172, 0.18125534057617188, 0.18679237365722656, 0.19232940673828125, 0.19786643981933594, 0.20340347290039062, 0.2089405059814453, 0.2144775390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 12.0, 9.0, 14.0, 17.0, 38.0, 31.0, 57.0, 80.0, 101.0, 173.0, 251.0, 392.0, 674.0, 1262.0, 2303.0, 4648.0, 10496.0, 25808.0, 69729.0, 190902.0, 360590.0, 235863.0, 87959.0, 32339.0, 12816.0, 5561.0, 2794.0, 1424.0, 790.0, 479.0, 302.0, 181.0, 156.0, 90.0, 54.0, 46.0, 31.0, 20.0, 14.0, 15.0, 18.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.409912109375, -1.35693359375, -1.303955078125, -1.2509765625, -1.197998046875, -1.14501953125, -1.092041015625, -1.0390625, -0.986083984375, -0.93310546875, -0.880126953125, -0.8271484375, -0.774169921875, -0.72119140625, -0.668212890625, -0.615234375, -0.562255859375, -0.50927734375, -0.456298828125, -0.4033203125, -0.350341796875, -0.29736328125, -0.244384765625, -0.19140625, -0.138427734375, -0.08544921875, -0.032470703125, 0.0205078125, 0.073486328125, 0.12646484375, 0.179443359375, 0.232421875, 0.285400390625, 0.33837890625, 0.391357421875, 0.4443359375, 0.497314453125, 0.55029296875, 0.603271484375, 0.65625, 0.709228515625, 0.76220703125, 0.815185546875, 0.8681640625, 0.921142578125, 0.97412109375, 1.027099609375, 1.080078125, 1.133056640625, 1.18603515625, 1.239013671875, 1.2919921875, 1.344970703125, 1.39794921875, 1.450927734375, 1.50390625, 1.556884765625, 1.60986328125, 1.662841796875, 1.7158203125, 1.768798828125, 1.82177734375, 1.874755859375, 1.927734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 13.0, 8.0, 15.0, 17.0, 16.0, 17.0, 26.0, 35.0, 28.0, 40.0, 42.0, 40.0, 43.0, 44.0, 57.0, 43.0, 38.0, 42.0, 47.0, 48.0, 44.0, 42.0, 37.0, 49.0, 30.0, 24.0, 19.0, 21.0, 10.0, 12.0, 7.0, 12.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9111328125, -0.8824920654296875, -0.853851318359375, -0.8252105712890625, -0.79656982421875, -0.7679290771484375, -0.739288330078125, -0.7106475830078125, -0.6820068359375, -0.6533660888671875, -0.624725341796875, -0.5960845947265625, -0.56744384765625, -0.5388031005859375, -0.510162353515625, -0.4815216064453125, -0.452880859375, -0.4242401123046875, -0.395599365234375, -0.3669586181640625, -0.33831787109375, -0.3096771240234375, -0.281036376953125, -0.2523956298828125, -0.2237548828125, -0.1951141357421875, -0.166473388671875, -0.1378326416015625, -0.10919189453125, -0.0805511474609375, -0.051910400390625, -0.0232696533203125, 0.00537109375, 0.0340118408203125, 0.062652587890625, 0.0912933349609375, 0.11993408203125, 0.1485748291015625, 0.177215576171875, 0.2058563232421875, 0.2344970703125, 0.2631378173828125, 0.291778564453125, 0.3204193115234375, 0.34906005859375, 0.3777008056640625, 0.406341552734375, 0.4349822998046875, 0.463623046875, 0.4922637939453125, 0.520904541015625, 0.5495452880859375, 0.57818603515625, 0.6068267822265625, 0.635467529296875, 0.6641082763671875, 0.6927490234375, 0.7213897705078125, 0.750030517578125, 0.7786712646484375, 0.80731201171875, 0.8359527587890625, 0.864593505859375, 0.8932342529296875, 0.921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 15.0, 22.0, 36.0, 33.0, 54.0, 77.0, 104.0, 144.0, 230.0, 340.0, 520.0, 835.0, 1447.0, 2450.0, 4175.0, 7578.0, 15057.0, 30673.0, 65633.0, 141703.0, 254368.0, 254358.0, 140672.0, 65007.0, 30202.0, 14573.0, 7748.0, 4218.0, 2332.0, 1403.0, 856.0, 520.0, 403.0, 228.0, 183.0, 100.0, 66.0, 55.0, 32.0, 21.0, 18.0, 18.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.052734375, -1.0217666625976562, -0.9907989501953125, -0.9598312377929688, -0.928863525390625, -0.8978958129882812, -0.8669281005859375, -0.8359603881835938, -0.80499267578125, -0.7740249633789062, -0.7430572509765625, -0.7120895385742188, -0.681121826171875, -0.6501541137695312, -0.6191864013671875, -0.5882186889648438, -0.5572509765625, -0.5262832641601562, -0.4953155517578125, -0.46434783935546875, -0.433380126953125, -0.40241241455078125, -0.3714447021484375, -0.34047698974609375, -0.30950927734375, -0.27854156494140625, -0.2475738525390625, -0.21660614013671875, -0.185638427734375, -0.15467071533203125, -0.1237030029296875, -0.09273529052734375, -0.061767578125, -0.03079986572265625, 0.0001678466796875, 0.03113555908203125, 0.062103271484375, 0.09307098388671875, 0.1240386962890625, 0.15500640869140625, 0.18597412109375, 0.21694183349609375, 0.2479095458984375, 0.27887725830078125, 0.309844970703125, 0.34081268310546875, 0.3717803955078125, 0.40274810791015625, 0.4337158203125, 0.46468353271484375, 0.4956512451171875, 0.5266189575195312, 0.557586669921875, 0.5885543823242188, 0.6195220947265625, 0.6504898071289062, 0.68145751953125, 0.7124252319335938, 0.7433929443359375, 0.7743606567382812, 0.805328369140625, 0.8362960815429688, 0.8672637939453125, 0.8982315063476562, 0.92919921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 1.0, 7.0, 9.0, 3.0, 5.0, 12.0, 15.0, 17.0, 38.0, 37.0, 57.0, 67.0, 80.0, 84.0, 94.0, 102.0, 81.0, 83.0, 51.0, 40.0, 28.0, 23.0, 20.0, 11.0, 12.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00030303001403808594, -0.00029450468719005585, -0.00028597936034202576, -0.00027745403349399567, -0.0002689287066459656, -0.0002604033797979355, -0.0002518780529499054, -0.0002433527261018753, -0.00023482739925384521, -0.00022630207240581512, -0.00021777674555778503, -0.00020925141870975494, -0.00020072609186172485, -0.00019220076501369476, -0.00018367543816566467, -0.00017515011131763458, -0.0001666247844696045, -0.0001580994576215744, -0.0001495741307735443, -0.00014104880392551422, -0.00013252347707748413, -0.00012399815022945404, -0.00011547282338142395, -0.00010694749653339386, -9.842216968536377e-05, -8.989684283733368e-05, -8.137151598930359e-05, -7.28461891412735e-05, -6.432086229324341e-05, -5.579553544521332e-05, -4.727020859718323e-05, -3.874488174915314e-05, -3.0219554901123047e-05, -2.1694228053092957e-05, -1.3168901205062866e-05, -4.643574357032776e-06, 3.8817524909973145e-06, 1.2407079339027405e-05, 2.0932406187057495e-05, 2.9457733035087585e-05, 3.7983059883117676e-05, 4.6508386731147766e-05, 5.5033713579177856e-05, 6.355904042720795e-05, 7.208436727523804e-05, 8.060969412326813e-05, 8.913502097129822e-05, 9.766034781932831e-05, 0.0001061856746673584, 0.00011471100151538849, 0.00012323632836341858, 0.00013176165521144867, 0.00014028698205947876, 0.00014881230890750885, 0.00015733763575553894, 0.00016586296260356903, 0.00017438828945159912, 0.0001829136162996292, 0.0001914389431476593, 0.0001999642699956894, 0.00020848959684371948, 0.00021701492369174957, 0.00022554025053977966, 0.00023406557738780975, 0.00024259090423583984]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 3.0, 9.0, 9.0, 5.0, 10.0, 16.0, 21.0, 34.0, 55.0, 67.0, 95.0, 151.0, 235.0, 366.0, 606.0, 1033.0, 2016.0, 4152.0, 9402.0, 23214.0, 62877.0, 193724.0, 406974.0, 224642.0, 72652.0, 25912.0, 10436.0, 4612.0, 2267.0, 1169.0, 629.0, 372.0, 248.0, 193.0, 111.0, 67.0, 51.0, 28.0, 26.0, 18.0, 14.0, 10.0, 5.0, 4.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5576171875, -1.5112152099609375, -1.464813232421875, -1.4184112548828125, -1.37200927734375, -1.3256072998046875, -1.279205322265625, -1.2328033447265625, -1.1864013671875, -1.1399993896484375, -1.093597412109375, -1.0471954345703125, -1.00079345703125, -0.9543914794921875, -0.907989501953125, -0.8615875244140625, -0.815185546875, -0.7687835693359375, -0.722381591796875, -0.6759796142578125, -0.62957763671875, -0.5831756591796875, -0.536773681640625, -0.4903717041015625, -0.4439697265625, -0.3975677490234375, -0.351165771484375, -0.3047637939453125, -0.25836181640625, -0.2119598388671875, -0.165557861328125, -0.1191558837890625, -0.07275390625, -0.0263519287109375, 0.020050048828125, 0.0664520263671875, 0.11285400390625, 0.1592559814453125, 0.205657958984375, 0.2520599365234375, 0.2984619140625, 0.3448638916015625, 0.391265869140625, 0.4376678466796875, 0.48406982421875, 0.5304718017578125, 0.576873779296875, 0.6232757568359375, 0.669677734375, 0.7160797119140625, 0.762481689453125, 0.8088836669921875, 0.85528564453125, 0.9016876220703125, 0.948089599609375, 0.9944915771484375, 1.0408935546875, 1.0872955322265625, 1.133697509765625, 1.1800994873046875, 1.22650146484375, 1.2729034423828125, 1.319305419921875, 1.3657073974609375, 1.412109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 6.0, 13.0, 8.0, 16.0, 12.0, 18.0, 15.0, 25.0, 23.0, 37.0, 38.0, 48.0, 48.0, 41.0, 45.0, 56.0, 64.0, 58.0, 40.0, 56.0, 43.0, 40.0, 35.0, 28.0, 21.0, 30.0, 15.0, 17.0, 12.0, 14.0, 12.0, 11.0, 3.0, 7.0, 11.0, 3.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.72509765625, -0.7052001953125, -0.685302734375, -0.6654052734375, -0.6455078125, -0.6256103515625, -0.605712890625, -0.5858154296875, -0.56591796875, -0.5460205078125, -0.526123046875, -0.5062255859375, -0.486328125, -0.4664306640625, -0.446533203125, -0.4266357421875, -0.40673828125, -0.3868408203125, -0.366943359375, -0.3470458984375, -0.3271484375, -0.3072509765625, -0.287353515625, -0.2674560546875, -0.24755859375, -0.2276611328125, -0.207763671875, -0.1878662109375, -0.16796875, -0.1480712890625, -0.128173828125, -0.1082763671875, -0.08837890625, -0.0684814453125, -0.048583984375, -0.0286865234375, -0.0087890625, 0.0111083984375, 0.031005859375, 0.0509033203125, 0.07080078125, 0.0906982421875, 0.110595703125, 0.1304931640625, 0.150390625, 0.1702880859375, 0.190185546875, 0.2100830078125, 0.22998046875, 0.2498779296875, 0.269775390625, 0.2896728515625, 0.3095703125, 0.3294677734375, 0.349365234375, 0.3692626953125, 0.38916015625, 0.4090576171875, 0.428955078125, 0.4488525390625, 0.46875, 0.4886474609375, 0.508544921875, 0.5284423828125, 0.54833984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 11.0, 34.0, 46.0, 67.0, 124.0, 154.0, 160.0, 162.0, 95.0, 60.0, 30.0, 19.0, 14.0, 7.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.917552947998047, -18.394878387451172, -17.872203826904297, -17.349529266357422, -16.826854705810547, -16.30417823791504, -15.781503677368164, -15.258829116821289, -14.736154556274414, -14.213479995727539, -13.690805435180664, -13.168129920959473, -12.645455360412598, -12.122780799865723, -11.600105285644531, -11.077430725097656, -10.554756164550781, -10.032081604003906, -9.509407043457031, -8.98673152923584, -8.464056968688965, -7.94138240814209, -7.418707370758057, -6.896032333374023, -6.373357772827148, -5.850683212280273, -5.32800817489624, -4.805333137512207, -4.282658576965332, -3.759983777999878, -3.237308979034424, -2.7146341800689697, -2.191957473754883, -1.6692826747894287, -1.1466078758239746, -0.6239330768585205, -0.1012582778930664, 0.4214165210723877, 0.9440913200378418, 1.466766119003296, 1.98944091796875, 2.512115716934204, 3.034790515899658, 3.5574653148651123, 4.080140113830566, 4.602814674377441, 5.125489711761475, 5.648164749145508, 6.170839309692383, 6.693513870239258, 7.216188907623291, 7.738863945007324, 8.2615385055542, 8.784213066101074, 9.306888580322266, 9.82956314086914, 10.352237701416016, 10.87491226196289, 11.397586822509766, 11.920262336730957, 12.442936897277832, 12.965611457824707, 13.488286972045898, 14.010961532592773, 14.533636093139648]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 5.0, 9.0, 7.0, 15.0, 13.0, 13.0, 14.0, 21.0, 35.0, 31.0, 28.0, 27.0, 36.0, 43.0, 41.0, 50.0, 45.0, 44.0, 59.0, 41.0, 34.0, 53.0, 31.0, 51.0, 26.0, 30.0, 30.0, 24.0, 28.0, 19.0, 15.0, 14.0, 13.0, 12.0, 8.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.531903266906738, -6.315352439880371, -6.098801612854004, -5.882250785827637, -5.6656999588012695, -5.449149131774902, -5.232598781585693, -5.016047954559326, -4.799497127532959, -4.582946300506592, -4.366395473480225, -4.149844646453857, -3.9332940578460693, -3.716743230819702, -3.500192642211914, -3.283641815185547, -3.0670909881591797, -2.8505401611328125, -2.6339893341064453, -2.4174387454986572, -2.20088791847229, -1.9843370914459229, -1.7677863836288452, -1.5512356758117676, -1.3346848487854004, -1.1181340217590332, -0.9015833139419556, -0.6850325465202332, -0.46848177909851074, -0.25193095207214355, -0.03538024425506592, 0.18117046356201172, 0.3977212905883789, 0.6142720580101013, 0.8308228254318237, 1.0473735332489014, 1.2639243602752686, 1.4804751873016357, 1.6970258951187134, 1.913576602935791, 2.130127429962158, 2.3466782569885254, 2.5632290840148926, 2.7797796726226807, 2.996330499649048, 3.212881326675415, 3.429431915283203, 3.6459827423095703, 3.8625335693359375, 4.079084396362305, 4.295635223388672, 4.512186050415039, 4.728736877441406, 4.945287704467773, 5.161838054656982, 5.37838888168335, 5.594939708709717, 5.811490535736084, 6.028041362762451, 6.244592189788818, 6.461142539978027, 6.6776933670043945, 6.894244194030762, 7.110795021057129, 7.327345848083496]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 3.0, 18.0, 25.0, 27.0, 47.0, 100.0, 159.0, 258.0, 506.0, 954.0, 2121.0, 4511.0, 11053.0, 30474.0, 96740.0, 429237.0, 3167746.0, 329401.0, 79087.0, 25016.0, 9355.0, 3782.0, 1684.0, 785.0, 442.0, 271.0, 156.0, 101.0, 66.0, 39.0, 30.0, 21.0, 18.0, 19.0, 10.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.424468994140625, -2.33917236328125, -2.253875732421875, -2.1685791015625, -2.083282470703125, -1.99798583984375, -1.912689208984375, -1.827392578125, -1.742095947265625, -1.65679931640625, -1.571502685546875, -1.4862060546875, -1.400909423828125, -1.31561279296875, -1.230316162109375, -1.14501953125, -1.059722900390625, -0.97442626953125, -0.889129638671875, -0.8038330078125, -0.718536376953125, -0.63323974609375, -0.547943115234375, -0.462646484375, -0.377349853515625, -0.29205322265625, -0.206756591796875, -0.1214599609375, -0.036163330078125, 0.04913330078125, 0.134429931640625, 0.2197265625, 0.305023193359375, 0.39031982421875, 0.475616455078125, 0.5609130859375, 0.646209716796875, 0.73150634765625, 0.816802978515625, 0.902099609375, 0.987396240234375, 1.07269287109375, 1.157989501953125, 1.2432861328125, 1.328582763671875, 1.41387939453125, 1.499176025390625, 1.58447265625, 1.669769287109375, 1.75506591796875, 1.840362548828125, 1.9256591796875, 2.010955810546875, 2.09625244140625, 2.181549072265625, 2.266845703125, 2.352142333984375, 2.43743896484375, 2.522735595703125, 2.6080322265625, 2.693328857421875, 2.77862548828125, 2.863922119140625, 2.94921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 10.0, 6.0, 18.0, 22.0, 21.0, 27.0, 32.0, 39.0, 54.0, 47.0, 68.0, 73.0, 75.0, 75.0, 74.0, 66.0, 50.0, 54.0, 47.0, 34.0, 26.0, 30.0, 16.0, 11.0, 10.0, 3.0, 8.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2022705078125, -0.1944751739501953, -0.18667984008789062, -0.17888450622558594, -0.17108917236328125, -0.16329383850097656, -0.15549850463867188, -0.1477031707763672, -0.1399078369140625, -0.1321125030517578, -0.12431716918945312, -0.11652183532714844, -0.10872650146484375, -0.10093116760253906, -0.09313583374023438, -0.08534049987792969, -0.077545166015625, -0.06974983215332031, -0.061954498291015625, -0.05415916442871094, -0.04636383056640625, -0.03856849670410156, -0.030773162841796875, -0.022977828979492188, -0.0151824951171875, -0.0073871612548828125, 0.000408172607421875, 0.008203506469726562, 0.01599884033203125, 0.023794174194335938, 0.031589508056640625, 0.03938484191894531, 0.04718017578125, 0.05497550964355469, 0.06277084350585938, 0.07056617736816406, 0.07836151123046875, 0.08615684509277344, 0.09395217895507812, 0.10174751281738281, 0.1095428466796875, 0.11733818054199219, 0.12513351440429688, 0.13292884826660156, 0.14072418212890625, 0.14851951599121094, 0.15631484985351562, 0.1641101837158203, 0.171905517578125, 0.1797008514404297, 0.18749618530273438, 0.19529151916503906, 0.20308685302734375, 0.21088218688964844, 0.21867752075195312, 0.2264728546142578, 0.2342681884765625, 0.2420635223388672, 0.24985885620117188, 0.25765419006347656, 0.26544952392578125, 0.27324485778808594, 0.2810401916503906, 0.2888355255126953, 0.296630859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 8.0, 6.0, 13.0, 32.0, 26.0, 76.0, 112.0, 183.0, 360.0, 674.0, 1489.0, 3830.0, 11677.0, 42086.0, 194183.0, 2325618.0, 1397393.0, 163727.0, 36315.0, 10173.0, 3522.0, 1380.0, 608.0, 342.0, 178.0, 105.0, 58.0, 47.0, 26.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.234375, -3.1298828125, -3.025390625, -2.9208984375, -2.81640625, -2.7119140625, -2.607421875, -2.5029296875, -2.3984375, -2.2939453125, -2.189453125, -2.0849609375, -1.98046875, -1.8759765625, -1.771484375, -1.6669921875, -1.5625, -1.4580078125, -1.353515625, -1.2490234375, -1.14453125, -1.0400390625, -0.935546875, -0.8310546875, -0.7265625, -0.6220703125, -0.517578125, -0.4130859375, -0.30859375, -0.2041015625, -0.099609375, 0.0048828125, 0.109375, 0.2138671875, 0.318359375, 0.4228515625, 0.52734375, 0.6318359375, 0.736328125, 0.8408203125, 0.9453125, 1.0498046875, 1.154296875, 1.2587890625, 1.36328125, 1.4677734375, 1.572265625, 1.6767578125, 1.78125, 1.8857421875, 1.990234375, 2.0947265625, 2.19921875, 2.3037109375, 2.408203125, 2.5126953125, 2.6171875, 2.7216796875, 2.826171875, 2.9306640625, 3.03515625, 3.1396484375, 3.244140625, 3.3486328125, 3.453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 16.0, 17.0, 18.0, 20.0, 29.0, 32.0, 59.0, 83.0, 122.0, 160.0, 274.0, 527.0, 1325.0, 525.0, 291.0, 180.0, 110.0, 88.0, 44.0, 52.0, 23.0, 21.0, 19.0, 16.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.7485885620117188, -0.7281341552734375, -0.7076797485351562, -0.687225341796875, -0.6667709350585938, -0.6463165283203125, -0.6258621215820312, -0.60540771484375, -0.5849533081054688, -0.5644989013671875, -0.5440444946289062, -0.523590087890625, -0.5031356811523438, -0.4826812744140625, -0.46222686767578125, -0.4417724609375, -0.42131805419921875, -0.4008636474609375, -0.38040924072265625, -0.359954833984375, -0.33950042724609375, -0.3190460205078125, -0.29859161376953125, -0.27813720703125, -0.25768280029296875, -0.2372283935546875, -0.21677398681640625, -0.196319580078125, -0.17586517333984375, -0.1554107666015625, -0.13495635986328125, -0.114501953125, -0.09404754638671875, -0.0735931396484375, -0.05313873291015625, -0.032684326171875, -0.01222991943359375, 0.0082244873046875, 0.02867889404296875, 0.04913330078125, 0.06958770751953125, 0.0900421142578125, 0.11049652099609375, 0.130950927734375, 0.15140533447265625, 0.1718597412109375, 0.19231414794921875, 0.2127685546875, 0.23322296142578125, 0.2536773681640625, 0.27413177490234375, 0.294586181640625, 0.31504058837890625, 0.3354949951171875, 0.35594940185546875, 0.37640380859375, 0.39685821533203125, 0.4173126220703125, 0.43776702880859375, 0.458221435546875, 0.47867584228515625, 0.4991302490234375, 0.5195846557617188, 0.5400390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 17.0, 26.0, 33.0, 58.0, 71.0, 87.0, 134.0, 116.0, 123.0, 90.0, 72.0, 58.0, 36.0, 23.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39105749130249, -4.252893447875977, -4.114729404449463, -3.9765655994415283, -3.8384017944335938, -3.70023775100708, -3.5620737075805664, -3.4239096641540527, -3.285745859146118, -3.1475818157196045, -3.00941801071167, -2.8712539672851562, -2.7330899238586426, -2.594926118850708, -2.4567620754241943, -2.3185982704162598, -2.180434226989746, -2.0422701835632324, -1.9041063785552979, -1.7659423351287842, -1.62777841091156, -1.489614486694336, -1.3514504432678223, -1.2132865190505981, -1.075122594833374, -0.9369586706161499, -0.798794686794281, -0.6606307029724121, -0.522466778755188, -0.38430285453796387, -0.24613887071609497, -0.10797488689422607, 0.03018951416015625, 0.16835346817970276, 0.30651742219924927, 0.4446813762187958, 0.5828453302383423, 0.7210092544555664, 0.8591732382774353, 0.9973372220993042, 1.1355011463165283, 1.2736650705337524, 1.4118289947509766, 1.5499930381774902, 1.6881569623947144, 1.8263208866119385, 1.9644849300384521, 2.1026487350463867, 2.2408127784729004, 2.378976821899414, 2.5171406269073486, 2.6553046703338623, 2.793468475341797, 2.9316325187683105, 3.069796562194824, 3.207960605621338, 3.3461244106292725, 3.484288454055786, 3.6224522590637207, 3.7606163024902344, 3.898780345916748, 4.036944389343262, 4.175107955932617, 4.313271999359131, 4.4514360427856445]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 7.0, 13.0, 14.0, 19.0, 17.0, 19.0, 25.0, 29.0, 24.0, 36.0, 27.0, 30.0, 36.0, 45.0, 35.0, 46.0, 25.0, 45.0, 22.0, 38.0, 43.0, 45.0, 33.0, 33.0, 28.0, 24.0, 31.0, 21.0, 31.0, 16.0, 23.0, 16.0, 14.0, 14.0, 11.0, 12.0, 5.0, 12.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.2567543983459473, -2.1906564235687256, -2.124558448791504, -2.0584607124328613, -1.9923627376556396, -1.926264762878418, -1.8601667881011963, -1.7940688133239746, -1.7279709577560425, -1.6618729829788208, -1.5957751274108887, -1.529677152633667, -1.4635791778564453, -1.3974813222885132, -1.3313833475112915, -1.2652854919433594, -1.1991875171661377, -1.133089542388916, -1.0669916868209839, -1.0008937120437622, -0.9347957968711853, -0.8686978816986084, -0.8025999069213867, -0.7365019917488098, -0.6704040765762329, -0.604306161403656, -0.5382082462310791, -0.4721102714538574, -0.4060123562812805, -0.3399144411087036, -0.2738164961338043, -0.20771855115890503, -0.14162087440490723, -0.07552294433116913, -0.00942501425743103, 0.05667291581630707, 0.12277084589004517, 0.18886876106262207, 0.25496670603752136, 0.32106465101242065, 0.38716256618499756, 0.45326048135757446, 0.5193583965301514, 0.585456371307373, 0.65155428647995, 0.7176522016525269, 0.7837501764297485, 0.8498480916023254, 0.9159460067749023, 0.9820439219474792, 1.0481418371200562, 1.1142398118972778, 1.18033766746521, 1.2464356422424316, 1.3125336170196533, 1.378631591796875, 1.4447294473648071, 1.5108274221420288, 1.576925277709961, 1.6430232524871826, 1.7091212272644043, 1.7752190828323364, 1.841317057609558, 1.9074149131774902, 1.973512887954712]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 12.0, 26.0, 40.0, 51.0, 76.0, 128.0, 233.0, 396.0, 813.0, 1746.0, 3866.0, 9168.0, 22739.0, 55774.0, 131062.0, 258224.0, 285212.0, 160384.0, 70023.0, 28282.0, 11417.0, 4620.0, 2095.0, 1001.0, 493.0, 253.0, 145.0, 103.0, 48.0, 37.0, 28.0, 13.0, 9.0, 1.0, 8.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6826171875, -1.6318206787109375, -1.581024169921875, -1.5302276611328125, -1.47943115234375, -1.4286346435546875, -1.377838134765625, -1.3270416259765625, -1.2762451171875, -1.2254486083984375, -1.174652099609375, -1.1238555908203125, -1.07305908203125, -1.0222625732421875, -0.971466064453125, -0.9206695556640625, -0.869873046875, -0.8190765380859375, -0.768280029296875, -0.7174835205078125, -0.66668701171875, -0.6158905029296875, -0.565093994140625, -0.5142974853515625, -0.4635009765625, -0.4127044677734375, -0.361907958984375, -0.3111114501953125, -0.26031494140625, -0.2095184326171875, -0.158721923828125, -0.1079254150390625, -0.05712890625, -0.0063323974609375, 0.044464111328125, 0.0952606201171875, 0.14605712890625, 0.1968536376953125, 0.247650146484375, 0.2984466552734375, 0.3492431640625, 0.4000396728515625, 0.450836181640625, 0.5016326904296875, 0.55242919921875, 0.6032257080078125, 0.654022216796875, 0.7048187255859375, 0.755615234375, 0.8064117431640625, 0.857208251953125, 0.9080047607421875, 0.95880126953125, 1.0095977783203125, 1.060394287109375, 1.1111907958984375, 1.1619873046875, 1.2127838134765625, 1.263580322265625, 1.3143768310546875, 1.36517333984375, 1.4159698486328125, 1.466766357421875, 1.5175628662109375, 1.568359375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 13.0, 9.0, 14.0, 31.0, 18.0, 48.0, 52.0, 50.0, 73.0, 72.0, 60.0, 74.0, 75.0, 75.0, 75.0, 51.0, 50.0, 34.0, 32.0, 32.0, 20.0, 11.0, 10.0, 7.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.265350341796875, -0.25604248046875, -0.246734619140625, -0.2374267578125, -0.228118896484375, -0.21881103515625, -0.209503173828125, -0.2001953125, -0.190887451171875, -0.18157958984375, -0.172271728515625, -0.1629638671875, -0.153656005859375, -0.14434814453125, -0.135040283203125, -0.125732421875, -0.116424560546875, -0.10711669921875, -0.097808837890625, -0.0885009765625, -0.079193115234375, -0.06988525390625, -0.060577392578125, -0.05126953125, -0.041961669921875, -0.03265380859375, -0.023345947265625, -0.0140380859375, -0.004730224609375, 0.00457763671875, 0.013885498046875, 0.023193359375, 0.032501220703125, 0.04180908203125, 0.051116943359375, 0.0604248046875, 0.069732666015625, 0.07904052734375, 0.088348388671875, 0.09765625, 0.106964111328125, 0.11627197265625, 0.125579833984375, 0.1348876953125, 0.144195556640625, 0.15350341796875, 0.162811279296875, 0.172119140625, 0.181427001953125, 0.19073486328125, 0.200042724609375, 0.2093505859375, 0.218658447265625, 0.22796630859375, 0.237274169921875, 0.24658203125, 0.255889892578125, 0.26519775390625, 0.274505615234375, 0.2838134765625, 0.293121337890625, 0.30242919921875, 0.311737060546875, 0.321044921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 10.0, 7.0, 13.0, 16.0, 28.0, 23.0, 39.0, 53.0, 71.0, 142.0, 198.0, 292.0, 439.0, 740.0, 1256.0, 2448.0, 5258.0, 12116.0, 30489.0, 78471.0, 196893.0, 355433.0, 217205.0, 87722.0, 33870.0, 13332.0, 5692.0, 2698.0, 1377.0, 828.0, 451.0, 301.0, 219.0, 128.0, 85.0, 64.0, 41.0, 39.0, 25.0, 12.0, 8.0, 10.0, 8.0, 7.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.009765625, -1.9498748779296875, -1.889984130859375, -1.8300933837890625, -1.77020263671875, -1.7103118896484375, -1.650421142578125, -1.5905303955078125, -1.5306396484375, -1.4707489013671875, -1.410858154296875, -1.3509674072265625, -1.29107666015625, -1.2311859130859375, -1.171295166015625, -1.1114044189453125, -1.051513671875, -0.9916229248046875, -0.931732177734375, -0.8718414306640625, -0.81195068359375, -0.7520599365234375, -0.692169189453125, -0.6322784423828125, -0.5723876953125, -0.5124969482421875, -0.452606201171875, -0.3927154541015625, -0.33282470703125, -0.2729339599609375, -0.213043212890625, -0.1531524658203125, -0.09326171875, -0.0333709716796875, 0.026519775390625, 0.0864105224609375, 0.14630126953125, 0.2061920166015625, 0.266082763671875, 0.3259735107421875, 0.3858642578125, 0.4457550048828125, 0.505645751953125, 0.5655364990234375, 0.62542724609375, 0.6853179931640625, 0.745208740234375, 0.8050994873046875, 0.864990234375, 0.9248809814453125, 0.984771728515625, 1.0446624755859375, 1.10455322265625, 1.1644439697265625, 1.224334716796875, 1.2842254638671875, 1.3441162109375, 1.4040069580078125, 1.463897705078125, 1.5237884521484375, 1.58367919921875, 1.6435699462890625, 1.703460693359375, 1.7633514404296875, 1.8232421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 12.0, 9.0, 15.0, 18.0, 22.0, 27.0, 24.0, 30.0, 30.0, 37.0, 46.0, 36.0, 40.0, 41.0, 54.0, 51.0, 52.0, 54.0, 61.0, 42.0, 35.0, 38.0, 39.0, 34.0, 32.0, 22.0, 24.0, 14.0, 18.0, 6.0, 7.0, 7.0, 1.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4151763916015625, -1.370391845703125, -1.3256072998046875, -1.28082275390625, -1.2360382080078125, -1.191253662109375, -1.1464691162109375, -1.1016845703125, -1.0569000244140625, -1.012115478515625, -0.9673309326171875, -0.92254638671875, -0.8777618408203125, -0.832977294921875, -0.7881927490234375, -0.743408203125, -0.6986236572265625, -0.653839111328125, -0.6090545654296875, -0.56427001953125, -0.5194854736328125, -0.474700927734375, -0.4299163818359375, -0.3851318359375, -0.3403472900390625, -0.295562744140625, -0.2507781982421875, -0.20599365234375, -0.1612091064453125, -0.116424560546875, -0.0716400146484375, -0.02685546875, 0.0179290771484375, 0.062713623046875, 0.1074981689453125, 0.15228271484375, 0.1970672607421875, 0.241851806640625, 0.2866363525390625, 0.3314208984375, 0.3762054443359375, 0.420989990234375, 0.4657745361328125, 0.51055908203125, 0.5553436279296875, 0.600128173828125, 0.6449127197265625, 0.689697265625, 0.7344818115234375, 0.779266357421875, 0.8240509033203125, 0.86883544921875, 0.9136199951171875, 0.958404541015625, 1.0031890869140625, 1.0479736328125, 1.0927581787109375, 1.137542724609375, 1.1823272705078125, 1.22711181640625, 1.2718963623046875, 1.316680908203125, 1.3614654541015625, 1.40625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 12.0, 19.0, 19.0, 23.0, 27.0, 49.0, 81.0, 163.0, 314.0, 612.0, 1444.0, 4132.0, 13269.0, 50032.0, 214454.0, 497665.0, 200223.0, 46898.0, 12450.0, 3980.0, 1373.0, 569.0, 304.0, 173.0, 76.0, 65.0, 34.0, 18.0, 7.0, 13.0, 4.0, 7.0, 5.0, 5.0, 5.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3798828125, -1.33306884765625, -1.2862548828125, -1.23944091796875, -1.192626953125, -1.14581298828125, -1.0989990234375, -1.05218505859375, -1.00537109375, -0.95855712890625, -0.9117431640625, -0.86492919921875, -0.818115234375, -0.77130126953125, -0.7244873046875, -0.67767333984375, -0.630859375, -0.58404541015625, -0.5372314453125, -0.49041748046875, -0.443603515625, -0.39678955078125, -0.3499755859375, -0.30316162109375, -0.25634765625, -0.20953369140625, -0.1627197265625, -0.11590576171875, -0.069091796875, -0.02227783203125, 0.0245361328125, 0.07135009765625, 0.1181640625, 0.16497802734375, 0.2117919921875, 0.25860595703125, 0.305419921875, 0.35223388671875, 0.3990478515625, 0.44586181640625, 0.49267578125, 0.53948974609375, 0.5863037109375, 0.63311767578125, 0.679931640625, 0.72674560546875, 0.7735595703125, 0.82037353515625, 0.8671875, 0.91400146484375, 0.9608154296875, 1.00762939453125, 1.054443359375, 1.10125732421875, 1.1480712890625, 1.19488525390625, 1.24169921875, 1.28851318359375, 1.3353271484375, 1.38214111328125, 1.428955078125, 1.47576904296875, 1.5225830078125, 1.56939697265625, 1.6162109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 6.0, 10.0, 15.0, 10.0, 18.0, 13.0, 25.0, 34.0, 37.0, 42.0, 58.0, 57.0, 79.0, 64.0, 67.0, 83.0, 69.0, 54.0, 56.0, 36.0, 40.0, 35.0, 19.0, 17.0, 12.0, 12.0, 10.0, 4.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019812583923339844, -0.00019153952598571777, -0.0001849532127380371, -0.00017836689949035645, -0.00017178058624267578, -0.00016519427299499512, -0.00015860795974731445, -0.0001520216464996338, -0.00014543533325195312, -0.00013884902000427246, -0.0001322627067565918, -0.00012567639350891113, -0.00011909008026123047, -0.0001125037670135498, -0.00010591745376586914, -9.933114051818848e-05, -9.274482727050781e-05, -8.615851402282715e-05, -7.957220077514648e-05, -7.298588752746582e-05, -6.639957427978516e-05, -5.981326103210449e-05, -5.322694778442383e-05, -4.6640634536743164e-05, -4.00543212890625e-05, -3.3468008041381836e-05, -2.6881694793701172e-05, -2.0295381546020508e-05, -1.3709068298339844e-05, -7.12275505065918e-06, -5.364418029785156e-07, 6.0498714447021484e-06, 1.2636184692382812e-05, 1.9222497940063477e-05, 2.580881118774414e-05, 3.2395124435424805e-05, 3.898143768310547e-05, 4.556775093078613e-05, 5.21540641784668e-05, 5.874037742614746e-05, 6.532669067382812e-05, 7.191300392150879e-05, 7.849931716918945e-05, 8.508563041687012e-05, 9.167194366455078e-05, 9.825825691223145e-05, 0.00010484457015991211, 0.00011143088340759277, 0.00011801719665527344, 0.0001246035099029541, 0.00013118982315063477, 0.00013777613639831543, 0.0001443624496459961, 0.00015094876289367676, 0.00015753507614135742, 0.00016412138938903809, 0.00017070770263671875, 0.00017729401588439941, 0.00018388032913208008, 0.00019046664237976074, 0.0001970529556274414, 0.00020363926887512207, 0.00021022558212280273, 0.0002168118953704834, 0.00022339820861816406]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 4.0, 6.0, 10.0, 22.0, 30.0, 35.0, 84.0, 157.0, 284.0, 539.0, 1546.0, 4476.0, 17330.0, 94001.0, 608911.0, 269043.0, 38915.0, 8718.0, 2637.0, 914.0, 435.0, 184.0, 111.0, 51.0, 38.0, 17.0, 19.0, 12.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.970367431640625, -1.89385986328125, -1.817352294921875, -1.7408447265625, -1.664337158203125, -1.58782958984375, -1.511322021484375, -1.434814453125, -1.358306884765625, -1.28179931640625, -1.205291748046875, -1.1287841796875, -1.052276611328125, -0.97576904296875, -0.899261474609375, -0.82275390625, -0.746246337890625, -0.66973876953125, -0.593231201171875, -0.5167236328125, -0.440216064453125, -0.36370849609375, -0.287200927734375, -0.210693359375, -0.134185791015625, -0.05767822265625, 0.018829345703125, 0.0953369140625, 0.171844482421875, 0.24835205078125, 0.324859619140625, 0.4013671875, 0.477874755859375, 0.55438232421875, 0.630889892578125, 0.7073974609375, 0.783905029296875, 0.86041259765625, 0.936920166015625, 1.013427734375, 1.089935302734375, 1.16644287109375, 1.242950439453125, 1.3194580078125, 1.395965576171875, 1.47247314453125, 1.548980712890625, 1.62548828125, 1.701995849609375, 1.77850341796875, 1.855010986328125, 1.9315185546875, 2.008026123046875, 2.08453369140625, 2.161041259765625, 2.237548828125, 2.314056396484375, 2.39056396484375, 2.467071533203125, 2.5435791015625, 2.620086669921875, 2.69659423828125, 2.773101806640625, 2.849609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 5.0, 2.0, 9.0, 9.0, 4.0, 12.0, 11.0, 16.0, 16.0, 23.0, 28.0, 29.0, 47.0, 50.0, 43.0, 65.0, 62.0, 70.0, 76.0, 59.0, 71.0, 42.0, 43.0, 34.0, 35.0, 27.0, 18.0, 11.0, 15.0, 12.0, 11.0, 4.0, 10.0, 10.0, 4.0, 2.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.83544921875, -0.8112869262695312, -0.7871246337890625, -0.7629623413085938, -0.738800048828125, -0.7146377563476562, -0.6904754638671875, -0.6663131713867188, -0.64215087890625, -0.6179885864257812, -0.5938262939453125, -0.5696640014648438, -0.545501708984375, -0.5213394165039062, -0.4971771240234375, -0.47301483154296875, -0.4488525390625, -0.42469024658203125, -0.4005279541015625, -0.37636566162109375, -0.352203369140625, -0.32804107666015625, -0.3038787841796875, -0.27971649169921875, -0.25555419921875, -0.23139190673828125, -0.2072296142578125, -0.18306732177734375, -0.158905029296875, -0.13474273681640625, -0.1105804443359375, -0.08641815185546875, -0.062255859375, -0.03809356689453125, -0.0139312744140625, 0.01023101806640625, 0.034393310546875, 0.05855560302734375, 0.0827178955078125, 0.10688018798828125, 0.13104248046875, 0.15520477294921875, 0.1793670654296875, 0.20352935791015625, 0.227691650390625, 0.25185394287109375, 0.2760162353515625, 0.30017852783203125, 0.3243408203125, 0.34850311279296875, 0.3726654052734375, 0.39682769775390625, 0.420989990234375, 0.44515228271484375, 0.4693145751953125, 0.49347686767578125, 0.51763916015625, 0.5418014526367188, 0.5659637451171875, 0.5901260375976562, 0.614288330078125, 0.6384506225585938, 0.6626129150390625, 0.6867752075195312, 0.7109375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 15.0, 14.0, 26.0, 41.0, 42.0, 78.0, 113.0, 132.0, 120.0, 112.0, 114.0, 62.0, 35.0, 30.0, 19.0, 8.0, 8.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-22.54735565185547, -22.070571899414062, -21.593786239624023, -21.117002487182617, -20.64021873474121, -20.163433074951172, -19.686649322509766, -19.20986557006836, -18.733081817626953, -18.256298065185547, -17.779512405395508, -17.3027286529541, -16.825944900512695, -16.349159240722656, -15.87237548828125, -15.395591735839844, -14.918806076049805, -14.442021369934082, -13.965237617492676, -13.488452911376953, -13.011669158935547, -12.534884452819824, -12.058099746704102, -11.581315994262695, -11.104531288146973, -10.62774658203125, -10.150962829589844, -9.674178123474121, -9.197393417358398, -8.720609664916992, -8.24382495880127, -7.767040729522705, -7.290256023406982, -6.813471794128418, -6.336687088012695, -5.859902858734131, -5.383118629455566, -4.906334400177002, -4.4295501708984375, -3.952765464782715, -3.4759812355041504, -2.999197006225586, -2.5224125385284424, -2.045628070831299, -1.5688438415527344, -1.09205961227417, -0.6152751445770264, -0.1384906768798828, 0.33829355239868164, 0.8150779008865356, 1.2918622493743896, 1.7686465978622437, 2.2454309463500977, 2.722215175628662, 3.1989996433258057, 3.675784111022949, 4.152568340301514, 4.629352569580078, 5.106137275695801, 5.582921504974365, 6.05970573425293, 6.536489963531494, 7.013274192810059, 7.490058898925781, 7.966843128204346]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 6.0, 13.0, 14.0, 17.0, 34.0, 32.0, 16.0, 41.0, 32.0, 43.0, 48.0, 43.0, 58.0, 47.0, 46.0, 47.0, 55.0, 47.0, 50.0, 41.0, 40.0, 36.0, 31.0, 30.0, 22.0, 21.0, 20.0, 14.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.256166458129883, -9.924861907958984, -9.593558311462402, -9.262253761291504, -8.930950164794922, -8.599645614624023, -8.268341064453125, -7.937036991119385, -7.6057329177856445, -7.274428844451904, -6.943124771118164, -6.611820220947266, -6.280516147613525, -5.949212074279785, -5.617907524108887, -5.2866034507751465, -4.955299377441406, -4.623995304107666, -4.292691230773926, -3.9613866806030273, -3.630082607269287, -3.298778533935547, -2.9674742221832275, -2.636169910430908, -2.304865837097168, -1.9735616445541382, -1.6422574520111084, -1.3109532594680786, -0.9796490669250488, -0.648344874382019, -0.31704068183898926, 0.014263629913330078, 0.3455677032470703, 0.6768718957901001, 1.0081760883331299, 1.3394802808761597, 1.6707844734191895, 2.0020885467529297, 2.333392858505249, 2.6646971702575684, 2.9960012435913086, 3.327305316925049, 3.658609628677368, 3.9899139404296875, 4.321218013763428, 4.652522087097168, 4.983826637268066, 5.315130710601807, 5.646434783935547, 5.977738857269287, 6.309042930603027, 6.640347480773926, 6.971651554107666, 7.302955627441406, 7.634260177612305, 7.965564250946045, 8.296868324279785, 8.628172874450684, 8.959476470947266, 9.290781021118164, 9.622085571289062, 9.953389167785645, 10.284693717956543, 10.615997314453125, 10.947301864624023]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 11.0, 19.0, 41.0, 46.0, 105.0, 176.0, 327.0, 609.0, 1110.0, 2200.0, 4634.0, 10249.0, 25061.0, 72537.0, 306028.0, 3396387.0, 266353.0, 66913.0, 23561.0, 9402.0, 4262.0, 1994.0, 1089.0, 469.0, 284.0, 138.0, 98.0, 62.0, 30.0, 19.0, 20.0, 14.0, 6.0, 1.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23828125, -2.17138671875, -2.1044921875, -2.03759765625, -1.970703125, -1.90380859375, -1.8369140625, -1.77001953125, -1.703125, -1.63623046875, -1.5693359375, -1.50244140625, -1.435546875, -1.36865234375, -1.3017578125, -1.23486328125, -1.16796875, -1.10107421875, -1.0341796875, -0.96728515625, -0.900390625, -0.83349609375, -0.7666015625, -0.69970703125, -0.6328125, -0.56591796875, -0.4990234375, -0.43212890625, -0.365234375, -0.29833984375, -0.2314453125, -0.16455078125, -0.09765625, -0.03076171875, 0.0361328125, 0.10302734375, 0.169921875, 0.23681640625, 0.3037109375, 0.37060546875, 0.4375, 0.50439453125, 0.5712890625, 0.63818359375, 0.705078125, 0.77197265625, 0.8388671875, 0.90576171875, 0.97265625, 1.03955078125, 1.1064453125, 1.17333984375, 1.240234375, 1.30712890625, 1.3740234375, 1.44091796875, 1.5078125, 1.57470703125, 1.6416015625, 1.70849609375, 1.775390625, 1.84228515625, 1.9091796875, 1.97607421875, 2.04296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 11.0, 15.0, 15.0, 20.0, 17.0, 29.0, 31.0, 41.0, 53.0, 42.0, 65.0, 62.0, 64.0, 69.0, 72.0, 51.0, 58.0, 52.0, 36.0, 46.0, 32.0, 30.0, 17.0, 12.0, 24.0, 8.0, 9.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287109375, -0.2772979736328125, -0.267486572265625, -0.2576751708984375, -0.24786376953125, -0.2380523681640625, -0.228240966796875, -0.2184295654296875, -0.2086181640625, -0.1988067626953125, -0.188995361328125, -0.1791839599609375, -0.16937255859375, -0.1595611572265625, -0.149749755859375, -0.1399383544921875, -0.130126953125, -0.1203155517578125, -0.110504150390625, -0.1006927490234375, -0.09088134765625, -0.0810699462890625, -0.071258544921875, -0.0614471435546875, -0.0516357421875, -0.0418243408203125, -0.032012939453125, -0.0222015380859375, -0.01239013671875, -0.0025787353515625, 0.007232666015625, 0.0170440673828125, 0.02685546875, 0.0366668701171875, 0.046478271484375, 0.0562896728515625, 0.06610107421875, 0.0759124755859375, 0.085723876953125, 0.0955352783203125, 0.1053466796875, 0.1151580810546875, 0.124969482421875, 0.1347808837890625, 0.14459228515625, 0.1544036865234375, 0.164215087890625, 0.1740264892578125, 0.183837890625, 0.1936492919921875, 0.203460693359375, 0.2132720947265625, 0.22308349609375, 0.2328948974609375, 0.242706298828125, 0.2525177001953125, 0.2623291015625, 0.2721405029296875, 0.281951904296875, 0.2917633056640625, 0.30157470703125, 0.3113861083984375, 0.321197509765625, 0.3310089111328125, 0.3408203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 11.0, 30.0, 21.0, 50.0, 75.0, 108.0, 162.0, 270.0, 421.0, 733.0, 1415.0, 3048.0, 7361.0, 21330.0, 77663.0, 419681.0, 3301274.0, 275599.0, 57569.0, 16493.0, 5699.0, 2431.0, 1258.0, 606.0, 389.0, 209.0, 124.0, 89.0, 48.0, 35.0, 21.0, 9.0, 11.0, 9.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.888671875, -2.8046875, -2.720703125, -2.63671875, -2.552734375, -2.46875, -2.384765625, -2.30078125, -2.216796875, -2.1328125, -2.048828125, -1.96484375, -1.880859375, -1.796875, -1.712890625, -1.62890625, -1.544921875, -1.4609375, -1.376953125, -1.29296875, -1.208984375, -1.125, -1.041015625, -0.95703125, -0.873046875, -0.7890625, -0.705078125, -0.62109375, -0.537109375, -0.453125, -0.369140625, -0.28515625, -0.201171875, -0.1171875, -0.033203125, 0.05078125, 0.134765625, 0.21875, 0.302734375, 0.38671875, 0.470703125, 0.5546875, 0.638671875, 0.72265625, 0.806640625, 0.890625, 0.974609375, 1.05859375, 1.142578125, 1.2265625, 1.310546875, 1.39453125, 1.478515625, 1.5625, 1.646484375, 1.73046875, 1.814453125, 1.8984375, 1.982421875, 2.06640625, 2.150390625, 2.234375, 2.318359375, 2.40234375, 2.486328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 5.0, 6.0, 3.0, 14.0, 13.0, 16.0, 17.0, 45.0, 49.0, 87.0, 99.0, 216.0, 472.0, 1883.0, 537.0, 245.0, 126.0, 75.0, 42.0, 43.0, 27.0, 19.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8427734375, -0.8183517456054688, -0.7939300537109375, -0.7695083618164062, -0.745086669921875, -0.7206649780273438, -0.6962432861328125, -0.6718215942382812, -0.64739990234375, -0.6229782104492188, -0.5985565185546875, -0.5741348266601562, -0.549713134765625, -0.5252914428710938, -0.5008697509765625, -0.47644805908203125, -0.4520263671875, -0.42760467529296875, -0.4031829833984375, -0.37876129150390625, -0.354339599609375, -0.32991790771484375, -0.3054962158203125, -0.28107452392578125, -0.25665283203125, -0.23223114013671875, -0.2078094482421875, -0.18338775634765625, -0.158966064453125, -0.13454437255859375, -0.1101226806640625, -0.08570098876953125, -0.061279296875, -0.03685760498046875, -0.0124359130859375, 0.01198577880859375, 0.036407470703125, 0.06082916259765625, 0.0852508544921875, 0.10967254638671875, 0.13409423828125, 0.15851593017578125, 0.1829376220703125, 0.20735931396484375, 0.231781005859375, 0.25620269775390625, 0.2806243896484375, 0.30504608154296875, 0.3294677734375, 0.35388946533203125, 0.3783111572265625, 0.40273284912109375, 0.427154541015625, 0.45157623291015625, 0.4759979248046875, 0.5004196166992188, 0.52484130859375, 0.5492630004882812, 0.5736846923828125, 0.5981063842773438, 0.622528076171875, 0.6469497680664062, 0.6713714599609375, 0.6957931518554688, 0.72021484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 7.0, 10.0, 20.0, 23.0, 77.0, 82.0, 122.0, 167.0, 140.0, 121.0, 85.0, 67.0, 40.0, 14.0, 12.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5741477012634277, -2.4107587337493896, -2.2473697662353516, -2.0839810371398926, -1.9205920696258545, -1.7572031021118164, -1.5938142538070679, -1.4304254055023193, -1.2670364379882812, -1.1036474704742432, -0.9402586221694946, -0.7768697142601013, -0.613480806350708, -0.4500918984413147, -0.2867029905319214, -0.12331414222717285, 0.040074825286865234, 0.20346373319625854, 0.36685264110565186, 0.5302415490150452, 0.6936304569244385, 0.8570193648338318, 1.020408272743225, 1.1837971210479736, 1.3471860885620117, 1.5105750560760498, 1.6739639043807983, 1.8373527526855469, 2.000741720199585, 2.164130687713623, 2.327519416809082, 2.49090838432312, 2.6542978286743164, 2.8176867961883545, 2.9810757637023926, 3.1444644927978516, 3.3078534603118896, 3.4712424278259277, 3.6346311569213867, 3.798020124435425, 3.961409091949463, 4.124797821044922, 4.288187026977539, 4.451575756072998, 4.614964485168457, 4.778353691101074, 4.941742420196533, 5.105131149291992, 5.268520355224609, 5.431909084320068, 5.5952982902526855, 5.7586870193481445, 5.922076225280762, 6.085464954376221, 6.24885368347168, 6.412242889404297, 6.575631618499756, 6.739020347595215, 6.902409553527832, 7.065798282623291, 7.22918701171875, 7.392576217651367, 7.555964946746826, 7.719353675842285, 7.882742881774902]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 7.0, 11.0, 10.0, 11.0, 5.0, 14.0, 18.0, 17.0, 22.0, 20.0, 20.0, 25.0, 33.0, 31.0, 37.0, 45.0, 27.0, 34.0, 38.0, 45.0, 41.0, 36.0, 38.0, 47.0, 51.0, 38.0, 32.0, 23.0, 29.0, 22.0, 22.0, 22.0, 26.0, 17.0, 15.0, 13.0, 8.0, 8.0, 5.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8588041067123413, -1.795504093170166, -1.7322039604187012, -1.6689039468765259, -1.6056039333343506, -1.5423039197921753, -1.47900390625, -1.4157037734985352, -1.3524037599563599, -1.2891037464141846, -1.2258036136627197, -1.1625036001205444, -1.0992035865783691, -1.0359035730361938, -0.9726034998893738, -0.9093034267425537, -0.8460034132003784, -0.7827033996582031, -0.7194033265113831, -0.656103253364563, -0.5928032398223877, -0.5295032262802124, -0.46620315313339233, -0.40290310978889465, -0.339603066444397, -0.2763030230998993, -0.2130029797554016, -0.14970293641090393, -0.08640289306640625, -0.02310284972190857, 0.04019719362258911, 0.10349723696708679, 0.16679716110229492, 0.2300972044467926, 0.2933972477912903, 0.35669729113578796, 0.41999733448028564, 0.4832973778247833, 0.546597421169281, 0.6098974943161011, 0.6731975078582764, 0.7364975214004517, 0.7997975945472717, 0.8630976676940918, 0.9263976812362671, 0.9896976947784424, 1.0529978275299072, 1.1162978410720825, 1.1795978546142578, 1.242897868156433, 1.3061978816986084, 1.3694980144500732, 1.4327980279922485, 1.4960980415344238, 1.5593981742858887, 1.622698187828064, 1.6859982013702393, 1.7492982149124146, 1.8125982284545898, 1.8758983612060547, 1.93919837474823, 2.0024983882904053, 2.06579852104187, 2.129098415374756, 2.1923985481262207]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 9.0, 12.0, 5.0, 25.0, 11.0, 29.0, 50.0, 55.0, 85.0, 109.0, 211.0, 277.0, 440.0, 782.0, 1224.0, 2217.0, 3974.0, 7314.0, 13738.0, 26232.0, 48920.0, 90617.0, 160449.0, 236616.0, 197884.0, 117991.0, 64784.0, 34537.0, 18280.0, 9525.0, 5054.0, 2972.0, 1605.0, 891.0, 535.0, 349.0, 241.0, 161.0, 102.0, 96.0, 37.0, 33.0, 17.0, 17.0, 11.0, 13.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1005859375, -1.0679473876953125, -1.035308837890625, -1.0026702880859375, -0.97003173828125, -0.9373931884765625, -0.904754638671875, -0.8721160888671875, -0.8394775390625, -0.8068389892578125, -0.774200439453125, -0.7415618896484375, -0.70892333984375, -0.6762847900390625, -0.643646240234375, -0.6110076904296875, -0.578369140625, -0.5457305908203125, -0.513092041015625, -0.4804534912109375, -0.44781494140625, -0.4151763916015625, -0.382537841796875, -0.3498992919921875, -0.3172607421875, -0.2846221923828125, -0.251983642578125, -0.2193450927734375, -0.18670654296875, -0.1540679931640625, -0.121429443359375, -0.0887908935546875, -0.05615234375, -0.0235137939453125, 0.009124755859375, 0.0417633056640625, 0.07440185546875, 0.1070404052734375, 0.139678955078125, 0.1723175048828125, 0.2049560546875, 0.2375946044921875, 0.270233154296875, 0.3028717041015625, 0.33551025390625, 0.3681488037109375, 0.400787353515625, 0.4334259033203125, 0.466064453125, 0.4987030029296875, 0.531341552734375, 0.5639801025390625, 0.59661865234375, 0.6292572021484375, 0.661895751953125, 0.6945343017578125, 0.7271728515625, 0.7598114013671875, 0.792449951171875, 0.8250885009765625, 0.85772705078125, 0.8903656005859375, 0.923004150390625, 0.9556427001953125, 0.98828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 5.0, 14.0, 14.0, 19.0, 18.0, 31.0, 30.0, 44.0, 52.0, 62.0, 52.0, 58.0, 67.0, 76.0, 68.0, 65.0, 61.0, 56.0, 52.0, 36.0, 27.0, 21.0, 26.0, 14.0, 8.0, 8.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306640625, -0.2961235046386719, -0.28560638427734375, -0.2750892639160156, -0.2645721435546875, -0.2540550231933594, -0.24353790283203125, -0.23302078247070312, -0.222503662109375, -0.21198654174804688, -0.20146942138671875, -0.19095230102539062, -0.1804351806640625, -0.16991806030273438, -0.15940093994140625, -0.14888381958007812, -0.13836669921875, -0.12784957885742188, -0.11733245849609375, -0.10681533813476562, -0.0962982177734375, -0.08578109741210938, -0.07526397705078125, -0.06474685668945312, -0.054229736328125, -0.043712615966796875, -0.03319549560546875, -0.022678375244140625, -0.0121612548828125, -0.001644134521484375, 0.00887298583984375, 0.019390106201171875, 0.0299072265625, 0.040424346923828125, 0.05094146728515625, 0.061458587646484375, 0.0719757080078125, 0.08249282836914062, 0.09300994873046875, 0.10352706909179688, 0.114044189453125, 0.12456130981445312, 0.13507843017578125, 0.14559555053710938, 0.1561126708984375, 0.16662979125976562, 0.17714691162109375, 0.18766403198242188, 0.19818115234375, 0.20869827270507812, 0.21921539306640625, 0.22973251342773438, 0.2402496337890625, 0.2507667541503906, 0.26128387451171875, 0.2718009948730469, 0.282318115234375, 0.2928352355957031, 0.30335235595703125, 0.3138694763183594, 0.3243865966796875, 0.3349037170410156, 0.34542083740234375, 0.3559379577636719, 0.366455078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 10.0, 13.0, 21.0, 25.0, 31.0, 67.0, 92.0, 108.0, 146.0, 231.0, 348.0, 479.0, 799.0, 1391.0, 2551.0, 4982.0, 10211.0, 22973.0, 54588.0, 128219.0, 265986.0, 290615.0, 148823.0, 64146.0, 27104.0, 11931.0, 5713.0, 2888.0, 1499.0, 864.0, 548.0, 351.0, 224.0, 154.0, 112.0, 90.0, 61.0, 37.0, 26.0, 14.0, 26.0, 13.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.271484375, -1.2305908203125, -1.189697265625, -1.1488037109375, -1.10791015625, -1.0670166015625, -1.026123046875, -0.9852294921875, -0.9443359375, -0.9034423828125, -0.862548828125, -0.8216552734375, -0.78076171875, -0.7398681640625, -0.698974609375, -0.6580810546875, -0.6171875, -0.5762939453125, -0.535400390625, -0.4945068359375, -0.45361328125, -0.4127197265625, -0.371826171875, -0.3309326171875, -0.2900390625, -0.2491455078125, -0.208251953125, -0.1673583984375, -0.12646484375, -0.0855712890625, -0.044677734375, -0.0037841796875, 0.037109375, 0.0780029296875, 0.118896484375, 0.1597900390625, 0.20068359375, 0.2415771484375, 0.282470703125, 0.3233642578125, 0.3642578125, 0.4051513671875, 0.446044921875, 0.4869384765625, 0.52783203125, 0.5687255859375, 0.609619140625, 0.6505126953125, 0.69140625, 0.7322998046875, 0.773193359375, 0.8140869140625, 0.85498046875, 0.8958740234375, 0.936767578125, 0.9776611328125, 1.0185546875, 1.0594482421875, 1.100341796875, 1.1412353515625, 1.18212890625, 1.2230224609375, 1.263916015625, 1.3048095703125, 1.345703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 9.0, 7.0, 5.0, 10.0, 19.0, 16.0, 20.0, 31.0, 28.0, 37.0, 41.0, 50.0, 54.0, 52.0, 60.0, 54.0, 68.0, 49.0, 57.0, 48.0, 52.0, 49.0, 38.0, 29.0, 25.0, 15.0, 19.0, 17.0, 7.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5267333984375, -1.477294921875, -1.4278564453125, -1.37841796875, -1.3289794921875, -1.279541015625, -1.2301025390625, -1.1806640625, -1.1312255859375, -1.081787109375, -1.0323486328125, -0.98291015625, -0.9334716796875, -0.884033203125, -0.8345947265625, -0.78515625, -0.7357177734375, -0.686279296875, -0.6368408203125, -0.58740234375, -0.5379638671875, -0.488525390625, -0.4390869140625, -0.3896484375, -0.3402099609375, -0.290771484375, -0.2413330078125, -0.19189453125, -0.1424560546875, -0.093017578125, -0.0435791015625, 0.005859375, 0.0552978515625, 0.104736328125, 0.1541748046875, 0.20361328125, 0.2530517578125, 0.302490234375, 0.3519287109375, 0.4013671875, 0.4508056640625, 0.500244140625, 0.5496826171875, 0.59912109375, 0.6485595703125, 0.697998046875, 0.7474365234375, 0.796875, 0.8463134765625, 0.895751953125, 0.9451904296875, 0.99462890625, 1.0440673828125, 1.093505859375, 1.1429443359375, 1.1923828125, 1.2418212890625, 1.291259765625, 1.3406982421875, 1.39013671875, 1.4395751953125, 1.489013671875, 1.5384521484375, 1.587890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 9.0, 20.0, 10.0, 15.0, 47.0, 50.0, 70.0, 117.0, 199.0, 410.0, 783.0, 1637.0, 3992.0, 10378.0, 31236.0, 116039.0, 406911.0, 346078.0, 90076.0, 25523.0, 8501.0, 3420.0, 1454.0, 718.0, 361.0, 188.0, 100.0, 83.0, 38.0, 30.0, 18.0, 7.0, 15.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0625, -1.0329132080078125, -1.003326416015625, -0.9737396240234375, -0.94415283203125, -0.9145660400390625, -0.884979248046875, -0.8553924560546875, -0.8258056640625, -0.7962188720703125, -0.766632080078125, -0.7370452880859375, -0.70745849609375, -0.6778717041015625, -0.648284912109375, -0.6186981201171875, -0.589111328125, -0.5595245361328125, -0.529937744140625, -0.5003509521484375, -0.47076416015625, -0.4411773681640625, -0.411590576171875, -0.3820037841796875, -0.3524169921875, -0.3228302001953125, -0.293243408203125, -0.2636566162109375, -0.23406982421875, -0.2044830322265625, -0.174896240234375, -0.1453094482421875, -0.11572265625, -0.0861358642578125, -0.056549072265625, -0.0269622802734375, 0.00262451171875, 0.0322113037109375, 0.061798095703125, 0.0913848876953125, 0.1209716796875, 0.1505584716796875, 0.180145263671875, 0.2097320556640625, 0.23931884765625, 0.2689056396484375, 0.298492431640625, 0.3280792236328125, 0.357666015625, 0.3872528076171875, 0.416839599609375, 0.4464263916015625, 0.47601318359375, 0.5055999755859375, 0.535186767578125, 0.5647735595703125, 0.5943603515625, 0.6239471435546875, 0.653533935546875, 0.6831207275390625, 0.71270751953125, 0.7422943115234375, 0.771881103515625, 0.8014678955078125, 0.8310546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 8.0, 5.0, 16.0, 13.0, 19.0, 21.0, 38.0, 50.0, 50.0, 71.0, 71.0, 111.0, 108.0, 70.0, 68.0, 42.0, 39.0, 32.0, 37.0, 23.0, 12.0, 17.0, 9.0, 11.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00014328956604003906, -0.00013795122504234314, -0.00013261288404464722, -0.0001272745430469513, -0.00012193620204925537, -0.00011659786105155945, -0.00011125952005386353, -0.0001059211790561676, -0.00010058283805847168, -9.524449706077576e-05, -8.990615606307983e-05, -8.456781506538391e-05, -7.922947406768799e-05, -7.389113306999207e-05, -6.855279207229614e-05, -6.321445107460022e-05, -5.78761100769043e-05, -5.2537769079208374e-05, -4.719942808151245e-05, -4.186108708381653e-05, -3.6522746086120605e-05, -3.118440508842468e-05, -2.584606409072876e-05, -2.0507723093032837e-05, -1.5169382095336914e-05, -9.831041097640991e-06, -4.492700099945068e-06, 8.456408977508545e-07, 6.183981895446777e-06, 1.15223228931427e-05, 1.6860663890838623e-05, 2.2199004888534546e-05, 2.753734588623047e-05, 3.287568688392639e-05, 3.8214027881622314e-05, 4.355236887931824e-05, 4.889070987701416e-05, 5.422905087471008e-05, 5.9567391872406006e-05, 6.490573287010193e-05, 7.024407386779785e-05, 7.558241486549377e-05, 8.09207558631897e-05, 8.625909686088562e-05, 9.159743785858154e-05, 9.693577885627747e-05, 0.00010227411985397339, 0.00010761246085166931, 0.00011295080184936523, 0.00011828914284706116, 0.00012362748384475708, 0.000128965824842453, 0.00013430416584014893, 0.00013964250683784485, 0.00014498084783554077, 0.0001503191888332367, 0.00015565752983093262, 0.00016099587082862854, 0.00016633421182632446, 0.00017167255282402039, 0.0001770108938217163, 0.00018234923481941223, 0.00018768757581710815, 0.00019302591681480408, 0.0001983642578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 9.0, 15.0, 24.0, 36.0, 61.0, 86.0, 152.0, 302.0, 694.0, 1549.0, 4246.0, 14501.0, 66421.0, 476423.0, 408560.0, 56150.0, 12737.0, 3813.0, 1485.0, 589.0, 273.0, 185.0, 91.0, 49.0, 39.0, 20.0, 16.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.8330078125, -1.78594970703125, -1.7388916015625, -1.69183349609375, -1.644775390625, -1.59771728515625, -1.5506591796875, -1.50360107421875, -1.45654296875, -1.40948486328125, -1.3624267578125, -1.31536865234375, -1.268310546875, -1.22125244140625, -1.1741943359375, -1.12713623046875, -1.080078125, -1.03302001953125, -0.9859619140625, -0.93890380859375, -0.891845703125, -0.84478759765625, -0.7977294921875, -0.75067138671875, -0.70361328125, -0.65655517578125, -0.6094970703125, -0.56243896484375, -0.515380859375, -0.46832275390625, -0.4212646484375, -0.37420654296875, -0.3271484375, -0.28009033203125, -0.2330322265625, -0.18597412109375, -0.138916015625, -0.09185791015625, -0.0447998046875, 0.00225830078125, 0.04931640625, 0.09637451171875, 0.1434326171875, 0.19049072265625, 0.237548828125, 0.28460693359375, 0.3316650390625, 0.37872314453125, 0.42578125, 0.47283935546875, 0.5198974609375, 0.56695556640625, 0.614013671875, 0.66107177734375, 0.7081298828125, 0.75518798828125, 0.80224609375, 0.84930419921875, 0.8963623046875, 0.94342041015625, 0.990478515625, 1.03753662109375, 1.0845947265625, 1.13165283203125, 1.1787109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 4.0, 8.0, 14.0, 11.0, 14.0, 16.0, 22.0, 28.0, 46.0, 56.0, 79.0, 76.0, 90.0, 105.0, 64.0, 80.0, 44.0, 48.0, 38.0, 25.0, 26.0, 18.0, 13.0, 17.0, 13.0, 4.0, 4.0, 4.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6572265625, -0.6347732543945312, -0.6123199462890625, -0.5898666381835938, -0.567413330078125, -0.5449600219726562, -0.5225067138671875, -0.5000534057617188, -0.47760009765625, -0.45514678955078125, -0.4326934814453125, -0.41024017333984375, -0.387786865234375, -0.36533355712890625, -0.3428802490234375, -0.32042694091796875, -0.2979736328125, -0.27552032470703125, -0.2530670166015625, -0.23061370849609375, -0.208160400390625, -0.18570709228515625, -0.1632537841796875, -0.14080047607421875, -0.11834716796875, -0.09589385986328125, -0.0734405517578125, -0.05098724365234375, -0.028533935546875, -0.00608062744140625, 0.0163726806640625, 0.03882598876953125, 0.061279296875, 0.08373260498046875, 0.1061859130859375, 0.12863922119140625, 0.151092529296875, 0.17354583740234375, 0.1959991455078125, 0.21845245361328125, 0.24090576171875, 0.26335906982421875, 0.2858123779296875, 0.30826568603515625, 0.330718994140625, 0.35317230224609375, 0.3756256103515625, 0.39807891845703125, 0.4205322265625, 0.44298553466796875, 0.4654388427734375, 0.48789215087890625, 0.510345458984375, 0.5327987670898438, 0.5552520751953125, 0.5777053833007812, 0.60015869140625, 0.6226119995117188, 0.6450653076171875, 0.6675186157226562, 0.689971923828125, 0.7124252319335938, 0.7348785400390625, 0.7573318481445312, 0.77978515625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 13.0, 5.0, 20.0, 16.0, 21.0, 32.0, 49.0, 60.0, 76.0, 85.0, 69.0, 87.0, 92.0, 77.0, 70.0, 62.0, 36.0, 26.0, 25.0, 17.0, 16.0, 10.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-9.764694213867188, -9.511588096618652, -9.2584810256958, -9.005374908447266, -8.752267837524414, -8.499161720275879, -8.246055603027344, -7.99294900894165, -7.739842414855957, -7.486735820770264, -7.23362922668457, -6.980523109436035, -6.727416515350342, -6.474309921264648, -6.221203804016113, -5.96809720993042, -5.714990615844727, -5.461884021759033, -5.20877742767334, -4.955671310424805, -4.702564716339111, -4.449458122253418, -4.196352005004883, -3.9432454109191895, -3.690138816833496, -3.4370322227478027, -3.1839258670806885, -2.930819511413574, -2.677712917327881, -2.4246063232421875, -2.1714999675750732, -1.9183934926986694, -1.6652874946594238, -1.41218101978302, -1.1590745449066162, -0.9059680700302124, -0.6528615951538086, -0.3997551202774048, -0.14664864540100098, 0.10645782947540283, 0.35956430435180664, 0.6126707792282104, 0.8657772541046143, 1.118883728981018, 1.3719902038574219, 1.6250966787338257, 1.8782031536102295, 2.1313095092773438, 2.384416103363037, 2.6375226974487305, 2.8906290531158447, 3.143735408782959, 3.3968420028686523, 3.6499485969543457, 3.90305495262146, 4.156161308288574, 4.409267902374268, 4.662374496459961, 4.915480613708496, 5.1685872077941895, 5.421693801879883, 5.674800395965576, 5.9279069900512695, 6.181013107299805, 6.434119701385498]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 5.0, 10.0, 20.0, 14.0, 16.0, 24.0, 27.0, 26.0, 29.0, 35.0, 37.0, 36.0, 53.0, 55.0, 42.0, 61.0, 64.0, 46.0, 51.0, 44.0, 45.0, 42.0, 25.0, 29.0, 24.0, 19.0, 24.0, 20.0, 19.0, 11.0, 1.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-9.38187026977539, -9.132511138916016, -8.88315200805664, -8.633792877197266, -8.384432792663574, -8.1350736618042, -7.885714530944824, -7.636355400085449, -7.386996269226074, -7.137637138366699, -6.888277530670166, -6.638918399810791, -6.389559268951416, -6.140199661254883, -5.890840530395508, -5.641481399536133, -5.392122268676758, -5.142763137817383, -4.89340353012085, -4.644044399261475, -4.3946852684021, -4.145325660705566, -3.8959665298461914, -3.6466073989868164, -3.397247791290283, -3.147888422012329, -2.898529291152954, -2.649169921875, -2.399810791015625, -2.150451421737671, -1.9010921716690063, -1.6517329216003418, -1.4023737907409668, -1.1530145406723022, -0.9036552906036377, -0.6542959809303284, -0.4049367308616638, -0.1555774211883545, 0.09378182888031006, 0.3431410789489746, 0.5925003290176392, 0.8418595790863037, 1.0912188291549683, 1.3405780792236328, 1.589937448501587, 1.8392966985702515, 2.088655948638916, 2.338015079498291, 2.587374448776245, 2.836733818054199, 3.086092948913574, 3.3354523181915283, 3.5848114490509033, 3.8341708183288574, 4.083529949188232, 4.332889556884766, 4.582248687744141, 4.831607818603516, 5.080967426300049, 5.330326557159424, 5.579685688018799, 5.829045295715332, 6.078404426574707, 6.327763557434082, 6.577122688293457]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 12.0, 15.0, 35.0, 40.0, 58.0, 101.0, 128.0, 225.0, 306.0, 526.0, 801.0, 1347.0, 2309.0, 3898.0, 7030.0, 13576.0, 28378.0, 66807.0, 229780.0, 3295247.0, 383446.0, 89629.0, 35104.0, 16280.0, 8379.0, 4433.0, 2475.0, 1493.0, 879.0, 549.0, 311.0, 217.0, 152.0, 88.0, 65.0, 36.0, 34.0, 17.0, 15.0, 11.0, 8.0, 10.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.4072265625, -1.365386962890625, -1.32354736328125, -1.281707763671875, -1.2398681640625, -1.198028564453125, -1.15618896484375, -1.114349365234375, -1.072509765625, -1.030670166015625, -0.98883056640625, -0.946990966796875, -0.9051513671875, -0.863311767578125, -0.82147216796875, -0.779632568359375, -0.73779296875, -0.695953369140625, -0.65411376953125, -0.612274169921875, -0.5704345703125, -0.528594970703125, -0.48675537109375, -0.444915771484375, -0.403076171875, -0.361236572265625, -0.31939697265625, -0.277557373046875, -0.2357177734375, -0.193878173828125, -0.15203857421875, -0.110198974609375, -0.068359375, -0.026519775390625, 0.01531982421875, 0.057159423828125, 0.0989990234375, 0.140838623046875, 0.18267822265625, 0.224517822265625, 0.266357421875, 0.308197021484375, 0.35003662109375, 0.391876220703125, 0.4337158203125, 0.475555419921875, 0.51739501953125, 0.559234619140625, 0.60107421875, 0.642913818359375, 0.68475341796875, 0.726593017578125, 0.7684326171875, 0.810272216796875, 0.85211181640625, 0.893951416015625, 0.935791015625, 0.977630615234375, 1.01947021484375, 1.061309814453125, 1.1031494140625, 1.144989013671875, 1.18682861328125, 1.228668212890625, 1.2705078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 2.0, 12.0, 13.0, 14.0, 15.0, 14.0, 14.0, 23.0, 32.0, 38.0, 38.0, 37.0, 44.0, 55.0, 48.0, 60.0, 53.0, 62.0, 60.0, 53.0, 51.0, 48.0, 34.0, 31.0, 21.0, 41.0, 22.0, 17.0, 10.0, 9.0, 11.0, 1.0, 7.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.294921875, -0.28580474853515625, -0.2766876220703125, -0.26757049560546875, -0.258453369140625, -0.24933624267578125, -0.2402191162109375, -0.23110198974609375, -0.22198486328125, -0.21286773681640625, -0.2037506103515625, -0.19463348388671875, -0.185516357421875, -0.17639923095703125, -0.1672821044921875, -0.15816497802734375, -0.1490478515625, -0.13993072509765625, -0.1308135986328125, -0.12169647216796875, -0.112579345703125, -0.10346221923828125, -0.0943450927734375, -0.08522796630859375, -0.07611083984375, -0.06699371337890625, -0.0578765869140625, -0.04875946044921875, -0.039642333984375, -0.03052520751953125, -0.0214080810546875, -0.01229095458984375, -0.003173828125, 0.00594329833984375, 0.0150604248046875, 0.02417755126953125, 0.033294677734375, 0.04241180419921875, 0.0515289306640625, 0.06064605712890625, 0.06976318359375, 0.07888031005859375, 0.0879974365234375, 0.09711456298828125, 0.106231689453125, 0.11534881591796875, 0.1244659423828125, 0.13358306884765625, 0.1427001953125, 0.15181732177734375, 0.1609344482421875, 0.17005157470703125, 0.179168701171875, 0.18828582763671875, 0.1974029541015625, 0.20652008056640625, 0.21563720703125, 0.22475433349609375, 0.2338714599609375, 0.24298858642578125, 0.252105712890625, 0.26122283935546875, 0.2703399658203125, 0.27945709228515625, 0.28857421875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 6.0, 4.0, 4.0, 9.0, 18.0, 22.0, 27.0, 24.0, 45.0, 53.0, 69.0, 101.0, 156.0, 236.0, 393.0, 630.0, 1251.0, 2740.0, 7205.0, 21475.0, 79549.0, 481514.0, 3298108.0, 228276.0, 49121.0, 14319.0, 4857.0, 1921.0, 869.0, 451.0, 249.0, 151.0, 109.0, 87.0, 62.0, 33.0, 35.0, 17.0, 19.0, 15.0, 12.0, 6.0, 4.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.234375, -2.167327880859375, -2.10028076171875, -2.033233642578125, -1.9661865234375, -1.899139404296875, -1.83209228515625, -1.765045166015625, -1.697998046875, -1.630950927734375, -1.56390380859375, -1.496856689453125, -1.4298095703125, -1.362762451171875, -1.29571533203125, -1.228668212890625, -1.16162109375, -1.094573974609375, -1.02752685546875, -0.960479736328125, -0.8934326171875, -0.826385498046875, -0.75933837890625, -0.692291259765625, -0.625244140625, -0.558197021484375, -0.49114990234375, -0.424102783203125, -0.3570556640625, -0.290008544921875, -0.22296142578125, -0.155914306640625, -0.0888671875, -0.021820068359375, 0.04522705078125, 0.112274169921875, 0.1793212890625, 0.246368408203125, 0.31341552734375, 0.380462646484375, 0.447509765625, 0.514556884765625, 0.58160400390625, 0.648651123046875, 0.7156982421875, 0.782745361328125, 0.84979248046875, 0.916839599609375, 0.98388671875, 1.050933837890625, 1.11798095703125, 1.185028076171875, 1.2520751953125, 1.319122314453125, 1.38616943359375, 1.453216552734375, 1.520263671875, 1.587310791015625, 1.65435791015625, 1.721405029296875, 1.7884521484375, 1.855499267578125, 1.92254638671875, 1.989593505859375, 2.056640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 7.0, 15.0, 10.0, 26.0, 36.0, 49.0, 74.0, 135.0, 265.0, 649.0, 1899.0, 420.0, 180.0, 111.0, 64.0, 42.0, 23.0, 23.0, 17.0, 8.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79248046875, -0.77001953125, -0.74755859375, -0.72509765625, -0.70263671875, -0.68017578125, -0.65771484375, -0.63525390625, -0.61279296875, -0.59033203125, -0.56787109375, -0.54541015625, -0.52294921875, -0.50048828125, -0.47802734375, -0.45556640625, -0.43310546875, -0.41064453125, -0.38818359375, -0.36572265625, -0.34326171875, -0.32080078125, -0.29833984375, -0.27587890625, -0.25341796875, -0.23095703125, -0.20849609375, -0.18603515625, -0.16357421875, -0.14111328125, -0.11865234375, -0.09619140625, -0.07373046875, -0.05126953125, -0.02880859375, -0.00634765625, 0.01611328125, 0.03857421875, 0.06103515625, 0.08349609375, 0.10595703125, 0.12841796875, 0.15087890625, 0.17333984375, 0.19580078125, 0.21826171875, 0.24072265625, 0.26318359375, 0.28564453125, 0.30810546875, 0.33056640625, 0.35302734375, 0.37548828125, 0.39794921875, 0.42041015625, 0.44287109375, 0.46533203125, 0.48779296875, 0.51025390625, 0.53271484375, 0.55517578125, 0.57763671875, 0.60009765625, 0.62255859375, 0.64501953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 20.0, 26.0, 27.0, 59.0, 80.0, 79.0, 110.0, 109.0, 120.0, 112.0, 77.0, 63.0, 31.0, 31.0, 17.0, 7.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8730950355529785, -3.7584071159362793, -3.64371919631958, -3.5290310382843018, -3.4143431186676025, -3.2996551990509033, -3.184967041015625, -3.070279121398926, -2.9555912017822266, -2.8409032821655273, -2.726215362548828, -2.61152720451355, -2.4968392848968506, -2.3821513652801514, -2.267463207244873, -2.152775287628174, -2.0380873680114746, -1.9233994483947754, -1.8087114095687866, -1.6940233707427979, -1.5793354511260986, -1.4646475315093994, -1.3499594926834106, -1.2352714538574219, -1.1205835342407227, -1.0058956146240234, -0.8912075757980347, -0.7765195965766907, -0.6618316173553467, -0.5471436381340027, -0.4324556589126587, -0.3177676796913147, -0.2030797004699707, -0.08839172124862671, 0.026296257972717285, 0.14098423719406128, 0.2556722164154053, 0.37036019563674927, 0.48504817485809326, 0.5997361540794373, 0.7144241333007812, 0.8291121125221252, 0.9438000917434692, 1.058488130569458, 1.1731760501861572, 1.2878639698028564, 1.4025520086288452, 1.517240047454834, 1.6319279670715332, 1.7466158866882324, 1.8613039255142212, 1.97599196434021, 2.090679883956909, 2.2053678035736084, 2.3200559616088867, 2.434743881225586, 2.549431800842285, 2.6641197204589844, 2.7788076400756836, 2.893495798110962, 3.008183717727661, 3.1228716373443604, 3.2375597953796387, 3.352247714996338, 3.466935634613037]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 9.0, 15.0, 12.0, 18.0, 15.0, 24.0, 22.0, 35.0, 30.0, 38.0, 29.0, 42.0, 45.0, 37.0, 57.0, 44.0, 39.0, 49.0, 40.0, 43.0, 39.0, 38.0, 39.0, 25.0, 29.0, 29.0, 20.0, 23.0, 28.0, 10.0, 12.0, 7.0, 10.0, 14.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.218714714050293, -2.155890703201294, -2.093066453933716, -2.030242443084717, -1.9674183130264282, -1.9045941829681396, -1.8417701721191406, -1.778946042060852, -1.7161219120025635, -1.653297781944275, -1.5904737710952759, -1.5276496410369873, -1.4648255109786987, -1.4020013809204102, -1.3391773700714111, -1.2763532400131226, -1.2135292291641235, -1.150705099105835, -1.087881088256836, -1.0250569581985474, -0.9622328281402588, -0.899408757686615, -0.8365846872329712, -0.7737605571746826, -0.7109364867210388, -0.648112416267395, -0.5852882862091064, -0.5224642157554626, -0.45964011549949646, -0.3968160152435303, -0.3339919447898865, -0.2711678445339203, -0.20834362506866455, -0.14551952481269836, -0.08269543945789337, -0.01987135410308838, 0.04295274615287781, 0.105776846408844, 0.1686009168624878, 0.23142501711845398, 0.29424911737442017, 0.35707321763038635, 0.41989731788635254, 0.48272138833999634, 0.5455454587936401, 0.6083695888519287, 0.6711936593055725, 0.7340177297592163, 0.7968418598175049, 0.8596659302711487, 0.9224900603294373, 0.985314130783081, 1.0481382608413696, 1.1109623908996582, 1.1737864017486572, 1.2366105318069458, 1.2994346618652344, 1.362258791923523, 1.425082802772522, 1.4879069328308105, 1.5507310628890991, 1.6135551929473877, 1.6763792037963867, 1.7392033338546753, 1.8020273447036743]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 11.0, 10.0, 21.0, 26.0, 50.0, 68.0, 106.0, 199.0, 294.0, 504.0, 859.0, 1412.0, 2591.0, 4413.0, 7886.0, 14408.0, 26783.0, 50833.0, 94775.0, 165326.0, 236595.0, 191957.0, 114149.0, 62350.0, 33142.0, 17736.0, 9537.0, 5421.0, 2934.0, 1653.0, 984.0, 563.0, 380.0, 208.0, 135.0, 90.0, 48.0, 30.0, 25.0, 13.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0625, -1.0318450927734375, -1.001190185546875, -0.9705352783203125, -0.93988037109375, -0.9092254638671875, -0.878570556640625, -0.8479156494140625, -0.8172607421875, -0.7866058349609375, -0.755950927734375, -0.7252960205078125, -0.69464111328125, -0.6639862060546875, -0.633331298828125, -0.6026763916015625, -0.572021484375, -0.5413665771484375, -0.510711669921875, -0.4800567626953125, -0.44940185546875, -0.4187469482421875, -0.388092041015625, -0.3574371337890625, -0.3267822265625, -0.2961273193359375, -0.265472412109375, -0.2348175048828125, -0.20416259765625, -0.1735076904296875, -0.142852783203125, -0.1121978759765625, -0.08154296875, -0.0508880615234375, -0.020233154296875, 0.0104217529296875, 0.04107666015625, 0.0717315673828125, 0.102386474609375, 0.1330413818359375, 0.1636962890625, 0.1943511962890625, 0.225006103515625, 0.2556610107421875, 0.28631591796875, 0.3169708251953125, 0.347625732421875, 0.3782806396484375, 0.408935546875, 0.4395904541015625, 0.470245361328125, 0.5009002685546875, 0.53155517578125, 0.5622100830078125, 0.592864990234375, 0.6235198974609375, 0.6541748046875, 0.6848297119140625, 0.715484619140625, 0.7461395263671875, 0.77679443359375, 0.8074493408203125, 0.838104248046875, 0.8687591552734375, 0.8994140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 7.0, 9.0, 12.0, 10.0, 11.0, 16.0, 18.0, 23.0, 21.0, 29.0, 37.0, 41.0, 37.0, 47.0, 51.0, 52.0, 58.0, 64.0, 56.0, 48.0, 51.0, 42.0, 44.0, 29.0, 35.0, 31.0, 33.0, 21.0, 13.0, 15.0, 7.0, 9.0, 8.0, 5.0, 9.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.266845703125, -0.25774383544921875, -0.2486419677734375, -0.23954010009765625, -0.230438232421875, -0.22133636474609375, -0.2122344970703125, -0.20313262939453125, -0.19403076171875, -0.18492889404296875, -0.1758270263671875, -0.16672515869140625, -0.157623291015625, -0.14852142333984375, -0.1394195556640625, -0.13031768798828125, -0.1212158203125, -0.11211395263671875, -0.1030120849609375, -0.09391021728515625, -0.084808349609375, -0.07570648193359375, -0.0666046142578125, -0.05750274658203125, -0.04840087890625, -0.03929901123046875, -0.0301971435546875, -0.02109527587890625, -0.011993408203125, -0.00289154052734375, 0.0062103271484375, 0.01531219482421875, 0.0244140625, 0.03351593017578125, 0.0426177978515625, 0.05171966552734375, 0.060821533203125, 0.06992340087890625, 0.0790252685546875, 0.08812713623046875, 0.09722900390625, 0.10633087158203125, 0.1154327392578125, 0.12453460693359375, 0.133636474609375, 0.14273834228515625, 0.1518402099609375, 0.16094207763671875, 0.1700439453125, 0.17914581298828125, 0.1882476806640625, 0.19734954833984375, 0.206451416015625, 0.21555328369140625, 0.2246551513671875, 0.23375701904296875, 0.24285888671875, 0.25196075439453125, 0.2610626220703125, 0.27016448974609375, 0.279266357421875, 0.28836822509765625, 0.2974700927734375, 0.30657196044921875, 0.315673828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 10.0, 15.0, 16.0, 40.0, 65.0, 95.0, 135.0, 228.0, 437.0, 982.0, 2081.0, 5383.0, 19286.0, 85943.0, 371386.0, 424772.0, 103597.0, 23265.0, 6257.0, 2310.0, 963.0, 501.0, 308.0, 171.0, 93.0, 65.0, 49.0, 20.0, 14.0, 11.0, 10.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.314453125, -2.250274658203125, -2.18609619140625, -2.121917724609375, -2.0577392578125, -1.993560791015625, -1.92938232421875, -1.865203857421875, -1.801025390625, -1.736846923828125, -1.67266845703125, -1.608489990234375, -1.5443115234375, -1.480133056640625, -1.41595458984375, -1.351776123046875, -1.28759765625, -1.223419189453125, -1.15924072265625, -1.095062255859375, -1.0308837890625, -0.966705322265625, -0.90252685546875, -0.838348388671875, -0.774169921875, -0.709991455078125, -0.64581298828125, -0.581634521484375, -0.5174560546875, -0.453277587890625, -0.38909912109375, -0.324920654296875, -0.2607421875, -0.196563720703125, -0.13238525390625, -0.068206787109375, -0.0040283203125, 0.060150146484375, 0.12432861328125, 0.188507080078125, 0.252685546875, 0.316864013671875, 0.38104248046875, 0.445220947265625, 0.5093994140625, 0.573577880859375, 0.63775634765625, 0.701934814453125, 0.76611328125, 0.830291748046875, 0.89447021484375, 0.958648681640625, 1.0228271484375, 1.087005615234375, 1.15118408203125, 1.215362548828125, 1.279541015625, 1.343719482421875, 1.40789794921875, 1.472076416015625, 1.5362548828125, 1.600433349609375, 1.66461181640625, 1.728790283203125, 1.79296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 6.0, 12.0, 11.0, 9.0, 16.0, 22.0, 29.0, 25.0, 35.0, 27.0, 26.0, 40.0, 43.0, 44.0, 36.0, 53.0, 47.0, 43.0, 55.0, 47.0, 60.0, 32.0, 39.0, 33.0, 33.0, 26.0, 23.0, 27.0, 18.0, 16.0, 6.0, 13.0, 10.0, 6.0, 4.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.342926025390625, -1.30499267578125, -1.267059326171875, -1.2291259765625, -1.191192626953125, -1.15325927734375, -1.115325927734375, -1.077392578125, -1.039459228515625, -1.00152587890625, -0.963592529296875, -0.9256591796875, -0.887725830078125, -0.84979248046875, -0.811859130859375, -0.77392578125, -0.735992431640625, -0.69805908203125, -0.660125732421875, -0.6221923828125, -0.584259033203125, -0.54632568359375, -0.508392333984375, -0.470458984375, -0.432525634765625, -0.39459228515625, -0.356658935546875, -0.3187255859375, -0.280792236328125, -0.24285888671875, -0.204925537109375, -0.1669921875, -0.129058837890625, -0.09112548828125, -0.053192138671875, -0.0152587890625, 0.022674560546875, 0.06060791015625, 0.098541259765625, 0.136474609375, 0.174407958984375, 0.21234130859375, 0.250274658203125, 0.2882080078125, 0.326141357421875, 0.36407470703125, 0.402008056640625, 0.43994140625, 0.477874755859375, 0.51580810546875, 0.553741455078125, 0.5916748046875, 0.629608154296875, 0.66754150390625, 0.705474853515625, 0.743408203125, 0.781341552734375, 0.81927490234375, 0.857208251953125, 0.8951416015625, 0.933074951171875, 0.97100830078125, 1.008941650390625, 1.046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 15.0, 16.0, 10.0, 22.0, 44.0, 85.0, 138.0, 250.0, 480.0, 982.0, 2170.0, 5784.0, 20680.0, 103201.0, 544406.0, 302450.0, 49282.0, 11687.0, 3784.0, 1547.0, 687.0, 363.0, 195.0, 118.0, 62.0, 42.0, 21.0, 8.0, 9.0, 6.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0508270263671875, -1.016693115234375, -0.9825592041015625, -0.94842529296875, -0.9142913818359375, -0.880157470703125, -0.8460235595703125, -0.8118896484375, -0.7777557373046875, -0.743621826171875, -0.7094879150390625, -0.67535400390625, -0.6412200927734375, -0.607086181640625, -0.5729522705078125, -0.538818359375, -0.5046844482421875, -0.470550537109375, -0.4364166259765625, -0.40228271484375, -0.3681488037109375, -0.334014892578125, -0.2998809814453125, -0.2657470703125, -0.2316131591796875, -0.197479248046875, -0.1633453369140625, -0.12921142578125, -0.0950775146484375, -0.060943603515625, -0.0268096923828125, 0.00732421875, 0.0414581298828125, 0.075592041015625, 0.1097259521484375, 0.14385986328125, 0.1779937744140625, 0.212127685546875, 0.2462615966796875, 0.2803955078125, 0.3145294189453125, 0.348663330078125, 0.3827972412109375, 0.41693115234375, 0.4510650634765625, 0.485198974609375, 0.5193328857421875, 0.553466796875, 0.5876007080078125, 0.621734619140625, 0.6558685302734375, 0.69000244140625, 0.7241363525390625, 0.758270263671875, 0.7924041748046875, 0.8265380859375, 0.8606719970703125, 0.894805908203125, 0.9289398193359375, 0.96307373046875, 0.9972076416015625, 1.031341552734375, 1.0654754638671875, 1.099609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 8.0, 10.0, 16.0, 23.0, 32.0, 38.0, 51.0, 66.0, 106.0, 149.0, 148.0, 103.0, 62.0, 49.0, 29.0, 26.0, 26.0, 15.0, 11.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000270843505859375, -0.00026203691959381104, -0.00025323033332824707, -0.0002444237470626831, -0.00023561716079711914, -0.00022681057453155518, -0.0002180039882659912, -0.00020919740200042725, -0.00020039081573486328, -0.00019158422946929932, -0.00018277764320373535, -0.0001739710569381714, -0.00016516447067260742, -0.00015635788440704346, -0.0001475512981414795, -0.00013874471187591553, -0.00012993812561035156, -0.0001211315393447876, -0.00011232495307922363, -0.00010351836681365967, -9.47117805480957e-05, -8.590519428253174e-05, -7.709860801696777e-05, -6.829202175140381e-05, -5.9485435485839844e-05, -5.067884922027588e-05, -4.1872262954711914e-05, -3.306567668914795e-05, -2.4259090423583984e-05, -1.545250415802002e-05, -6.645917892456055e-06, 2.16066837310791e-06, 1.0967254638671875e-05, 1.977384090423584e-05, 2.8580427169799805e-05, 3.738701343536377e-05, 4.6193599700927734e-05, 5.50001859664917e-05, 6.380677223205566e-05, 7.261335849761963e-05, 8.14199447631836e-05, 9.022653102874756e-05, 9.903311729431152e-05, 0.00010783970355987549, 0.00011664628982543945, 0.00012545287609100342, 0.00013425946235656738, 0.00014306604862213135, 0.0001518726348876953, 0.00016067922115325928, 0.00016948580741882324, 0.0001782923936843872, 0.00018709897994995117, 0.00019590556621551514, 0.0002047121524810791, 0.00021351873874664307, 0.00022232532501220703, 0.000231131911277771, 0.00023993849754333496, 0.0002487450838088989, 0.0002575516700744629, 0.00026635825634002686, 0.0002751648426055908, 0.0002839714288711548, 0.00029277801513671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 0.0, 4.0, 6.0, 8.0, 10.0, 16.0, 20.0, 32.0, 61.0, 66.0, 96.0, 149.0, 240.0, 407.0, 695.0, 1147.0, 2361.0, 5235.0, 13612.0, 42864.0, 170127.0, 528159.0, 206334.0, 49746.0, 15512.0, 5875.0, 2583.0, 1302.0, 737.0, 421.0, 261.0, 148.0, 99.0, 68.0, 53.0, 28.0, 21.0, 17.0, 15.0, 4.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99755859375, -0.96783447265625, -0.9381103515625, -0.90838623046875, -0.878662109375, -0.84893798828125, -0.8192138671875, -0.78948974609375, -0.759765625, -0.73004150390625, -0.7003173828125, -0.67059326171875, -0.640869140625, -0.61114501953125, -0.5814208984375, -0.55169677734375, -0.52197265625, -0.49224853515625, -0.4625244140625, -0.43280029296875, -0.403076171875, -0.37335205078125, -0.3436279296875, -0.31390380859375, -0.2841796875, -0.25445556640625, -0.2247314453125, -0.19500732421875, -0.165283203125, -0.13555908203125, -0.1058349609375, -0.07611083984375, -0.04638671875, -0.01666259765625, 0.0130615234375, 0.04278564453125, 0.072509765625, 0.10223388671875, 0.1319580078125, 0.16168212890625, 0.19140625, 0.22113037109375, 0.2508544921875, 0.28057861328125, 0.310302734375, 0.34002685546875, 0.3697509765625, 0.39947509765625, 0.42919921875, 0.45892333984375, 0.4886474609375, 0.51837158203125, 0.548095703125, 0.57781982421875, 0.6075439453125, 0.63726806640625, 0.6669921875, 0.69671630859375, 0.7264404296875, 0.75616455078125, 0.785888671875, 0.81561279296875, 0.8453369140625, 0.87506103515625, 0.90478515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 7.0, 9.0, 9.0, 7.0, 17.0, 18.0, 32.0, 25.0, 46.0, 58.0, 52.0, 84.0, 85.0, 94.0, 100.0, 64.0, 49.0, 44.0, 39.0, 30.0, 19.0, 22.0, 15.0, 9.0, 9.0, 6.0, 8.0, 6.0, 5.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48291015625, -0.46387481689453125, -0.4448394775390625, -0.42580413818359375, -0.406768798828125, -0.38773345947265625, -0.3686981201171875, -0.34966278076171875, -0.33062744140625, -0.31159210205078125, -0.2925567626953125, -0.27352142333984375, -0.254486083984375, -0.23545074462890625, -0.2164154052734375, -0.19738006591796875, -0.1783447265625, -0.15930938720703125, -0.1402740478515625, -0.12123870849609375, -0.102203369140625, -0.08316802978515625, -0.0641326904296875, -0.04509735107421875, -0.02606201171875, -0.00702667236328125, 0.0120086669921875, 0.03104400634765625, 0.050079345703125, 0.06911468505859375, 0.0881500244140625, 0.10718536376953125, 0.126220703125, 0.14525604248046875, 0.1642913818359375, 0.18332672119140625, 0.202362060546875, 0.22139739990234375, 0.2404327392578125, 0.25946807861328125, 0.27850341796875, 0.29753875732421875, 0.3165740966796875, 0.33560943603515625, 0.354644775390625, 0.37368011474609375, 0.3927154541015625, 0.41175079345703125, 0.4307861328125, 0.44982147216796875, 0.4688568115234375, 0.48789215087890625, 0.506927490234375, 0.5259628295898438, 0.5449981689453125, 0.5640335083007812, 0.58306884765625, 0.6021041870117188, 0.6211395263671875, 0.6401748657226562, 0.659210205078125, 0.6782455444335938, 0.6972808837890625, 0.7163162231445312, 0.7353515625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 22.0, 42.0, 88.0, 128.0, 182.0, 175.0, 133.0, 92.0, 55.0, 31.0, 14.0, 10.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.520613670349121, -15.065470695495605, -14.610326766967773, -14.155183792114258, -13.700040817260742, -13.244897842407227, -12.789754867553711, -12.334610939025879, -11.879467964172363, -11.424324989318848, -10.969181060791016, -10.5140380859375, -10.058895111083984, -9.603752136230469, -9.148609161376953, -8.693465232849121, -8.238322257995605, -7.78317928314209, -7.328035831451416, -6.872892379760742, -6.417749404907227, -5.962606430053711, -5.507462978363037, -5.052319526672363, -4.597176551818848, -4.142033576965332, -3.686890125274658, -3.2317469120025635, -2.7766036987304688, -2.321460485458374, -1.8663172721862793, -1.4111740589141846, -0.9560298919677734, -0.5008866786956787, -0.045743465423583984, 0.40939974784851074, 0.8645429611206055, 1.3196861743927002, 1.774829387664795, 2.2299726009368896, 2.6851158142089844, 3.140259027481079, 3.595402240753174, 4.050545692443848, 4.505688667297363, 4.960831642150879, 5.415975093841553, 5.871118545532227, 6.326261520385742, 6.781404495239258, 7.236547946929932, 7.6916913986206055, 8.146834373474121, 8.601977348327637, 9.057121276855469, 9.512264251708984, 9.9674072265625, 10.422550201416016, 10.877693176269531, 11.332837104797363, 11.787980079650879, 12.243123054504395, 12.698266983032227, 13.153409957885742, 13.608552932739258]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 7.0, 7.0, 22.0, 23.0, 29.0, 30.0, 29.0, 38.0, 35.0, 50.0, 46.0, 47.0, 58.0, 59.0, 52.0, 42.0, 45.0, 42.0, 50.0, 39.0, 42.0, 32.0, 38.0, 19.0, 25.0, 16.0, 13.0, 14.0, 8.0, 10.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.976999282836914, -8.7401762008667, -8.503352165222168, -8.266529083251953, -8.029705047607422, -7.792881965637207, -7.556058883666992, -7.319235324859619, -7.082411766052246, -6.845588207244873, -6.6087646484375, -6.371941566467285, -6.135118007659912, -5.898294448852539, -5.661471366882324, -5.424647808074951, -5.187824249267578, -4.951000690460205, -4.714177131652832, -4.477354049682617, -4.240530490875244, -4.003706932067871, -3.766883611679077, -3.530060291290283, -3.29323673248291, -3.056413173675537, -2.819589853286743, -2.582766532897949, -2.345942974090576, -2.109119415283203, -1.8722960948944092, -1.6354726552963257, -1.3986496925354004, -1.161826252937317, -0.9250028133392334, -0.6881793737411499, -0.4513559341430664, -0.2145324945449829, 0.022290945053100586, 0.2591143846511841, 0.4959378242492676, 0.7327612638473511, 0.9695847034454346, 1.206408143043518, 1.4432315826416016, 1.680055022239685, 1.9168784618377686, 2.1537017822265625, 2.3905253410339355, 2.6273488998413086, 2.8641722202301025, 3.1009955406188965, 3.3378190994262695, 3.5746426582336426, 3.8114659786224365, 4.0482892990112305, 4.2851128578186035, 4.521936416625977, 4.758759498596191, 4.9955830574035645, 5.2324066162109375, 5.4692301750183105, 5.706053733825684, 5.942876815795898, 6.1797003746032715]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 10.0, 12.0, 16.0, 20.0, 32.0, 48.0, 72.0, 144.0, 177.0, 259.0, 409.0, 649.0, 1021.0, 1821.0, 3090.0, 5489.0, 10221.0, 20260.0, 42768.0, 100648.0, 333836.0, 2997929.0, 457720.0, 120514.0, 48947.0, 22467.0, 11194.0, 6124.0, 3348.0, 1912.0, 1118.0, 701.0, 447.0, 287.0, 187.0, 139.0, 65.0, 63.0, 33.0, 21.0, 18.0, 18.0, 7.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0234375, -0.9863433837890625, -0.949249267578125, -0.9121551513671875, -0.87506103515625, -0.8379669189453125, -0.800872802734375, -0.7637786865234375, -0.7266845703125, -0.6895904541015625, -0.652496337890625, -0.6154022216796875, -0.57830810546875, -0.5412139892578125, -0.504119873046875, -0.4670257568359375, -0.429931640625, -0.3928375244140625, -0.355743408203125, -0.3186492919921875, -0.28155517578125, -0.2444610595703125, -0.207366943359375, -0.1702728271484375, -0.1331787109375, -0.0960845947265625, -0.058990478515625, -0.0218963623046875, 0.01519775390625, 0.0522918701171875, 0.089385986328125, 0.1264801025390625, 0.16357421875, 0.2006683349609375, 0.237762451171875, 0.2748565673828125, 0.31195068359375, 0.3490447998046875, 0.386138916015625, 0.4232330322265625, 0.4603271484375, 0.4974212646484375, 0.534515380859375, 0.5716094970703125, 0.60870361328125, 0.6457977294921875, 0.682891845703125, 0.7199859619140625, 0.757080078125, 0.7941741943359375, 0.831268310546875, 0.8683624267578125, 0.90545654296875, 0.9425506591796875, 0.979644775390625, 1.0167388916015625, 1.0538330078125, 1.0909271240234375, 1.128021240234375, 1.1651153564453125, 1.20220947265625, 1.2393035888671875, 1.276397705078125, 1.3134918212890625, 1.3505859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 11.0, 11.0, 6.0, 12.0, 19.0, 23.0, 24.0, 39.0, 44.0, 37.0, 56.0, 35.0, 49.0, 55.0, 64.0, 64.0, 59.0, 56.0, 48.0, 44.0, 37.0, 41.0, 30.0, 22.0, 23.0, 21.0, 18.0, 16.0, 8.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28662109375, -0.2770729064941406, -0.26752471923828125, -0.2579765319824219, -0.2484283447265625, -0.23888015747070312, -0.22933197021484375, -0.21978378295898438, -0.210235595703125, -0.20068740844726562, -0.19113922119140625, -0.18159103393554688, -0.1720428466796875, -0.16249465942382812, -0.15294647216796875, -0.14339828491210938, -0.13385009765625, -0.12430191040039062, -0.11475372314453125, -0.10520553588867188, -0.0956573486328125, -0.08610916137695312, -0.07656097412109375, -0.06701278686523438, -0.057464599609375, -0.047916412353515625, -0.03836822509765625, -0.028820037841796875, -0.0192718505859375, -0.009723663330078125, -0.00017547607421875, 0.009372711181640625, 0.0189208984375, 0.028469085693359375, 0.03801727294921875, 0.047565460205078125, 0.0571136474609375, 0.06666183471679688, 0.07621002197265625, 0.08575820922851562, 0.095306396484375, 0.10485458374023438, 0.11440277099609375, 0.12395095825195312, 0.1334991455078125, 0.14304733276367188, 0.15259552001953125, 0.16214370727539062, 0.17169189453125, 0.18124008178710938, 0.19078826904296875, 0.20033645629882812, 0.2098846435546875, 0.21943283081054688, 0.22898101806640625, 0.23852920532226562, 0.248077392578125, 0.2576255798339844, 0.26717376708984375, 0.2767219543457031, 0.2862701416015625, 0.2958183288574219, 0.30536651611328125, 0.3149147033691406, 0.324462890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 15.0, 19.0, 19.0, 28.0, 39.0, 45.0, 92.0, 150.0, 226.0, 328.0, 629.0, 1131.0, 2244.0, 5358.0, 13962.0, 42728.0, 158700.0, 1052343.0, 2586674.0, 239519.0, 59573.0, 18077.0, 6558.0, 2774.0, 1284.0, 658.0, 399.0, 249.0, 151.0, 110.0, 64.0, 40.0, 27.0, 18.0, 6.0, 13.0, 4.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.607421875, -1.557403564453125, -1.50738525390625, -1.457366943359375, -1.4073486328125, -1.357330322265625, -1.30731201171875, -1.257293701171875, -1.207275390625, -1.157257080078125, -1.10723876953125, -1.057220458984375, -1.0072021484375, -0.957183837890625, -0.90716552734375, -0.857147216796875, -0.80712890625, -0.757110595703125, -0.70709228515625, -0.657073974609375, -0.6070556640625, -0.557037353515625, -0.50701904296875, -0.457000732421875, -0.406982421875, -0.356964111328125, -0.30694580078125, -0.256927490234375, -0.2069091796875, -0.156890869140625, -0.10687255859375, -0.056854248046875, -0.0068359375, 0.043182373046875, 0.09320068359375, 0.143218994140625, 0.1932373046875, 0.243255615234375, 0.29327392578125, 0.343292236328125, 0.393310546875, 0.443328857421875, 0.49334716796875, 0.543365478515625, 0.5933837890625, 0.643402099609375, 0.69342041015625, 0.743438720703125, 0.79345703125, 0.843475341796875, 0.89349365234375, 0.943511962890625, 0.9935302734375, 1.043548583984375, 1.09356689453125, 1.143585205078125, 1.193603515625, 1.243621826171875, 1.29364013671875, 1.343658447265625, 1.3936767578125, 1.443695068359375, 1.49371337890625, 1.543731689453125, 1.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 13.0, 20.0, 21.0, 24.0, 44.0, 54.0, 128.0, 167.0, 283.0, 708.0, 1473.0, 490.0, 226.0, 157.0, 96.0, 68.0, 32.0, 21.0, 18.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0146484375, -0.98748779296875, -0.9603271484375, -0.93316650390625, -0.906005859375, -0.87884521484375, -0.8516845703125, -0.82452392578125, -0.79736328125, -0.77020263671875, -0.7430419921875, -0.71588134765625, -0.688720703125, -0.66156005859375, -0.6343994140625, -0.60723876953125, -0.580078125, -0.55291748046875, -0.5257568359375, -0.49859619140625, -0.471435546875, -0.44427490234375, -0.4171142578125, -0.38995361328125, -0.36279296875, -0.33563232421875, -0.3084716796875, -0.28131103515625, -0.254150390625, -0.22698974609375, -0.1998291015625, -0.17266845703125, -0.1455078125, -0.11834716796875, -0.0911865234375, -0.06402587890625, -0.036865234375, -0.00970458984375, 0.0174560546875, 0.04461669921875, 0.07177734375, 0.09893798828125, 0.1260986328125, 0.15325927734375, 0.180419921875, 0.20758056640625, 0.2347412109375, 0.26190185546875, 0.2890625, 0.31622314453125, 0.3433837890625, 0.37054443359375, 0.397705078125, 0.42486572265625, 0.4520263671875, 0.47918701171875, 0.50634765625, 0.53350830078125, 0.5606689453125, 0.58782958984375, 0.614990234375, 0.64215087890625, 0.6693115234375, 0.69647216796875, 0.7236328125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 10.0, 17.0, 26.0, 42.0, 54.0, 98.0, 137.0, 129.0, 141.0, 115.0, 90.0, 55.0, 27.0, 25.0, 16.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70355224609375, -6.525900840759277, -6.348249435424805, -6.170597553253174, -5.992946147918701, -5.8152947425842285, -5.637643337249756, -5.459991455078125, -5.282340049743652, -5.10468864440918, -4.927037239074707, -4.749385356903076, -4.5717339515686035, -4.394082546234131, -4.216431140899658, -4.038779258728027, -3.861128091812134, -3.683476686477661, -3.5058250427246094, -3.3281736373901367, -3.150521993637085, -2.9728705883026123, -2.7952189445495605, -2.617567539215088, -2.4399161338806152, -2.2622647285461426, -2.084613084793091, -1.9069616794586182, -1.7293100357055664, -1.5516586303710938, -1.3740071058273315, -1.1963555812835693, -1.0187039375305176, -0.8410524129867554, -0.6634008884429932, -0.48574942350387573, -0.3080978989601135, -0.13044637441635132, 0.04720509052276611, 0.22485661506652832, 0.4025081396102905, 0.5801596641540527, 0.7578111886978149, 0.9354626536369324, 1.1131141185760498, 1.2907657623291016, 1.4684171676635742, 1.6460686922073364, 1.8237202167510986, 2.0013716220855713, 2.179023265838623, 2.3566746711730957, 2.5343263149261475, 2.71197772026062, 2.889629364013672, 3.0672807693481445, 3.244932174682617, 3.42258358001709, 3.6002352237701416, 3.7778866291046143, 3.955538272857666, 4.133189678192139, 4.310841083526611, 4.488492965698242, 4.666144371032715]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 11.0, 13.0, 13.0, 7.0, 11.0, 10.0, 22.0, 18.0, 24.0, 22.0, 37.0, 32.0, 36.0, 24.0, 41.0, 51.0, 41.0, 37.0, 42.0, 39.0, 49.0, 47.0, 45.0, 48.0, 41.0, 27.0, 30.0, 36.0, 13.0, 25.0, 19.0, 16.0, 10.0, 13.0, 7.0, 7.0, 8.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.328500747680664, -2.255256414413452, -2.1820120811462402, -2.1087677478790283, -2.0355234146118164, -1.9622790813446045, -1.8890347480773926, -1.8157904148101807, -1.7425460815429688, -1.6693017482757568, -1.596057415008545, -1.522813081741333, -1.449568748474121, -1.3763244152069092, -1.3030800819396973, -1.2298357486724854, -1.1565914154052734, -1.0833470821380615, -1.0101027488708496, -0.9368584156036377, -0.8636140823364258, -0.7903697490692139, -0.717125415802002, -0.64388108253479, -0.5706367492675781, -0.4973924160003662, -0.4241480827331543, -0.3509037494659424, -0.27765941619873047, -0.20441508293151855, -0.13117074966430664, -0.05792641639709473, 0.015317916870117188, 0.0885622501373291, 0.16180658340454102, 0.23505091667175293, 0.30829524993896484, 0.38153958320617676, 0.45478391647338867, 0.5280282497406006, 0.6012725830078125, 0.6745169162750244, 0.7477612495422363, 0.8210055828094482, 0.8942499160766602, 0.9674942493438721, 1.040738582611084, 1.113982915878296, 1.1872272491455078, 1.2604715824127197, 1.3337159156799316, 1.4069602489471436, 1.4802045822143555, 1.5534489154815674, 1.6266932487487793, 1.6999375820159912, 1.7731819152832031, 1.846426248550415, 1.919670581817627, 1.9929149150848389, 2.066159248352051, 2.1394035816192627, 2.2126479148864746, 2.2858922481536865, 2.3591365814208984]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 5.0, 10.0, 4.0, 10.0, 16.0, 13.0, 23.0, 33.0, 48.0, 80.0, 99.0, 213.0, 254.0, 485.0, 862.0, 1494.0, 2695.0, 5158.0, 9709.0, 18898.0, 37329.0, 75751.0, 160081.0, 330113.0, 212899.0, 95783.0, 46927.0, 23625.0, 12035.0, 6166.0, 3339.0, 1817.0, 1009.0, 618.0, 340.0, 209.0, 131.0, 81.0, 44.0, 37.0, 35.0, 23.0, 13.0, 8.0, 9.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.27734375, -1.235687255859375, -1.19403076171875, -1.152374267578125, -1.1107177734375, -1.069061279296875, -1.02740478515625, -0.985748291015625, -0.944091796875, -0.902435302734375, -0.86077880859375, -0.819122314453125, -0.7774658203125, -0.735809326171875, -0.69415283203125, -0.652496337890625, -0.61083984375, -0.569183349609375, -0.52752685546875, -0.485870361328125, -0.4442138671875, -0.402557373046875, -0.36090087890625, -0.319244384765625, -0.277587890625, -0.235931396484375, -0.19427490234375, -0.152618408203125, -0.1109619140625, -0.069305419921875, -0.02764892578125, 0.014007568359375, 0.0556640625, 0.097320556640625, 0.13897705078125, 0.180633544921875, 0.2222900390625, 0.263946533203125, 0.30560302734375, 0.347259521484375, 0.388916015625, 0.430572509765625, 0.47222900390625, 0.513885498046875, 0.5555419921875, 0.597198486328125, 0.63885498046875, 0.680511474609375, 0.72216796875, 0.763824462890625, 0.80548095703125, 0.847137451171875, 0.8887939453125, 0.930450439453125, 0.97210693359375, 1.013763427734375, 1.055419921875, 1.097076416015625, 1.13873291015625, 1.180389404296875, 1.2220458984375, 1.263702392578125, 1.30535888671875, 1.347015380859375, 1.388671875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 11.0, 8.0, 17.0, 10.0, 16.0, 16.0, 36.0, 34.0, 40.0, 35.0, 37.0, 47.0, 49.0, 58.0, 60.0, 53.0, 51.0, 58.0, 56.0, 50.0, 30.0, 40.0, 34.0, 28.0, 22.0, 20.0, 22.0, 12.0, 12.0, 9.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.300048828125, -0.2907257080078125, -0.281402587890625, -0.2720794677734375, -0.26275634765625, -0.2534332275390625, -0.244110107421875, -0.2347869873046875, -0.2254638671875, -0.2161407470703125, -0.206817626953125, -0.1974945068359375, -0.18817138671875, -0.1788482666015625, -0.169525146484375, -0.1602020263671875, -0.15087890625, -0.1415557861328125, -0.132232666015625, -0.1229095458984375, -0.11358642578125, -0.1042633056640625, -0.094940185546875, -0.0856170654296875, -0.0762939453125, -0.0669708251953125, -0.057647705078125, -0.0483245849609375, -0.03900146484375, -0.0296783447265625, -0.020355224609375, -0.0110321044921875, -0.001708984375, 0.0076141357421875, 0.016937255859375, 0.0262603759765625, 0.03558349609375, 0.0449066162109375, 0.054229736328125, 0.0635528564453125, 0.0728759765625, 0.0821990966796875, 0.091522216796875, 0.1008453369140625, 0.11016845703125, 0.1194915771484375, 0.128814697265625, 0.1381378173828125, 0.1474609375, 0.1567840576171875, 0.166107177734375, 0.1754302978515625, 0.18475341796875, 0.1940765380859375, 0.203399658203125, 0.2127227783203125, 0.2220458984375, 0.2313690185546875, 0.240692138671875, 0.2500152587890625, 0.25933837890625, 0.2686614990234375, 0.277984619140625, 0.2873077392578125, 0.296630859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 14.0, 15.0, 19.0, 28.0, 48.0, 66.0, 112.0, 149.0, 211.0, 337.0, 594.0, 941.0, 1614.0, 2978.0, 5778.0, 12424.0, 29934.0, 80594.0, 233004.0, 411738.0, 166342.0, 58951.0, 22466.0, 9480.0, 4593.0, 2435.0, 1378.0, 808.0, 497.0, 307.0, 213.0, 137.0, 77.0, 79.0, 47.0, 25.0, 19.0, 26.0, 16.0, 9.0, 4.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3004150390625, -1.256103515625, -1.2117919921875, -1.16748046875, -1.1231689453125, -1.078857421875, -1.0345458984375, -0.990234375, -0.9459228515625, -0.901611328125, -0.8572998046875, -0.81298828125, -0.7686767578125, -0.724365234375, -0.6800537109375, -0.6357421875, -0.5914306640625, -0.547119140625, -0.5028076171875, -0.45849609375, -0.4141845703125, -0.369873046875, -0.3255615234375, -0.28125, -0.2369384765625, -0.192626953125, -0.1483154296875, -0.10400390625, -0.0596923828125, -0.015380859375, 0.0289306640625, 0.0732421875, 0.1175537109375, 0.161865234375, 0.2061767578125, 0.25048828125, 0.2947998046875, 0.339111328125, 0.3834228515625, 0.427734375, 0.4720458984375, 0.516357421875, 0.5606689453125, 0.60498046875, 0.6492919921875, 0.693603515625, 0.7379150390625, 0.7822265625, 0.8265380859375, 0.870849609375, 0.9151611328125, 0.95947265625, 1.0037841796875, 1.048095703125, 1.0924072265625, 1.13671875, 1.1810302734375, 1.225341796875, 1.2696533203125, 1.31396484375, 1.3582763671875, 1.402587890625, 1.4468994140625, 1.4912109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 7.0, 5.0, 17.0, 6.0, 14.0, 11.0, 26.0, 27.0, 23.0, 32.0, 31.0, 28.0, 34.0, 44.0, 47.0, 51.0, 43.0, 49.0, 64.0, 44.0, 46.0, 43.0, 41.0, 44.0, 26.0, 30.0, 24.0, 22.0, 27.0, 18.0, 19.0, 15.0, 7.0, 7.0, 7.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4072265625, -1.365264892578125, -1.32330322265625, -1.281341552734375, -1.2393798828125, -1.197418212890625, -1.15545654296875, -1.113494873046875, -1.071533203125, -1.029571533203125, -0.98760986328125, -0.945648193359375, -0.9036865234375, -0.861724853515625, -0.81976318359375, -0.777801513671875, -0.73583984375, -0.693878173828125, -0.65191650390625, -0.609954833984375, -0.5679931640625, -0.526031494140625, -0.48406982421875, -0.442108154296875, -0.400146484375, -0.358184814453125, -0.31622314453125, -0.274261474609375, -0.2322998046875, -0.190338134765625, -0.14837646484375, -0.106414794921875, -0.064453125, -0.022491455078125, 0.01947021484375, 0.061431884765625, 0.1033935546875, 0.145355224609375, 0.18731689453125, 0.229278564453125, 0.271240234375, 0.313201904296875, 0.35516357421875, 0.397125244140625, 0.4390869140625, 0.481048583984375, 0.52301025390625, 0.564971923828125, 0.60693359375, 0.648895263671875, 0.69085693359375, 0.732818603515625, 0.7747802734375, 0.816741943359375, 0.85870361328125, 0.900665283203125, 0.942626953125, 0.984588623046875, 1.02655029296875, 1.068511962890625, 1.1104736328125, 1.152435302734375, 1.19439697265625, 1.236358642578125, 1.2783203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 12.0, 24.0, 30.0, 33.0, 42.0, 71.0, 92.0, 191.0, 315.0, 600.0, 1217.0, 2908.0, 7879.0, 25420.0, 107452.0, 484019.0, 325487.0, 65907.0, 16843.0, 5638.0, 2209.0, 985.0, 440.0, 276.0, 137.0, 86.0, 67.0, 56.0, 21.0, 20.0, 15.0, 9.0, 11.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.97509765625, -0.9424209594726562, -0.9097442626953125, -0.8770675659179688, -0.844390869140625, -0.8117141723632812, -0.7790374755859375, -0.7463607788085938, -0.71368408203125, -0.6810073852539062, -0.6483306884765625, -0.6156539916992188, -0.582977294921875, -0.5503005981445312, -0.5176239013671875, -0.48494720458984375, -0.4522705078125, -0.41959381103515625, -0.3869171142578125, -0.35424041748046875, -0.321563720703125, -0.28888702392578125, -0.2562103271484375, -0.22353363037109375, -0.19085693359375, -0.15818023681640625, -0.1255035400390625, -0.09282684326171875, -0.060150146484375, -0.02747344970703125, 0.0052032470703125, 0.03787994384765625, 0.070556640625, 0.10323333740234375, 0.1359100341796875, 0.16858673095703125, 0.201263427734375, 0.23394012451171875, 0.2666168212890625, 0.29929351806640625, 0.33197021484375, 0.36464691162109375, 0.3973236083984375, 0.43000030517578125, 0.462677001953125, 0.49535369873046875, 0.5280303955078125, 0.5607070922851562, 0.5933837890625, 0.6260604858398438, 0.6587371826171875, 0.6914138793945312, 0.724090576171875, 0.7567672729492188, 0.7894439697265625, 0.8221206665039062, 0.85479736328125, 0.8874740600585938, 0.9201507568359375, 0.9528274536132812, 0.985504150390625, 1.0181808471679688, 1.0508575439453125, 1.0835342407226562, 1.1162109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 0.0, 3.0, 5.0, 9.0, 12.0, 19.0, 29.0, 23.0, 20.0, 34.0, 51.0, 81.0, 112.0, 138.0, 139.0, 84.0, 64.0, 38.0, 26.0, 25.0, 16.0, 17.0, 7.0, 6.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00028443336486816406, -0.00027688220143318176, -0.00026933103799819946, -0.00026177987456321716, -0.00025422871112823486, -0.00024667754769325256, -0.00023912638425827026, -0.00023157522082328796, -0.00022402405738830566, -0.00021647289395332336, -0.00020892173051834106, -0.00020137056708335876, -0.00019381940364837646, -0.00018626824021339417, -0.00017871707677841187, -0.00017116591334342957, -0.00016361474990844727, -0.00015606358647346497, -0.00014851242303848267, -0.00014096125960350037, -0.00013341009616851807, -0.00012585893273353577, -0.00011830776929855347, -0.00011075660586357117, -0.00010320544242858887, -9.565427899360657e-05, -8.810311555862427e-05, -8.055195212364197e-05, -7.300078868865967e-05, -6.544962525367737e-05, -5.789846181869507e-05, -5.034729838371277e-05, -4.279613494873047e-05, -3.524497151374817e-05, -2.769380807876587e-05, -2.014264464378357e-05, -1.259148120880127e-05, -5.04031777381897e-06, 2.51084566116333e-06, 1.006200909614563e-05, 1.761317253112793e-05, 2.516433596611023e-05, 3.271549940109253e-05, 4.026666283607483e-05, 4.781782627105713e-05, 5.536898970603943e-05, 6.292015314102173e-05, 7.047131657600403e-05, 7.802248001098633e-05, 8.557364344596863e-05, 9.312480688095093e-05, 0.00010067597031593323, 0.00010822713375091553, 0.00011577829718589783, 0.00012332946062088013, 0.00013088062405586243, 0.00013843178749084473, 0.00014598295092582703, 0.00015353411436080933, 0.00016108527779579163, 0.00016863644123077393, 0.00017618760466575623, 0.00018373876810073853, 0.00019128993153572083, 0.00019884109497070312]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 1.0, 7.0, 13.0, 16.0, 12.0, 32.0, 47.0, 84.0, 143.0, 350.0, 729.0, 1837.0, 5427.0, 23033.0, 171576.0, 681462.0, 136332.0, 19590.0, 4771.0, 1718.0, 704.0, 304.0, 143.0, 72.0, 52.0, 27.0, 24.0, 15.0, 8.0, 8.0, 5.0, 2.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.708984375, -1.6645355224609375, -1.620086669921875, -1.5756378173828125, -1.53118896484375, -1.4867401123046875, -1.442291259765625, -1.3978424072265625, -1.3533935546875, -1.3089447021484375, -1.264495849609375, -1.2200469970703125, -1.17559814453125, -1.1311492919921875, -1.086700439453125, -1.0422515869140625, -0.997802734375, -0.9533538818359375, -0.908905029296875, -0.8644561767578125, -0.82000732421875, -0.7755584716796875, -0.731109619140625, -0.6866607666015625, -0.6422119140625, -0.5977630615234375, -0.553314208984375, -0.5088653564453125, -0.46441650390625, -0.4199676513671875, -0.375518798828125, -0.3310699462890625, -0.28662109375, -0.2421722412109375, -0.197723388671875, -0.1532745361328125, -0.10882568359375, -0.0643768310546875, -0.019927978515625, 0.0245208740234375, 0.0689697265625, 0.1134185791015625, 0.157867431640625, 0.2023162841796875, 0.24676513671875, 0.2912139892578125, 0.335662841796875, 0.3801116943359375, 0.424560546875, 0.4690093994140625, 0.513458251953125, 0.5579071044921875, 0.60235595703125, 0.6468048095703125, 0.691253662109375, 0.7357025146484375, 0.7801513671875, 0.8246002197265625, 0.869049072265625, 0.9134979248046875, 0.95794677734375, 1.0023956298828125, 1.046844482421875, 1.0912933349609375, 1.1357421875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 4.0, 7.0, 16.0, 22.0, 33.0, 36.0, 52.0, 70.0, 99.0, 108.0, 109.0, 111.0, 82.0, 64.0, 50.0, 35.0, 21.0, 20.0, 14.0, 7.0, 6.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.7137374877929688, -0.6877288818359375, -0.6617202758789062, -0.635711669921875, -0.6097030639648438, -0.5836944580078125, -0.5576858520507812, -0.53167724609375, -0.5056686401367188, -0.4796600341796875, -0.45365142822265625, -0.427642822265625, -0.40163421630859375, -0.3756256103515625, -0.34961700439453125, -0.3236083984375, -0.29759979248046875, -0.2715911865234375, -0.24558258056640625, -0.219573974609375, -0.19356536865234375, -0.1675567626953125, -0.14154815673828125, -0.11553955078125, -0.08953094482421875, -0.0635223388671875, -0.03751373291015625, -0.011505126953125, 0.01450347900390625, 0.0405120849609375, 0.06652069091796875, 0.092529296875, 0.11853790283203125, 0.1445465087890625, 0.17055511474609375, 0.196563720703125, 0.22257232666015625, 0.2485809326171875, 0.27458953857421875, 0.30059814453125, 0.32660675048828125, 0.3526153564453125, 0.37862396240234375, 0.404632568359375, 0.43064117431640625, 0.4566497802734375, 0.48265838623046875, 0.5086669921875, 0.5346755981445312, 0.5606842041015625, 0.5866928100585938, 0.612701416015625, 0.6387100219726562, 0.6647186279296875, 0.6907272338867188, 0.71673583984375, 0.7427444458007812, 0.7687530517578125, 0.7947616577148438, 0.820770263671875, 0.8467788696289062, 0.8727874755859375, 0.8987960815429688, 0.9248046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 10.0, 12.0, 23.0, 31.0, 49.0, 89.0, 122.0, 146.0, 150.0, 127.0, 93.0, 65.0, 43.0, 19.0, 11.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.568193435668945, -12.103687286376953, -11.639181137084961, -11.174674987792969, -10.710168838500977, -10.245662689208984, -9.781156539916992, -9.316650390625, -8.852144241333008, -8.387638092041016, -7.923131942749023, -7.458625793457031, -6.994119644165039, -6.529613494873047, -6.065107345581055, -5.6006011962890625, -5.13609504699707, -4.671588897705078, -4.207082748413086, -3.7425765991210938, -3.2780704498291016, -2.8135643005371094, -2.349058151245117, -1.884552001953125, -1.4200458526611328, -0.9555397033691406, -0.49103355407714844, -0.02652740478515625, 0.43797874450683594, 0.9024848937988281, 1.3669910430908203, 1.8314971923828125, 2.2960033416748047, 2.760509490966797, 3.225015640258789, 3.6895217895507812, 4.154027938842773, 4.618534088134766, 5.083040237426758, 5.54754638671875, 6.012052536010742, 6.476558685302734, 6.941064834594727, 7.405570983886719, 7.870077133178711, 8.334583282470703, 8.799089431762695, 9.263595581054688, 9.72810173034668, 10.192607879638672, 10.657114028930664, 11.121620178222656, 11.586126327514648, 12.05063247680664, 12.515138626098633, 12.979644775390625, 13.444150924682617, 13.90865707397461, 14.373163223266602, 14.837669372558594, 15.302175521850586, 15.766681671142578, 16.23118782043457, 16.695693969726562, 17.160200119018555]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 4.0, 3.0, 9.0, 8.0, 10.0, 12.0, 14.0, 15.0, 14.0, 24.0, 23.0, 24.0, 26.0, 28.0, 33.0, 39.0, 49.0, 36.0, 38.0, 46.0, 32.0, 50.0, 43.0, 44.0, 41.0, 41.0, 42.0, 27.0, 31.0, 28.0, 24.0, 23.0, 24.0, 17.0, 15.0, 14.0, 12.0, 10.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.7632293701171875, -7.544877529144287, -7.3265252113342285, -7.108173370361328, -6.889821529388428, -6.671469688415527, -6.453117370605469, -6.234765529632568, -6.016413688659668, -5.798061847686768, -5.579709529876709, -5.361357688903809, -5.143005847930908, -4.924654006958008, -4.706301689147949, -4.487949848175049, -4.26959753036499, -4.05124568939209, -3.8328936100006104, -3.614541530609131, -3.3961896896362305, -3.177837610244751, -2.9594855308532715, -2.741133689880371, -2.5227816104888916, -2.304429531097412, -2.0860776901245117, -1.8677256107330322, -1.6493736505508423, -1.4310216903686523, -1.2126696109771729, -0.9943176507949829, -0.7759652137756348, -0.5576132535934448, -0.3392612338066101, -0.12090921401977539, 0.09744274616241455, 0.3157947063446045, 0.534146785736084, 0.7524987459182739, 0.9708507061004639, 1.1892026662826538, 1.4075546264648438, 1.6259067058563232, 1.8442586660385132, 2.062610626220703, 2.2809627056121826, 2.499314785003662, 2.7176666259765625, 2.936018705368042, 3.1543705463409424, 3.372722625732422, 3.5910744667053223, 3.8094265460968018, 4.027778625488281, 4.246130466461182, 4.464482307434082, 4.682834148406982, 4.901186466217041, 5.119538307189941, 5.337890148162842, 5.556241989135742, 5.774594306945801, 5.992946147918701, 6.21129846572876]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 21.0, 27.0, 42.0, 67.0, 118.0, 204.0, 291.0, 491.0, 832.0, 1698.0, 3442.0, 7775.0, 21233.0, 73711.0, 608630.0, 3302131.0, 123130.0, 30664.0, 10772.0, 4350.0, 2003.0, 1059.0, 618.0, 357.0, 243.0, 128.0, 65.0, 60.0, 39.0, 21.0, 10.0, 10.0, 5.0, 12.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8819427490234375, -1.819549560546875, -1.7571563720703125, -1.69476318359375, -1.6323699951171875, -1.569976806640625, -1.5075836181640625, -1.4451904296875, -1.3827972412109375, -1.320404052734375, -1.2580108642578125, -1.19561767578125, -1.1332244873046875, -1.070831298828125, -1.0084381103515625, -0.946044921875, -0.8836517333984375, -0.821258544921875, -0.7588653564453125, -0.69647216796875, -0.6340789794921875, -0.571685791015625, -0.5092926025390625, -0.4468994140625, -0.3845062255859375, -0.322113037109375, -0.2597198486328125, -0.19732666015625, -0.1349334716796875, -0.072540283203125, -0.0101470947265625, 0.05224609375, 0.1146392822265625, 0.177032470703125, 0.2394256591796875, 0.30181884765625, 0.3642120361328125, 0.426605224609375, 0.4889984130859375, 0.5513916015625, 0.6137847900390625, 0.676177978515625, 0.7385711669921875, 0.80096435546875, 0.8633575439453125, 0.925750732421875, 0.9881439208984375, 1.050537109375, 1.1129302978515625, 1.175323486328125, 1.2377166748046875, 1.30010986328125, 1.3625030517578125, 1.424896240234375, 1.4872894287109375, 1.5496826171875, 1.6120758056640625, 1.674468994140625, 1.7368621826171875, 1.79925537109375, 1.8616485595703125, 1.924041748046875, 1.9864349365234375, 2.048828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 4.0, 8.0, 12.0, 15.0, 11.0, 15.0, 27.0, 18.0, 24.0, 36.0, 38.0, 42.0, 39.0, 51.0, 55.0, 49.0, 57.0, 55.0, 43.0, 57.0, 47.0, 40.0, 37.0, 36.0, 30.0, 28.0, 33.0, 17.0, 17.0, 17.0, 12.0, 8.0, 4.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273681640625, -0.2638587951660156, -0.25403594970703125, -0.24421310424804688, -0.2343902587890625, -0.22456741333007812, -0.21474456787109375, -0.20492172241210938, -0.195098876953125, -0.18527603149414062, -0.17545318603515625, -0.16563034057617188, -0.1558074951171875, -0.14598464965820312, -0.13616180419921875, -0.12633895874023438, -0.11651611328125, -0.10669326782226562, -0.09687042236328125, -0.08704757690429688, -0.0772247314453125, -0.06740188598632812, -0.05757904052734375, -0.047756195068359375, -0.037933349609375, -0.028110504150390625, -0.01828765869140625, -0.008464813232421875, 0.0013580322265625, 0.011180877685546875, 0.02100372314453125, 0.030826568603515625, 0.0406494140625, 0.050472259521484375, 0.06029510498046875, 0.07011795043945312, 0.0799407958984375, 0.08976364135742188, 0.09958648681640625, 0.10940933227539062, 0.119232177734375, 0.12905502319335938, 0.13887786865234375, 0.14870071411132812, 0.1585235595703125, 0.16834640502929688, 0.17816925048828125, 0.18799209594726562, 0.19781494140625, 0.20763778686523438, 0.21746063232421875, 0.22728347778320312, 0.2371063232421875, 0.24692916870117188, 0.25675201416015625, 0.2665748596191406, 0.276397705078125, 0.2862205505371094, 0.29604339599609375, 0.3058662414550781, 0.3156890869140625, 0.3255119323730469, 0.33533477783203125, 0.3451576232910156, 0.35498046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 3.0, 12.0, 11.0, 12.0, 16.0, 20.0, 18.0, 20.0, 38.0, 32.0, 48.0, 73.0, 115.0, 203.0, 458.0, 1231.0, 4519.0, 24424.0, 263881.0, 3739768.0, 138681.0, 15603.0, 3211.0, 969.0, 373.0, 167.0, 93.0, 62.0, 46.0, 27.0, 23.0, 28.0, 17.0, 11.0, 10.0, 12.0, 7.0, 3.0, 4.0, 4.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4609375, -3.350677490234375, -3.24041748046875, -3.130157470703125, -3.0198974609375, -2.909637451171875, -2.79937744140625, -2.689117431640625, -2.578857421875, -2.468597412109375, -2.35833740234375, -2.248077392578125, -2.1378173828125, -2.027557373046875, -1.91729736328125, -1.807037353515625, -1.69677734375, -1.586517333984375, -1.47625732421875, -1.365997314453125, -1.2557373046875, -1.145477294921875, -1.03521728515625, -0.924957275390625, -0.814697265625, -0.704437255859375, -0.59417724609375, -0.483917236328125, -0.3736572265625, -0.263397216796875, -0.15313720703125, -0.042877197265625, 0.0673828125, 0.177642822265625, 0.28790283203125, 0.398162841796875, 0.5084228515625, 0.618682861328125, 0.72894287109375, 0.839202880859375, 0.949462890625, 1.059722900390625, 1.16998291015625, 1.280242919921875, 1.3905029296875, 1.500762939453125, 1.61102294921875, 1.721282958984375, 1.83154296875, 1.941802978515625, 2.05206298828125, 2.162322998046875, 2.2725830078125, 2.382843017578125, 2.49310302734375, 2.603363037109375, 2.713623046875, 2.823883056640625, 2.93414306640625, 3.044403076171875, 3.1546630859375, 3.264923095703125, 3.37518310546875, 3.485443115234375, 3.595703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 13.0, 23.0, 27.0, 47.0, 93.0, 222.0, 714.0, 2199.0, 427.0, 152.0, 70.0, 43.0, 23.0, 9.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -2.0074310302734375, -1.964080810546875, -1.9207305908203125, -1.87738037109375, -1.8340301513671875, -1.790679931640625, -1.7473297119140625, -1.7039794921875, -1.6606292724609375, -1.617279052734375, -1.5739288330078125, -1.53057861328125, -1.4872283935546875, -1.443878173828125, -1.4005279541015625, -1.357177734375, -1.3138275146484375, -1.270477294921875, -1.2271270751953125, -1.18377685546875, -1.1404266357421875, -1.097076416015625, -1.0537261962890625, -1.0103759765625, -0.9670257568359375, -0.923675537109375, -0.8803253173828125, -0.83697509765625, -0.7936248779296875, -0.750274658203125, -0.7069244384765625, -0.66357421875, -0.6202239990234375, -0.576873779296875, -0.5335235595703125, -0.49017333984375, -0.4468231201171875, -0.403472900390625, -0.3601226806640625, -0.3167724609375, -0.2734222412109375, -0.230072021484375, -0.1867218017578125, -0.14337158203125, -0.1000213623046875, -0.056671142578125, -0.0133209228515625, 0.030029296875, 0.0733795166015625, 0.116729736328125, 0.1600799560546875, 0.20343017578125, 0.2467803955078125, 0.290130615234375, 0.3334808349609375, 0.3768310546875, 0.4201812744140625, 0.463531494140625, 0.5068817138671875, 0.55023193359375, 0.5935821533203125, 0.636932373046875, 0.6802825927734375, 0.7236328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 11.0, 13.0, 23.0, 25.0, 27.0, 37.0, 51.0, 58.0, 76.0, 103.0, 104.0, 87.0, 71.0, 77.0, 57.0, 53.0, 33.0, 17.0, 21.0, 11.0, 17.0, 3.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.384737014770508, -4.266667366027832, -4.1485981941223145, -4.030529022216797, -3.912459373474121, -3.7943899631500244, -3.6763205528259277, -3.558251142501831, -3.4401817321777344, -3.3221123218536377, -3.204042911529541, -3.0859735012054443, -2.9679040908813477, -2.849834680557251, -2.7317652702331543, -2.6136958599090576, -2.495626449584961, -2.3775570392608643, -2.2594876289367676, -2.141418218612671, -2.023348808288574, -1.9052793979644775, -1.7872099876403809, -1.6691405773162842, -1.5510711669921875, -1.4330017566680908, -1.3149323463439941, -1.1968629360198975, -1.0787935256958008, -0.9607241153717041, -0.8426547050476074, -0.7245852947235107, -0.6065158843994141, -0.4884464740753174, -0.3703770637512207, -0.252307653427124, -0.13423824310302734, -0.016168832778930664, 0.10190057754516602, 0.2199699878692627, 0.3380393981933594, 0.45610880851745605, 0.5741782188415527, 0.6922476291656494, 0.8103170394897461, 0.9283864498138428, 1.0464558601379395, 1.1645252704620361, 1.2825946807861328, 1.4006640911102295, 1.5187335014343262, 1.6368029117584229, 1.7548723220825195, 1.8729417324066162, 1.991011142730713, 2.1090805530548096, 2.2271499633789062, 2.345219373703003, 2.4632887840270996, 2.5813581943511963, 2.699427604675293, 2.8174970149993896, 2.9355664253234863, 3.053635835647583, 3.1717052459716797]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 9.0, 10.0, 8.0, 11.0, 19.0, 25.0, 21.0, 28.0, 31.0, 26.0, 32.0, 37.0, 44.0, 41.0, 37.0, 40.0, 47.0, 50.0, 33.0, 40.0, 46.0, 37.0, 39.0, 35.0, 36.0, 30.0, 28.0, 29.0, 16.0, 18.0, 20.0, 14.0, 9.0, 7.0, 8.0, 10.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.79723858833313, -2.7152867317199707, -2.6333351135253906, -2.5513832569122314, -2.4694314002990723, -2.387479782104492, -2.305527925491333, -2.223576068878174, -2.1416244506835938, -2.0596725940704346, -1.9777209758758545, -1.8957691192626953, -1.8138173818588257, -1.731865644454956, -1.6499137878417969, -1.5679620504379272, -1.4860103130340576, -1.404058575630188, -1.3221068382263184, -1.2401549816131592, -1.1582032442092896, -1.07625150680542, -0.9942997097969055, -0.9123479127883911, -0.8303961753845215, -0.7484444379806519, -0.6664926409721375, -0.584540843963623, -0.5025891065597534, -0.4206373393535614, -0.3386855721473694, -0.256733775138855, -0.17478227615356445, -0.09283050894737244, -0.01087874174118042, 0.0710730254650116, 0.1530247926712036, 0.23497655987739563, 0.31692832708358765, 0.39888012409210205, 0.4808318614959717, 0.5627835988998413, 0.6447353959083557, 0.7266871929168701, 0.8086389303207397, 0.8905906677246094, 0.9725424647331238, 1.0544942617416382, 1.1364459991455078, 1.2183977365493774, 1.300349473953247, 1.3823013305664062, 1.4642530679702759, 1.5462048053741455, 1.6281566619873047, 1.7101083993911743, 1.792060136795044, 1.8740118741989136, 1.9559636116027832, 2.0379154682159424, 2.1198673248291016, 2.2018189430236816, 2.283770799636841, 2.36572265625, 2.44767427444458]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 17.0, 22.0, 26.0, 39.0, 73.0, 130.0, 173.0, 316.0, 488.0, 815.0, 1405.0, 2474.0, 4315.0, 7932.0, 13951.0, 25189.0, 45497.0, 81517.0, 147583.0, 257024.0, 207140.0, 111903.0, 61963.0, 34668.0, 19259.0, 10646.0, 5964.0, 3370.0, 1882.0, 1084.0, 644.0, 403.0, 236.0, 157.0, 86.0, 58.0, 27.0, 25.0, 17.0, 13.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1215057373046875, -1.083831787109375, -1.0461578369140625, -1.00848388671875, -0.9708099365234375, -0.933135986328125, -0.8954620361328125, -0.8577880859375, -0.8201141357421875, -0.782440185546875, -0.7447662353515625, -0.70709228515625, -0.6694183349609375, -0.631744384765625, -0.5940704345703125, -0.556396484375, -0.5187225341796875, -0.481048583984375, -0.4433746337890625, -0.40570068359375, -0.3680267333984375, -0.330352783203125, -0.2926788330078125, -0.2550048828125, -0.2173309326171875, -0.179656982421875, -0.1419830322265625, -0.10430908203125, -0.0666351318359375, -0.028961181640625, 0.0087127685546875, 0.04638671875, 0.0840606689453125, 0.121734619140625, 0.1594085693359375, 0.19708251953125, 0.2347564697265625, 0.272430419921875, 0.3101043701171875, 0.3477783203125, 0.3854522705078125, 0.423126220703125, 0.4608001708984375, 0.49847412109375, 0.5361480712890625, 0.573822021484375, 0.6114959716796875, 0.649169921875, 0.6868438720703125, 0.724517822265625, 0.7621917724609375, 0.79986572265625, 0.8375396728515625, 0.875213623046875, 0.9128875732421875, 0.9505615234375, 0.9882354736328125, 1.025909423828125, 1.0635833740234375, 1.10125732421875, 1.1389312744140625, 1.176605224609375, 1.2142791748046875, 1.251953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 6.0, 18.0, 4.0, 14.0, 12.0, 21.0, 24.0, 31.0, 32.0, 34.0, 41.0, 47.0, 39.0, 42.0, 46.0, 47.0, 47.0, 58.0, 44.0, 49.0, 47.0, 46.0, 39.0, 34.0, 24.0, 30.0, 20.0, 25.0, 12.0, 12.0, 11.0, 12.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314697265625, -0.30466461181640625, -0.2946319580078125, -0.28459930419921875, -0.274566650390625, -0.26453399658203125, -0.2545013427734375, -0.24446868896484375, -0.23443603515625, -0.22440338134765625, -0.2143707275390625, -0.20433807373046875, -0.194305419921875, -0.18427276611328125, -0.1742401123046875, -0.16420745849609375, -0.1541748046875, -0.14414215087890625, -0.1341094970703125, -0.12407684326171875, -0.114044189453125, -0.10401153564453125, -0.0939788818359375, -0.08394622802734375, -0.07391357421875, -0.06388092041015625, -0.0538482666015625, -0.04381561279296875, -0.033782958984375, -0.02375030517578125, -0.0137176513671875, -0.00368499755859375, 0.00634765625, 0.01638031005859375, 0.0264129638671875, 0.03644561767578125, 0.046478271484375, 0.05651092529296875, 0.0665435791015625, 0.07657623291015625, 0.08660888671875, 0.09664154052734375, 0.1066741943359375, 0.11670684814453125, 0.126739501953125, 0.13677215576171875, 0.1468048095703125, 0.15683746337890625, 0.1668701171875, 0.17690277099609375, 0.1869354248046875, 0.19696807861328125, 0.207000732421875, 0.21703338623046875, 0.2270660400390625, 0.23709869384765625, 0.24713134765625, 0.25716400146484375, 0.2671966552734375, 0.27722930908203125, 0.287261962890625, 0.29729461669921875, 0.3073272705078125, 0.31735992431640625, 0.327392578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 12.0, 13.0, 31.0, 34.0, 63.0, 105.0, 129.0, 249.0, 403.0, 798.0, 1720.0, 5199.0, 20650.0, 99850.0, 494620.0, 339361.0, 64362.0, 14161.0, 3809.0, 1397.0, 665.0, 330.0, 208.0, 126.0, 84.0, 52.0, 37.0, 23.0, 17.0, 13.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.63671875, -2.56109619140625, -2.4854736328125, -2.40985107421875, -2.334228515625, -2.25860595703125, -2.1829833984375, -2.10736083984375, -2.03173828125, -1.95611572265625, -1.8804931640625, -1.80487060546875, -1.729248046875, -1.65362548828125, -1.5780029296875, -1.50238037109375, -1.4267578125, -1.35113525390625, -1.2755126953125, -1.19989013671875, -1.124267578125, -1.04864501953125, -0.9730224609375, -0.89739990234375, -0.82177734375, -0.74615478515625, -0.6705322265625, -0.59490966796875, -0.519287109375, -0.44366455078125, -0.3680419921875, -0.29241943359375, -0.216796875, -0.14117431640625, -0.0655517578125, 0.01007080078125, 0.085693359375, 0.16131591796875, 0.2369384765625, 0.31256103515625, 0.38818359375, 0.46380615234375, 0.5394287109375, 0.61505126953125, 0.690673828125, 0.76629638671875, 0.8419189453125, 0.91754150390625, 0.9931640625, 1.06878662109375, 1.1444091796875, 1.22003173828125, 1.295654296875, 1.37127685546875, 1.4468994140625, 1.52252197265625, 1.59814453125, 1.67376708984375, 1.7493896484375, 1.82501220703125, 1.900634765625, 1.97625732421875, 2.0518798828125, 2.12750244140625, 2.203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 9.0, 8.0, 16.0, 13.0, 23.0, 23.0, 29.0, 22.0, 28.0, 42.0, 41.0, 54.0, 41.0, 48.0, 53.0, 38.0, 55.0, 48.0, 50.0, 47.0, 40.0, 36.0, 26.0, 26.0, 34.0, 25.0, 15.0, 23.0, 16.0, 15.0, 14.0, 6.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4734039306640625, -1.428253173828125, -1.3831024169921875, -1.33795166015625, -1.2928009033203125, -1.247650146484375, -1.2024993896484375, -1.1573486328125, -1.1121978759765625, -1.067047119140625, -1.0218963623046875, -0.97674560546875, -0.9315948486328125, -0.886444091796875, -0.8412933349609375, -0.796142578125, -0.7509918212890625, -0.705841064453125, -0.6606903076171875, -0.61553955078125, -0.5703887939453125, -0.525238037109375, -0.4800872802734375, -0.4349365234375, -0.3897857666015625, -0.344635009765625, -0.2994842529296875, -0.25433349609375, -0.2091827392578125, -0.164031982421875, -0.1188812255859375, -0.07373046875, -0.0285797119140625, 0.016571044921875, 0.0617218017578125, 0.10687255859375, 0.1520233154296875, 0.197174072265625, 0.2423248291015625, 0.2874755859375, 0.3326263427734375, 0.377777099609375, 0.4229278564453125, 0.46807861328125, 0.5132293701171875, 0.558380126953125, 0.6035308837890625, 0.648681640625, 0.6938323974609375, 0.738983154296875, 0.7841339111328125, 0.82928466796875, 0.8744354248046875, 0.919586181640625, 0.9647369384765625, 1.0098876953125, 1.0550384521484375, 1.100189208984375, 1.1453399658203125, 1.19049072265625, 1.2356414794921875, 1.280792236328125, 1.3259429931640625, 1.37109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 10.0, 13.0, 16.0, 24.0, 30.0, 38.0, 90.0, 136.0, 221.0, 375.0, 703.0, 1369.0, 2788.0, 6824.0, 22326.0, 128390.0, 724379.0, 126090.0, 22053.0, 6836.0, 2807.0, 1377.0, 719.0, 365.0, 205.0, 132.0, 84.0, 59.0, 27.0, 23.0, 12.0, 7.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9402923583984375, -1.880584716796875, -1.8208770751953125, -1.76116943359375, -1.7014617919921875, -1.641754150390625, -1.5820465087890625, -1.5223388671875, -1.4626312255859375, -1.402923583984375, -1.3432159423828125, -1.28350830078125, -1.2238006591796875, -1.164093017578125, -1.1043853759765625, -1.044677734375, -0.9849700927734375, -0.925262451171875, -0.8655548095703125, -0.80584716796875, -0.7461395263671875, -0.686431884765625, -0.6267242431640625, -0.5670166015625, -0.5073089599609375, -0.447601318359375, -0.3878936767578125, -0.32818603515625, -0.2684783935546875, -0.208770751953125, -0.1490631103515625, -0.08935546875, -0.0296478271484375, 0.030059814453125, 0.0897674560546875, 0.14947509765625, 0.2091827392578125, 0.268890380859375, 0.3285980224609375, 0.3883056640625, 0.4480133056640625, 0.507720947265625, 0.5674285888671875, 0.62713623046875, 0.6868438720703125, 0.746551513671875, 0.8062591552734375, 0.865966796875, 0.9256744384765625, 0.985382080078125, 1.0450897216796875, 1.10479736328125, 1.1645050048828125, 1.224212646484375, 1.2839202880859375, 1.3436279296875, 1.4033355712890625, 1.463043212890625, 1.5227508544921875, 1.58245849609375, 1.6421661376953125, 1.701873779296875, 1.7615814208984375, 1.8212890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 12.0, 19.0, 14.0, 25.0, 43.0, 45.0, 64.0, 141.0, 167.0, 153.0, 103.0, 63.0, 42.0, 34.0, 15.0, 9.0, 10.0, 8.0, 3.0, 5.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002982616424560547, -0.0002878643572330475, -0.0002774670720100403, -0.0002670697867870331, -0.0002566725015640259, -0.0002462752163410187, -0.00023587793111801147, -0.00022548064589500427, -0.00021508336067199707, -0.00020468607544898987, -0.00019428879022598267, -0.00018389150500297546, -0.00017349421977996826, -0.00016309693455696106, -0.00015269964933395386, -0.00014230236411094666, -0.00013190507888793945, -0.00012150779366493225, -0.00011111050844192505, -0.00010071322321891785, -9.031593799591064e-05, -7.991865277290344e-05, -6.952136754989624e-05, -5.912408232688904e-05, -4.8726797103881836e-05, -3.8329511880874634e-05, -2.793222665786743e-05, -1.753494143486023e-05, -7.137656211853027e-06, 3.259629011154175e-06, 1.3656914234161377e-05, 2.405419945716858e-05, 3.445148468017578e-05, 4.4848769903182983e-05, 5.5246055126190186e-05, 6.564334034919739e-05, 7.604062557220459e-05, 8.643791079521179e-05, 9.6835196018219e-05, 0.0001072324812412262, 0.0001176297664642334, 0.0001280270516872406, 0.0001384243369102478, 0.000148821622133255, 0.0001592189073562622, 0.0001696161925792694, 0.0001800134778022766, 0.0001904107630252838, 0.00020080804824829102, 0.00021120533347129822, 0.00022160261869430542, 0.00023199990391731262, 0.00024239718914031982, 0.000252794474363327, 0.00026319175958633423, 0.00027358904480934143, 0.00028398633003234863, 0.00029438361525535583, 0.00030478090047836304, 0.00031517818570137024, 0.00032557547092437744, 0.00033597275614738464, 0.00034637004137039185, 0.00035676732659339905, 0.00036716461181640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 11.0, 15.0, 21.0, 35.0, 45.0, 64.0, 116.0, 212.0, 413.0, 869.0, 1893.0, 4809.0, 14490.0, 65329.0, 661263.0, 252655.0, 31559.0, 8927.0, 3171.0, 1381.0, 591.0, 285.0, 154.0, 88.0, 49.0, 38.0, 24.0, 17.0, 14.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.08477783203125, -2.0230712890625, -1.96136474609375, -1.899658203125, -1.83795166015625, -1.7762451171875, -1.71453857421875, -1.65283203125, -1.59112548828125, -1.5294189453125, -1.46771240234375, -1.406005859375, -1.34429931640625, -1.2825927734375, -1.22088623046875, -1.1591796875, -1.09747314453125, -1.0357666015625, -0.97406005859375, -0.912353515625, -0.85064697265625, -0.7889404296875, -0.72723388671875, -0.66552734375, -0.60382080078125, -0.5421142578125, -0.48040771484375, -0.418701171875, -0.35699462890625, -0.2952880859375, -0.23358154296875, -0.171875, -0.11016845703125, -0.0484619140625, 0.01324462890625, 0.074951171875, 0.13665771484375, 0.1983642578125, 0.26007080078125, 0.32177734375, 0.38348388671875, 0.4451904296875, 0.50689697265625, 0.568603515625, 0.63031005859375, 0.6920166015625, 0.75372314453125, 0.8154296875, 0.87713623046875, 0.9388427734375, 1.00054931640625, 1.062255859375, 1.12396240234375, 1.1856689453125, 1.24737548828125, 1.30908203125, 1.37078857421875, 1.4324951171875, 1.49420166015625, 1.555908203125, 1.61761474609375, 1.6793212890625, 1.74102783203125, 1.802734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 3.0, 11.0, 3.0, 4.0, 12.0, 17.0, 25.0, 48.0, 67.0, 113.0, 173.0, 200.0, 112.0, 70.0, 44.0, 20.0, 13.0, 8.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5917816162109375, -1.541961669921875, -1.4921417236328125, -1.44232177734375, -1.3925018310546875, -1.342681884765625, -1.2928619384765625, -1.2430419921875, -1.1932220458984375, -1.143402099609375, -1.0935821533203125, -1.04376220703125, -0.9939422607421875, -0.944122314453125, -0.8943023681640625, -0.844482421875, -0.7946624755859375, -0.744842529296875, -0.6950225830078125, -0.64520263671875, -0.5953826904296875, -0.545562744140625, -0.4957427978515625, -0.4459228515625, -0.3961029052734375, -0.346282958984375, -0.2964630126953125, -0.24664306640625, -0.1968231201171875, -0.147003173828125, -0.0971832275390625, -0.04736328125, 0.0024566650390625, 0.052276611328125, 0.1020965576171875, 0.15191650390625, 0.2017364501953125, 0.251556396484375, 0.3013763427734375, 0.3511962890625, 0.4010162353515625, 0.450836181640625, 0.5006561279296875, 0.55047607421875, 0.6002960205078125, 0.650115966796875, 0.6999359130859375, 0.749755859375, 0.7995758056640625, 0.849395751953125, 0.8992156982421875, 0.94903564453125, 0.9988555908203125, 1.048675537109375, 1.0984954833984375, 1.1483154296875, 1.1981353759765625, 1.247955322265625, 1.2977752685546875, 1.34759521484375, 1.3974151611328125, 1.447235107421875, 1.4970550537109375, 1.546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 7.0, 13.0, 14.0, 44.0, 65.0, 113.0, 136.0, 176.0, 131.0, 136.0, 71.0, 38.0, 26.0, 14.0, 9.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.22884750366211, -16.671518325805664, -16.11418914794922, -15.55686092376709, -14.999532699584961, -14.442203521728516, -13.88487434387207, -13.327546119689941, -12.770217895507812, -12.212888717651367, -11.655560493469238, -11.098231315612793, -10.540903091430664, -9.983573913574219, -9.426244735717773, -8.868916511535645, -8.3115873336792, -7.754258632659912, -7.196929931640625, -6.63960075378418, -6.082272529602051, -5.5249433517456055, -4.967614650726318, -4.410285949707031, -3.852957248687744, -3.295628547668457, -2.73829984664917, -2.1809709072113037, -1.6236422061920166, -1.0663135051727295, -0.5089845657348633, 0.04834413528442383, 0.6056728363037109, 1.163001537322998, 1.7203303575515747, 2.2776591777801514, 2.8349878787994385, 3.3923165798187256, 3.949645519256592, 4.506974220275879, 5.064302921295166, 5.621631622314453, 6.17896032333374, 6.736289024353027, 7.293618202209473, 7.850946426391602, 8.408275604248047, 8.965604782104492, 9.522933006286621, 10.080262184143066, 10.637590408325195, 11.19491958618164, 11.75224781036377, 12.309576988220215, 12.866905212402344, 13.424234390258789, 13.981563568115234, 14.53889274597168, 15.096220970153809, 15.653550148010254, 16.210878372192383, 16.768207550048828, 17.325536727905273, 17.88286590576172, 18.44019317626953]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 6.0, 12.0, 14.0, 12.0, 19.0, 21.0, 21.0, 29.0, 35.0, 27.0, 29.0, 28.0, 44.0, 55.0, 45.0, 56.0, 40.0, 49.0, 63.0, 44.0, 48.0, 30.0, 41.0, 35.0, 40.0, 27.0, 26.0, 17.0, 9.0, 12.0, 13.0, 8.0, 11.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.818575382232666, -6.551798343658447, -6.2850213050842285, -6.018243789672852, -5.751466751098633, -5.484689712524414, -5.217912673950195, -4.951135635375977, -4.684358596801758, -4.417581558227539, -4.15080451965332, -3.8840272426605225, -3.6172499656677246, -3.350472927093506, -3.083695888519287, -2.8169188499450684, -2.5501413345336914, -2.2833642959594727, -2.016587018966675, -1.749809980392456, -1.4830328226089478, -1.2162556648254395, -0.9494786262512207, -0.6827014684677124, -0.4159243106842041, -0.1491471827030182, 0.11762994527816772, 0.38440704345703125, 0.6511842012405396, 0.9179613590240479, 1.1847383975982666, 1.451515555381775, 1.7182931900024414, 1.9850703477859497, 2.251847505569458, 2.5186245441436768, 2.7854018211364746, 3.0521788597106934, 3.318955898284912, 3.585732936859131, 3.8525102138519287, 4.119287490844727, 4.386064529418945, 4.652841567993164, 4.919618606567383, 5.186395645141602, 5.45317268371582, 5.719950199127197, 5.986727237701416, 6.253504276275635, 6.5202813148498535, 6.7870588302612305, 7.053835868835449, 7.320612907409668, 7.587389945983887, 7.8541669845581055, 8.120944023132324, 8.387721061706543, 8.654498100280762, 8.92127513885498, 9.1880521774292, 9.454830169677734, 9.721607208251953, 9.988384246826172, 10.25516128540039]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 7.0, 19.0, 24.0, 19.0, 39.0, 36.0, 75.0, 82.0, 140.0, 182.0, 255.0, 374.0, 571.0, 869.0, 1409.0, 2142.0, 3649.0, 6495.0, 11973.0, 23978.0, 52815.0, 138798.0, 646692.0, 2874239.0, 269839.0, 85203.0, 35997.0, 16911.0, 8854.0, 4779.0, 2827.0, 1671.0, 1105.0, 658.0, 464.0, 347.0, 203.0, 131.0, 113.0, 77.0, 56.0, 41.0, 28.0, 27.0, 10.0, 14.0, 9.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0], "bins": [-1.2802734375, -1.23931884765625, -1.1983642578125, -1.15740966796875, -1.116455078125, -1.07550048828125, -1.0345458984375, -0.99359130859375, -0.95263671875, -0.91168212890625, -0.8707275390625, -0.82977294921875, -0.788818359375, -0.74786376953125, -0.7069091796875, -0.66595458984375, -0.625, -0.58404541015625, -0.5430908203125, -0.50213623046875, -0.461181640625, -0.42022705078125, -0.3792724609375, -0.33831787109375, -0.29736328125, -0.25640869140625, -0.2154541015625, -0.17449951171875, -0.133544921875, -0.09259033203125, -0.0516357421875, -0.01068115234375, 0.0302734375, 0.07122802734375, 0.1121826171875, 0.15313720703125, 0.194091796875, 0.23504638671875, 0.2760009765625, 0.31695556640625, 0.35791015625, 0.39886474609375, 0.4398193359375, 0.48077392578125, 0.521728515625, 0.56268310546875, 0.6036376953125, 0.64459228515625, 0.685546875, 0.72650146484375, 0.7674560546875, 0.80841064453125, 0.849365234375, 0.89031982421875, 0.9312744140625, 0.97222900390625, 1.01318359375, 1.05413818359375, 1.0950927734375, 1.13604736328125, 1.177001953125, 1.21795654296875, 1.2589111328125, 1.29986572265625, 1.3408203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 8.0, 4.0, 1.0, 4.0, 10.0, 8.0, 6.0, 14.0, 16.0, 19.0, 28.0, 27.0, 27.0, 36.0, 28.0, 23.0, 32.0, 38.0, 51.0, 38.0, 38.0, 58.0, 43.0, 52.0, 31.0, 47.0, 35.0, 33.0, 29.0, 19.0, 34.0, 25.0, 25.0, 18.0, 19.0, 14.0, 12.0, 12.0, 6.0, 7.0, 11.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2958984375, -0.2869071960449219, -0.27791595458984375, -0.2689247131347656, -0.2599334716796875, -0.2509422302246094, -0.24195098876953125, -0.23295974731445312, -0.223968505859375, -0.21497726440429688, -0.20598602294921875, -0.19699478149414062, -0.1880035400390625, -0.17901229858398438, -0.17002105712890625, -0.16102981567382812, -0.15203857421875, -0.14304733276367188, -0.13405609130859375, -0.12506484985351562, -0.1160736083984375, -0.10708236694335938, -0.09809112548828125, -0.08909988403320312, -0.080108642578125, -0.07111740112304688, -0.06212615966796875, -0.053134918212890625, -0.0441436767578125, -0.035152435302734375, -0.02616119384765625, -0.017169952392578125, -0.0081787109375, 0.000812530517578125, 0.00980377197265625, 0.018795013427734375, 0.0277862548828125, 0.036777496337890625, 0.04576873779296875, 0.054759979248046875, 0.063751220703125, 0.07274246215820312, 0.08173370361328125, 0.09072494506835938, 0.0997161865234375, 0.10870742797851562, 0.11769866943359375, 0.12668991088867188, 0.13568115234375, 0.14467239379882812, 0.15366363525390625, 0.16265487670898438, 0.1716461181640625, 0.18063735961914062, 0.18962860107421875, 0.19861984252929688, 0.207611083984375, 0.21660232543945312, 0.22559356689453125, 0.23458480834960938, 0.2435760498046875, 0.2525672912597656, 0.26155853271484375, 0.2705497741699219, 0.279541015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 6.0, 6.0, 2.0, 10.0, 18.0, 15.0, 18.0, 27.0, 25.0, 39.0, 57.0, 76.0, 103.0, 234.0, 405.0, 837.0, 1967.0, 4950.0, 15036.0, 56481.0, 308427.0, 3306762.0, 404907.0, 66257.0, 17634.0, 5777.0, 2201.0, 904.0, 444.0, 217.0, 134.0, 83.0, 55.0, 44.0, 32.0, 21.0, 16.0, 12.0, 10.0, 5.0, 9.0, 7.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.183929443359375, -2.11004638671875, -2.036163330078125, -1.9622802734375, -1.888397216796875, -1.81451416015625, -1.740631103515625, -1.666748046875, -1.592864990234375, -1.51898193359375, -1.445098876953125, -1.3712158203125, -1.297332763671875, -1.22344970703125, -1.149566650390625, -1.07568359375, -1.001800537109375, -0.92791748046875, -0.854034423828125, -0.7801513671875, -0.706268310546875, -0.63238525390625, -0.558502197265625, -0.484619140625, -0.410736083984375, -0.33685302734375, -0.262969970703125, -0.1890869140625, -0.115203857421875, -0.04132080078125, 0.032562255859375, 0.1064453125, 0.180328369140625, 0.25421142578125, 0.328094482421875, 0.4019775390625, 0.475860595703125, 0.54974365234375, 0.623626708984375, 0.697509765625, 0.771392822265625, 0.84527587890625, 0.919158935546875, 0.9930419921875, 1.066925048828125, 1.14080810546875, 1.214691162109375, 1.28857421875, 1.362457275390625, 1.43634033203125, 1.510223388671875, 1.5841064453125, 1.657989501953125, 1.73187255859375, 1.805755615234375, 1.879638671875, 1.953521728515625, 2.02740478515625, 2.101287841796875, 2.1751708984375, 2.249053955078125, 2.32293701171875, 2.396820068359375, 2.470703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 13.0, 9.0, 16.0, 22.0, 26.0, 55.0, 74.0, 102.0, 235.0, 470.0, 1548.0, 812.0, 280.0, 154.0, 89.0, 62.0, 35.0, 22.0, 15.0, 12.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4501953125, -1.411712646484375, -1.37322998046875, -1.334747314453125, -1.2962646484375, -1.257781982421875, -1.21929931640625, -1.180816650390625, -1.142333984375, -1.103851318359375, -1.06536865234375, -1.026885986328125, -0.9884033203125, -0.949920654296875, -0.91143798828125, -0.872955322265625, -0.83447265625, -0.795989990234375, -0.75750732421875, -0.719024658203125, -0.6805419921875, -0.642059326171875, -0.60357666015625, -0.565093994140625, -0.526611328125, -0.488128662109375, -0.44964599609375, -0.411163330078125, -0.3726806640625, -0.334197998046875, -0.29571533203125, -0.257232666015625, -0.21875, -0.180267333984375, -0.14178466796875, -0.103302001953125, -0.0648193359375, -0.026336669921875, 0.01214599609375, 0.050628662109375, 0.089111328125, 0.127593994140625, 0.16607666015625, 0.204559326171875, 0.2430419921875, 0.281524658203125, 0.32000732421875, 0.358489990234375, 0.39697265625, 0.435455322265625, 0.47393798828125, 0.512420654296875, 0.5509033203125, 0.589385986328125, 0.62786865234375, 0.666351318359375, 0.704833984375, 0.743316650390625, 0.78179931640625, 0.820281982421875, 0.8587646484375, 0.897247314453125, 0.93572998046875, 0.974212646484375, 1.0126953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 21.0, 25.0, 50.0, 107.0, 149.0, 147.0, 161.0, 133.0, 86.0, 39.0, 45.0, 15.0, 9.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4707231521606445, -6.197763442993164, -5.924803256988525, -5.651843547821045, -5.378883361816406, -5.105923652648926, -4.832963943481445, -4.560004234313965, -4.287044048309326, -4.014084339141846, -3.741124153137207, -3.4681644439697266, -3.195204496383667, -2.9222445487976074, -2.649284839630127, -2.3763248920440674, -2.103364944458008, -1.8304049968719482, -1.5574451684951782, -1.2844853401184082, -1.0115253925323486, -0.7385654449462891, -0.46560561656951904, -0.19264578819274902, 0.08031415939331055, 0.35327404737472534, 0.6262339353561401, 0.8991938233375549, 1.1721537113189697, 1.4451136589050293, 1.7180734872817993, 1.9910333156585693, 2.263993263244629, 2.5369532108306885, 2.809913158416748, 3.0828728675842285, 3.355832815170288, 3.6287927627563477, 3.901752471923828, 4.174712181091309, 4.447672367095947, 4.720632076263428, 4.993592262268066, 5.266551971435547, 5.539511680603027, 5.812471866607666, 6.0854315757751465, 6.358391761779785, 6.631351470947266, 6.904311180114746, 7.177271366119385, 7.450231075286865, 7.723191261291504, 7.996150970458984, 8.269110679626465, 8.542070388793945, 8.815031051635742, 9.087990760803223, 9.360950469970703, 9.6339111328125, 9.90687084197998, 10.179830551147461, 10.452790260314941, 10.725749969482422, 10.998709678649902]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 10.0, 4.0, 7.0, 5.0, 7.0, 20.0, 14.0, 15.0, 19.0, 21.0, 21.0, 31.0, 20.0, 27.0, 36.0, 39.0, 49.0, 44.0, 45.0, 44.0, 20.0, 41.0, 47.0, 38.0, 38.0, 27.0, 37.0, 37.0, 34.0, 26.0, 31.0, 29.0, 18.0, 20.0, 14.0, 15.0, 9.0, 10.0, 8.0, 8.0, 10.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.436687707901001, -3.3341846466064453, -3.2316815853118896, -3.129178524017334, -3.0266754627227783, -2.9241724014282227, -2.821669101715088, -2.7191660404205322, -2.6166629791259766, -2.514159917831421, -2.4116568565368652, -2.3091537952423096, -2.206650733947754, -2.104147434234619, -2.0016446113586426, -1.8991413116455078, -1.7966383695602417, -1.694135308265686, -1.5916322469711304, -1.4891290664672852, -1.3866260051727295, -1.2841229438781738, -1.1816198825836182, -1.0791168212890625, -0.9766137003898621, -0.8741106390953064, -0.771607518196106, -0.6691044569015503, -0.5666013956069946, -0.4640982747077942, -0.3615952134132385, -0.2590920925140381, -0.15658903121948242, -0.05408594757318497, 0.04841713607311249, 0.15092021226882935, 0.2534233033657074, 0.35592639446258545, 0.4584294557571411, 0.5609325766563416, 0.6634356379508972, 0.7659386992454529, 0.8684418201446533, 0.970944881439209, 1.0734479427337646, 1.1759510040283203, 1.278454065322876, 1.3809572458267212, 1.4834603071212769, 1.5859633684158325, 1.6884664297103882, 1.7909696102142334, 1.893472671508789, 1.9959757328033447, 2.0984787940979004, 2.200981855392456, 2.3034849166870117, 2.4059879779815674, 2.508491039276123, 2.6109941005706787, 2.7134971618652344, 2.816000461578369, 2.9185032844543457, 3.0210065841674805, 3.123509645462036]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 10.0, 18.0, 27.0, 38.0, 64.0, 78.0, 90.0, 171.0, 275.0, 398.0, 627.0, 1062.0, 1749.0, 2962.0, 5016.0, 8764.0, 15011.0, 26555.0, 49558.0, 107664.0, 345392.0, 288608.0, 92520.0, 44214.0, 24380.0, 13813.0, 7833.0, 4614.0, 2735.0, 1550.0, 980.0, 609.0, 397.0, 269.0, 144.0, 107.0, 68.0, 40.0, 39.0, 17.0, 23.0, 6.0, 12.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.255859375, -1.2138824462890625, -1.171905517578125, -1.1299285888671875, -1.08795166015625, -1.0459747314453125, -1.003997802734375, -0.9620208740234375, -0.9200439453125, -0.8780670166015625, -0.836090087890625, -0.7941131591796875, -0.75213623046875, -0.7101593017578125, -0.668182373046875, -0.6262054443359375, -0.584228515625, -0.5422515869140625, -0.500274658203125, -0.4582977294921875, -0.41632080078125, -0.3743438720703125, -0.332366943359375, -0.2903900146484375, -0.2484130859375, -0.2064361572265625, -0.164459228515625, -0.1224822998046875, -0.08050537109375, -0.0385284423828125, 0.003448486328125, 0.0454254150390625, 0.08740234375, 0.1293792724609375, 0.171356201171875, 0.2133331298828125, 0.25531005859375, 0.2972869873046875, 0.339263916015625, 0.3812408447265625, 0.4232177734375, 0.4651947021484375, 0.507171630859375, 0.5491485595703125, 0.59112548828125, 0.6331024169921875, 0.675079345703125, 0.7170562744140625, 0.759033203125, 0.8010101318359375, 0.842987060546875, 0.8849639892578125, 0.92694091796875, 0.9689178466796875, 1.010894775390625, 1.0528717041015625, 1.0948486328125, 1.1368255615234375, 1.178802490234375, 1.2207794189453125, 1.26275634765625, 1.3047332763671875, 1.346710205078125, 1.3886871337890625, 1.4306640625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 17.0, 14.0, 20.0, 25.0, 31.0, 31.0, 36.0, 34.0, 39.0, 30.0, 48.0, 43.0, 53.0, 48.0, 44.0, 41.0, 48.0, 45.0, 44.0, 43.0, 32.0, 40.0, 16.0, 16.0, 16.0, 26.0, 10.0, 14.0, 19.0, 9.0, 7.0, 10.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.319091796875, -0.3090667724609375, -0.299041748046875, -0.2890167236328125, -0.27899169921875, -0.2689666748046875, -0.258941650390625, -0.2489166259765625, -0.2388916015625, -0.2288665771484375, -0.218841552734375, -0.2088165283203125, -0.19879150390625, -0.1887664794921875, -0.178741455078125, -0.1687164306640625, -0.15869140625, -0.1486663818359375, -0.138641357421875, -0.1286163330078125, -0.11859130859375, -0.1085662841796875, -0.098541259765625, -0.0885162353515625, -0.0784912109375, -0.0684661865234375, -0.058441162109375, -0.0484161376953125, -0.03839111328125, -0.0283660888671875, -0.018341064453125, -0.0083160400390625, 0.001708984375, 0.0117340087890625, 0.021759033203125, 0.0317840576171875, 0.04180908203125, 0.0518341064453125, 0.061859130859375, 0.0718841552734375, 0.0819091796875, 0.0919342041015625, 0.101959228515625, 0.1119842529296875, 0.12200927734375, 0.1320343017578125, 0.142059326171875, 0.1520843505859375, 0.162109375, 0.1721343994140625, 0.182159423828125, 0.1921844482421875, 0.20220947265625, 0.2122344970703125, 0.222259521484375, 0.2322845458984375, 0.2423095703125, 0.2523345947265625, 0.262359619140625, 0.2723846435546875, 0.28240966796875, 0.2924346923828125, 0.302459716796875, 0.3124847412109375, 0.322509765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 22.0, 22.0, 18.0, 46.0, 51.0, 81.0, 120.0, 175.0, 273.0, 443.0, 743.0, 1455.0, 3277.0, 9105.0, 33275.0, 208636.0, 683593.0, 79651.0, 17353.0, 5495.0, 2160.0, 1026.0, 579.0, 326.0, 232.0, 110.0, 91.0, 50.0, 40.0, 27.0, 23.0, 19.0, 8.0, 4.0, 4.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.20703125, -2.123016357421875, -2.03900146484375, -1.954986572265625, -1.8709716796875, -1.786956787109375, -1.70294189453125, -1.618927001953125, -1.534912109375, -1.450897216796875, -1.36688232421875, -1.282867431640625, -1.1988525390625, -1.114837646484375, -1.03082275390625, -0.946807861328125, -0.86279296875, -0.778778076171875, -0.69476318359375, -0.610748291015625, -0.5267333984375, -0.442718505859375, -0.35870361328125, -0.274688720703125, -0.190673828125, -0.106658935546875, -0.02264404296875, 0.061370849609375, 0.1453857421875, 0.229400634765625, 0.31341552734375, 0.397430419921875, 0.4814453125, 0.565460205078125, 0.64947509765625, 0.733489990234375, 0.8175048828125, 0.901519775390625, 0.98553466796875, 1.069549560546875, 1.153564453125, 1.237579345703125, 1.32159423828125, 1.405609130859375, 1.4896240234375, 1.573638916015625, 1.65765380859375, 1.741668701171875, 1.82568359375, 1.909698486328125, 1.99371337890625, 2.077728271484375, 2.1617431640625, 2.245758056640625, 2.32977294921875, 2.413787841796875, 2.497802734375, 2.581817626953125, 2.66583251953125, 2.749847412109375, 2.8338623046875, 2.917877197265625, 3.00189208984375, 3.085906982421875, 3.169921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 15.0, 12.0, 9.0, 20.0, 25.0, 24.0, 47.0, 46.0, 62.0, 57.0, 60.0, 68.0, 62.0, 83.0, 69.0, 71.0, 52.0, 45.0, 40.0, 32.0, 25.0, 17.0, 14.0, 8.0, 9.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9150390625, -1.8502960205078125, -1.785552978515625, -1.7208099365234375, -1.65606689453125, -1.5913238525390625, -1.526580810546875, -1.4618377685546875, -1.3970947265625, -1.3323516845703125, -1.267608642578125, -1.2028656005859375, -1.13812255859375, -1.0733795166015625, -1.008636474609375, -0.9438934326171875, -0.879150390625, -0.8144073486328125, -0.749664306640625, -0.6849212646484375, -0.62017822265625, -0.5554351806640625, -0.490692138671875, -0.4259490966796875, -0.3612060546875, -0.2964630126953125, -0.231719970703125, -0.1669769287109375, -0.10223388671875, -0.0374908447265625, 0.027252197265625, 0.0919952392578125, 0.15673828125, 0.2214813232421875, 0.286224365234375, 0.3509674072265625, 0.41571044921875, 0.4804534912109375, 0.545196533203125, 0.6099395751953125, 0.6746826171875, 0.7394256591796875, 0.804168701171875, 0.8689117431640625, 0.93365478515625, 0.9983978271484375, 1.063140869140625, 1.1278839111328125, 1.192626953125, 1.2573699951171875, 1.322113037109375, 1.3868560791015625, 1.45159912109375, 1.5163421630859375, 1.581085205078125, 1.6458282470703125, 1.7105712890625, 1.7753143310546875, 1.840057373046875, 1.9048004150390625, 1.96954345703125, 2.0342864990234375, 2.099029541015625, 2.1637725830078125, 2.228515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 17.0, 12.0, 9.0, 20.0, 19.0, 48.0, 79.0, 100.0, 214.0, 309.0, 608.0, 1186.0, 2485.0, 6240.0, 17371.0, 54147.0, 327639.0, 527928.0, 73462.0, 22606.0, 7917.0, 3146.0, 1378.0, 690.0, 338.0, 214.0, 122.0, 83.0, 58.0, 40.0, 22.0, 13.0, 11.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96044921875, -0.9274673461914062, -0.8944854736328125, -0.8615036010742188, -0.828521728515625, -0.7955398559570312, -0.7625579833984375, -0.7295761108398438, -0.69659423828125, -0.6636123657226562, -0.6306304931640625, -0.5976486206054688, -0.564666748046875, -0.5316848754882812, -0.4987030029296875, -0.46572113037109375, -0.4327392578125, -0.39975738525390625, -0.3667755126953125, -0.33379364013671875, -0.300811767578125, -0.26782989501953125, -0.2348480224609375, -0.20186614990234375, -0.16888427734375, -0.13590240478515625, -0.1029205322265625, -0.06993865966796875, -0.036956787109375, -0.00397491455078125, 0.0290069580078125, 0.06198883056640625, 0.094970703125, 0.12795257568359375, 0.1609344482421875, 0.19391632080078125, 0.226898193359375, 0.25988006591796875, 0.2928619384765625, 0.32584381103515625, 0.35882568359375, 0.39180755615234375, 0.4247894287109375, 0.45777130126953125, 0.490753173828125, 0.5237350463867188, 0.5567169189453125, 0.5896987915039062, 0.6226806640625, 0.6556625366210938, 0.6886444091796875, 0.7216262817382812, 0.754608154296875, 0.7875900268554688, 0.8205718994140625, 0.8535537719726562, 0.88653564453125, 0.9195175170898438, 0.9524993896484375, 0.9854812622070312, 1.018463134765625, 1.0514450073242188, 1.0844268798828125, 1.1174087524414062, 1.150390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 16.0, 19.0, 22.0, 21.0, 29.0, 38.0, 120.0, 163.0, 211.0, 125.0, 59.0, 45.0, 25.0, 13.0, 15.0, 14.0, 10.0, 9.0, 9.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00024175643920898438, -0.00023318827152252197, -0.00022462010383605957, -0.00021605193614959717, -0.00020748376846313477, -0.00019891560077667236, -0.00019034743309020996, -0.00018177926540374756, -0.00017321109771728516, -0.00016464293003082275, -0.00015607476234436035, -0.00014750659465789795, -0.00013893842697143555, -0.00013037025928497314, -0.00012180209159851074, -0.00011323392391204834, -0.00010466575622558594, -9.609758853912354e-05, -8.752942085266113e-05, -7.896125316619873e-05, -7.039308547973633e-05, -6.182491779327393e-05, -5.3256750106811523e-05, -4.468858242034912e-05, -3.612041473388672e-05, -2.7552247047424316e-05, -1.8984079360961914e-05, -1.0415911674499512e-05, -1.8477439880371094e-06, 6.720423698425293e-06, 1.5288591384887695e-05, 2.3856759071350098e-05, 3.24249267578125e-05, 4.09930944442749e-05, 4.9561262130737305e-05, 5.812942981719971e-05, 6.669759750366211e-05, 7.526576519012451e-05, 8.383393287658691e-05, 9.240210056304932e-05, 0.00010097026824951172, 0.00010953843593597412, 0.00011810660362243652, 0.00012667477130889893, 0.00013524293899536133, 0.00014381110668182373, 0.00015237927436828613, 0.00016094744205474854, 0.00016951560974121094, 0.00017808377742767334, 0.00018665194511413574, 0.00019522011280059814, 0.00020378828048706055, 0.00021235644817352295, 0.00022092461585998535, 0.00022949278354644775, 0.00023806095123291016, 0.00024662911891937256, 0.00025519728660583496, 0.00026376545429229736, 0.00027233362197875977, 0.00028090178966522217, 0.00028946995735168457, 0.00029803812503814697, 0.0003066062927246094]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 14.0, 10.0, 20.0, 29.0, 38.0, 55.0, 68.0, 111.0, 223.0, 354.0, 820.0, 2097.0, 6449.0, 26698.0, 163076.0, 732529.0, 91163.0, 17094.0, 4608.0, 1607.0, 641.0, 340.0, 161.0, 123.0, 76.0, 45.0, 33.0, 22.0, 14.0, 13.0, 10.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1459808349609375, -1.102508544921875, -1.0590362548828125, -1.01556396484375, -0.9720916748046875, -0.928619384765625, -0.8851470947265625, -0.8416748046875, -0.7982025146484375, -0.754730224609375, -0.7112579345703125, -0.66778564453125, -0.6243133544921875, -0.580841064453125, -0.5373687744140625, -0.493896484375, -0.4504241943359375, -0.406951904296875, -0.3634796142578125, -0.32000732421875, -0.2765350341796875, -0.233062744140625, -0.1895904541015625, -0.1461181640625, -0.1026458740234375, -0.059173583984375, -0.0157012939453125, 0.02777099609375, 0.0712432861328125, 0.114715576171875, 0.1581878662109375, 0.20166015625, 0.2451324462890625, 0.288604736328125, 0.3320770263671875, 0.37554931640625, 0.4190216064453125, 0.462493896484375, 0.5059661865234375, 0.5494384765625, 0.5929107666015625, 0.636383056640625, 0.6798553466796875, 0.72332763671875, 0.7667999267578125, 0.810272216796875, 0.8537445068359375, 0.897216796875, 0.9406890869140625, 0.984161376953125, 1.0276336669921875, 1.07110595703125, 1.1145782470703125, 1.158050537109375, 1.2015228271484375, 1.2449951171875, 1.2884674072265625, 1.331939697265625, 1.3754119873046875, 1.41888427734375, 1.4623565673828125, 1.505828857421875, 1.5493011474609375, 1.5927734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 11.0, 6.0, 12.0, 11.0, 10.0, 21.0, 12.0, 34.0, 29.0, 65.0, 107.0, 171.0, 144.0, 120.0, 58.0, 45.0, 22.0, 24.0, 23.0, 11.0, 13.0, 11.0, 12.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.7029800415039062, -0.6759796142578125, -0.6489791870117188, -0.621978759765625, -0.5949783325195312, -0.5679779052734375, -0.5409774780273438, -0.51397705078125, -0.48697662353515625, -0.4599761962890625, -0.43297576904296875, -0.405975341796875, -0.37897491455078125, -0.3519744873046875, -0.32497406005859375, -0.2979736328125, -0.27097320556640625, -0.2439727783203125, -0.21697235107421875, -0.189971923828125, -0.16297149658203125, -0.1359710693359375, -0.10897064208984375, -0.08197021484375, -0.05496978759765625, -0.0279693603515625, -0.00096893310546875, 0.026031494140625, 0.05303192138671875, 0.0800323486328125, 0.10703277587890625, 0.134033203125, 0.16103363037109375, 0.1880340576171875, 0.21503448486328125, 0.242034912109375, 0.26903533935546875, 0.2960357666015625, 0.32303619384765625, 0.35003662109375, 0.37703704833984375, 0.4040374755859375, 0.43103790283203125, 0.458038330078125, 0.48503875732421875, 0.5120391845703125, 0.5390396118164062, 0.5660400390625, 0.5930404663085938, 0.6200408935546875, 0.6470413208007812, 0.674041748046875, 0.7010421752929688, 0.7280426025390625, 0.7550430297851562, 0.78204345703125, 0.8090438842773438, 0.8360443115234375, 0.8630447387695312, 0.890045166015625, 0.9170455932617188, 0.9440460205078125, 0.9710464477539062, 0.998046875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 14.0, 32.0, 77.0, 119.0, 147.0, 168.0, 160.0, 114.0, 71.0, 41.0, 29.0, 15.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.95413589477539, -19.363948822021484, -18.773759841918945, -18.183570861816406, -17.5933837890625, -17.003196716308594, -16.413007736206055, -15.822819709777832, -15.23263168334961, -14.642443656921387, -14.052255630493164, -13.462067604064941, -12.871879577636719, -12.281691551208496, -11.691503524780273, -11.10131549835205, -10.511127471923828, -9.920939445495605, -9.330751419067383, -8.74056339263916, -8.150375366210938, -7.560187339782715, -6.969999313354492, -6.3798112869262695, -5.789623260498047, -5.199435234069824, -4.609247207641602, -4.019059181213379, -3.4288711547851562, -2.8386831283569336, -2.248495101928711, -1.6583070755004883, -1.0681190490722656, -0.47793102264404297, 0.11225700378417969, 0.7024450302124023, 1.292633056640625, 1.8828210830688477, 2.4730091094970703, 3.063197135925293, 3.6533851623535156, 4.243573188781738, 4.833761215209961, 5.423949241638184, 6.014137268066406, 6.604325294494629, 7.194513320922852, 7.784701347351074, 8.374889373779297, 8.96507740020752, 9.555265426635742, 10.145453453063965, 10.735641479492188, 11.32582950592041, 11.916017532348633, 12.506205558776855, 13.096393585205078, 13.6865816116333, 14.276769638061523, 14.866957664489746, 15.457145690917969, 16.047332763671875, 16.637521743774414, 17.227710723876953, 17.81789779663086]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 10.0, 13.0, 13.0, 19.0, 12.0, 26.0, 38.0, 28.0, 33.0, 45.0, 39.0, 56.0, 61.0, 59.0, 58.0, 55.0, 56.0, 58.0, 52.0, 46.0, 40.0, 34.0, 23.0, 32.0, 25.0, 15.0, 14.0, 9.0, 14.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.687544345855713, -7.378377914428711, -7.069211959838867, -6.760046005249023, -6.4508795738220215, -6.1417131423950195, -5.832547187805176, -5.523381233215332, -5.21421480178833, -4.905048370361328, -4.595882415771484, -4.286716461181641, -3.9775500297546387, -3.668383836746216, -3.359217643737793, -3.05005145072937, -2.7408852577209473, -2.4317190647125244, -2.1225528717041016, -1.8133866786956787, -1.5042204856872559, -1.195054292678833, -0.8858880996704102, -0.5767219066619873, -0.26755571365356445, 0.0416104793548584, 0.35077667236328125, 0.6599428653717041, 0.969109058380127, 1.2782752513885498, 1.5874414443969727, 1.8966076374053955, 2.2057743072509766, 2.5149405002593994, 2.8241066932678223, 3.133272886276245, 3.442439079284668, 3.751605272293091, 4.060771465301514, 4.369937896728516, 4.679103851318359, 4.988269805908203, 5.297436237335205, 5.606602668762207, 5.915768623352051, 6.2249345779418945, 6.5341010093688965, 6.843267440795898, 7.152433395385742, 7.461599349975586, 7.770765781402588, 8.07993221282959, 8.389098167419434, 8.698264122009277, 9.007431030273438, 9.316596984863281, 9.625762939453125, 9.934928894042969, 10.244094848632812, 10.553261756896973, 10.862427711486816, 11.17159366607666, 11.48076057434082, 11.789926528930664, 12.099092483520508]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 10.0, 6.0, 8.0, 21.0, 25.0, 46.0, 69.0, 77.0, 144.0, 215.0, 331.0, 470.0, 851.0, 1440.0, 2439.0, 4368.0, 8142.0, 16451.0, 34704.0, 87291.0, 355615.0, 3170024.0, 354212.0, 86857.0, 34845.0, 16322.0, 8365.0, 4505.0, 2555.0, 1375.0, 859.0, 538.0, 368.0, 259.0, 136.0, 103.0, 75.0, 36.0, 39.0, 23.0, 23.0, 11.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.15594482421875, -1.1087646484375, -1.06158447265625, -1.014404296875, -0.96722412109375, -0.9200439453125, -0.87286376953125, -0.82568359375, -0.77850341796875, -0.7313232421875, -0.68414306640625, -0.636962890625, -0.58978271484375, -0.5426025390625, -0.49542236328125, -0.4482421875, -0.40106201171875, -0.3538818359375, -0.30670166015625, -0.259521484375, -0.21234130859375, -0.1651611328125, -0.11798095703125, -0.07080078125, -0.02362060546875, 0.0235595703125, 0.07073974609375, 0.117919921875, 0.16510009765625, 0.2122802734375, 0.25946044921875, 0.306640625, 0.35382080078125, 0.4010009765625, 0.44818115234375, 0.495361328125, 0.54254150390625, 0.5897216796875, 0.63690185546875, 0.68408203125, 0.73126220703125, 0.7784423828125, 0.82562255859375, 0.872802734375, 0.91998291015625, 0.9671630859375, 1.01434326171875, 1.0615234375, 1.10870361328125, 1.1558837890625, 1.20306396484375, 1.250244140625, 1.29742431640625, 1.3446044921875, 1.39178466796875, 1.43896484375, 1.48614501953125, 1.5333251953125, 1.58050537109375, 1.627685546875, 1.67486572265625, 1.7220458984375, 1.76922607421875, 1.81640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 12.0, 14.0, 13.0, 13.0, 17.0, 21.0, 30.0, 32.0, 33.0, 37.0, 31.0, 45.0, 39.0, 36.0, 47.0, 56.0, 47.0, 45.0, 47.0, 48.0, 36.0, 32.0, 34.0, 36.0, 35.0, 16.0, 26.0, 18.0, 14.0, 17.0, 16.0, 4.0, 9.0, 7.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2587852478027344, -0.24755096435546875, -0.23631668090820312, -0.2250823974609375, -0.21384811401367188, -0.20261383056640625, -0.19137954711914062, -0.180145263671875, -0.16891098022460938, -0.15767669677734375, -0.14644241333007812, -0.1352081298828125, -0.12397384643554688, -0.11273956298828125, -0.10150527954101562, -0.09027099609375, -0.07903671264648438, -0.06780242919921875, -0.056568145751953125, -0.0453338623046875, -0.034099578857421875, -0.02286529541015625, -0.011631011962890625, -0.000396728515625, 0.010837554931640625, 0.02207183837890625, 0.033306121826171875, 0.0445404052734375, 0.055774688720703125, 0.06700897216796875, 0.07824325561523438, 0.0894775390625, 0.10071182250976562, 0.11194610595703125, 0.12318038940429688, 0.1344146728515625, 0.14564895629882812, 0.15688323974609375, 0.16811752319335938, 0.179351806640625, 0.19058609008789062, 0.20182037353515625, 0.21305465698242188, 0.2242889404296875, 0.23552322387695312, 0.24675750732421875, 0.2579917907714844, 0.26922607421875, 0.2804603576660156, 0.29169464111328125, 0.3029289245605469, 0.3141632080078125, 0.3253974914550781, 0.33663177490234375, 0.3478660583496094, 0.359100341796875, 0.3703346252441406, 0.38156890869140625, 0.3928031921386719, 0.4040374755859375, 0.4152717590332031, 0.42650604248046875, 0.4377403259277344, 0.448974609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 13.0, 15.0, 13.0, 21.0, 14.0, 16.0, 21.0, 30.0, 31.0, 36.0, 48.0, 72.0, 100.0, 219.0, 727.0, 7667.0, 2933730.0, 1243796.0, 6461.0, 633.0, 186.0, 105.0, 76.0, 41.0, 35.0, 32.0, 25.0, 20.0, 25.0, 15.0, 16.0, 5.0, 10.0, 4.0, 3.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.70068359375, -10.3857421875, -10.07080078125, -9.755859375, -9.44091796875, -9.1259765625, -8.81103515625, -8.49609375, -8.18115234375, -7.8662109375, -7.55126953125, -7.236328125, -6.92138671875, -6.6064453125, -6.29150390625, -5.9765625, -5.66162109375, -5.3466796875, -5.03173828125, -4.716796875, -4.40185546875, -4.0869140625, -3.77197265625, -3.45703125, -3.14208984375, -2.8271484375, -2.51220703125, -2.197265625, -1.88232421875, -1.5673828125, -1.25244140625, -0.9375, -0.62255859375, -0.3076171875, 0.00732421875, 0.322265625, 0.63720703125, 0.9521484375, 1.26708984375, 1.58203125, 1.89697265625, 2.2119140625, 2.52685546875, 2.841796875, 3.15673828125, 3.4716796875, 3.78662109375, 4.1015625, 4.41650390625, 4.7314453125, 5.04638671875, 5.361328125, 5.67626953125, 5.9912109375, 6.30615234375, 6.62109375, 6.93603515625, 7.2509765625, 7.56591796875, 7.880859375, 8.19580078125, 8.5107421875, 8.82568359375, 9.140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 14.0, 21.0, 50.0, 165.0, 1589.0, 1984.0, 179.0, 48.0, 22.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -5.029754638671875, -4.92279052734375, -4.815826416015625, -4.7088623046875, -4.601898193359375, -4.49493408203125, -4.387969970703125, -4.281005859375, -4.174041748046875, -4.06707763671875, -3.960113525390625, -3.8531494140625, -3.746185302734375, -3.63922119140625, -3.532257080078125, -3.42529296875, -3.318328857421875, -3.21136474609375, -3.104400634765625, -2.9974365234375, -2.890472412109375, -2.78350830078125, -2.676544189453125, -2.569580078125, -2.462615966796875, -2.35565185546875, -2.248687744140625, -2.1417236328125, -2.034759521484375, -1.92779541015625, -1.820831298828125, -1.7138671875, -1.606903076171875, -1.49993896484375, -1.392974853515625, -1.2860107421875, -1.179046630859375, -1.07208251953125, -0.965118408203125, -0.858154296875, -0.751190185546875, -0.64422607421875, -0.537261962890625, -0.4302978515625, -0.323333740234375, -0.21636962890625, -0.109405517578125, -0.00244140625, 0.104522705078125, 0.21148681640625, 0.318450927734375, 0.4254150390625, 0.532379150390625, 0.63934326171875, 0.746307373046875, 0.853271484375, 0.960235595703125, 1.06719970703125, 1.174163818359375, 1.2811279296875, 1.388092041015625, 1.49505615234375, 1.602020263671875, 1.708984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 9.0, 20.0, 19.0, 23.0, 32.0, 39.0, 84.0, 81.0, 121.0, 129.0, 129.0, 97.0, 77.0, 51.0, 36.0, 13.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-13.661874771118164, -13.368433952331543, -13.074994087219238, -12.781553268432617, -12.488113403320312, -12.194672584533691, -11.90123176574707, -11.607791900634766, -11.314351081848145, -11.020910263061523, -10.727470397949219, -10.434029579162598, -10.140588760375977, -9.847148895263672, -9.55370807647705, -9.26026725769043, -8.966827392578125, -8.673386573791504, -8.3799467086792, -8.086505889892578, -7.793065547943115, -7.499625205993652, -7.206184387207031, -6.912744045257568, -6.6193037033081055, -6.325863361358643, -6.03242301940918, -5.738982200622559, -5.445541858673096, -5.152101516723633, -4.858660697937012, -4.565220355987549, -4.271780490875244, -3.9783401489257812, -3.6848995685577393, -3.3914589881896973, -3.0980186462402344, -2.8045783042907715, -2.5111377239227295, -2.2176971435546875, -1.9242568016052246, -1.6308163404464722, -1.3373758792877197, -1.0439354181289673, -0.7504949569702148, -0.4570544958114624, -0.16361403465270996, 0.12982654571533203, 0.4232668876647949, 0.7167073488235474, 1.0101478099822998, 1.3035882711410522, 1.5970287322998047, 1.8904691934585571, 2.1839096546173096, 2.4773502349853516, 2.7707905769348145, 3.0642309188842773, 3.3576714992523193, 3.6511120796203613, 3.944552421569824, 4.237992763519287, 4.53143310546875, 4.824873924255371, 5.118314266204834]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 7.0, 6.0, 7.0, 14.0, 9.0, 21.0, 15.0, 18.0, 25.0, 23.0, 31.0, 36.0, 38.0, 49.0, 33.0, 44.0, 43.0, 46.0, 37.0, 53.0, 41.0, 34.0, 39.0, 33.0, 38.0, 35.0, 35.0, 35.0, 24.0, 20.0, 18.0, 11.0, 14.0, 13.0, 10.0, 10.0, 10.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15170955657959, -4.997504234313965, -4.843299388885498, -4.689094066619873, -4.534888744354248, -4.380683422088623, -4.226478576660156, -4.072273254394531, -3.9180679321289062, -3.7638628482818604, -3.6096575260162354, -3.4554524421691895, -3.3012471199035645, -3.1470420360565186, -2.9928369522094727, -2.8386316299438477, -2.6844265460968018, -2.530221462249756, -2.376016139984131, -2.221811056137085, -2.06760573387146, -1.913400650024414, -1.7591954469680786, -1.6049902439117432, -1.4507850408554077, -1.2965798377990723, -1.1423746347427368, -0.9881694912910461, -0.8339642882347107, -0.6797590851783752, -0.5255539417266846, -0.3713487386703491, -0.21714353561401367, -0.06293834745883942, 0.09126684069633484, 0.2454720139503479, 0.39967721700668335, 0.5538824200630188, 0.7080875635147095, 0.8622927665710449, 1.0164979696273804, 1.1707031726837158, 1.3249083757400513, 1.4791135787963867, 1.6333186626434326, 1.7875239849090576, 1.9417290687561035, 2.0959343910217285, 2.2501394748687744, 2.4043445587158203, 2.5585498809814453, 2.712754964828491, 2.866960287094116, 3.021165370941162, 3.175370693206787, 3.329575777053833, 3.483780860900879, 3.637985944747925, 3.79219126701355, 3.9463963508605957, 4.100601673126221, 4.254806995391846, 4.4090118408203125, 4.5632171630859375, 4.7174224853515625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 14.0, 20.0, 34.0, 44.0, 59.0, 93.0, 140.0, 239.0, 354.0, 480.0, 825.0, 1437.0, 2375.0, 4574.0, 8775.0, 17375.0, 37077.0, 91417.0, 340365.0, 368025.0, 97359.0, 38899.0, 18353.0, 9109.0, 4703.0, 2628.0, 1455.0, 852.0, 515.0, 348.0, 218.0, 127.0, 94.0, 59.0, 45.0, 15.0, 18.0, 11.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.48284912109375, -1.4334716796875, -1.38409423828125, -1.334716796875, -1.28533935546875, -1.2359619140625, -1.18658447265625, -1.13720703125, -1.08782958984375, -1.0384521484375, -0.98907470703125, -0.939697265625, -0.89031982421875, -0.8409423828125, -0.79156494140625, -0.7421875, -0.69281005859375, -0.6434326171875, -0.59405517578125, -0.544677734375, -0.49530029296875, -0.4459228515625, -0.39654541015625, -0.34716796875, -0.29779052734375, -0.2484130859375, -0.19903564453125, -0.149658203125, -0.10028076171875, -0.0509033203125, -0.00152587890625, 0.0478515625, 0.09722900390625, 0.1466064453125, 0.19598388671875, 0.245361328125, 0.29473876953125, 0.3441162109375, 0.39349365234375, 0.44287109375, 0.49224853515625, 0.5416259765625, 0.59100341796875, 0.640380859375, 0.68975830078125, 0.7391357421875, 0.78851318359375, 0.837890625, 0.88726806640625, 0.9366455078125, 0.98602294921875, 1.035400390625, 1.08477783203125, 1.1341552734375, 1.18353271484375, 1.23291015625, 1.28228759765625, 1.3316650390625, 1.38104248046875, 1.430419921875, 1.47979736328125, 1.5291748046875, 1.57855224609375, 1.6279296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 11.0, 4.0, 8.0, 7.0, 20.0, 13.0, 22.0, 21.0, 23.0, 18.0, 22.0, 19.0, 21.0, 34.0, 34.0, 39.0, 43.0, 36.0, 44.0, 41.0, 51.0, 44.0, 31.0, 44.0, 34.0, 36.0, 32.0, 33.0, 35.0, 26.0, 15.0, 26.0, 20.0, 21.0, 9.0, 7.0, 11.0, 9.0, 10.0, 6.0, 4.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.354736328125, -0.34264373779296875, -0.3305511474609375, -0.31845855712890625, -0.306365966796875, -0.29427337646484375, -0.2821807861328125, -0.27008819580078125, -0.25799560546875, -0.24590301513671875, -0.2338104248046875, -0.22171783447265625, -0.209625244140625, -0.19753265380859375, -0.1854400634765625, -0.17334747314453125, -0.1612548828125, -0.14916229248046875, -0.1370697021484375, -0.12497711181640625, -0.112884521484375, -0.10079193115234375, -0.0886993408203125, -0.07660675048828125, -0.06451416015625, -0.05242156982421875, -0.0403289794921875, -0.02823638916015625, -0.016143798828125, -0.00405120849609375, 0.0080413818359375, 0.02013397216796875, 0.0322265625, 0.04431915283203125, 0.0564117431640625, 0.06850433349609375, 0.080596923828125, 0.09268951416015625, 0.1047821044921875, 0.11687469482421875, 0.12896728515625, 0.14105987548828125, 0.1531524658203125, 0.16524505615234375, 0.177337646484375, 0.18943023681640625, 0.2015228271484375, 0.21361541748046875, 0.2257080078125, 0.23780059814453125, 0.2498931884765625, 0.26198577880859375, 0.274078369140625, 0.28617095947265625, 0.2982635498046875, 0.31035614013671875, 0.32244873046875, 0.33454132080078125, 0.3466339111328125, 0.35872650146484375, 0.370819091796875, 0.38291168212890625, 0.3950042724609375, 0.40709686279296875, 0.419189453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 12.0, 16.0, 17.0, 20.0, 44.0, 43.0, 78.0, 126.0, 181.0, 237.0, 383.0, 594.0, 1007.0, 1763.0, 3260.0, 6588.0, 14895.0, 35084.0, 122378.0, 698531.0, 103224.0, 32458.0, 13827.0, 6341.0, 3082.0, 1760.0, 945.0, 587.0, 370.0, 207.0, 143.0, 115.0, 73.0, 46.0, 34.0, 18.0, 13.0, 9.0, 12.0, 6.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.2578125, -2.18603515625, -2.1142578125, -2.04248046875, -1.970703125, -1.89892578125, -1.8271484375, -1.75537109375, -1.68359375, -1.61181640625, -1.5400390625, -1.46826171875, -1.396484375, -1.32470703125, -1.2529296875, -1.18115234375, -1.109375, -1.03759765625, -0.9658203125, -0.89404296875, -0.822265625, -0.75048828125, -0.6787109375, -0.60693359375, -0.53515625, -0.46337890625, -0.3916015625, -0.31982421875, -0.248046875, -0.17626953125, -0.1044921875, -0.03271484375, 0.0390625, 0.11083984375, 0.1826171875, 0.25439453125, 0.326171875, 0.39794921875, 0.4697265625, 0.54150390625, 0.61328125, 0.68505859375, 0.7568359375, 0.82861328125, 0.900390625, 0.97216796875, 1.0439453125, 1.11572265625, 1.1875, 1.25927734375, 1.3310546875, 1.40283203125, 1.474609375, 1.54638671875, 1.6181640625, 1.68994140625, 1.76171875, 1.83349609375, 1.9052734375, 1.97705078125, 2.048828125, 2.12060546875, 2.1923828125, 2.26416015625, 2.3359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 8.0, 11.0, 11.0, 16.0, 32.0, 35.0, 44.0, 55.0, 75.0, 83.0, 85.0, 73.0, 93.0, 95.0, 64.0, 52.0, 32.0, 33.0, 27.0, 16.0, 15.0, 5.0, 9.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.296875, -3.19476318359375, -3.0926513671875, -2.99053955078125, -2.888427734375, -2.78631591796875, -2.6842041015625, -2.58209228515625, -2.47998046875, -2.37786865234375, -2.2757568359375, -2.17364501953125, -2.071533203125, -1.96942138671875, -1.8673095703125, -1.76519775390625, -1.6630859375, -1.56097412109375, -1.4588623046875, -1.35675048828125, -1.254638671875, -1.15252685546875, -1.0504150390625, -0.94830322265625, -0.84619140625, -0.74407958984375, -0.6419677734375, -0.53985595703125, -0.437744140625, -0.33563232421875, -0.2335205078125, -0.13140869140625, -0.029296875, 0.07281494140625, 0.1749267578125, 0.27703857421875, 0.379150390625, 0.48126220703125, 0.5833740234375, 0.68548583984375, 0.78759765625, 0.88970947265625, 0.9918212890625, 1.09393310546875, 1.196044921875, 1.29815673828125, 1.4002685546875, 1.50238037109375, 1.6044921875, 1.70660400390625, 1.8087158203125, 1.91082763671875, 2.012939453125, 2.11505126953125, 2.2171630859375, 2.31927490234375, 2.42138671875, 2.52349853515625, 2.6256103515625, 2.72772216796875, 2.829833984375, 2.93194580078125, 3.0340576171875, 3.13616943359375, 3.23828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 18.0, 34.0, 56.0, 120.0, 230.0, 540.0, 1509.0, 6238.0, 33867.0, 496001.0, 468692.0, 32643.0, 6014.0, 1515.0, 502.0, 275.0, 127.0, 62.0, 39.0, 29.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.62109375, -1.56878662109375, -1.5164794921875, -1.46417236328125, -1.411865234375, -1.35955810546875, -1.3072509765625, -1.25494384765625, -1.20263671875, -1.15032958984375, -1.0980224609375, -1.04571533203125, -0.993408203125, -0.94110107421875, -0.8887939453125, -0.83648681640625, -0.7841796875, -0.73187255859375, -0.6795654296875, -0.62725830078125, -0.574951171875, -0.52264404296875, -0.4703369140625, -0.41802978515625, -0.36572265625, -0.31341552734375, -0.2611083984375, -0.20880126953125, -0.156494140625, -0.10418701171875, -0.0518798828125, 0.00042724609375, 0.052734375, 0.10504150390625, 0.1573486328125, 0.20965576171875, 0.261962890625, 0.31427001953125, 0.3665771484375, 0.41888427734375, 0.47119140625, 0.52349853515625, 0.5758056640625, 0.62811279296875, 0.680419921875, 0.73272705078125, 0.7850341796875, 0.83734130859375, 0.8896484375, 0.94195556640625, 0.9942626953125, 1.04656982421875, 1.098876953125, 1.15118408203125, 1.2034912109375, 1.25579833984375, 1.30810546875, 1.36041259765625, 1.4127197265625, 1.46502685546875, 1.517333984375, 1.56964111328125, 1.6219482421875, 1.67425537109375, 1.7265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 3.0, 7.0, 8.0, 8.0, 16.0, 20.0, 26.0, 42.0, 118.0, 239.0, 257.0, 96.0, 51.0, 20.0, 11.0, 16.0, 13.0, 6.0, 13.0, 2.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022721290588378906, -0.0002173297107219696, -0.00020744651556015015, -0.0001975633203983307, -0.00018768012523651123, -0.00017779693007469177, -0.00016791373491287231, -0.00015803053975105286, -0.0001481473445892334, -0.00013826414942741394, -0.00012838095426559448, -0.00011849775910377502, -0.00010861456394195557, -9.873136878013611e-05, -8.884817361831665e-05, -7.896497845649719e-05, -6.908178329467773e-05, -5.9198588132858276e-05, -4.931539297103882e-05, -3.943219780921936e-05, -2.9549002647399902e-05, -1.9665807485580444e-05, -9.782612323760986e-06, 1.0058283805847168e-07, 9.98377799987793e-06, 1.9866973161697388e-05, 2.9750168323516846e-05, 3.9633363485336304e-05, 4.951655864715576e-05, 5.939975380897522e-05, 6.928294897079468e-05, 7.916614413261414e-05, 8.90493392944336e-05, 9.893253445625305e-05, 0.00010881572961807251, 0.00011869892477989197, 0.00012858211994171143, 0.00013846531510353088, 0.00014834851026535034, 0.0001582317054271698, 0.00016811490058898926, 0.00017799809575080872, 0.00018788129091262817, 0.00019776448607444763, 0.0002076476812362671, 0.00021753087639808655, 0.000227414071559906, 0.00023729726672172546, 0.0002471804618835449, 0.0002570636570453644, 0.00026694685220718384, 0.0002768300473690033, 0.00028671324253082275, 0.0002965964376926422, 0.00030647963285446167, 0.00031636282801628113, 0.0003262460231781006, 0.00033612921833992004, 0.0003460124135017395, 0.00035589560866355896, 0.0003657788038253784, 0.0003756619989871979, 0.00038554519414901733, 0.0003954283893108368, 0.00040531158447265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 8.0, 12.0, 27.0, 18.0, 53.0, 82.0, 157.0, 261.0, 453.0, 827.0, 1892.0, 5069.0, 16722.0, 67964.0, 583696.0, 308076.0, 44558.0, 11862.0, 3796.0, 1437.0, 669.0, 349.0, 194.0, 149.0, 84.0, 51.0, 28.0, 18.0, 6.0, 11.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.111328125, -1.0741119384765625, -1.036895751953125, -0.9996795654296875, -0.96246337890625, -0.9252471923828125, -0.888031005859375, -0.8508148193359375, -0.8135986328125, -0.7763824462890625, -0.739166259765625, -0.7019500732421875, -0.66473388671875, -0.6275177001953125, -0.590301513671875, -0.5530853271484375, -0.515869140625, -0.4786529541015625, -0.441436767578125, -0.4042205810546875, -0.36700439453125, -0.3297882080078125, -0.292572021484375, -0.2553558349609375, -0.2181396484375, -0.1809234619140625, -0.143707275390625, -0.1064910888671875, -0.06927490234375, -0.0320587158203125, 0.005157470703125, 0.0423736572265625, 0.07958984375, 0.1168060302734375, 0.154022216796875, 0.1912384033203125, 0.22845458984375, 0.2656707763671875, 0.302886962890625, 0.3401031494140625, 0.3773193359375, 0.4145355224609375, 0.451751708984375, 0.4889678955078125, 0.52618408203125, 0.5634002685546875, 0.600616455078125, 0.6378326416015625, 0.675048828125, 0.7122650146484375, 0.749481201171875, 0.7866973876953125, 0.82391357421875, 0.8611297607421875, 0.898345947265625, 0.9355621337890625, 0.9727783203125, 1.0099945068359375, 1.047210693359375, 1.0844268798828125, 1.12164306640625, 1.1588592529296875, 1.196075439453125, 1.2332916259765625, 1.2705078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 11.0, 14.0, 17.0, 25.0, 31.0, 57.0, 94.0, 105.0, 202.0, 156.0, 93.0, 48.0, 36.0, 23.0, 16.0, 15.0, 11.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75244140625, -0.7193222045898438, -0.6862030029296875, -0.6530838012695312, -0.619964599609375, -0.5868453979492188, -0.5537261962890625, -0.5206069946289062, -0.48748779296875, -0.45436859130859375, -0.4212493896484375, -0.38813018798828125, -0.355010986328125, -0.32189178466796875, -0.2887725830078125, -0.25565338134765625, -0.2225341796875, -0.18941497802734375, -0.1562957763671875, -0.12317657470703125, -0.090057373046875, -0.05693817138671875, -0.0238189697265625, 0.00930023193359375, 0.04241943359375, 0.07553863525390625, 0.1086578369140625, 0.14177703857421875, 0.174896240234375, 0.20801544189453125, 0.2411346435546875, 0.27425384521484375, 0.307373046875, 0.34049224853515625, 0.3736114501953125, 0.40673065185546875, 0.439849853515625, 0.47296905517578125, 0.5060882568359375, 0.5392074584960938, 0.57232666015625, 0.6054458618164062, 0.6385650634765625, 0.6716842651367188, 0.704803466796875, 0.7379226684570312, 0.7710418701171875, 0.8041610717773438, 0.8372802734375, 0.8703994750976562, 0.9035186767578125, 0.9366378784179688, 0.969757080078125, 1.0028762817382812, 1.0359954833984375, 1.0691146850585938, 1.10223388671875, 1.1353530883789062, 1.1684722900390625, 1.2015914916992188, 1.234710693359375, 1.2678298950195312, 1.3009490966796875, 1.3340682983398438, 1.3671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 28.0, 23.0, 47.0, 47.0, 65.0, 98.0, 105.0, 110.0, 112.0, 92.0, 87.0, 50.0, 46.0, 27.0, 15.0, 13.0, 10.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.717826843261719, -12.30018424987793, -11.882542610168457, -11.464900016784668, -11.047258377075195, -10.629615783691406, -10.211973190307617, -9.794331550598145, -9.376689910888672, -8.959047317504883, -8.54140567779541, -8.123763084411621, -7.706121444702148, -7.288478851318359, -6.8708367347717285, -6.453194618225098, -6.035552024841309, -5.617909908294678, -5.200267791748047, -4.782625198364258, -4.364983558654785, -3.947341203689575, -3.5296988487243652, -3.1120567321777344, -2.6944146156311035, -2.2767724990844727, -1.8591302633285522, -1.4414880275726318, -1.023845911026001, -0.6062037944793701, -0.18856143951416016, 0.2290806770324707, 0.6467218399047852, 1.064363956451416, 1.4820061922073364, 1.8996484279632568, 2.3172905445098877, 2.7349326610565186, 3.1525750160217285, 3.5702171325683594, 3.9878592491149902, 4.405501365661621, 4.823143482208252, 5.240785598754883, 5.658428192138672, 6.0760698318481445, 6.493712425231934, 6.9113545417785645, 7.328996658325195, 7.746638774871826, 8.164280891418457, 8.581923484802246, 8.999565124511719, 9.417207717895508, 9.834850311279297, 10.25249195098877, 10.670133590698242, 11.087776184082031, 11.505417823791504, 11.923060417175293, 12.340702056884766, 12.758344650268555, 13.175987243652344, 13.593628883361816, 14.011271476745605]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 13.0, 13.0, 15.0, 20.0, 32.0, 27.0, 37.0, 47.0, 35.0, 40.0, 43.0, 55.0, 49.0, 58.0, 58.0, 53.0, 51.0, 39.0, 38.0, 37.0, 33.0, 28.0, 32.0, 27.0, 13.0, 22.0, 12.0, 13.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.63415813446045, -8.311763763427734, -7.9893693923950195, -7.666975021362305, -7.34458065032959, -7.022186279296875, -6.69979190826416, -6.377397537231445, -6.0550031661987305, -5.732608795166016, -5.410214424133301, -5.087820053100586, -4.765425682067871, -4.443031311035156, -4.120636940002441, -3.7982425689697266, -3.4758481979370117, -3.153453826904297, -2.831059455871582, -2.508665084838867, -2.1862707138061523, -1.8638763427734375, -1.5414819717407227, -1.2190876007080078, -0.896693229675293, -0.5742988586425781, -0.2519044876098633, 0.07048988342285156, 0.3928842544555664, 0.7152786254882812, 1.037672996520996, 1.360067367553711, 1.6824626922607422, 2.004857063293457, 2.327251434326172, 2.6496458053588867, 2.9720401763916016, 3.2944345474243164, 3.6168289184570312, 3.939223289489746, 4.261617660522461, 4.584012031555176, 4.906406402587891, 5.2288007736206055, 5.55119514465332, 5.873589515686035, 6.19598388671875, 6.518378257751465, 6.84077262878418, 7.1631669998168945, 7.485561370849609, 7.807955741882324, 8.130350112915039, 8.452744483947754, 8.775138854980469, 9.097533226013184, 9.419927597045898, 9.742321968078613, 10.064716339111328, 10.387110710144043, 10.709505081176758, 11.031899452209473, 11.354293823242188, 11.676688194274902, 11.999082565307617]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 22.0, 18.0, 22.0, 38.0, 53.0, 78.0, 132.0, 289.0, 537.0, 1172.0, 2827.0, 8314.0, 34808.0, 411061.0, 3636189.0, 76673.0, 14332.0, 4384.0, 1672.0, 735.0, 361.0, 186.0, 99.0, 68.0, 44.0, 32.0, 23.0, 18.0, 16.0, 11.0, 5.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.48046875, -5.32025146484375, -5.1600341796875, -4.99981689453125, -4.839599609375, -4.67938232421875, -4.5191650390625, -4.35894775390625, -4.19873046875, -4.03851318359375, -3.8782958984375, -3.71807861328125, -3.557861328125, -3.39764404296875, -3.2374267578125, -3.07720947265625, -2.9169921875, -2.75677490234375, -2.5965576171875, -2.43634033203125, -2.276123046875, -2.11590576171875, -1.9556884765625, -1.79547119140625, -1.63525390625, -1.47503662109375, -1.3148193359375, -1.15460205078125, -0.994384765625, -0.83416748046875, -0.6739501953125, -0.51373291015625, -0.353515625, -0.19329833984375, -0.0330810546875, 0.12713623046875, 0.287353515625, 0.44757080078125, 0.6077880859375, 0.76800537109375, 0.92822265625, 1.08843994140625, 1.2486572265625, 1.40887451171875, 1.569091796875, 1.72930908203125, 1.8895263671875, 2.04974365234375, 2.2099609375, 2.37017822265625, 2.5303955078125, 2.69061279296875, 2.850830078125, 3.01104736328125, 3.1712646484375, 3.33148193359375, 3.49169921875, 3.65191650390625, 3.8121337890625, 3.97235107421875, 4.132568359375, 4.29278564453125, 4.4530029296875, 4.61322021484375, 4.7734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 4.0, 6.0, 15.0, 18.0, 15.0, 16.0, 19.0, 19.0, 28.0, 27.0, 33.0, 27.0, 48.0, 42.0, 47.0, 46.0, 50.0, 48.0, 34.0, 62.0, 49.0, 49.0, 46.0, 31.0, 33.0, 28.0, 26.0, 27.0, 21.0, 17.0, 14.0, 8.0, 15.0, 5.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3464317321777344, -0.33177947998046875, -0.3171272277832031, -0.3024749755859375, -0.2878227233886719, -0.27317047119140625, -0.2585182189941406, -0.243865966796875, -0.22921371459960938, -0.21456146240234375, -0.19990921020507812, -0.1852569580078125, -0.17060470581054688, -0.15595245361328125, -0.14130020141601562, -0.12664794921875, -0.11199569702148438, -0.09734344482421875, -0.08269119262695312, -0.0680389404296875, -0.053386688232421875, -0.03873443603515625, -0.024082183837890625, -0.009429931640625, 0.005222320556640625, 0.01987457275390625, 0.034526824951171875, 0.0491790771484375, 0.06383132934570312, 0.07848358154296875, 0.09313583374023438, 0.1077880859375, 0.12244033813476562, 0.13709259033203125, 0.15174484252929688, 0.1663970947265625, 0.18104934692382812, 0.19570159912109375, 0.21035385131835938, 0.225006103515625, 0.23965835571289062, 0.25431060791015625, 0.2689628601074219, 0.2836151123046875, 0.2982673645019531, 0.31291961669921875, 0.3275718688964844, 0.34222412109375, 0.3568763732910156, 0.37152862548828125, 0.3861808776855469, 0.4008331298828125, 0.4154853820800781, 0.43013763427734375, 0.4447898864746094, 0.459442138671875, 0.4740943908691406, 0.48874664306640625, 0.5033988952636719, 0.5180511474609375, 0.5327033996582031, 0.5473556518554688, 0.5620079040527344, 0.57666015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 11.0, 6.0, 16.0, 18.0, 24.0, 45.0, 33.0, 40.0, 82.0, 113.0, 131.0, 165.0, 298.0, 526.0, 910.0, 2185.0, 6852.0, 42302.0, 2925485.0, 1168339.0, 35683.0, 6529.0, 2028.0, 955.0, 461.0, 264.0, 208.0, 166.0, 90.0, 76.0, 76.0, 44.0, 31.0, 17.0, 16.0, 11.0, 20.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.86328125, -6.66119384765625, -6.4591064453125, -6.25701904296875, -6.054931640625, -5.85284423828125, -5.6507568359375, -5.44866943359375, -5.24658203125, -5.04449462890625, -4.8424072265625, -4.64031982421875, -4.438232421875, -4.23614501953125, -4.0340576171875, -3.83197021484375, -3.6298828125, -3.42779541015625, -3.2257080078125, -3.02362060546875, -2.821533203125, -2.61944580078125, -2.4173583984375, -2.21527099609375, -2.01318359375, -1.81109619140625, -1.6090087890625, -1.40692138671875, -1.204833984375, -1.00274658203125, -0.8006591796875, -0.59857177734375, -0.396484375, -0.19439697265625, 0.0076904296875, 0.20977783203125, 0.411865234375, 0.61395263671875, 0.8160400390625, 1.01812744140625, 1.22021484375, 1.42230224609375, 1.6243896484375, 1.82647705078125, 2.028564453125, 2.23065185546875, 2.4327392578125, 2.63482666015625, 2.8369140625, 3.03900146484375, 3.2410888671875, 3.44317626953125, 3.645263671875, 3.84735107421875, 4.0494384765625, 4.25152587890625, 4.45361328125, 4.65570068359375, 4.8577880859375, 5.05987548828125, 5.261962890625, 5.46405029296875, 5.6661376953125, 5.86822509765625, 6.0703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 16.0, 24.0, 59.0, 115.0, 364.0, 2601.0, 603.0, 154.0, 51.0, 45.0, 13.0, 13.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.24114990234375, -3.1502685546875, -3.05938720703125, -2.968505859375, -2.87762451171875, -2.7867431640625, -2.69586181640625, -2.60498046875, -2.51409912109375, -2.4232177734375, -2.33233642578125, -2.241455078125, -2.15057373046875, -2.0596923828125, -1.96881103515625, -1.8779296875, -1.78704833984375, -1.6961669921875, -1.60528564453125, -1.514404296875, -1.42352294921875, -1.3326416015625, -1.24176025390625, -1.15087890625, -1.05999755859375, -0.9691162109375, -0.87823486328125, -0.787353515625, -0.69647216796875, -0.6055908203125, -0.51470947265625, -0.423828125, -0.33294677734375, -0.2420654296875, -0.15118408203125, -0.060302734375, 0.03057861328125, 0.1214599609375, 0.21234130859375, 0.30322265625, 0.39410400390625, 0.4849853515625, 0.57586669921875, 0.666748046875, 0.75762939453125, 0.8485107421875, 0.93939208984375, 1.0302734375, 1.12115478515625, 1.2120361328125, 1.30291748046875, 1.393798828125, 1.48468017578125, 1.5755615234375, 1.66644287109375, 1.75732421875, 1.84820556640625, 1.9390869140625, 2.02996826171875, 2.120849609375, 2.21173095703125, 2.3026123046875, 2.39349365234375, 2.484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 11.0, 17.0, 38.0, 69.0, 107.0, 168.0, 182.0, 139.0, 86.0, 65.0, 51.0, 33.0, 11.0, 10.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.422357082366943, -7.0340962409973145, -6.6458353996276855, -6.257574558258057, -5.869313716888428, -5.481052875518799, -5.092791557312012, -4.704530715942383, -4.316269874572754, -3.928009033203125, -3.539748191833496, -3.151487350463867, -2.7632265090942383, -2.3749656677246094, -1.9867045879364014, -1.5984437465667725, -1.2101831436157227, -0.8219223022460938, -0.43366140127182007, -0.04540050029754639, 0.3428603410720825, 0.7311211824417114, 1.1193821430206299, 1.5076429843902588, 1.8959038257598877, 2.2841646671295166, 2.6724255084991455, 3.0606865882873535, 3.4489474296569824, 3.8372082710266113, 4.22546911239624, 4.613729953765869, 5.00199031829834, 5.390251159667969, 5.778512001037598, 6.166772842407227, 6.5550336837768555, 6.943294525146484, 7.331555366516113, 7.719816207885742, 8.108077049255371, 8.496337890625, 8.884598731994629, 9.272859573364258, 9.661120414733887, 10.049381256103516, 10.437642097473145, 10.825902938842773, 11.214164733886719, 11.602425575256348, 11.990686416625977, 12.378947257995605, 12.767208099365234, 13.155468940734863, 13.543729782104492, 13.931990623474121, 14.32025146484375, 14.708512306213379, 15.096773147583008, 15.485033988952637, 15.873294830322266, 16.26155662536621, 16.649816513061523, 17.03807830810547, 17.42633819580078]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 5.0, 9.0, 5.0, 9.0, 14.0, 10.0, 13.0, 10.0, 30.0, 24.0, 18.0, 28.0, 38.0, 32.0, 26.0, 45.0, 38.0, 39.0, 47.0, 38.0, 43.0, 41.0, 46.0, 53.0, 45.0, 36.0, 29.0, 26.0, 37.0, 19.0, 30.0, 16.0, 18.0, 11.0, 16.0, 5.0, 10.0, 7.0, 3.0, 3.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.564762592315674, -5.40660285949707, -5.248443126678467, -5.090283393859863, -4.932123184204102, -4.773963451385498, -4.6158037185668945, -4.457643985748291, -4.2994842529296875, -4.141324520111084, -3.9831647872924805, -3.825004816055298, -3.6668450832366943, -3.508685350418091, -3.350525379180908, -3.1923656463623047, -3.034205913543701, -2.8760461807250977, -2.717886447906494, -2.5597264766693115, -2.401566743850708, -2.2434070110321045, -2.085247039794922, -1.9270873069763184, -1.7689275741577148, -1.6107678413391113, -1.4526079893112183, -1.2944481372833252, -1.1362884044647217, -0.9781286120414734, -0.8199688196182251, -0.661808967590332, -0.5036487579345703, -0.345488965511322, -0.18732917308807373, -0.02916938066482544, 0.12899041175842285, 0.28715020418167114, 0.44530999660491943, 0.6034698486328125, 0.761629581451416, 0.9197893738746643, 1.0779491662979126, 1.2361090183258057, 1.3942687511444092, 1.5524284839630127, 1.7105883359909058, 1.8687481880187988, 2.0269079208374023, 2.185067653656006, 2.3432273864746094, 2.501387357711792, 2.6595470905303955, 2.817706823348999, 2.9758667945861816, 3.134026527404785, 3.2921862602233887, 3.450345993041992, 3.6085057258605957, 3.7666656970977783, 3.924825429916382, 4.0829854011535645, 4.241145133972168, 4.3993048667907715, 4.557464599609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 16.0, 21.0, 27.0, 30.0, 45.0, 74.0, 110.0, 155.0, 211.0, 304.0, 467.0, 723.0, 1098.0, 1759.0, 2596.0, 4435.0, 7400.0, 13188.0, 24764.0, 49185.0, 104526.0, 235272.0, 317457.0, 144454.0, 66780.0, 32234.0, 16835.0, 9485.0, 5553.0, 3257.0, 2144.0, 1345.0, 840.0, 566.0, 349.0, 258.0, 164.0, 124.0, 86.0, 52.0, 48.0, 34.0, 23.0, 17.0, 10.0, 4.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8037109375, -1.74591064453125, -1.6881103515625, -1.63031005859375, -1.572509765625, -1.51470947265625, -1.4569091796875, -1.39910888671875, -1.34130859375, -1.28350830078125, -1.2257080078125, -1.16790771484375, -1.110107421875, -1.05230712890625, -0.9945068359375, -0.93670654296875, -0.87890625, -0.82110595703125, -0.7633056640625, -0.70550537109375, -0.647705078125, -0.58990478515625, -0.5321044921875, -0.47430419921875, -0.41650390625, -0.35870361328125, -0.3009033203125, -0.24310302734375, -0.185302734375, -0.12750244140625, -0.0697021484375, -0.01190185546875, 0.0458984375, 0.10369873046875, 0.1614990234375, 0.21929931640625, 0.277099609375, 0.33489990234375, 0.3927001953125, 0.45050048828125, 0.50830078125, 0.56610107421875, 0.6239013671875, 0.68170166015625, 0.739501953125, 0.79730224609375, 0.8551025390625, 0.91290283203125, 0.970703125, 1.02850341796875, 1.0863037109375, 1.14410400390625, 1.201904296875, 1.25970458984375, 1.3175048828125, 1.37530517578125, 1.43310546875, 1.49090576171875, 1.5487060546875, 1.60650634765625, 1.664306640625, 1.72210693359375, 1.7799072265625, 1.83770751953125, 1.8955078125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 8.0, 12.0, 13.0, 15.0, 10.0, 13.0, 17.0, 19.0, 12.0, 26.0, 31.0, 32.0, 25.0, 31.0, 34.0, 33.0, 31.0, 40.0, 34.0, 58.0, 37.0, 46.0, 37.0, 43.0, 32.0, 30.0, 29.0, 31.0, 28.0, 21.0, 18.0, 13.0, 19.0, 18.0, 12.0, 17.0, 15.0, 11.0, 7.0, 6.0, 7.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.44921875, -0.4343414306640625, -0.419464111328125, -0.4045867919921875, -0.38970947265625, -0.3748321533203125, -0.359954833984375, -0.3450775146484375, -0.3302001953125, -0.3153228759765625, -0.300445556640625, -0.2855682373046875, -0.27069091796875, -0.2558135986328125, -0.240936279296875, -0.2260589599609375, -0.211181640625, -0.1963043212890625, -0.181427001953125, -0.1665496826171875, -0.15167236328125, -0.1367950439453125, -0.121917724609375, -0.1070404052734375, -0.0921630859375, -0.0772857666015625, -0.062408447265625, -0.0475311279296875, -0.03265380859375, -0.0177764892578125, -0.002899169921875, 0.0119781494140625, 0.02685546875, 0.0417327880859375, 0.056610107421875, 0.0714874267578125, 0.08636474609375, 0.1012420654296875, 0.116119384765625, 0.1309967041015625, 0.1458740234375, 0.1607513427734375, 0.175628662109375, 0.1905059814453125, 0.20538330078125, 0.2202606201171875, 0.235137939453125, 0.2500152587890625, 0.264892578125, 0.2797698974609375, 0.294647216796875, 0.3095245361328125, 0.32440185546875, 0.3392791748046875, 0.354156494140625, 0.3690338134765625, 0.3839111328125, 0.3987884521484375, 0.413665771484375, 0.4285430908203125, 0.44342041015625, 0.4582977294921875, 0.473175048828125, 0.4880523681640625, 0.5029296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 5.0, 17.0, 20.0, 19.0, 30.0, 33.0, 61.0, 66.0, 89.0, 116.0, 194.0, 213.0, 336.0, 515.0, 925.0, 1875.0, 4373.0, 12140.0, 43093.0, 216695.0, 628377.0, 101968.0, 23220.0, 7463.0, 3009.0, 1435.0, 772.0, 420.0, 281.0, 217.0, 143.0, 111.0, 61.0, 51.0, 57.0, 32.0, 29.0, 16.0, 19.0, 15.0, 8.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.861328125, -3.737884521484375, -3.61444091796875, -3.490997314453125, -3.3675537109375, -3.244110107421875, -3.12066650390625, -2.997222900390625, -2.873779296875, -2.750335693359375, -2.62689208984375, -2.503448486328125, -2.3800048828125, -2.256561279296875, -2.13311767578125, -2.009674072265625, -1.88623046875, -1.762786865234375, -1.63934326171875, -1.515899658203125, -1.3924560546875, -1.269012451171875, -1.14556884765625, -1.022125244140625, -0.898681640625, -0.775238037109375, -0.65179443359375, -0.528350830078125, -0.4049072265625, -0.281463623046875, -0.15802001953125, -0.034576416015625, 0.0888671875, 0.212310791015625, 0.33575439453125, 0.459197998046875, 0.5826416015625, 0.706085205078125, 0.82952880859375, 0.952972412109375, 1.076416015625, 1.199859619140625, 1.32330322265625, 1.446746826171875, 1.5701904296875, 1.693634033203125, 1.81707763671875, 1.940521240234375, 2.06396484375, 2.187408447265625, 2.31085205078125, 2.434295654296875, 2.5577392578125, 2.681182861328125, 2.80462646484375, 2.928070068359375, 3.051513671875, 3.174957275390625, 3.29840087890625, 3.421844482421875, 3.5452880859375, 3.668731689453125, 3.79217529296875, 3.915618896484375, 4.0390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 8.0, 2.0, 5.0, 5.0, 11.0, 12.0, 16.0, 16.0, 20.0, 29.0, 37.0, 46.0, 49.0, 54.0, 80.0, 64.0, 74.0, 54.0, 69.0, 64.0, 54.0, 45.0, 37.0, 44.0, 20.0, 22.0, 17.0, 17.0, 13.0, 9.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.21484375, -4.08587646484375, -3.9569091796875, -3.82794189453125, -3.698974609375, -3.57000732421875, -3.4410400390625, -3.31207275390625, -3.18310546875, -3.05413818359375, -2.9251708984375, -2.79620361328125, -2.667236328125, -2.53826904296875, -2.4093017578125, -2.28033447265625, -2.1513671875, -2.02239990234375, -1.8934326171875, -1.76446533203125, -1.635498046875, -1.50653076171875, -1.3775634765625, -1.24859619140625, -1.11962890625, -0.99066162109375, -0.8616943359375, -0.73272705078125, -0.603759765625, -0.47479248046875, -0.3458251953125, -0.21685791015625, -0.087890625, 0.04107666015625, 0.1700439453125, 0.29901123046875, 0.427978515625, 0.55694580078125, 0.6859130859375, 0.81488037109375, 0.94384765625, 1.07281494140625, 1.2017822265625, 1.33074951171875, 1.459716796875, 1.58868408203125, 1.7176513671875, 1.84661865234375, 1.9755859375, 2.10455322265625, 2.2335205078125, 2.36248779296875, 2.491455078125, 2.62042236328125, 2.7493896484375, 2.87835693359375, 3.00732421875, 3.13629150390625, 3.2652587890625, 3.39422607421875, 3.523193359375, 3.65216064453125, 3.7811279296875, 3.91009521484375, 4.0390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 1.0, 4.0, 7.0, 9.0, 19.0, 27.0, 38.0, 35.0, 67.0, 111.0, 158.0, 241.0, 512.0, 1531.0, 8431.0, 804978.0, 224977.0, 5161.0, 1199.0, 407.0, 221.0, 134.0, 94.0, 67.0, 52.0, 19.0, 21.0, 9.0, 10.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.69140625, -6.4815673828125, -6.271728515625, -6.0618896484375, -5.85205078125, -5.6422119140625, -5.432373046875, -5.2225341796875, -5.0126953125, -4.8028564453125, -4.593017578125, -4.3831787109375, -4.17333984375, -3.9635009765625, -3.753662109375, -3.5438232421875, -3.333984375, -3.1241455078125, -2.914306640625, -2.7044677734375, -2.49462890625, -2.2847900390625, -2.074951171875, -1.8651123046875, -1.6552734375, -1.4454345703125, -1.235595703125, -1.0257568359375, -0.81591796875, -0.6060791015625, -0.396240234375, -0.1864013671875, 0.0234375, 0.2332763671875, 0.443115234375, 0.6529541015625, 0.86279296875, 1.0726318359375, 1.282470703125, 1.4923095703125, 1.7021484375, 1.9119873046875, 2.121826171875, 2.3316650390625, 2.54150390625, 2.7513427734375, 2.961181640625, 3.1710205078125, 3.380859375, 3.5906982421875, 3.800537109375, 4.0103759765625, 4.22021484375, 4.4300537109375, 4.639892578125, 4.8497314453125, 5.0595703125, 5.2694091796875, 5.479248046875, 5.6890869140625, 5.89892578125, 6.1087646484375, 6.318603515625, 6.5284423828125, 6.73828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 7.0, 12.0, 25.0, 36.0, 80.0, 142.0, 322.0, 187.0, 95.0, 38.0, 18.0, 18.0, 13.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008373260498046875, -0.0008081197738647461, -0.0007789134979248047, -0.0007497072219848633, -0.0007205009460449219, -0.0006912946701049805, -0.0006620883941650391, -0.0006328821182250977, -0.0006036758422851562, -0.0005744695663452148, -0.0005452632904052734, -0.000516057014465332, -0.0004868507385253906, -0.0004576444625854492, -0.0004284381866455078, -0.0003992319107055664, -0.000370025634765625, -0.0003408193588256836, -0.0003116130828857422, -0.0002824068069458008, -0.0002532005310058594, -0.00022399425506591797, -0.00019478797912597656, -0.00016558170318603516, -0.00013637542724609375, -0.00010716915130615234, -7.796287536621094e-05, -4.875659942626953e-05, -1.9550323486328125e-05, 9.655952453613281e-06, 3.886222839355469e-05, 6.80685043334961e-05, 9.72747802734375e-05, 0.0001264810562133789, 0.0001556873321533203, 0.00018489360809326172, 0.00021409988403320312, 0.00024330615997314453, 0.00027251243591308594, 0.00030171871185302734, 0.00033092498779296875, 0.00036013126373291016, 0.00038933753967285156, 0.00041854381561279297, 0.0004477500915527344, 0.0004769563674926758, 0.0005061626434326172, 0.0005353689193725586, 0.0005645751953125, 0.0005937814712524414, 0.0006229877471923828, 0.0006521940231323242, 0.0006814002990722656, 0.000710606575012207, 0.0007398128509521484, 0.0007690191268920898, 0.0007982254028320312, 0.0008274316787719727, 0.0008566379547119141, 0.0008858442306518555, 0.0009150505065917969, 0.0009442567825317383, 0.0009734630584716797, 0.001002669334411621, 0.0010318756103515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 14.0, 11.0, 15.0, 34.0, 53.0, 85.0, 184.0, 280.0, 605.0, 1771.0, 7599.0, 338498.0, 685510.0, 10340.0, 2104.0, 643.0, 330.0, 184.0, 110.0, 58.0, 48.0, 24.0, 12.0, 6.0, 5.0, 3.0, 0.0, 5.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.74835205078125, -5.5435791015625, -5.33880615234375, -5.134033203125, -4.92926025390625, -4.7244873046875, -4.51971435546875, -4.31494140625, -4.11016845703125, -3.9053955078125, -3.70062255859375, -3.495849609375, -3.29107666015625, -3.0863037109375, -2.88153076171875, -2.6767578125, -2.47198486328125, -2.2672119140625, -2.06243896484375, -1.857666015625, -1.65289306640625, -1.4481201171875, -1.24334716796875, -1.03857421875, -0.83380126953125, -0.6290283203125, -0.42425537109375, -0.219482421875, -0.01470947265625, 0.1900634765625, 0.39483642578125, 0.599609375, 0.80438232421875, 1.0091552734375, 1.21392822265625, 1.418701171875, 1.62347412109375, 1.8282470703125, 2.03302001953125, 2.23779296875, 2.44256591796875, 2.6473388671875, 2.85211181640625, 3.056884765625, 3.26165771484375, 3.4664306640625, 3.67120361328125, 3.8759765625, 4.08074951171875, 4.2855224609375, 4.49029541015625, 4.695068359375, 4.89984130859375, 5.1046142578125, 5.30938720703125, 5.51416015625, 5.71893310546875, 5.9237060546875, 6.12847900390625, 6.333251953125, 6.53802490234375, 6.7427978515625, 6.94757080078125, 7.15234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 13.0, 22.0, 51.0, 100.0, 166.0, 227.0, 203.0, 113.0, 50.0, 20.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1796875, -4.04730224609375, -3.9149169921875, -3.78253173828125, -3.650146484375, -3.51776123046875, -3.3853759765625, -3.25299072265625, -3.12060546875, -2.98822021484375, -2.8558349609375, -2.72344970703125, -2.591064453125, -2.45867919921875, -2.3262939453125, -2.19390869140625, -2.0615234375, -1.92913818359375, -1.7967529296875, -1.66436767578125, -1.531982421875, -1.39959716796875, -1.2672119140625, -1.13482666015625, -1.00244140625, -0.87005615234375, -0.7376708984375, -0.60528564453125, -0.472900390625, -0.34051513671875, -0.2081298828125, -0.07574462890625, 0.056640625, 0.18902587890625, 0.3214111328125, 0.45379638671875, 0.586181640625, 0.71856689453125, 0.8509521484375, 0.98333740234375, 1.11572265625, 1.24810791015625, 1.3804931640625, 1.51287841796875, 1.645263671875, 1.77764892578125, 1.9100341796875, 2.04241943359375, 2.1748046875, 2.30718994140625, 2.4395751953125, 2.57196044921875, 2.704345703125, 2.83673095703125, 2.9691162109375, 3.10150146484375, 3.23388671875, 3.36627197265625, 3.4986572265625, 3.63104248046875, 3.763427734375, 3.89581298828125, 4.0281982421875, 4.16058349609375, 4.29296875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 16.0, 32.0, 88.0, 166.0, 225.0, 208.0, 147.0, 75.0, 30.0, 11.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78947448730469, -39.08312225341797, -37.376773834228516, -35.6704216003418, -33.96406936645508, -32.257720947265625, -30.551368713378906, -28.84501838684082, -27.138668060302734, -25.43231773376465, -23.72596549987793, -22.019615173339844, -20.313264846801758, -18.606914520263672, -16.900562286376953, -15.194211959838867, -13.487859725952148, -11.781508445739746, -10.07515811920166, -8.368806838989258, -6.662456035614014, -4.9561052322387695, -3.249753952026367, -1.5434036254882812, 0.1629476547241211, 1.8692985773086548, 3.5756494998931885, 5.282000541687012, 6.988351345062256, 8.6947021484375, 10.401053428649902, 12.107403755187988, 13.81375503540039, 15.520106315612793, 17.226457595825195, 18.93280792236328, 20.639158248901367, 22.345508575439453, 24.051860809326172, 25.758211135864258, 27.464561462402344, 29.17091178894043, 30.87726402282715, 32.583614349365234, 34.28996658325195, 35.996315002441406, 37.702667236328125, 39.409019470214844, 41.11537170410156, 42.82172393798828, 44.528072357177734, 46.23442459106445, 47.94077682495117, 49.647125244140625, 51.353477478027344, 53.05982971191406, 54.766178131103516, 56.472530364990234, 58.17887878417969, 59.885231018066406, 61.591583251953125, 63.29793167114258, 65.00428771972656, 66.71063232421875, 68.41698455810547]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 8.0, 10.0, 14.0, 18.0, 20.0, 20.0, 26.0, 38.0, 30.0, 44.0, 42.0, 46.0, 56.0, 49.0, 54.0, 54.0, 49.0, 59.0, 42.0, 45.0, 37.0, 42.0, 25.0, 24.0, 19.0, 25.0, 14.0, 12.0, 17.0, 13.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.121912002563477, -18.503585815429688, -17.88526153564453, -17.266935348510742, -16.648609161376953, -16.030284881591797, -15.411958694458008, -14.793633460998535, -14.175308227539062, -13.55698299407959, -12.9386568069458, -12.320331573486328, -11.702006340026855, -11.083681106567383, -10.465354919433594, -9.847029685974121, -9.228703498840332, -8.61037826538086, -7.9920525550842285, -7.373726844787598, -6.755401611328125, -6.137075901031494, -5.518750190734863, -4.900424957275391, -4.28209924697876, -3.663773775100708, -3.0454483032226562, -2.4271225929260254, -1.8087971210479736, -1.1904716491699219, -0.572145938873291, 0.04617929458618164, 0.6645050048828125, 1.2828304767608643, 1.9011560678482056, 2.519481658935547, 3.1378071308135986, 3.7561326026916504, 4.374458312988281, 4.992783546447754, 5.611109256744385, 6.229434967041016, 6.847760200500488, 7.466085910797119, 8.08441162109375, 8.702736854553223, 9.321062088012695, 9.939388275146484, 10.557713508605957, 11.17603874206543, 11.794364929199219, 12.412690162658691, 13.031015396118164, 13.649341583251953, 14.267666816711426, 14.885992050170898, 15.504318237304688, 16.122644424438477, 16.740968704223633, 17.359294891357422, 17.97762107849121, 18.595945358276367, 19.214271545410156, 19.832595825195312, 20.4509220123291]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 12.0, 14.0, 10.0, 16.0, 24.0, 24.0, 41.0, 86.0, 93.0, 151.0, 173.0, 293.0, 453.0, 717.0, 1310.0, 2365.0, 5164.0, 12521.0, 37236.0, 161411.0, 3264287.0, 592558.0, 76852.0, 22129.0, 8092.0, 3554.0, 1825.0, 1027.0, 625.0, 365.0, 253.0, 176.0, 119.0, 78.0, 52.0, 55.0, 31.0, 15.0, 20.0, 13.0, 10.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.16015625, -3.060699462890625, -2.96124267578125, -2.861785888671875, -2.7623291015625, -2.662872314453125, -2.56341552734375, -2.463958740234375, -2.364501953125, -2.265045166015625, -2.16558837890625, -2.066131591796875, -1.9666748046875, -1.867218017578125, -1.76776123046875, -1.668304443359375, -1.56884765625, -1.469390869140625, -1.36993408203125, -1.270477294921875, -1.1710205078125, -1.071563720703125, -0.97210693359375, -0.872650146484375, -0.773193359375, -0.673736572265625, -0.57427978515625, -0.474822998046875, -0.3753662109375, -0.275909423828125, -0.17645263671875, -0.076995849609375, 0.0224609375, 0.121917724609375, 0.22137451171875, 0.320831298828125, 0.4202880859375, 0.519744873046875, 0.61920166015625, 0.718658447265625, 0.818115234375, 0.917572021484375, 1.01702880859375, 1.116485595703125, 1.2159423828125, 1.315399169921875, 1.41485595703125, 1.514312744140625, 1.61376953125, 1.713226318359375, 1.81268310546875, 1.912139892578125, 2.0115966796875, 2.111053466796875, 2.21051025390625, 2.309967041015625, 2.409423828125, 2.508880615234375, 2.60833740234375, 2.707794189453125, 2.8072509765625, 2.906707763671875, 3.00616455078125, 3.105621337890625, 3.205078125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 11.0, 17.0, 28.0, 17.0, 15.0, 23.0, 33.0, 29.0, 44.0, 39.0, 44.0, 47.0, 46.0, 51.0, 48.0, 40.0, 53.0, 40.0, 50.0, 34.0, 35.0, 24.0, 24.0, 30.0, 22.0, 21.0, 16.0, 18.0, 16.0, 8.0, 9.0, 7.0, 7.0, 6.0, 3.0, 4.0, 3.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58349609375, -0.5645904541015625, -0.545684814453125, -0.5267791748046875, -0.50787353515625, -0.4889678955078125, -0.470062255859375, -0.4511566162109375, -0.4322509765625, -0.4133453369140625, -0.394439697265625, -0.3755340576171875, -0.35662841796875, -0.3377227783203125, -0.318817138671875, -0.2999114990234375, -0.281005859375, -0.2621002197265625, -0.243194580078125, -0.2242889404296875, -0.20538330078125, -0.1864776611328125, -0.167572021484375, -0.1486663818359375, -0.1297607421875, -0.1108551025390625, -0.091949462890625, -0.0730438232421875, -0.05413818359375, -0.0352325439453125, -0.016326904296875, 0.0025787353515625, 0.021484375, 0.0403900146484375, 0.059295654296875, 0.0782012939453125, 0.09710693359375, 0.1160125732421875, 0.134918212890625, 0.1538238525390625, 0.1727294921875, 0.1916351318359375, 0.210540771484375, 0.2294464111328125, 0.24835205078125, 0.2672576904296875, 0.286163330078125, 0.3050689697265625, 0.323974609375, 0.3428802490234375, 0.361785888671875, 0.3806915283203125, 0.39959716796875, 0.4185028076171875, 0.437408447265625, 0.4563140869140625, 0.4752197265625, 0.4941253662109375, 0.513031005859375, 0.5319366455078125, 0.55084228515625, 0.5697479248046875, 0.588653564453125, 0.6075592041015625, 0.62646484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 13.0, 4.0, 12.0, 14.0, 20.0, 7.0, 20.0, 14.0, 25.0, 35.0, 42.0, 43.0, 60.0, 73.0, 117.0, 148.0, 231.0, 339.0, 582.0, 1086.0, 2689.0, 9318.0, 60883.0, 3292492.0, 778939.0, 35984.0, 6539.0, 2020.0, 887.0, 511.0, 307.0, 199.0, 139.0, 95.0, 88.0, 53.0, 50.0, 41.0, 29.0, 23.0, 12.0, 15.0, 21.0, 7.0, 12.0, 14.0, 4.0, 5.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.72265625, -6.5181884765625, -6.313720703125, -6.1092529296875, -5.90478515625, -5.7003173828125, -5.495849609375, -5.2913818359375, -5.0869140625, -4.8824462890625, -4.677978515625, -4.4735107421875, -4.26904296875, -4.0645751953125, -3.860107421875, -3.6556396484375, -3.451171875, -3.2467041015625, -3.042236328125, -2.8377685546875, -2.63330078125, -2.4288330078125, -2.224365234375, -2.0198974609375, -1.8154296875, -1.6109619140625, -1.406494140625, -1.2020263671875, -0.99755859375, -0.7930908203125, -0.588623046875, -0.3841552734375, -0.1796875, 0.0247802734375, 0.229248046875, 0.4337158203125, 0.63818359375, 0.8426513671875, 1.047119140625, 1.2515869140625, 1.4560546875, 1.6605224609375, 1.864990234375, 2.0694580078125, 2.27392578125, 2.4783935546875, 2.682861328125, 2.8873291015625, 3.091796875, 3.2962646484375, 3.500732421875, 3.7052001953125, 3.90966796875, 4.1141357421875, 4.318603515625, 4.5230712890625, 4.7275390625, 4.9320068359375, 5.136474609375, 5.3409423828125, 5.54541015625, 5.7498779296875, 5.954345703125, 6.1588134765625, 6.36328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 10.0, 30.0, 42.0, 130.0, 552.0, 2775.0, 390.0, 88.0, 31.0, 15.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.51348876953125, -5.3433837890625, -5.17327880859375, -5.003173828125, -4.83306884765625, -4.6629638671875, -4.49285888671875, -4.32275390625, -4.15264892578125, -3.9825439453125, -3.81243896484375, -3.642333984375, -3.47222900390625, -3.3021240234375, -3.13201904296875, -2.9619140625, -2.79180908203125, -2.6217041015625, -2.45159912109375, -2.281494140625, -2.11138916015625, -1.9412841796875, -1.77117919921875, -1.60107421875, -1.43096923828125, -1.2608642578125, -1.09075927734375, -0.920654296875, -0.75054931640625, -0.5804443359375, -0.41033935546875, -0.240234375, -0.07012939453125, 0.0999755859375, 0.27008056640625, 0.440185546875, 0.61029052734375, 0.7803955078125, 0.95050048828125, 1.12060546875, 1.29071044921875, 1.4608154296875, 1.63092041015625, 1.801025390625, 1.97113037109375, 2.1412353515625, 2.31134033203125, 2.4814453125, 2.65155029296875, 2.8216552734375, 2.99176025390625, 3.161865234375, 3.33197021484375, 3.5020751953125, 3.67218017578125, 3.84228515625, 4.01239013671875, 4.1824951171875, 4.35260009765625, 4.522705078125, 4.69281005859375, 4.8629150390625, 5.03302001953125, 5.203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 7.0, 3.0, 8.0, 7.0, 22.0, 15.0, 22.0, 52.0, 64.0, 69.0, 85.0, 116.0, 115.0, 118.0, 72.0, 58.0, 54.0, 32.0, 27.0, 18.0, 14.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.988187789916992, -13.596678733825684, -13.205168724060059, -12.81365966796875, -12.422149658203125, -12.030640602111816, -11.639131546020508, -11.247621536254883, -10.856112480163574, -10.464603424072266, -10.07309341430664, -9.681584358215332, -9.290075302124023, -8.898565292358398, -8.50705623626709, -8.115547180175781, -7.724037170410156, -7.3325276374816895, -6.941018104553223, -6.549509048461914, -6.157999515533447, -5.7664899826049805, -5.374980926513672, -4.983471393585205, -4.591961860656738, -4.2004523277282715, -3.808943033218384, -3.417433738708496, -3.0259242057800293, -2.6344146728515625, -2.242905378341675, -1.851396083831787, -1.4598865509033203, -1.068377137184143, -0.6768677234649658, -0.2853583097457886, 0.10615110397338867, 0.4976605176925659, 0.8891699314117432, 1.2806792259216309, 1.6721887588500977, 2.0636982917785645, 2.455207586288452, 2.84671688079834, 3.2382264137268066, 3.6297359466552734, 4.021245002746582, 4.412754535675049, 4.804264068603516, 5.195773601531982, 5.587283134460449, 5.978792190551758, 6.370301723480225, 6.761811256408691, 7.1533203125, 7.544829845428467, 7.936339378356934, 8.327848434448242, 8.719358444213867, 9.110867500305176, 9.502376556396484, 9.89388656616211, 10.285395622253418, 10.676904678344727, 11.068414688110352]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 8.0, 10.0, 9.0, 8.0, 13.0, 18.0, 14.0, 22.0, 20.0, 19.0, 25.0, 24.0, 30.0, 36.0, 22.0, 49.0, 38.0, 35.0, 44.0, 44.0, 49.0, 37.0, 36.0, 40.0, 43.0, 30.0, 36.0, 23.0, 28.0, 36.0, 26.0, 14.0, 18.0, 18.0, 15.0, 13.0, 7.0, 4.0, 10.0, 6.0, 3.0, 10.0, 3.0, 0.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.623883247375488, -7.372845649719238, -7.121808052062988, -6.870770454406738, -6.619732856750488, -6.368695259094238, -6.11765718460083, -5.86661958694458, -5.61558198928833, -5.36454439163208, -5.11350679397583, -4.86246919631958, -4.611431121826172, -4.360393524169922, -4.109355926513672, -3.858318328857422, -3.607280731201172, -3.356243133544922, -3.105205535888672, -2.8541676998138428, -2.6031301021575928, -2.3520925045013428, -2.1010546684265137, -1.8500170707702637, -1.5989794731140137, -1.3479418754577637, -1.0969041585922241, -0.8458665013313293, -0.5948288440704346, -0.34379124641418457, -0.09275352954864502, 0.15828418731689453, 0.4093208312988281, 0.6603584885597229, 0.9113961458206177, 1.1624338626861572, 1.4134714603424072, 1.6645090579986572, 1.9155467748641968, 2.1665844917297363, 2.4176220893859863, 2.6686596870422363, 2.9196972846984863, 3.1707351207733154, 3.4217727184295654, 3.6728103160858154, 3.9238481521606445, 4.1748857498168945, 4.4259233474731445, 4.6769609451293945, 4.9279985427856445, 5.1790361404418945, 5.4300737380981445, 5.6811113357543945, 5.932149410247803, 6.183187007904053, 6.434224605560303, 6.685262203216553, 6.936299800872803, 7.187337398529053, 7.438375473022461, 7.689413070678711, 7.940450668334961, 8.191488265991211, 8.442525863647461]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 9.0, 10.0, 10.0, 20.0, 30.0, 36.0, 56.0, 90.0, 97.0, 184.0, 295.0, 397.0, 603.0, 871.0, 1311.0, 2135.0, 3395.0, 5772.0, 10103.0, 18158.0, 34473.0, 67679.0, 133636.0, 233656.0, 240235.0, 141545.0, 71689.0, 35958.0, 19213.0, 10837.0, 6051.0, 3619.0, 2256.0, 1414.0, 859.0, 644.0, 388.0, 251.0, 180.0, 122.0, 78.0, 60.0, 34.0, 30.0, 23.0, 14.0, 14.0, 8.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5491943359375, -1.495849609375, -1.4425048828125, -1.38916015625, -1.3358154296875, -1.282470703125, -1.2291259765625, -1.17578125, -1.1224365234375, -1.069091796875, -1.0157470703125, -0.96240234375, -0.9090576171875, -0.855712890625, -0.8023681640625, -0.7490234375, -0.6956787109375, -0.642333984375, -0.5889892578125, -0.53564453125, -0.4822998046875, -0.428955078125, -0.3756103515625, -0.322265625, -0.2689208984375, -0.215576171875, -0.1622314453125, -0.10888671875, -0.0555419921875, -0.002197265625, 0.0511474609375, 0.1044921875, 0.1578369140625, 0.211181640625, 0.2645263671875, 0.31787109375, 0.3712158203125, 0.424560546875, 0.4779052734375, 0.53125, 0.5845947265625, 0.637939453125, 0.6912841796875, 0.74462890625, 0.7979736328125, 0.851318359375, 0.9046630859375, 0.9580078125, 1.0113525390625, 1.064697265625, 1.1180419921875, 1.17138671875, 1.2247314453125, 1.278076171875, 1.3314208984375, 1.384765625, 1.4381103515625, 1.491455078125, 1.5447998046875, 1.59814453125, 1.6514892578125, 1.704833984375, 1.7581787109375, 1.8115234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 14.0, 16.0, 9.0, 22.0, 33.0, 22.0, 34.0, 42.0, 42.0, 45.0, 49.0, 36.0, 41.0, 45.0, 45.0, 42.0, 52.0, 40.0, 47.0, 45.0, 53.0, 27.0, 26.0, 21.0, 27.0, 19.0, 10.0, 12.0, 15.0, 12.0, 10.0, 13.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85546875, -0.8300399780273438, -0.8046112060546875, -0.7791824340820312, -0.753753662109375, -0.7283248901367188, -0.7028961181640625, -0.6774673461914062, -0.65203857421875, -0.6266098022460938, -0.6011810302734375, -0.5757522583007812, -0.550323486328125, -0.5248947143554688, -0.4994659423828125, -0.47403717041015625, -0.4486083984375, -0.42317962646484375, -0.3977508544921875, -0.37232208251953125, -0.346893310546875, -0.32146453857421875, -0.2960357666015625, -0.27060699462890625, -0.24517822265625, -0.21974945068359375, -0.1943206787109375, -0.16889190673828125, -0.143463134765625, -0.11803436279296875, -0.0926055908203125, -0.06717681884765625, -0.041748046875, -0.01631927490234375, 0.0091094970703125, 0.03453826904296875, 0.059967041015625, 0.08539581298828125, 0.1108245849609375, 0.13625335693359375, 0.16168212890625, 0.18711090087890625, 0.2125396728515625, 0.23796844482421875, 0.263397216796875, 0.28882598876953125, 0.3142547607421875, 0.33968353271484375, 0.3651123046875, 0.39054107666015625, 0.4159698486328125, 0.44139862060546875, 0.466827392578125, 0.49225616455078125, 0.5176849365234375, 0.5431137084960938, 0.56854248046875, 0.5939712524414062, 0.6194000244140625, 0.6448287963867188, 0.670257568359375, 0.6956863403320312, 0.7211151123046875, 0.7465438842773438, 0.77197265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 2.0, 8.0, 15.0, 11.0, 21.0, 28.0, 31.0, 44.0, 60.0, 82.0, 120.0, 178.0, 259.0, 346.0, 575.0, 944.0, 1773.0, 3943.0, 13190.0, 74908.0, 612130.0, 291708.0, 34148.0, 7761.0, 2673.0, 1310.0, 752.0, 482.0, 296.0, 214.0, 144.0, 101.0, 68.0, 52.0, 40.0, 44.0, 22.0, 12.0, 15.0, 11.0, 6.0, 3.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.51953125, -5.345947265625, -5.17236328125, -4.998779296875, -4.8251953125, -4.651611328125, -4.47802734375, -4.304443359375, -4.130859375, -3.957275390625, -3.78369140625, -3.610107421875, -3.4365234375, -3.262939453125, -3.08935546875, -2.915771484375, -2.7421875, -2.568603515625, -2.39501953125, -2.221435546875, -2.0478515625, -1.874267578125, -1.70068359375, -1.527099609375, -1.353515625, -1.179931640625, -1.00634765625, -0.832763671875, -0.6591796875, -0.485595703125, -0.31201171875, -0.138427734375, 0.03515625, 0.208740234375, 0.38232421875, 0.555908203125, 0.7294921875, 0.903076171875, 1.07666015625, 1.250244140625, 1.423828125, 1.597412109375, 1.77099609375, 1.944580078125, 2.1181640625, 2.291748046875, 2.46533203125, 2.638916015625, 2.8125, 2.986083984375, 3.15966796875, 3.333251953125, 3.5068359375, 3.680419921875, 3.85400390625, 4.027587890625, 4.201171875, 4.374755859375, 4.54833984375, 4.721923828125, 4.8955078125, 5.069091796875, 5.24267578125, 5.416259765625, 5.58984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 8.0, 12.0, 6.0, 14.0, 15.0, 24.0, 31.0, 24.0, 38.0, 27.0, 36.0, 31.0, 36.0, 42.0, 53.0, 45.0, 45.0, 41.0, 56.0, 46.0, 53.0, 35.0, 29.0, 39.0, 34.0, 32.0, 17.0, 20.0, 22.0, 15.0, 15.0, 3.0, 3.0, 4.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.4266357421875, -4.290771484375, -4.1549072265625, -4.01904296875, -3.8831787109375, -3.747314453125, -3.6114501953125, -3.4755859375, -3.3397216796875, -3.203857421875, -3.0679931640625, -2.93212890625, -2.7962646484375, -2.660400390625, -2.5245361328125, -2.388671875, -2.2528076171875, -2.116943359375, -1.9810791015625, -1.84521484375, -1.7093505859375, -1.573486328125, -1.4376220703125, -1.3017578125, -1.1658935546875, -1.030029296875, -0.8941650390625, -0.75830078125, -0.6224365234375, -0.486572265625, -0.3507080078125, -0.21484375, -0.0789794921875, 0.056884765625, 0.1927490234375, 0.32861328125, 0.4644775390625, 0.600341796875, 0.7362060546875, 0.8720703125, 1.0079345703125, 1.143798828125, 1.2796630859375, 1.41552734375, 1.5513916015625, 1.687255859375, 1.8231201171875, 1.958984375, 2.0948486328125, 2.230712890625, 2.3665771484375, 2.50244140625, 2.6383056640625, 2.774169921875, 2.9100341796875, 3.0458984375, 3.1817626953125, 3.317626953125, 3.4534912109375, 3.58935546875, 3.7252197265625, 3.861083984375, 3.9969482421875, 4.1328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 14.0, 17.0, 17.0, 29.0, 31.0, 43.0, 79.0, 102.0, 149.0, 243.0, 421.0, 719.0, 1397.0, 3045.0, 7301.0, 22651.0, 101635.0, 498763.0, 327246.0, 59088.0, 15185.0, 5235.0, 2353.0, 1127.0, 639.0, 375.0, 212.0, 143.0, 90.0, 64.0, 31.0, 29.0, 21.0, 16.0, 7.0, 9.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.091796875, -2.0280914306640625, -1.964385986328125, -1.9006805419921875, -1.83697509765625, -1.7732696533203125, -1.709564208984375, -1.6458587646484375, -1.5821533203125, -1.5184478759765625, -1.454742431640625, -1.3910369873046875, -1.32733154296875, -1.2636260986328125, -1.199920654296875, -1.1362152099609375, -1.072509765625, -1.0088043212890625, -0.945098876953125, -0.8813934326171875, -0.81768798828125, -0.7539825439453125, -0.690277099609375, -0.6265716552734375, -0.5628662109375, -0.4991607666015625, -0.435455322265625, -0.3717498779296875, -0.30804443359375, -0.2443389892578125, -0.180633544921875, -0.1169281005859375, -0.05322265625, 0.0104827880859375, 0.074188232421875, 0.1378936767578125, 0.20159912109375, 0.2653045654296875, 0.329010009765625, 0.3927154541015625, 0.4564208984375, 0.5201263427734375, 0.583831787109375, 0.6475372314453125, 0.71124267578125, 0.7749481201171875, 0.838653564453125, 0.9023590087890625, 0.966064453125, 1.0297698974609375, 1.093475341796875, 1.1571807861328125, 1.22088623046875, 1.2845916748046875, 1.348297119140625, 1.4120025634765625, 1.4757080078125, 1.5394134521484375, 1.603118896484375, 1.6668243408203125, 1.73052978515625, 1.7942352294921875, 1.857940673828125, 1.9216461181640625, 1.9853515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 4.0, 16.0, 16.0, 31.0, 41.0, 73.0, 143.0, 165.0, 139.0, 136.0, 88.0, 51.0, 42.0, 15.0, 13.0, 11.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0010499954223632812, -0.0010276660323143005, -0.0010053366422653198, -0.0009830072522163391, -0.0009606778621673584, -0.0009383484721183777, -0.000916019082069397, -0.0008936896920204163, -0.0008713603019714355, -0.0008490309119224548, -0.0008267015218734741, -0.0008043721318244934, -0.0007820427417755127, -0.000759713351726532, -0.0007373839616775513, -0.0007150545716285706, -0.0006927251815795898, -0.0006703957915306091, -0.0006480664014816284, -0.0006257370114326477, -0.000603407621383667, -0.0005810782313346863, -0.0005587488412857056, -0.0005364194512367249, -0.0005140900611877441, -0.0004917606711387634, -0.0004694312810897827, -0.000447101891040802, -0.0004247725009918213, -0.0004024431109428406, -0.00038011372089385986, -0.00035778433084487915, -0.00033545494079589844, -0.0003131255507469177, -0.000290796160697937, -0.0002684667706489563, -0.0002461373805999756, -0.00022380799055099487, -0.00020147860050201416, -0.00017914921045303345, -0.00015681982040405273, -0.00013449043035507202, -0.00011216104030609131, -8.98316502571106e-05, -6.750226020812988e-05, -4.517287015914917e-05, -2.2843480110168457e-05, -5.140900611877441e-07, 2.181529998779297e-05, 4.414469003677368e-05, 6.64740800857544e-05, 8.880347013473511e-05, 0.00011113286018371582, 0.00013346225023269653, 0.00015579164028167725, 0.00017812103033065796, 0.00020045042037963867, 0.00022277981042861938, 0.0002451092004776001, 0.0002674385905265808, 0.0002897679805755615, 0.00031209737062454224, 0.00033442676067352295, 0.00035675615072250366, 0.0003790855407714844]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 19.0, 28.0, 30.0, 41.0, 65.0, 94.0, 125.0, 193.0, 370.0, 664.0, 1450.0, 3424.0, 10779.0, 52051.0, 423520.0, 476197.0, 60251.0, 11994.0, 3787.0, 1622.0, 704.0, 412.0, 229.0, 150.0, 80.0, 69.0, 42.0, 33.0, 22.0, 16.0, 14.0, 10.0, 5.0, 7.0, 2.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.520355224609375, -2.43914794921875, -2.357940673828125, -2.2767333984375, -2.195526123046875, -2.11431884765625, -2.033111572265625, -1.951904296875, -1.870697021484375, -1.78948974609375, -1.708282470703125, -1.6270751953125, -1.545867919921875, -1.46466064453125, -1.383453369140625, -1.30224609375, -1.221038818359375, -1.13983154296875, -1.058624267578125, -0.9774169921875, -0.896209716796875, -0.81500244140625, -0.733795166015625, -0.652587890625, -0.571380615234375, -0.49017333984375, -0.408966064453125, -0.3277587890625, -0.246551513671875, -0.16534423828125, -0.084136962890625, -0.0029296875, 0.078277587890625, 0.15948486328125, 0.240692138671875, 0.3218994140625, 0.403106689453125, 0.48431396484375, 0.565521240234375, 0.646728515625, 0.727935791015625, 0.80914306640625, 0.890350341796875, 0.9715576171875, 1.052764892578125, 1.13397216796875, 1.215179443359375, 1.29638671875, 1.377593994140625, 1.45880126953125, 1.540008544921875, 1.6212158203125, 1.702423095703125, 1.78363037109375, 1.864837646484375, 1.946044921875, 2.027252197265625, 2.10845947265625, 2.189666748046875, 2.2708740234375, 2.352081298828125, 2.43328857421875, 2.514495849609375, 2.595703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 8.0, 7.0, 4.0, 10.0, 13.0, 22.0, 26.0, 43.0, 52.0, 55.0, 81.0, 89.0, 73.0, 85.0, 71.0, 72.0, 49.0, 59.0, 38.0, 42.0, 15.0, 21.0, 12.0, 15.0, 10.0, 1.0, 8.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.85546875, -1.799468994140625, -1.74346923828125, -1.687469482421875, -1.6314697265625, -1.575469970703125, -1.51947021484375, -1.463470458984375, -1.407470703125, -1.351470947265625, -1.29547119140625, -1.239471435546875, -1.1834716796875, -1.127471923828125, -1.07147216796875, -1.015472412109375, -0.95947265625, -0.903472900390625, -0.84747314453125, -0.791473388671875, -0.7354736328125, -0.679473876953125, -0.62347412109375, -0.567474365234375, -0.511474609375, -0.455474853515625, -0.39947509765625, -0.343475341796875, -0.2874755859375, -0.231475830078125, -0.17547607421875, -0.119476318359375, -0.0634765625, -0.007476806640625, 0.04852294921875, 0.104522705078125, 0.1605224609375, 0.216522216796875, 0.27252197265625, 0.328521728515625, 0.384521484375, 0.440521240234375, 0.49652099609375, 0.552520751953125, 0.6085205078125, 0.664520263671875, 0.72052001953125, 0.776519775390625, 0.83251953125, 0.888519287109375, 0.94451904296875, 1.000518798828125, 1.0565185546875, 1.112518310546875, 1.16851806640625, 1.224517822265625, 1.280517578125, 1.336517333984375, 1.39251708984375, 1.448516845703125, 1.5045166015625, 1.560516357421875, 1.61651611328125, 1.672515869140625, 1.728515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 23.0, 40.0, 51.0, 92.0, 156.0, 148.0, 172.0, 116.0, 75.0, 56.0, 30.0, 17.0, 14.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.966819763183594, -46.69770812988281, -45.42859649658203, -44.15948486328125, -42.89037322998047, -41.62126159667969, -40.352149963378906, -39.083038330078125, -37.813926696777344, -36.54481506347656, -35.27570343017578, -34.006591796875, -32.73748016357422, -31.468368530273438, -30.199256896972656, -28.930145263671875, -27.661035537719727, -26.391923904418945, -25.122812271118164, -23.853700637817383, -22.5845890045166, -21.31547737121582, -20.046367645263672, -18.77725601196289, -17.50814437866211, -16.239032745361328, -14.969921112060547, -13.700809478759766, -12.431697845458984, -11.162586212158203, -9.893475532531738, -8.624363899230957, -7.355251312255859, -6.086139678955078, -4.817028045654297, -3.547916889190674, -2.2788052558898926, -1.0096936225891113, 0.2594175338745117, 1.528529167175293, 2.797640800476074, 4.0667524337768555, 5.335864067077637, 6.60497522354126, 7.874086856842041, 9.143198013305664, 10.412309646606445, 11.681421279907227, 12.950532913208008, 14.219644546508789, 15.48875617980957, 16.75786781311035, 18.026979446411133, 19.296091079711914, 20.565200805664062, 21.834312438964844, 23.103424072265625, 24.372535705566406, 25.641647338867188, 26.91075897216797, 28.17987060546875, 29.44898223876953, 30.718093872070312, 31.987205505371094, 33.256317138671875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 12.0, 10.0, 26.0, 30.0, 18.0, 22.0, 30.0, 39.0, 43.0, 33.0, 43.0, 52.0, 68.0, 70.0, 40.0, 50.0, 36.0, 49.0, 35.0, 39.0, 37.0, 24.0, 20.0, 20.0, 16.0, 18.0, 14.0, 12.0, 16.0, 13.0, 11.0, 1.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.56783676147461, -23.820573806762695, -23.073312759399414, -22.3260498046875, -21.57878875732422, -20.831525802612305, -20.084264755249023, -19.33700180053711, -18.589740753173828, -17.842477798461914, -17.095216751098633, -16.34795379638672, -15.600692749023438, -14.85343074798584, -14.106168746948242, -13.358905792236328, -12.61164379119873, -11.864381790161133, -11.117119789123535, -10.369857788085938, -9.62259578704834, -8.875333786010742, -8.128070831298828, -7.380809307098389, -6.633547306060791, -5.886285305023193, -5.139023303985596, -4.39176082611084, -3.6444990634918213, -2.8972370624542236, -2.149974822998047, -1.4027128219604492, -0.6554508209228516, 0.09181123971939087, 0.8390733003616333, 1.5863354206085205, 2.333597421646118, 3.080859422683716, 3.8281216621398926, 4.57538366317749, 5.322645664215088, 6.0699076652526855, 6.817169666290283, 7.564432144165039, 8.311694145202637, 9.058956146240234, 9.806218147277832, 10.55348014831543, 11.300742149353027, 12.048004150390625, 12.795266151428223, 13.54252815246582, 14.289790153503418, 15.037052154541016, 15.78431510925293, 16.53157615661621, 17.278839111328125, 18.02610206604004, 18.77336311340332, 19.520626068115234, 20.267887115478516, 21.01515007019043, 21.76241111755371, 22.509674072265625, 23.256935119628906]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 5.0, 12.0, 19.0, 26.0, 22.0, 26.0, 51.0, 69.0, 79.0, 120.0, 188.0, 404.0, 572.0, 1205.0, 2340.0, 5074.0, 13532.0, 71545.0, 4018309.0, 58714.0, 12347.0, 4761.0, 2193.0, 1046.0, 615.0, 329.0, 189.0, 126.0, 90.0, 52.0, 53.0, 38.0, 31.0, 22.0, 12.0, 12.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.98046875, -4.8359375, -4.69140625, -4.546875, -4.40234375, -4.2578125, -4.11328125, -3.96875, -3.82421875, -3.6796875, -3.53515625, -3.390625, -3.24609375, -3.1015625, -2.95703125, -2.8125, -2.66796875, -2.5234375, -2.37890625, -2.234375, -2.08984375, -1.9453125, -1.80078125, -1.65625, -1.51171875, -1.3671875, -1.22265625, -1.078125, -0.93359375, -0.7890625, -0.64453125, -0.5, -0.35546875, -0.2109375, -0.06640625, 0.078125, 0.22265625, 0.3671875, 0.51171875, 0.65625, 0.80078125, 0.9453125, 1.08984375, 1.234375, 1.37890625, 1.5234375, 1.66796875, 1.8125, 1.95703125, 2.1015625, 2.24609375, 2.390625, 2.53515625, 2.6796875, 2.82421875, 2.96875, 3.11328125, 3.2578125, 3.40234375, 3.546875, 3.69140625, 3.8359375, 3.98046875, 4.125, 4.26953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 15.0, 18.0, 15.0, 24.0, 34.0, 42.0, 40.0, 51.0, 54.0, 55.0, 54.0, 55.0, 61.0, 67.0, 57.0, 58.0, 47.0, 43.0, 31.0, 32.0, 29.0, 26.0, 16.0, 21.0, 11.0, 8.0, 10.0, 6.0, 7.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1036376953125, -1.068603515625, -1.0335693359375, -0.99853515625, -0.9635009765625, -0.928466796875, -0.8934326171875, -0.8583984375, -0.8233642578125, -0.788330078125, -0.7532958984375, -0.71826171875, -0.6832275390625, -0.648193359375, -0.6131591796875, -0.578125, -0.5430908203125, -0.508056640625, -0.4730224609375, -0.43798828125, -0.4029541015625, -0.367919921875, -0.3328857421875, -0.2978515625, -0.2628173828125, -0.227783203125, -0.1927490234375, -0.15771484375, -0.1226806640625, -0.087646484375, -0.0526123046875, -0.017578125, 0.0174560546875, 0.052490234375, 0.0875244140625, 0.12255859375, 0.1575927734375, 0.192626953125, 0.2276611328125, 0.2626953125, 0.2977294921875, 0.332763671875, 0.3677978515625, 0.40283203125, 0.4378662109375, 0.472900390625, 0.5079345703125, 0.54296875, 0.5780029296875, 0.613037109375, 0.6480712890625, 0.68310546875, 0.7181396484375, 0.753173828125, 0.7882080078125, 0.8232421875, 0.8582763671875, 0.893310546875, 0.9283447265625, 0.96337890625, 0.9984130859375, 1.033447265625, 1.0684814453125, 1.103515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 10.0, 14.0, 19.0, 23.0, 25.0, 37.0, 50.0, 74.0, 99.0, 114.0, 243.0, 550.0, 1889.0, 16630.0, 4153609.0, 17727.0, 1896.0, 562.0, 226.0, 122.0, 89.0, 76.0, 41.0, 37.0, 25.0, 29.0, 27.0, 11.0, 7.0, 4.0, 9.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.1346435546875, -13.620849609375, -13.1070556640625, -12.59326171875, -12.0794677734375, -11.565673828125, -11.0518798828125, -10.5380859375, -10.0242919921875, -9.510498046875, -8.9967041015625, -8.48291015625, -7.9691162109375, -7.455322265625, -6.9415283203125, -6.427734375, -5.9139404296875, -5.400146484375, -4.8863525390625, -4.37255859375, -3.8587646484375, -3.344970703125, -2.8311767578125, -2.3173828125, -1.8035888671875, -1.289794921875, -0.7760009765625, -0.26220703125, 0.2515869140625, 0.765380859375, 1.2791748046875, 1.79296875, 2.3067626953125, 2.820556640625, 3.3343505859375, 3.84814453125, 4.3619384765625, 4.875732421875, 5.3895263671875, 5.9033203125, 6.4171142578125, 6.930908203125, 7.4447021484375, 7.95849609375, 8.4722900390625, 8.986083984375, 9.4998779296875, 10.013671875, 10.5274658203125, 11.041259765625, 11.5550537109375, 12.06884765625, 12.5826416015625, 13.096435546875, 13.6102294921875, 14.1240234375, 14.6378173828125, 15.151611328125, 15.6654052734375, 16.17919921875, 16.6929931640625, 17.206787109375, 17.7205810546875, 18.234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 11.0, 14.0, 62.0, 3745.0, 198.0, 31.0, 11.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.481536865234375, -2.38104248046875, -2.280548095703125, -2.1800537109375, -2.079559326171875, -1.97906494140625, -1.878570556640625, -1.778076171875, -1.677581787109375, -1.57708740234375, -1.476593017578125, -1.3760986328125, -1.275604248046875, -1.17510986328125, -1.074615478515625, -0.97412109375, -0.873626708984375, -0.77313232421875, -0.672637939453125, -0.5721435546875, -0.471649169921875, -0.37115478515625, -0.270660400390625, -0.170166015625, -0.069671630859375, 0.03082275390625, 0.131317138671875, 0.2318115234375, 0.332305908203125, 0.43280029296875, 0.533294677734375, 0.6337890625, 0.734283447265625, 0.83477783203125, 0.935272216796875, 1.0357666015625, 1.136260986328125, 1.23675537109375, 1.337249755859375, 1.437744140625, 1.538238525390625, 1.63873291015625, 1.739227294921875, 1.8397216796875, 1.940216064453125, 2.04071044921875, 2.141204833984375, 2.24169921875, 2.342193603515625, 2.44268798828125, 2.543182373046875, 2.6436767578125, 2.744171142578125, 2.84466552734375, 2.945159912109375, 3.045654296875, 3.146148681640625, 3.24664306640625, 3.347137451171875, 3.4476318359375, 3.548126220703125, 3.64862060546875, 3.749114990234375, 3.849609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 23.0, 29.0, 49.0, 74.0, 135.0, 157.0, 168.0, 131.0, 97.0, 52.0, 24.0, 23.0, 6.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0812177658081055, -4.885937213897705, -4.690656661987305, -4.495375633239746, -4.300095081329346, -4.104814529418945, -3.909533977508545, -3.7142531871795654, -3.518972396850586, -3.3236918449401855, -3.128411054611206, -2.9331305027008057, -2.737849712371826, -2.542569160461426, -2.3472886085510254, -2.152007818222046, -1.9567272663116455, -1.7614465951919556, -1.5661659240722656, -1.3708853721618652, -1.1756045818328857, -0.9803239703178406, -0.7850433588027954, -0.5897626876831055, -0.3944820165634155, -0.19920136034488678, -0.003920704126358032, 0.19135993719100952, 0.38664060831069946, 0.5819212794303894, 0.7772018909454346, 0.9724825620651245, 1.1677632331848145, 1.3630439043045044, 1.5583245754241943, 1.7536051273345947, 1.9488859176635742, 2.1441664695739746, 2.339447021484375, 2.5347278118133545, 2.730008602142334, 2.9252891540527344, 3.120569944381714, 3.3158504962921143, 3.5111312866210938, 3.706411838531494, 3.9016923904418945, 4.096973419189453, 4.292253494262695, 4.487534046173096, 4.682814598083496, 4.878095626831055, 5.073376178741455, 5.2686567306518555, 5.463937282562256, 5.659217834472656, 5.854498863220215, 6.049779415130615, 6.245059967041016, 6.440340995788574, 6.635621547698975, 6.830902099609375, 7.026182651519775, 7.221463203430176, 7.416744232177734]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 6.0, 16.0, 7.0, 12.0, 19.0, 30.0, 25.0, 26.0, 25.0, 27.0, 31.0, 47.0, 32.0, 28.0, 45.0, 47.0, 35.0, 41.0, 41.0, 32.0, 45.0, 47.0, 30.0, 32.0, 21.0, 36.0, 26.0, 21.0, 19.0, 27.0, 11.0, 10.0, 20.0, 10.0, 10.0, 14.0, 8.0, 5.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.757889986038208, -2.6786556243896484, -2.599421262741089, -2.52018666267395, -2.4409523010253906, -2.361717939376831, -2.2824835777282715, -2.203249216079712, -2.1240148544311523, -2.0447804927825928, -1.9655460119247437, -1.886311650276184, -1.807077169418335, -1.7278428077697754, -1.6486084461212158, -1.5693740844726562, -1.4901394844055176, -1.410905122756958, -1.3316706418991089, -1.2524362802505493, -1.1732017993927002, -1.0939674377441406, -1.014733076095581, -0.9354986548423767, -0.8562642335891724, -0.777029812335968, -0.6977953910827637, -0.6185610294342041, -0.5393266081809998, -0.4600921869277954, -0.38085779547691345, -0.3016234040260315, -0.22238874435424805, -0.1431543380022049, -0.06391993165016174, 0.015314474701881409, 0.09454888105392456, 0.1737833023071289, 0.25301769375801086, 0.3322520852088928, 0.41148650646209717, 0.4907209277153015, 0.5699553489685059, 0.6491897106170654, 0.7284241318702698, 0.8076585531234741, 0.8868929147720337, 0.966127336025238, 1.0453617572784424, 1.124596118927002, 1.203830599784851, 1.2830649614334106, 1.3622994422912598, 1.4415338039398193, 1.520768165588379, 1.6000025272369385, 1.6792370080947876, 1.7584713697433472, 1.8377058506011963, 1.9169402122497559, 1.9961745738983154, 2.075408935546875, 2.1546435356140137, 2.2338778972625732, 2.313112258911133]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 6.0, 4.0, 11.0, 17.0, 20.0, 32.0, 52.0, 57.0, 115.0, 152.0, 230.0, 378.0, 650.0, 1117.0, 1809.0, 3340.0, 6482.0, 12868.0, 26653.0, 59480.0, 141172.0, 297525.0, 273348.0, 123079.0, 51667.0, 23828.0, 11269.0, 5824.0, 3090.0, 1717.0, 970.0, 610.0, 347.0, 217.0, 118.0, 106.0, 60.0, 44.0, 30.0, 20.0, 14.0, 10.0, 6.0, 11.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.106201171875, -2.03076171875, -1.955322265625, -1.8798828125, -1.804443359375, -1.72900390625, -1.653564453125, -1.578125, -1.502685546875, -1.42724609375, -1.351806640625, -1.2763671875, -1.200927734375, -1.12548828125, -1.050048828125, -0.974609375, -0.899169921875, -0.82373046875, -0.748291015625, -0.6728515625, -0.597412109375, -0.52197265625, -0.446533203125, -0.37109375, -0.295654296875, -0.22021484375, -0.144775390625, -0.0693359375, 0.006103515625, 0.08154296875, 0.156982421875, 0.232421875, 0.307861328125, 0.38330078125, 0.458740234375, 0.5341796875, 0.609619140625, 0.68505859375, 0.760498046875, 0.8359375, 0.911376953125, 0.98681640625, 1.062255859375, 1.1376953125, 1.213134765625, 1.28857421875, 1.364013671875, 1.439453125, 1.514892578125, 1.59033203125, 1.665771484375, 1.7412109375, 1.816650390625, 1.89208984375, 1.967529296875, 2.04296875, 2.118408203125, 2.19384765625, 2.269287109375, 2.3447265625, 2.420166015625, 2.49560546875, 2.571044921875, 2.646484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 6.0, 6.0, 10.0, 8.0, 10.0, 14.0, 12.0, 19.0, 19.0, 29.0, 24.0, 31.0, 40.0, 42.0, 37.0, 47.0, 50.0, 43.0, 50.0, 55.0, 52.0, 43.0, 48.0, 48.0, 33.0, 26.0, 21.0, 36.0, 23.0, 15.0, 16.0, 13.0, 18.0, 8.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94921875, -0.916351318359375, -0.88348388671875, -0.850616455078125, -0.8177490234375, -0.784881591796875, -0.75201416015625, -0.719146728515625, -0.686279296875, -0.653411865234375, -0.62054443359375, -0.587677001953125, -0.5548095703125, -0.521942138671875, -0.48907470703125, -0.456207275390625, -0.42333984375, -0.390472412109375, -0.35760498046875, -0.324737548828125, -0.2918701171875, -0.259002685546875, -0.22613525390625, -0.193267822265625, -0.160400390625, -0.127532958984375, -0.09466552734375, -0.061798095703125, -0.0289306640625, 0.003936767578125, 0.03680419921875, 0.069671630859375, 0.1025390625, 0.135406494140625, 0.16827392578125, 0.201141357421875, 0.2340087890625, 0.266876220703125, 0.29974365234375, 0.332611083984375, 0.365478515625, 0.398345947265625, 0.43121337890625, 0.464080810546875, 0.4969482421875, 0.529815673828125, 0.56268310546875, 0.595550537109375, 0.62841796875, 0.661285400390625, 0.69415283203125, 0.727020263671875, 0.7598876953125, 0.792755126953125, 0.82562255859375, 0.858489990234375, 0.891357421875, 0.924224853515625, 0.95709228515625, 0.989959716796875, 1.0228271484375, 1.055694580078125, 1.08856201171875, 1.121429443359375, 1.154296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 5.0, 5.0, 8.0, 13.0, 16.0, 15.0, 25.0, 21.0, 38.0, 52.0, 65.0, 80.0, 113.0, 113.0, 173.0, 269.0, 346.0, 522.0, 824.0, 1358.0, 2834.0, 6937.0, 23660.0, 131535.0, 651259.0, 182301.0, 30242.0, 8201.0, 3184.0, 1497.0, 867.0, 540.0, 384.0, 280.0, 174.0, 131.0, 111.0, 86.0, 68.0, 49.0, 33.0, 24.0, 24.0, 16.0, 15.0, 6.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-5.83984375, -5.67095947265625, -5.5020751953125, -5.33319091796875, -5.164306640625, -4.99542236328125, -4.8265380859375, -4.65765380859375, -4.48876953125, -4.31988525390625, -4.1510009765625, -3.98211669921875, -3.813232421875, -3.64434814453125, -3.4754638671875, -3.30657958984375, -3.1376953125, -2.96881103515625, -2.7999267578125, -2.63104248046875, -2.462158203125, -2.29327392578125, -2.1243896484375, -1.95550537109375, -1.78662109375, -1.61773681640625, -1.4488525390625, -1.27996826171875, -1.111083984375, -0.94219970703125, -0.7733154296875, -0.60443115234375, -0.435546875, -0.26666259765625, -0.0977783203125, 0.07110595703125, 0.239990234375, 0.40887451171875, 0.5777587890625, 0.74664306640625, 0.91552734375, 1.08441162109375, 1.2532958984375, 1.42218017578125, 1.591064453125, 1.75994873046875, 1.9288330078125, 2.09771728515625, 2.2666015625, 2.43548583984375, 2.6043701171875, 2.77325439453125, 2.942138671875, 3.11102294921875, 3.2799072265625, 3.44879150390625, 3.61767578125, 3.78656005859375, 3.9554443359375, 4.12432861328125, 4.293212890625, 4.46209716796875, 4.6309814453125, 4.79986572265625, 4.96875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 10.0, 15.0, 21.0, 20.0, 19.0, 24.0, 32.0, 25.0, 42.0, 44.0, 55.0, 45.0, 46.0, 50.0, 48.0, 47.0, 43.0, 30.0, 44.0, 49.0, 36.0, 24.0, 38.0, 25.0, 25.0, 23.0, 12.0, 22.0, 17.0, 7.0, 7.0, 7.0, 8.0, 2.0, 7.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.32421875, -5.1402587890625, -4.956298828125, -4.7723388671875, -4.58837890625, -4.4044189453125, -4.220458984375, -4.0364990234375, -3.8525390625, -3.6685791015625, -3.484619140625, -3.3006591796875, -3.11669921875, -2.9327392578125, -2.748779296875, -2.5648193359375, -2.380859375, -2.1968994140625, -2.012939453125, -1.8289794921875, -1.64501953125, -1.4610595703125, -1.277099609375, -1.0931396484375, -0.9091796875, -0.7252197265625, -0.541259765625, -0.3572998046875, -0.17333984375, 0.0106201171875, 0.194580078125, 0.3785400390625, 0.5625, 0.7464599609375, 0.930419921875, 1.1143798828125, 1.29833984375, 1.4822998046875, 1.666259765625, 1.8502197265625, 2.0341796875, 2.2181396484375, 2.402099609375, 2.5860595703125, 2.77001953125, 2.9539794921875, 3.137939453125, 3.3218994140625, 3.505859375, 3.6898193359375, 3.873779296875, 4.0577392578125, 4.24169921875, 4.4256591796875, 4.609619140625, 4.7935791015625, 4.9775390625, 5.1614990234375, 5.345458984375, 5.5294189453125, 5.71337890625, 5.8973388671875, 6.081298828125, 6.2652587890625, 6.44921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 5.0, 7.0, 8.0, 23.0, 25.0, 30.0, 45.0, 48.0, 86.0, 126.0, 224.0, 393.0, 646.0, 1232.0, 2560.0, 5686.0, 15380.0, 65084.0, 471466.0, 404412.0, 56560.0, 14093.0, 5236.0, 2402.0, 1144.0, 620.0, 362.0, 221.0, 145.0, 90.0, 52.0, 37.0, 23.0, 11.0, 14.0, 14.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.34375, -2.270416259765625, -2.19708251953125, -2.123748779296875, -2.0504150390625, -1.977081298828125, -1.90374755859375, -1.830413818359375, -1.757080078125, -1.683746337890625, -1.61041259765625, -1.537078857421875, -1.4637451171875, -1.390411376953125, -1.31707763671875, -1.243743896484375, -1.17041015625, -1.097076416015625, -1.02374267578125, -0.950408935546875, -0.8770751953125, -0.803741455078125, -0.73040771484375, -0.657073974609375, -0.583740234375, -0.510406494140625, -0.43707275390625, -0.363739013671875, -0.2904052734375, -0.217071533203125, -0.14373779296875, -0.070404052734375, 0.0029296875, 0.076263427734375, 0.14959716796875, 0.222930908203125, 0.2962646484375, 0.369598388671875, 0.44293212890625, 0.516265869140625, 0.589599609375, 0.662933349609375, 0.73626708984375, 0.809600830078125, 0.8829345703125, 0.956268310546875, 1.02960205078125, 1.102935791015625, 1.17626953125, 1.249603271484375, 1.32293701171875, 1.396270751953125, 1.4696044921875, 1.542938232421875, 1.61627197265625, 1.689605712890625, 1.762939453125, 1.836273193359375, 1.90960693359375, 1.982940673828125, 2.0562744140625, 2.129608154296875, 2.20294189453125, 2.276275634765625, 2.349609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 11.0, 16.0, 25.0, 34.0, 71.0, 122.0, 188.0, 172.0, 136.0, 98.0, 46.0, 31.0, 7.0, 11.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007476806640625, -0.0007229968905448914, -0.0006983131170272827, -0.0006736293435096741, -0.0006489455699920654, -0.0006242617964744568, -0.0005995780229568481, -0.0005748942494392395, -0.0005502104759216309, -0.0005255267024040222, -0.0005008429288864136, -0.00047615915536880493, -0.0004514753818511963, -0.00042679160833358765, -0.000402107834815979, -0.00037742406129837036, -0.0003527402877807617, -0.0003280565142631531, -0.00030337274074554443, -0.0002786889672279358, -0.00025400519371032715, -0.0002293214201927185, -0.00020463764667510986, -0.00017995387315750122, -0.00015527009963989258, -0.00013058632612228394, -0.00010590255260467529, -8.121877908706665e-05, -5.653500556945801e-05, -3.1851232051849365e-05, -7.167458534240723e-06, 1.751631498336792e-05, 4.220008850097656e-05, 6.68838620185852e-05, 9.156763553619385e-05, 0.00011625140905380249, 0.00014093518257141113, 0.00016561895608901978, 0.00019030272960662842, 0.00021498650312423706, 0.0002396702766418457, 0.00026435405015945435, 0.000289037823677063, 0.00031372159719467163, 0.0003384053707122803, 0.0003630891442298889, 0.00038777291774749756, 0.0004124566912651062, 0.00043714046478271484, 0.0004618242383003235, 0.00048650801181793213, 0.0005111917853355408, 0.0005358755588531494, 0.0005605593323707581, 0.0005852431058883667, 0.0006099268794059753, 0.000634610652923584, 0.0006592944264411926, 0.0006839781999588013, 0.0007086619734764099, 0.0007333457469940186, 0.0007580295205116272, 0.0007827132940292358, 0.0008073970675468445, 0.0008320808410644531]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 9.0, 15.0, 33.0, 46.0, 63.0, 125.0, 217.0, 453.0, 954.0, 2788.0, 13010.0, 177479.0, 789238.0, 53967.0, 6852.0, 1824.0, 706.0, 327.0, 184.0, 108.0, 65.0, 23.0, 27.0, 12.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.701171875, -3.579071044921875, -3.45697021484375, -3.334869384765625, -3.2127685546875, -3.090667724609375, -2.96856689453125, -2.846466064453125, -2.724365234375, -2.602264404296875, -2.48016357421875, -2.358062744140625, -2.2359619140625, -2.113861083984375, -1.99176025390625, -1.869659423828125, -1.74755859375, -1.625457763671875, -1.50335693359375, -1.381256103515625, -1.2591552734375, -1.137054443359375, -1.01495361328125, -0.892852783203125, -0.770751953125, -0.648651123046875, -0.52655029296875, -0.404449462890625, -0.2823486328125, -0.160247802734375, -0.03814697265625, 0.083953857421875, 0.2060546875, 0.328155517578125, 0.45025634765625, 0.572357177734375, 0.6944580078125, 0.816558837890625, 0.93865966796875, 1.060760498046875, 1.182861328125, 1.304962158203125, 1.42706298828125, 1.549163818359375, 1.6712646484375, 1.793365478515625, 1.91546630859375, 2.037567138671875, 2.15966796875, 2.281768798828125, 2.40386962890625, 2.525970458984375, 2.6480712890625, 2.770172119140625, 2.89227294921875, 3.014373779296875, 3.136474609375, 3.258575439453125, 3.38067626953125, 3.502777099609375, 3.6248779296875, 3.746978759765625, 3.86907958984375, 3.991180419921875, 4.11328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 10.0, 10.0, 19.0, 19.0, 18.0, 39.0, 48.0, 53.0, 88.0, 75.0, 90.0, 101.0, 86.0, 77.0, 60.0, 47.0, 31.0, 37.0, 21.0, 14.0, 9.0, 12.0, 3.0, 6.0, 10.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7353515625, -1.6604461669921875, -1.585540771484375, -1.5106353759765625, -1.43572998046875, -1.3608245849609375, -1.285919189453125, -1.2110137939453125, -1.1361083984375, -1.0612030029296875, -0.986297607421875, -0.9113922119140625, -0.83648681640625, -0.7615814208984375, -0.686676025390625, -0.6117706298828125, -0.536865234375, -0.4619598388671875, -0.387054443359375, -0.3121490478515625, -0.23724365234375, -0.1623382568359375, -0.087432861328125, -0.0125274658203125, 0.0623779296875, 0.1372833251953125, 0.212188720703125, 0.2870941162109375, 0.36199951171875, 0.4369049072265625, 0.511810302734375, 0.5867156982421875, 0.66162109375, 0.7365264892578125, 0.811431884765625, 0.8863372802734375, 0.96124267578125, 1.0361480712890625, 1.111053466796875, 1.1859588623046875, 1.2608642578125, 1.3357696533203125, 1.410675048828125, 1.4855804443359375, 1.56048583984375, 1.6353912353515625, 1.710296630859375, 1.7852020263671875, 1.860107421875, 1.9350128173828125, 2.009918212890625, 2.0848236083984375, 2.15972900390625, 2.2346343994140625, 2.309539794921875, 2.3844451904296875, 2.4593505859375, 2.5342559814453125, 2.609161376953125, 2.6840667724609375, 2.75897216796875, 2.8338775634765625, 2.908782958984375, 2.9836883544921875, 3.05859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 10.0, 18.0, 67.0, 151.0, 298.0, 296.0, 118.0, 36.0, 13.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.30361557006836, -59.33602523803711, -56.36843490600586, -53.400848388671875, -50.433258056640625, -47.465667724609375, -44.498077392578125, -41.530487060546875, -38.562896728515625, -35.595306396484375, -32.627716064453125, -29.660127639770508, -26.692537307739258, -23.724946975708008, -20.75735855102539, -17.78976821899414, -14.82217788696289, -11.85458755493164, -8.886998176574707, -5.919408798217773, -2.9518184661865234, 0.015771865844726562, 2.9833602905273438, 5.950950622558594, 8.918540954589844, 11.886131286621094, 14.853720664978027, 17.82131004333496, 20.78890037536621, 23.75649070739746, 26.724079132080078, 29.691669464111328, 32.65925598144531, 35.62684631347656, 38.59443664550781, 41.56202697753906, 44.52961730957031, 47.49720764160156, 50.46479415893555, 53.4323844909668, 56.39997482299805, 59.3675651550293, 62.33515548706055, 65.30274200439453, 68.27033233642578, 71.23792266845703, 74.20551300048828, 77.17310333251953, 80.14069366455078, 83.10828399658203, 86.07587432861328, 89.04346466064453, 92.01105499267578, 94.97864532470703, 97.94622802734375, 100.913818359375, 103.88140869140625, 106.8489990234375, 109.81658935546875, 112.7841796875, 115.75177001953125, 118.7193603515625, 121.68695068359375, 124.654541015625, 127.62213134765625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 10.0, 5.0, 12.0, 15.0, 19.0, 22.0, 22.0, 22.0, 28.0, 29.0, 37.0, 41.0, 32.0, 41.0, 48.0, 51.0, 47.0, 55.0, 41.0, 50.0, 43.0, 39.0, 39.0, 36.0, 25.0, 24.0, 20.0, 28.0, 16.0, 19.0, 17.0, 14.0, 6.0, 8.0, 3.0, 12.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.79395294189453, -27.920385360717773, -27.046817779541016, -26.17325210571289, -25.299684524536133, -24.426116943359375, -23.552549362182617, -22.67898178100586, -21.805416107177734, -20.931848526000977, -20.05828094482422, -19.184715270996094, -18.311147689819336, -17.437580108642578, -16.56401252746582, -15.690444946289062, -14.816877365112305, -13.943309783935547, -13.069743156433105, -12.196175575256348, -11.322608947753906, -10.449041366577148, -9.57547378540039, -8.701906204223633, -7.828339576721191, -6.954772472381592, -6.081205368041992, -5.207637786865234, -4.334070682525635, -3.460503578186035, -2.5869359970092773, -1.7133688926696777, -0.8398036956787109, 0.03376352787017822, 0.9073307514190674, 1.780898094177246, 2.6544651985168457, 3.5280323028564453, 4.401599884033203, 5.275166988372803, 6.148734092712402, 7.022301197052002, 7.895868301391602, 8.76943588256836, 9.643003463745117, 10.516570091247559, 11.390137672424316, 12.263704299926758, 13.137271881103516, 14.010839462280273, 14.884406089782715, 15.757973670959473, 16.631540298461914, 17.505107879638672, 18.37867546081543, 19.252243041992188, 20.125808715820312, 20.99937629699707, 21.872943878173828, 22.746509552001953, 23.62007713317871, 24.49364471435547, 25.367212295532227, 26.240779876708984, 27.114347457885742]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 10.0, 9.0, 18.0, 23.0, 26.0, 35.0, 39.0, 50.0, 80.0, 91.0, 129.0, 167.0, 266.0, 420.0, 723.0, 1412.0, 3587.0, 12503.0, 181411.0, 3963912.0, 20343.0, 4724.0, 1820.0, 872.0, 516.0, 308.0, 183.0, 135.0, 92.0, 81.0, 53.0, 50.0, 43.0, 27.0, 18.0, 18.0, 14.0, 11.0, 14.0, 5.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0], "bins": [-7.30078125, -7.0869140625, -6.873046875, -6.6591796875, -6.4453125, -6.2314453125, -6.017578125, -5.8037109375, -5.58984375, -5.3759765625, -5.162109375, -4.9482421875, -4.734375, -4.5205078125, -4.306640625, -4.0927734375, -3.87890625, -3.6650390625, -3.451171875, -3.2373046875, -3.0234375, -2.8095703125, -2.595703125, -2.3818359375, -2.16796875, -1.9541015625, -1.740234375, -1.5263671875, -1.3125, -1.0986328125, -0.884765625, -0.6708984375, -0.45703125, -0.2431640625, -0.029296875, 0.1845703125, 0.3984375, 0.6123046875, 0.826171875, 1.0400390625, 1.25390625, 1.4677734375, 1.681640625, 1.8955078125, 2.109375, 2.3232421875, 2.537109375, 2.7509765625, 2.96484375, 3.1787109375, 3.392578125, 3.6064453125, 3.8203125, 4.0341796875, 4.248046875, 4.4619140625, 4.67578125, 4.8896484375, 5.103515625, 5.3173828125, 5.53125, 5.7451171875, 5.958984375, 6.1728515625, 6.38671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 11.0, 15.0, 15.0, 20.0, 40.0, 23.0, 42.0, 55.0, 49.0, 76.0, 63.0, 65.0, 78.0, 69.0, 81.0, 56.0, 42.0, 41.0, 32.0, 26.0, 21.0, 25.0, 13.0, 7.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.7282257080078125, -1.679107666015625, -1.6299896240234375, -1.58087158203125, -1.5317535400390625, -1.482635498046875, -1.4335174560546875, -1.3843994140625, -1.3352813720703125, -1.286163330078125, -1.2370452880859375, -1.18792724609375, -1.1388092041015625, -1.089691162109375, -1.0405731201171875, -0.991455078125, -0.9423370361328125, -0.893218994140625, -0.8441009521484375, -0.79498291015625, -0.7458648681640625, -0.696746826171875, -0.6476287841796875, -0.5985107421875, -0.5493927001953125, -0.500274658203125, -0.4511566162109375, -0.40203857421875, -0.3529205322265625, -0.303802490234375, -0.2546844482421875, -0.20556640625, -0.1564483642578125, -0.107330322265625, -0.0582122802734375, -0.00909423828125, 0.0400238037109375, 0.089141845703125, 0.1382598876953125, 0.1873779296875, 0.2364959716796875, 0.285614013671875, 0.3347320556640625, 0.38385009765625, 0.4329681396484375, 0.482086181640625, 0.5312042236328125, 0.580322265625, 0.6294403076171875, 0.678558349609375, 0.7276763916015625, 0.77679443359375, 0.8259124755859375, 0.875030517578125, 0.9241485595703125, 0.9732666015625, 1.0223846435546875, 1.071502685546875, 1.1206207275390625, 1.16973876953125, 1.2188568115234375, 1.267974853515625, 1.3170928955078125, 1.3662109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 4.0, 2.0, 13.0, 9.0, 14.0, 29.0, 14.0, 36.0, 22.0, 37.0, 43.0, 68.0, 77.0, 102.0, 165.0, 254.0, 560.0, 1179.0, 3311.0, 13290.0, 3795873.0, 363195.0, 10640.0, 2917.0, 1104.0, 477.0, 238.0, 150.0, 95.0, 69.0, 54.0, 40.0, 48.0, 35.0, 32.0, 17.0, 17.0, 12.0, 5.0, 6.0, 10.0, 4.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.5164794921875, -9.236083984375, -8.9556884765625, -8.67529296875, -8.3948974609375, -8.114501953125, -7.8341064453125, -7.5537109375, -7.2733154296875, -6.992919921875, -6.7125244140625, -6.43212890625, -6.1517333984375, -5.871337890625, -5.5909423828125, -5.310546875, -5.0301513671875, -4.749755859375, -4.4693603515625, -4.18896484375, -3.9085693359375, -3.628173828125, -3.3477783203125, -3.0673828125, -2.7869873046875, -2.506591796875, -2.2261962890625, -1.94580078125, -1.6654052734375, -1.385009765625, -1.1046142578125, -0.82421875, -0.5438232421875, -0.263427734375, 0.0169677734375, 0.29736328125, 0.5777587890625, 0.858154296875, 1.1385498046875, 1.4189453125, 1.6993408203125, 1.979736328125, 2.2601318359375, 2.54052734375, 2.8209228515625, 3.101318359375, 3.3817138671875, 3.662109375, 3.9425048828125, 4.222900390625, 4.5032958984375, 4.78369140625, 5.0640869140625, 5.344482421875, 5.6248779296875, 5.9052734375, 6.1856689453125, 6.466064453125, 6.7464599609375, 7.02685546875, 7.3072509765625, 7.587646484375, 7.8680419921875, 8.1484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 8.0, 6.0, 17.0, 82.0, 3595.0, 307.0, 40.0, 12.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73828125, -4.6369781494140625, -4.535675048828125, -4.4343719482421875, -4.33306884765625, -4.2317657470703125, -4.130462646484375, -4.0291595458984375, -3.9278564453125, -3.8265533447265625, -3.725250244140625, -3.6239471435546875, -3.52264404296875, -3.4213409423828125, -3.320037841796875, -3.2187347412109375, -3.117431640625, -3.0161285400390625, -2.914825439453125, -2.8135223388671875, -2.71221923828125, -2.6109161376953125, -2.509613037109375, -2.4083099365234375, -2.3070068359375, -2.2057037353515625, -2.104400634765625, -2.0030975341796875, -1.90179443359375, -1.8004913330078125, -1.699188232421875, -1.5978851318359375, -1.49658203125, -1.3952789306640625, -1.293975830078125, -1.1926727294921875, -1.09136962890625, -0.9900665283203125, -0.888763427734375, -0.7874603271484375, -0.6861572265625, -0.5848541259765625, -0.483551025390625, -0.3822479248046875, -0.28094482421875, -0.1796417236328125, -0.078338623046875, 0.0229644775390625, 0.124267578125, 0.2255706787109375, 0.326873779296875, 0.4281768798828125, 0.52947998046875, 0.6307830810546875, 0.732086181640625, 0.8333892822265625, 0.9346923828125, 1.0359954833984375, 1.137298583984375, 1.2386016845703125, 1.33990478515625, 1.4412078857421875, 1.542510986328125, 1.6438140869140625, 1.7451171875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 17.0, 24.0, 37.0, 62.0, 101.0, 137.0, 170.0, 159.0, 105.0, 72.0, 44.0, 23.0, 19.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.453943252563477, -7.235770225524902, -7.017597198486328, -6.799424171447754, -6.58125114440918, -6.3630781173706055, -6.144905090332031, -5.926731586456299, -5.708558559417725, -5.49038553237915, -5.272212505340576, -5.054039478302002, -4.835866451263428, -4.617692947387695, -4.399519920349121, -4.181346893310547, -3.9631741046905518, -3.7450010776519775, -3.5268280506134033, -3.30865478515625, -3.090481758117676, -2.8723087310791016, -2.6541357040405273, -2.435962677001953, -2.217789649963379, -1.9996166229248047, -1.781443476676941, -1.5632704496383667, -1.345097303390503, -1.1269242763519287, -0.9087512493133545, -0.6905781030654907, -0.47240495681762695, -0.25423187017440796, -0.03605881333351135, 0.18211424350738525, 0.40028733015060425, 0.6184604167938232, 0.8366334438323975, 1.0548065900802612, 1.2729796171188354, 1.4911526441574097, 1.7093257904052734, 1.9274988174438477, 2.145671844482422, 2.363844871520996, 2.5820178985595703, 2.8001911640167236, 3.018364191055298, 3.236537218093872, 3.4547102451324463, 3.6728835105895996, 3.891056537628174, 4.109229564666748, 4.327402591705322, 4.5455756187438965, 4.763748645782471, 4.981921672821045, 5.200094699859619, 5.418267726898193, 5.636440753936768, 5.8546142578125, 6.072787284851074, 6.290960311889648, 6.509133338928223]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 1.0, 5.0, 8.0, 7.0, 13.0, 22.0, 15.0, 16.0, 15.0, 24.0, 33.0, 17.0, 40.0, 22.0, 35.0, 41.0, 51.0, 29.0, 36.0, 54.0, 41.0, 49.0, 54.0, 39.0, 36.0, 40.0, 26.0, 34.0, 28.0, 17.0, 26.0, 16.0, 10.0, 14.0, 14.0, 9.0, 11.0, 15.0, 7.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5316474437713623, -3.425902843475342, -3.320158004760742, -3.2144134044647217, -3.108668804168701, -3.0029239654541016, -2.897179365158081, -2.7914347648620605, -2.685689926147461, -2.5799453258514404, -2.474200487136841, -2.3684558868408203, -2.2627110481262207, -2.1569664478302, -2.0512218475341797, -1.9454771280288696, -1.8397324085235596, -1.7339876890182495, -1.6282429695129395, -1.522498369216919, -1.4167536497116089, -1.3110089302062988, -1.2052643299102783, -1.0995196104049683, -0.9937748908996582, -0.8880301713943481, -0.7822855114936829, -0.6765408515930176, -0.5707961320877075, -0.46505141258239746, -0.3593067526817322, -0.2535620927810669, -0.14781761169433594, -0.04207292199134827, 0.0636717677116394, 0.16941645741462708, 0.27516114711761475, 0.3809058666229248, 0.4866505265235901, 0.5923951864242554, 0.6981399059295654, 0.8038846254348755, 0.9096292853355408, 1.015373945236206, 1.1211186647415161, 1.2268633842468262, 1.3326079845428467, 1.4383527040481567, 1.5440974235534668, 1.6498421430587769, 1.755586862564087, 1.8613314628601074, 1.9670761823654175, 2.0728209018707275, 2.178565502166748, 2.2843103408813477, 2.390054941177368, 2.4957995414733887, 2.6015443801879883, 2.707288980484009, 2.8130335807800293, 2.918778419494629, 3.0245230197906494, 3.13026762008667, 3.2360124588012695]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 14.0, 19.0, 28.0, 42.0, 57.0, 123.0, 211.0, 358.0, 640.0, 1371.0, 2554.0, 5651.0, 12539.0, 30668.0, 85512.0, 268921.0, 403931.0, 150538.0, 49772.0, 19427.0, 8379.0, 3891.0, 1909.0, 949.0, 474.0, 258.0, 129.0, 81.0, 35.0, 27.0, 9.0, 15.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.24334716796875, -2.1468505859375, -2.05035400390625, -1.953857421875, -1.85736083984375, -1.7608642578125, -1.66436767578125, -1.56787109375, -1.47137451171875, -1.3748779296875, -1.27838134765625, -1.181884765625, -1.08538818359375, -0.9888916015625, -0.89239501953125, -0.7958984375, -0.69940185546875, -0.6029052734375, -0.50640869140625, -0.409912109375, -0.31341552734375, -0.2169189453125, -0.12042236328125, -0.02392578125, 0.07257080078125, 0.1690673828125, 0.26556396484375, 0.362060546875, 0.45855712890625, 0.5550537109375, 0.65155029296875, 0.748046875, 0.84454345703125, 0.9410400390625, 1.03753662109375, 1.134033203125, 1.23052978515625, 1.3270263671875, 1.42352294921875, 1.52001953125, 1.61651611328125, 1.7130126953125, 1.80950927734375, 1.906005859375, 2.00250244140625, 2.0989990234375, 2.19549560546875, 2.2919921875, 2.38848876953125, 2.4849853515625, 2.58148193359375, 2.677978515625, 2.77447509765625, 2.8709716796875, 2.96746826171875, 3.06396484375, 3.16046142578125, 3.2569580078125, 3.35345458984375, 3.449951171875, 3.54644775390625, 3.6429443359375, 3.73944091796875, 3.8359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 15.0, 29.0, 29.0, 36.0, 56.0, 69.0, 61.0, 69.0, 79.0, 76.0, 71.0, 70.0, 68.0, 54.0, 57.0, 35.0, 28.0, 16.0, 22.0, 10.0, 10.0, 6.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265625, -2.2052154541015625, -2.144805908203125, -2.0843963623046875, -2.02398681640625, -1.9635772705078125, -1.903167724609375, -1.8427581787109375, -1.7823486328125, -1.7219390869140625, -1.661529541015625, -1.6011199951171875, -1.54071044921875, -1.4803009033203125, -1.419891357421875, -1.3594818115234375, -1.299072265625, -1.2386627197265625, -1.178253173828125, -1.1178436279296875, -1.05743408203125, -0.9970245361328125, -0.936614990234375, -0.8762054443359375, -0.8157958984375, -0.7553863525390625, -0.694976806640625, -0.6345672607421875, -0.57415771484375, -0.5137481689453125, -0.453338623046875, -0.3929290771484375, -0.33251953125, -0.2721099853515625, -0.211700439453125, -0.1512908935546875, -0.09088134765625, -0.0304718017578125, 0.029937744140625, 0.0903472900390625, 0.1507568359375, 0.2111663818359375, 0.271575927734375, 0.3319854736328125, 0.39239501953125, 0.4528045654296875, 0.513214111328125, 0.5736236572265625, 0.634033203125, 0.6944427490234375, 0.754852294921875, 0.8152618408203125, 0.87567138671875, 0.9360809326171875, 0.996490478515625, 1.0569000244140625, 1.1173095703125, 1.1777191162109375, 1.238128662109375, 1.2985382080078125, 1.35894775390625, 1.4193572998046875, 1.479766845703125, 1.5401763916015625, 1.6005859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 9.0, 4.0, 5.0, 7.0, 22.0, 21.0, 41.0, 66.0, 84.0, 186.0, 342.0, 727.0, 1978.0, 14792.0, 847407.0, 174972.0, 5483.0, 1294.0, 536.0, 242.0, 128.0, 74.0, 56.0, 26.0, 16.0, 16.0, 10.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.8984375, -12.5052490234375, -12.112060546875, -11.7188720703125, -11.32568359375, -10.9324951171875, -10.539306640625, -10.1461181640625, -9.7529296875, -9.3597412109375, -8.966552734375, -8.5733642578125, -8.18017578125, -7.7869873046875, -7.393798828125, -7.0006103515625, -6.607421875, -6.2142333984375, -5.821044921875, -5.4278564453125, -5.03466796875, -4.6414794921875, -4.248291015625, -3.8551025390625, -3.4619140625, -3.0687255859375, -2.675537109375, -2.2823486328125, -1.88916015625, -1.4959716796875, -1.102783203125, -0.7095947265625, -0.31640625, 0.0767822265625, 0.469970703125, 0.8631591796875, 1.25634765625, 1.6495361328125, 2.042724609375, 2.4359130859375, 2.8291015625, 3.2222900390625, 3.615478515625, 4.0086669921875, 4.40185546875, 4.7950439453125, 5.188232421875, 5.5814208984375, 5.974609375, 6.3677978515625, 6.760986328125, 7.1541748046875, 7.54736328125, 7.9405517578125, 8.333740234375, 8.7269287109375, 9.1201171875, 9.5133056640625, 9.906494140625, 10.2996826171875, 10.69287109375, 11.0860595703125, 11.479248046875, 11.8724365234375, 12.265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 10.0, 14.0, 11.0, 9.0, 20.0, 14.0, 27.0, 19.0, 35.0, 22.0, 34.0, 36.0, 36.0, 31.0, 33.0, 46.0, 46.0, 57.0, 43.0, 42.0, 47.0, 38.0, 39.0, 43.0, 33.0, 34.0, 19.0, 24.0, 14.0, 18.0, 14.0, 12.0, 13.0, 12.0, 5.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0], "bins": [-6.34765625, -6.16265869140625, -5.9776611328125, -5.79266357421875, -5.607666015625, -5.42266845703125, -5.2376708984375, -5.05267333984375, -4.86767578125, -4.68267822265625, -4.4976806640625, -4.31268310546875, -4.127685546875, -3.94268798828125, -3.7576904296875, -3.57269287109375, -3.3876953125, -3.20269775390625, -3.0177001953125, -2.83270263671875, -2.647705078125, -2.46270751953125, -2.2777099609375, -2.09271240234375, -1.90771484375, -1.72271728515625, -1.5377197265625, -1.35272216796875, -1.167724609375, -0.98272705078125, -0.7977294921875, -0.61273193359375, -0.427734375, -0.24273681640625, -0.0577392578125, 0.12725830078125, 0.312255859375, 0.49725341796875, 0.6822509765625, 0.86724853515625, 1.05224609375, 1.23724365234375, 1.4222412109375, 1.60723876953125, 1.792236328125, 1.97723388671875, 2.1622314453125, 2.34722900390625, 2.5322265625, 2.71722412109375, 2.9022216796875, 3.08721923828125, 3.272216796875, 3.45721435546875, 3.6422119140625, 3.82720947265625, 4.01220703125, 4.19720458984375, 4.3822021484375, 4.56719970703125, 4.752197265625, 4.93719482421875, 5.1221923828125, 5.30718994140625, 5.4921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 10.0, 4.0, 3.0, 8.0, 8.0, 18.0, 17.0, 31.0, 60.0, 104.0, 250.0, 573.0, 1661.0, 8798.0, 179251.0, 821960.0, 30629.0, 3544.0, 908.0, 323.0, 174.0, 84.0, 55.0, 40.0, 11.0, 10.0, 4.0, 4.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.68359375, -4.557861328125, -4.43212890625, -4.306396484375, -4.1806640625, -4.054931640625, -3.92919921875, -3.803466796875, -3.677734375, -3.552001953125, -3.42626953125, -3.300537109375, -3.1748046875, -3.049072265625, -2.92333984375, -2.797607421875, -2.671875, -2.546142578125, -2.42041015625, -2.294677734375, -2.1689453125, -2.043212890625, -1.91748046875, -1.791748046875, -1.666015625, -1.540283203125, -1.41455078125, -1.288818359375, -1.1630859375, -1.037353515625, -0.91162109375, -0.785888671875, -0.66015625, -0.534423828125, -0.40869140625, -0.282958984375, -0.1572265625, -0.031494140625, 0.09423828125, 0.219970703125, 0.345703125, 0.471435546875, 0.59716796875, 0.722900390625, 0.8486328125, 0.974365234375, 1.10009765625, 1.225830078125, 1.3515625, 1.477294921875, 1.60302734375, 1.728759765625, 1.8544921875, 1.980224609375, 2.10595703125, 2.231689453125, 2.357421875, 2.483154296875, 2.60888671875, 2.734619140625, 2.8603515625, 2.986083984375, 3.11181640625, 3.237548828125, 3.36328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 10.0, 11.0, 14.0, 11.0, 22.0, 31.0, 30.0, 36.0, 57.0, 56.0, 87.0, 100.0, 93.0, 73.0, 77.0, 59.0, 54.0, 46.0, 26.0, 32.0, 15.0, 14.0, 9.0, 10.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029158592224121094, -0.00028128549456596375, -0.00027098506689071655, -0.00026068463921546936, -0.00025038421154022217, -0.00024008378386497498, -0.00022978335618972778, -0.0002194829285144806, -0.0002091825008392334, -0.0001988820731639862, -0.00018858164548873901, -0.00017828121781349182, -0.00016798079013824463, -0.00015768036246299744, -0.00014737993478775024, -0.00013707950711250305, -0.00012677907943725586, -0.00011647865176200867, -0.00010617822408676147, -9.587779641151428e-05, -8.557736873626709e-05, -7.52769410610199e-05, -6.49765133857727e-05, -5.467608571052551e-05, -4.437565803527832e-05, -3.407523036003113e-05, -2.3774802684783936e-05, -1.3474375009536743e-05, -3.1739473342895508e-06, 7.126480340957642e-06, 1.7426908016204834e-05, 2.7727335691452026e-05, 3.802776336669922e-05, 4.832819104194641e-05, 5.8628618717193604e-05, 6.89290463924408e-05, 7.922947406768799e-05, 8.952990174293518e-05, 9.983032941818237e-05, 0.00011013075709342957, 0.00012043118476867676, 0.00013073161244392395, 0.00014103204011917114, 0.00015133246779441833, 0.00016163289546966553, 0.00017193332314491272, 0.0001822337508201599, 0.0001925341784954071, 0.0002028346061706543, 0.0002131350338459015, 0.00022343546152114868, 0.00023373588919639587, 0.00024403631687164307, 0.00025433674454689026, 0.00026463717222213745, 0.00027493759989738464, 0.00028523802757263184, 0.00029553845524787903, 0.0003058388829231262, 0.0003161393105983734, 0.0003264397382736206, 0.0003367401659488678, 0.000347040593624115, 0.0003573410212993622, 0.0003676414489746094]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 15.0, 17.0, 24.0, 42.0, 79.0, 129.0, 233.0, 747.0, 4555.0, 138312.0, 887275.0, 14739.0, 1551.0, 430.0, 154.0, 96.0, 61.0, 31.0, 16.0, 16.0, 10.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.10546875, -4.91796875, -4.73046875, -4.54296875, -4.35546875, -4.16796875, -3.98046875, -3.79296875, -3.60546875, -3.41796875, -3.23046875, -3.04296875, -2.85546875, -2.66796875, -2.48046875, -2.29296875, -2.10546875, -1.91796875, -1.73046875, -1.54296875, -1.35546875, -1.16796875, -0.98046875, -0.79296875, -0.60546875, -0.41796875, -0.23046875, -0.04296875, 0.14453125, 0.33203125, 0.51953125, 0.70703125, 0.89453125, 1.08203125, 1.26953125, 1.45703125, 1.64453125, 1.83203125, 2.01953125, 2.20703125, 2.39453125, 2.58203125, 2.76953125, 2.95703125, 3.14453125, 3.33203125, 3.51953125, 3.70703125, 3.89453125, 4.08203125, 4.26953125, 4.45703125, 4.64453125, 4.83203125, 5.01953125, 5.20703125, 5.39453125, 5.58203125, 5.76953125, 5.95703125, 6.14453125, 6.33203125, 6.51953125, 6.70703125, 6.89453125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 12.0, 6.0, 15.0, 20.0, 36.0, 63.0, 63.0, 101.0, 94.0, 107.0, 91.0, 104.0, 80.0, 59.0, 50.0, 26.0, 23.0, 12.0, 7.0, 6.0, 2.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -1.990570068359375, -1.91278076171875, -1.834991455078125, -1.7572021484375, -1.679412841796875, -1.60162353515625, -1.523834228515625, -1.446044921875, -1.368255615234375, -1.29046630859375, -1.212677001953125, -1.1348876953125, -1.057098388671875, -0.97930908203125, -0.901519775390625, -0.82373046875, -0.745941162109375, -0.66815185546875, -0.590362548828125, -0.5125732421875, -0.434783935546875, -0.35699462890625, -0.279205322265625, -0.201416015625, -0.123626708984375, -0.04583740234375, 0.031951904296875, 0.1097412109375, 0.187530517578125, 0.26531982421875, 0.343109130859375, 0.4208984375, 0.498687744140625, 0.57647705078125, 0.654266357421875, 0.7320556640625, 0.809844970703125, 0.88763427734375, 0.965423583984375, 1.043212890625, 1.121002197265625, 1.19879150390625, 1.276580810546875, 1.3543701171875, 1.432159423828125, 1.50994873046875, 1.587738037109375, 1.66552734375, 1.743316650390625, 1.82110595703125, 1.898895263671875, 1.9766845703125, 2.054473876953125, 2.13226318359375, 2.210052490234375, 2.287841796875, 2.365631103515625, 2.44342041015625, 2.521209716796875, 2.5989990234375, 2.676788330078125, 2.75457763671875, 2.832366943359375, 2.91015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 24.0, 50.0, 179.0, 299.0, 249.0, 125.0, 40.0, 17.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.280296325683594, -50.846221923828125, -48.41215133666992, -45.97807693481445, -43.54400634765625, -41.10993194580078, -38.67585754394531, -36.241783142089844, -33.80771255493164, -31.373640060424805, -28.93956756591797, -26.5054931640625, -24.071420669555664, -21.637348175048828, -19.20327377319336, -16.769201278686523, -14.335128784179688, -11.901056289672852, -9.4669828414917, -7.032909870147705, -4.598836898803711, -2.164764404296875, 0.26930904388427734, 2.7033824920654297, 5.137454986572266, 7.57152795791626, 10.005600929260254, 12.439674377441406, 14.873746871948242, 17.307819366455078, 19.741893768310547, 22.175966262817383, 24.610031127929688, 27.044103622436523, 29.47817611694336, 31.912250518798828, 34.34632110595703, 36.7803955078125, 39.21446990966797, 41.64854431152344, 44.08261489868164, 46.51668930053711, 48.95075988769531, 51.38483428955078, 53.81890869140625, 56.25297927856445, 58.68705368041992, 61.121124267578125, 63.555198669433594, 65.98927307128906, 68.42334747314453, 70.85741424560547, 73.29148864746094, 75.7255630493164, 78.15963745117188, 80.59371185302734, 83.02778625488281, 85.46186065673828, 87.89593505859375, 90.33000183105469, 92.76407623291016, 95.19815063476562, 97.6322250366211, 100.06629943847656, 102.5003662109375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 13.0, 19.0, 26.0, 26.0, 20.0, 52.0, 64.0, 43.0, 53.0, 71.0, 65.0, 57.0, 76.0, 60.0, 65.0, 42.0, 55.0, 40.0, 27.0, 18.0, 18.0, 16.0, 8.0, 14.0, 11.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.59623718261719, -42.42603302001953, -41.255828857421875, -40.08562088012695, -38.9154167175293, -37.74521255493164, -36.575008392333984, -35.40480422973633, -34.234596252441406, -33.06439208984375, -31.89418601989746, -30.723981857299805, -29.553775787353516, -28.38357162475586, -27.213367462158203, -26.043163299560547, -24.87295913696289, -23.702754974365234, -22.532548904418945, -21.36234474182129, -20.192138671875, -19.021934509277344, -17.851730346679688, -16.68152618408203, -15.511320114135742, -14.34111499786377, -13.170909881591797, -12.00070571899414, -10.830500602722168, -9.660295486450195, -8.490091323852539, -7.319886207580566, -6.149684906005859, -4.979479789733887, -3.8092751502990723, -2.6390702724456787, -1.4688653945922852, -0.2986602783203125, 0.871544361114502, 2.0417490005493164, 3.211954116821289, 4.382159233093262, 5.552363872528076, 6.722568511962891, 7.892773628234863, 9.062978744506836, 10.233182907104492, 11.403388023376465, 12.573593139648438, 13.74379825592041, 14.914003372192383, 16.08420753479004, 17.254413604736328, 18.424617767333984, 19.59482192993164, 20.765026092529297, 21.935232162475586, 23.105436325073242, 24.27564239501953, 25.445846557617188, 26.616050720214844, 27.786256790161133, 28.95646095275879, 30.126667022705078, 31.296871185302734]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 9.0, 11.0, 27.0, 28.0, 32.0, 56.0, 74.0, 110.0, 130.0, 165.0, 254.0, 388.0, 561.0, 992.0, 2000.0, 4952.0, 18660.0, 4075774.0, 73817.0, 9349.0, 3108.0, 1396.0, 761.0, 463.0, 300.0, 243.0, 162.0, 105.0, 86.0, 66.0, 34.0, 39.0, 35.0, 17.0, 19.0, 9.0, 8.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.17578125, -6.949951171875, -6.72412109375, -6.498291015625, -6.2724609375, -6.046630859375, -5.82080078125, -5.594970703125, -5.369140625, -5.143310546875, -4.91748046875, -4.691650390625, -4.4658203125, -4.239990234375, -4.01416015625, -3.788330078125, -3.5625, -3.336669921875, -3.11083984375, -2.885009765625, -2.6591796875, -2.433349609375, -2.20751953125, -1.981689453125, -1.755859375, -1.530029296875, -1.30419921875, -1.078369140625, -0.8525390625, -0.626708984375, -0.40087890625, -0.175048828125, 0.05078125, 0.276611328125, 0.50244140625, 0.728271484375, 0.9541015625, 1.179931640625, 1.40576171875, 1.631591796875, 1.857421875, 2.083251953125, 2.30908203125, 2.534912109375, 2.7607421875, 2.986572265625, 3.21240234375, 3.438232421875, 3.6640625, 3.889892578125, 4.11572265625, 4.341552734375, 4.5673828125, 4.793212890625, 5.01904296875, 5.244873046875, 5.470703125, 5.696533203125, 5.92236328125, 6.148193359375, 6.3740234375, 6.599853515625, 6.82568359375, 7.051513671875, 7.27734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 10.0, 11.0, 21.0, 21.0, 22.0, 44.0, 46.0, 64.0, 68.0, 73.0, 80.0, 73.0, 81.0, 59.0, 62.0, 57.0, 37.0, 43.0, 30.0, 24.0, 20.0, 19.0, 8.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6636505126953125, -1.603668212890625, -1.5436859130859375, -1.48370361328125, -1.4237213134765625, -1.363739013671875, -1.3037567138671875, -1.2437744140625, -1.1837921142578125, -1.123809814453125, -1.0638275146484375, -1.00384521484375, -0.9438629150390625, -0.883880615234375, -0.8238983154296875, -0.763916015625, -0.7039337158203125, -0.643951416015625, -0.5839691162109375, -0.52398681640625, -0.4640045166015625, -0.404022216796875, -0.3440399169921875, -0.2840576171875, -0.2240753173828125, -0.164093017578125, -0.1041107177734375, -0.04412841796875, 0.0158538818359375, 0.075836181640625, 0.1358184814453125, 0.19580078125, 0.2557830810546875, 0.315765380859375, 0.3757476806640625, 0.43572998046875, 0.4957122802734375, 0.555694580078125, 0.6156768798828125, 0.6756591796875, 0.7356414794921875, 0.795623779296875, 0.8556060791015625, 0.91558837890625, 0.9755706787109375, 1.035552978515625, 1.0955352783203125, 1.155517578125, 1.2154998779296875, 1.275482177734375, 1.3354644775390625, 1.39544677734375, 1.4554290771484375, 1.515411376953125, 1.5753936767578125, 1.6353759765625, 1.6953582763671875, 1.755340576171875, 1.8153228759765625, 1.87530517578125, 1.9352874755859375, 1.995269775390625, 2.0552520751953125, 2.115234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 7.0, 12.0, 14.0, 17.0, 13.0, 34.0, 32.0, 40.0, 65.0, 86.0, 124.0, 203.0, 315.0, 631.0, 1318.0, 3541.0, 13872.0, 4103535.0, 59394.0, 6636.0, 2168.0, 948.0, 459.0, 263.0, 171.0, 101.0, 86.0, 64.0, 37.0, 26.0, 25.0, 14.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8125, -10.482421875, -10.15234375, -9.822265625, -9.4921875, -9.162109375, -8.83203125, -8.501953125, -8.171875, -7.841796875, -7.51171875, -7.181640625, -6.8515625, -6.521484375, -6.19140625, -5.861328125, -5.53125, -5.201171875, -4.87109375, -4.541015625, -4.2109375, -3.880859375, -3.55078125, -3.220703125, -2.890625, -2.560546875, -2.23046875, -1.900390625, -1.5703125, -1.240234375, -0.91015625, -0.580078125, -0.25, 0.080078125, 0.41015625, 0.740234375, 1.0703125, 1.400390625, 1.73046875, 2.060546875, 2.390625, 2.720703125, 3.05078125, 3.380859375, 3.7109375, 4.041015625, 4.37109375, 4.701171875, 5.03125, 5.361328125, 5.69140625, 6.021484375, 6.3515625, 6.681640625, 7.01171875, 7.341796875, 7.671875, 8.001953125, 8.33203125, 8.662109375, 8.9921875, 9.322265625, 9.65234375, 9.982421875, 10.3125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 13.0, 48.0, 3747.0, 208.0, 27.0, 15.0, 5.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.689453125, -3.58038330078125, -3.4713134765625, -3.36224365234375, -3.253173828125, -3.14410400390625, -3.0350341796875, -2.92596435546875, -2.81689453125, -2.70782470703125, -2.5987548828125, -2.48968505859375, -2.380615234375, -2.27154541015625, -2.1624755859375, -2.05340576171875, -1.9443359375, -1.83526611328125, -1.7261962890625, -1.61712646484375, -1.508056640625, -1.39898681640625, -1.2899169921875, -1.18084716796875, -1.07177734375, -0.96270751953125, -0.8536376953125, -0.74456787109375, -0.635498046875, -0.52642822265625, -0.4173583984375, -0.30828857421875, -0.19921875, -0.09014892578125, 0.0189208984375, 0.12799072265625, 0.237060546875, 0.34613037109375, 0.4552001953125, 0.56427001953125, 0.67333984375, 0.78240966796875, 0.8914794921875, 1.00054931640625, 1.109619140625, 1.21868896484375, 1.3277587890625, 1.43682861328125, 1.5458984375, 1.65496826171875, 1.7640380859375, 1.87310791015625, 1.982177734375, 2.09124755859375, 2.2003173828125, 2.30938720703125, 2.41845703125, 2.52752685546875, 2.6365966796875, 2.74566650390625, 2.854736328125, 2.96380615234375, 3.0728759765625, 3.18194580078125, 3.291015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 11.0, 16.0, 34.0, 58.0, 88.0, 112.0, 143.0, 132.0, 144.0, 78.0, 63.0, 45.0, 24.0, 12.0, 10.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.5110344886779785, -7.3282294273376465, -7.1454243659973145, -6.962619304656982, -6.77981424331665, -6.597009181976318, -6.414204120635986, -6.231399059295654, -6.048593997955322, -5.86578893661499, -5.682983875274658, -5.500178813934326, -5.317373752593994, -5.134568691253662, -4.95176362991333, -4.768958568572998, -4.586153507232666, -4.403348445892334, -4.220543384552002, -4.03773832321167, -3.854933261871338, -3.672128200531006, -3.489323139190674, -3.306518077850342, -3.1237130165100098, -2.9409079551696777, -2.7581028938293457, -2.5752978324890137, -2.3924927711486816, -2.2096877098083496, -2.0268826484680176, -1.8440775871276855, -1.6612720489501953, -1.4784669876098633, -1.2956619262695312, -1.1128568649291992, -0.9300518035888672, -0.7472467422485352, -0.5644416809082031, -0.3816366195678711, -0.19883155822753906, -0.01602649688720703, 0.166778564453125, 0.34958362579345703, 0.5323886871337891, 0.7151937484741211, 0.8979988098144531, 1.0808038711547852, 1.2636089324951172, 1.4464139938354492, 1.6292190551757812, 1.8120241165161133, 1.9948291778564453, 2.1776342391967773, 2.3604393005371094, 2.5432443618774414, 2.7260494232177734, 2.9088544845581055, 3.0916595458984375, 3.2744646072387695, 3.4572696685791016, 3.6400747299194336, 3.8228797912597656, 4.005684852600098, 4.18848991394043]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 8.0, 10.0, 11.0, 14.0, 16.0, 20.0, 15.0, 17.0, 18.0, 28.0, 26.0, 33.0, 33.0, 31.0, 49.0, 52.0, 30.0, 48.0, 40.0, 44.0, 35.0, 42.0, 39.0, 30.0, 42.0, 36.0, 31.0, 41.0, 19.0, 19.0, 16.0, 7.0, 20.0, 14.0, 14.0, 7.0, 7.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.013434648513794, -2.918721914291382, -2.824009418487549, -2.7292966842651367, -2.6345839500427246, -2.5398712158203125, -2.4451584815979004, -2.3504459857940674, -2.2557332515716553, -2.161020517349243, -2.06630802154541, -1.971595287322998, -1.876882553100586, -1.7821698188781738, -1.6874572038650513, -1.5927445888519287, -1.4980318546295166, -1.4033191204071045, -1.308606505393982, -1.2138938903808594, -1.1191811561584473, -1.0244684219360352, -0.9297558069229126, -0.8350431323051453, -0.7403304576873779, -0.6456177830696106, -0.5509051084518433, -0.4561924338340759, -0.3614797592163086, -0.26676708459854126, -0.17205440998077393, -0.07734173536300659, 0.017370939254760742, 0.11208361387252808, 0.2067962884902954, 0.30150896310806274, 0.3962216377258301, 0.4909343123435974, 0.5856469869613647, 0.6803596615791321, 0.7750723361968994, 0.8697850108146667, 0.9644976854324341, 1.0592103004455566, 1.1539230346679688, 1.2486357688903809, 1.3433483839035034, 1.438060998916626, 1.532773733139038, 1.6274864673614502, 1.7221990823745728, 1.8169116973876953, 1.9116244316101074, 2.0063371658325195, 2.1010499000549316, 2.1957623958587646, 2.2904751300811768, 2.385187864303589, 2.479900360107422, 2.574613094329834, 2.669325828552246, 2.764038562774658, 2.8587512969970703, 2.9534637928009033, 3.0481765270233154]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 10.0, 10.0, 18.0, 29.0, 28.0, 48.0, 74.0, 115.0, 161.0, 239.0, 402.0, 698.0, 1229.0, 2298.0, 4528.0, 9365.0, 20661.0, 49789.0, 126629.0, 335840.0, 303693.0, 112100.0, 44349.0, 18582.0, 8451.0, 4118.0, 2135.0, 1173.0, 698.0, 370.0, 254.0, 137.0, 87.0, 68.0, 36.0, 35.0, 25.0, 18.0, 14.0, 9.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.31640625, -2.236358642578125, -2.15631103515625, -2.076263427734375, -1.9962158203125, -1.916168212890625, -1.83612060546875, -1.756072998046875, -1.676025390625, -1.595977783203125, -1.51593017578125, -1.435882568359375, -1.3558349609375, -1.275787353515625, -1.19573974609375, -1.115692138671875, -1.03564453125, -0.955596923828125, -0.87554931640625, -0.795501708984375, -0.7154541015625, -0.635406494140625, -0.55535888671875, -0.475311279296875, -0.395263671875, -0.315216064453125, -0.23516845703125, -0.155120849609375, -0.0750732421875, 0.004974365234375, 0.08502197265625, 0.165069580078125, 0.2451171875, 0.325164794921875, 0.40521240234375, 0.485260009765625, 0.5653076171875, 0.645355224609375, 0.72540283203125, 0.805450439453125, 0.885498046875, 0.965545654296875, 1.04559326171875, 1.125640869140625, 1.2056884765625, 1.285736083984375, 1.36578369140625, 1.445831298828125, 1.52587890625, 1.605926513671875, 1.68597412109375, 1.766021728515625, 1.8460693359375, 1.926116943359375, 2.00616455078125, 2.086212158203125, 2.166259765625, 2.246307373046875, 2.32635498046875, 2.406402587890625, 2.4864501953125, 2.566497802734375, 2.64654541015625, 2.726593017578125, 2.806640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 10.0, 27.0, 24.0, 30.0, 34.0, 49.0, 48.0, 69.0, 71.0, 61.0, 65.0, 68.0, 57.0, 57.0, 51.0, 49.0, 34.0, 39.0, 27.0, 17.0, 29.0, 10.0, 11.0, 9.0, 12.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7412109375, -1.684906005859375, -1.62860107421875, -1.572296142578125, -1.5159912109375, -1.459686279296875, -1.40338134765625, -1.347076416015625, -1.290771484375, -1.234466552734375, -1.17816162109375, -1.121856689453125, -1.0655517578125, -1.009246826171875, -0.95294189453125, -0.896636962890625, -0.84033203125, -0.784027099609375, -0.72772216796875, -0.671417236328125, -0.6151123046875, -0.558807373046875, -0.50250244140625, -0.446197509765625, -0.389892578125, -0.333587646484375, -0.27728271484375, -0.220977783203125, -0.1646728515625, -0.108367919921875, -0.05206298828125, 0.004241943359375, 0.060546875, 0.116851806640625, 0.17315673828125, 0.229461669921875, 0.2857666015625, 0.342071533203125, 0.39837646484375, 0.454681396484375, 0.510986328125, 0.567291259765625, 0.62359619140625, 0.679901123046875, 0.7362060546875, 0.792510986328125, 0.84881591796875, 0.905120849609375, 0.96142578125, 1.017730712890625, 1.07403564453125, 1.130340576171875, 1.1866455078125, 1.242950439453125, 1.29925537109375, 1.355560302734375, 1.411865234375, 1.468170166015625, 1.52447509765625, 1.580780029296875, 1.6370849609375, 1.693389892578125, 1.74969482421875, 1.805999755859375, 1.8623046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 8.0, 19.0, 20.0, 31.0, 34.0, 49.0, 82.0, 98.0, 168.0, 266.0, 434.0, 678.0, 1403.0, 3913.0, 21468.0, 371259.0, 610269.0, 29943.0, 4732.0, 1584.0, 769.0, 424.0, 296.0, 199.0, 126.0, 81.0, 52.0, 40.0, 27.0, 28.0, 14.0, 7.0, 9.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -7.01104736328125, -6.8111572265625, -6.61126708984375, -6.411376953125, -6.21148681640625, -6.0115966796875, -5.81170654296875, -5.61181640625, -5.41192626953125, -5.2120361328125, -5.01214599609375, -4.812255859375, -4.61236572265625, -4.4124755859375, -4.21258544921875, -4.0126953125, -3.81280517578125, -3.6129150390625, -3.41302490234375, -3.213134765625, -3.01324462890625, -2.8133544921875, -2.61346435546875, -2.41357421875, -2.21368408203125, -2.0137939453125, -1.81390380859375, -1.614013671875, -1.41412353515625, -1.2142333984375, -1.01434326171875, -0.814453125, -0.61456298828125, -0.4146728515625, -0.21478271484375, -0.014892578125, 0.18499755859375, 0.3848876953125, 0.58477783203125, 0.78466796875, 0.98455810546875, 1.1844482421875, 1.38433837890625, 1.584228515625, 1.78411865234375, 1.9840087890625, 2.18389892578125, 2.3837890625, 2.58367919921875, 2.7835693359375, 2.98345947265625, 3.183349609375, 3.38323974609375, 3.5831298828125, 3.78302001953125, 3.98291015625, 4.18280029296875, 4.3826904296875, 4.58258056640625, 4.782470703125, 4.98236083984375, 5.1822509765625, 5.38214111328125, 5.58203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 6.0, 6.0, 9.0, 7.0, 10.0, 17.0, 11.0, 19.0, 27.0, 22.0, 36.0, 28.0, 28.0, 28.0, 20.0, 56.0, 47.0, 41.0, 47.0, 41.0, 47.0, 37.0, 39.0, 33.0, 37.0, 37.0, 29.0, 38.0, 34.0, 27.0, 25.0, 20.0, 18.0, 13.0, 11.0, 6.0, 10.0, 5.0, 3.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.66796875, -5.5015869140625, -5.335205078125, -5.1688232421875, -5.00244140625, -4.8360595703125, -4.669677734375, -4.5032958984375, -4.3369140625, -4.1705322265625, -4.004150390625, -3.8377685546875, -3.67138671875, -3.5050048828125, -3.338623046875, -3.1722412109375, -3.005859375, -2.8394775390625, -2.673095703125, -2.5067138671875, -2.34033203125, -2.1739501953125, -2.007568359375, -1.8411865234375, -1.6748046875, -1.5084228515625, -1.342041015625, -1.1756591796875, -1.00927734375, -0.8428955078125, -0.676513671875, -0.5101318359375, -0.34375, -0.1773681640625, -0.010986328125, 0.1553955078125, 0.32177734375, 0.4881591796875, 0.654541015625, 0.8209228515625, 0.9873046875, 1.1536865234375, 1.320068359375, 1.4864501953125, 1.65283203125, 1.8192138671875, 1.985595703125, 2.1519775390625, 2.318359375, 2.4847412109375, 2.651123046875, 2.8175048828125, 2.98388671875, 3.1502685546875, 3.316650390625, 3.4830322265625, 3.6494140625, 3.8157958984375, 3.982177734375, 4.1485595703125, 4.31494140625, 4.4813232421875, 4.647705078125, 4.8140869140625, 4.98046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 5.0, 11.0, 9.0, 7.0, 19.0, 22.0, 41.0, 56.0, 86.0, 114.0, 179.0, 350.0, 665.0, 1789.0, 6236.0, 36634.0, 490746.0, 466538.0, 35569.0, 6095.0, 1716.0, 726.0, 374.0, 182.0, 113.0, 73.0, 46.0, 28.0, 31.0, 21.0, 15.0, 18.0, 4.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.40234375, -2.32952880859375, -2.2567138671875, -2.18389892578125, -2.111083984375, -2.03826904296875, -1.9654541015625, -1.89263916015625, -1.81982421875, -1.74700927734375, -1.6741943359375, -1.60137939453125, -1.528564453125, -1.45574951171875, -1.3829345703125, -1.31011962890625, -1.2373046875, -1.16448974609375, -1.0916748046875, -1.01885986328125, -0.946044921875, -0.87322998046875, -0.8004150390625, -0.72760009765625, -0.65478515625, -0.58197021484375, -0.5091552734375, -0.43634033203125, -0.363525390625, -0.29071044921875, -0.2178955078125, -0.14508056640625, -0.072265625, 0.00054931640625, 0.0733642578125, 0.14617919921875, 0.218994140625, 0.29180908203125, 0.3646240234375, 0.43743896484375, 0.51025390625, 0.58306884765625, 0.6558837890625, 0.72869873046875, 0.801513671875, 0.87432861328125, 0.9471435546875, 1.01995849609375, 1.0927734375, 1.16558837890625, 1.2384033203125, 1.31121826171875, 1.384033203125, 1.45684814453125, 1.5296630859375, 1.60247802734375, 1.67529296875, 1.74810791015625, 1.8209228515625, 1.89373779296875, 1.966552734375, 2.03936767578125, 2.1121826171875, 2.18499755859375, 2.2578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 6.0, 5.0, 6.0, 12.0, 15.0, 20.0, 40.0, 42.0, 69.0, 76.0, 110.0, 108.0, 125.0, 90.0, 61.0, 49.0, 35.0, 20.0, 30.0, 23.0, 18.0, 13.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002491474151611328, -0.00023815035820007324, -0.00022715330123901367, -0.0002161562442779541, -0.00020515918731689453, -0.00019416213035583496, -0.0001831650733947754, -0.00017216801643371582, -0.00016117095947265625, -0.00015017390251159668, -0.0001391768455505371, -0.00012817978858947754, -0.00011718273162841797, -0.0001061856746673584, -9.518861770629883e-05, -8.419156074523926e-05, -7.319450378417969e-05, -6.219744682312012e-05, -5.120038986206055e-05, -4.0203332901000977e-05, -2.9206275939941406e-05, -1.8209218978881836e-05, -7.212162017822266e-06, 3.7848949432373047e-06, 1.4781951904296875e-05, 2.5779008865356445e-05, 3.6776065826416016e-05, 4.7773122787475586e-05, 5.8770179748535156e-05, 6.976723670959473e-05, 8.07642936706543e-05, 9.176135063171387e-05, 0.00010275840759277344, 0.00011375546455383301, 0.00012475252151489258, 0.00013574957847595215, 0.00014674663543701172, 0.0001577436923980713, 0.00016874074935913086, 0.00017973780632019043, 0.00019073486328125, 0.00020173192024230957, 0.00021272897720336914, 0.0002237260341644287, 0.00023472309112548828, 0.00024572014808654785, 0.0002567172050476074, 0.000267714262008667, 0.00027871131896972656, 0.00028970837593078613, 0.0003007054328918457, 0.0003117024898529053, 0.00032269954681396484, 0.0003336966037750244, 0.000344693660736084, 0.00035569071769714355, 0.0003666877746582031, 0.0003776848316192627, 0.00038868188858032227, 0.00039967894554138184, 0.0004106760025024414, 0.000421673059463501, 0.00043267011642456055, 0.0004436671733856201, 0.0004546642303466797]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 12.0, 23.0, 17.0, 32.0, 39.0, 48.0, 74.0, 126.0, 186.0, 313.0, 557.0, 1030.0, 2211.0, 6269.0, 26548.0, 215268.0, 679363.0, 93946.0, 14598.0, 4246.0, 1665.0, 793.0, 429.0, 270.0, 153.0, 98.0, 67.0, 37.0, 32.0, 30.0, 11.0, 13.0, 12.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.190093994140625, -2.12628173828125, -2.062469482421875, -1.9986572265625, -1.934844970703125, -1.87103271484375, -1.807220458984375, -1.743408203125, -1.679595947265625, -1.61578369140625, -1.551971435546875, -1.4881591796875, -1.424346923828125, -1.36053466796875, -1.296722412109375, -1.23291015625, -1.169097900390625, -1.10528564453125, -1.041473388671875, -0.9776611328125, -0.913848876953125, -0.85003662109375, -0.786224365234375, -0.722412109375, -0.658599853515625, -0.59478759765625, -0.530975341796875, -0.4671630859375, -0.403350830078125, -0.33953857421875, -0.275726318359375, -0.2119140625, -0.148101806640625, -0.08428955078125, -0.020477294921875, 0.0433349609375, 0.107147216796875, 0.17095947265625, 0.234771728515625, 0.298583984375, 0.362396240234375, 0.42620849609375, 0.490020751953125, 0.5538330078125, 0.617645263671875, 0.68145751953125, 0.745269775390625, 0.80908203125, 0.872894287109375, 0.93670654296875, 1.000518798828125, 1.0643310546875, 1.128143310546875, 1.19195556640625, 1.255767822265625, 1.319580078125, 1.383392333984375, 1.44720458984375, 1.511016845703125, 1.5748291015625, 1.638641357421875, 1.70245361328125, 1.766265869140625, 1.830078125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 9.0, 13.0, 13.0, 26.0, 24.0, 49.0, 61.0, 69.0, 76.0, 83.0, 90.0, 87.0, 78.0, 77.0, 59.0, 48.0, 29.0, 19.0, 24.0, 11.0, 16.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.0, -1.9425048828125, -1.885009765625, -1.8275146484375, -1.77001953125, -1.7125244140625, -1.655029296875, -1.5975341796875, -1.5400390625, -1.4825439453125, -1.425048828125, -1.3675537109375, -1.31005859375, -1.2525634765625, -1.195068359375, -1.1375732421875, -1.080078125, -1.0225830078125, -0.965087890625, -0.9075927734375, -0.85009765625, -0.7926025390625, -0.735107421875, -0.6776123046875, -0.6201171875, -0.5626220703125, -0.505126953125, -0.4476318359375, -0.39013671875, -0.3326416015625, -0.275146484375, -0.2176513671875, -0.16015625, -0.1026611328125, -0.045166015625, 0.0123291015625, 0.06982421875, 0.1273193359375, 0.184814453125, 0.2423095703125, 0.2998046875, 0.3572998046875, 0.414794921875, 0.4722900390625, 0.52978515625, 0.5872802734375, 0.644775390625, 0.7022705078125, 0.759765625, 0.8172607421875, 0.874755859375, 0.9322509765625, 0.98974609375, 1.0472412109375, 1.104736328125, 1.1622314453125, 1.2197265625, 1.2772216796875, 1.334716796875, 1.3922119140625, 1.44970703125, 1.5072021484375, 1.564697265625, 1.6221923828125, 1.6796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 20.0, 50.0, 128.0, 280.0, 312.0, 144.0, 46.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.4658432006836, -102.20612335205078, -99.94640350341797, -97.68668365478516, -95.42696380615234, -93.16724395751953, -90.90752410888672, -88.6478042602539, -86.3880844116211, -84.12836456298828, -81.86864471435547, -79.60892486572266, -77.34920501708984, -75.08948516845703, -72.82976531982422, -70.5700454711914, -68.31031799316406, -66.05059814453125, -63.79087829589844, -61.531158447265625, -59.27143859863281, -57.01171875, -54.75199890136719, -52.492279052734375, -50.23255920410156, -47.97283935546875, -45.71311950683594, -43.453399658203125, -41.19367980957031, -38.9339599609375, -36.67424011230469, -34.414520263671875, -32.15480422973633, -29.895084381103516, -27.635364532470703, -25.37564468383789, -23.115924835205078, -20.856204986572266, -18.59648323059082, -16.336763381958008, -14.077043533325195, -11.817323684692383, -9.55760383605957, -7.297883033752441, -5.038163185119629, -2.7784433364868164, -0.5187225341796875, 1.740997314453125, 4.0007171630859375, 6.26043701171875, 8.520156860351562, 10.779877662658691, 13.039597511291504, 15.299317359924316, 17.559038162231445, 19.818758010864258, 22.07847785949707, 24.338197708129883, 26.597917556762695, 28.85763931274414, 31.117359161376953, 33.377079010009766, 35.63679885864258, 37.89651870727539, 40.1562385559082]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 12.0, 5.0, 11.0, 11.0, 20.0, 30.0, 22.0, 34.0, 26.0, 38.0, 46.0, 35.0, 34.0, 46.0, 64.0, 46.0, 58.0, 42.0, 47.0, 38.0, 44.0, 37.0, 42.0, 26.0, 22.0, 23.0, 21.0, 15.0, 15.0, 18.0, 6.0, 12.0, 16.0, 4.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.51537322998047, -23.73332977294922, -22.9512882232666, -22.16924476623535, -21.387203216552734, -20.605159759521484, -19.823116302490234, -19.041074752807617, -18.259031295776367, -17.476987838745117, -16.6949462890625, -15.91290283203125, -15.130860328674316, -14.348817825317383, -13.56677532196045, -12.784732818603516, -12.002690315246582, -11.220647811889648, -10.438605308532715, -9.656562805175781, -8.874519348144531, -8.092476844787598, -7.310434341430664, -6.528391361236572, -5.746348857879639, -4.964306354522705, -4.182263374328613, -3.4002208709716797, -2.618178129196167, -1.8361353874206543, -1.0540928840637207, -0.2720499038696289, 0.5099925994873047, 1.2920353412628174, 2.07407808303833, 2.8561205863952637, 3.6381633281707764, 4.420206069946289, 5.202248573303223, 5.9842915534973145, 6.766334056854248, 7.548376560211182, 8.330419540405273, 9.112462043762207, 9.89450454711914, 10.67654800415039, 11.458589553833008, 12.240633010864258, 13.022675514221191, 13.804718017578125, 14.586760520935059, 15.368803024291992, 16.150846481323242, 16.93288803100586, 17.71493148803711, 18.49697494506836, 19.279016494750977, 20.061059951782227, 20.843101501464844, 21.625144958496094, 22.40718650817871, 23.18922996520996, 23.971271514892578, 24.753314971923828, 25.535358428955078]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 7.0, 4.0, 10.0, 17.0, 26.0, 28.0, 42.0, 50.0, 67.0, 102.0, 101.0, 187.0, 257.0, 341.0, 596.0, 1016.0, 1850.0, 3969.0, 10164.0, 52036.0, 4016562.0, 84223.0, 12775.0, 4636.0, 2042.0, 1158.0, 691.0, 388.0, 278.0, 179.0, 127.0, 104.0, 58.0, 39.0, 42.0, 23.0, 19.0, 21.0, 13.0, 8.0, 10.0, 2.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.4765625, -5.32269287109375, -5.1688232421875, -5.01495361328125, -4.861083984375, -4.70721435546875, -4.5533447265625, -4.39947509765625, -4.24560546875, -4.09173583984375, -3.9378662109375, -3.78399658203125, -3.630126953125, -3.47625732421875, -3.3223876953125, -3.16851806640625, -3.0146484375, -2.86077880859375, -2.7069091796875, -2.55303955078125, -2.399169921875, -2.24530029296875, -2.0914306640625, -1.93756103515625, -1.78369140625, -1.62982177734375, -1.4759521484375, -1.32208251953125, -1.168212890625, -1.01434326171875, -0.8604736328125, -0.70660400390625, -0.552734375, -0.39886474609375, -0.2449951171875, -0.09112548828125, 0.062744140625, 0.21661376953125, 0.3704833984375, 0.52435302734375, 0.67822265625, 0.83209228515625, 0.9859619140625, 1.13983154296875, 1.293701171875, 1.44757080078125, 1.6014404296875, 1.75531005859375, 1.9091796875, 2.06304931640625, 2.2169189453125, 2.37078857421875, 2.524658203125, 2.67852783203125, 2.8323974609375, 2.98626708984375, 3.14013671875, 3.29400634765625, 3.4478759765625, 3.60174560546875, 3.755615234375, 3.90948486328125, 4.0633544921875, 4.21722412109375, 4.37109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 14.0, 18.0, 22.0, 44.0, 54.0, 55.0, 71.0, 67.0, 76.0, 78.0, 79.0, 81.0, 62.0, 62.0, 51.0, 38.0, 33.0, 23.0, 14.0, 13.0, 12.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.998046875, -1.93365478515625, -1.8692626953125, -1.80487060546875, -1.740478515625, -1.67608642578125, -1.6116943359375, -1.54730224609375, -1.48291015625, -1.41851806640625, -1.3541259765625, -1.28973388671875, -1.225341796875, -1.16094970703125, -1.0965576171875, -1.03216552734375, -0.9677734375, -0.90338134765625, -0.8389892578125, -0.77459716796875, -0.710205078125, -0.64581298828125, -0.5814208984375, -0.51702880859375, -0.45263671875, -0.38824462890625, -0.3238525390625, -0.25946044921875, -0.195068359375, -0.13067626953125, -0.0662841796875, -0.00189208984375, 0.0625, 0.12689208984375, 0.1912841796875, 0.25567626953125, 0.320068359375, 0.38446044921875, 0.4488525390625, 0.51324462890625, 0.57763671875, 0.64202880859375, 0.7064208984375, 0.77081298828125, 0.835205078125, 0.89959716796875, 0.9639892578125, 1.02838134765625, 1.0927734375, 1.15716552734375, 1.2215576171875, 1.28594970703125, 1.350341796875, 1.41473388671875, 1.4791259765625, 1.54351806640625, 1.60791015625, 1.67230224609375, 1.7366943359375, 1.80108642578125, 1.865478515625, 1.92987060546875, 1.9942626953125, 2.05865478515625, 2.123046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 12.0, 20.0, 22.0, 33.0, 44.0, 69.0, 103.0, 149.0, 248.0, 397.0, 737.0, 1445.0, 3111.0, 7910.0, 28033.0, 400747.0, 3691735.0, 41667.0, 10212.0, 3800.0, 1659.0, 855.0, 456.0, 281.0, 163.0, 113.0, 70.0, 47.0, 32.0, 22.0, 15.0, 18.0, 11.0, 6.0, 4.0, 4.0, 1.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.12890625, -3.9962158203125, -3.863525390625, -3.7308349609375, -3.59814453125, -3.4654541015625, -3.332763671875, -3.2000732421875, -3.0673828125, -2.9346923828125, -2.802001953125, -2.6693115234375, -2.53662109375, -2.4039306640625, -2.271240234375, -2.1385498046875, -2.005859375, -1.8731689453125, -1.740478515625, -1.6077880859375, -1.47509765625, -1.3424072265625, -1.209716796875, -1.0770263671875, -0.9443359375, -0.8116455078125, -0.678955078125, -0.5462646484375, -0.41357421875, -0.2808837890625, -0.148193359375, -0.0155029296875, 0.1171875, 0.2498779296875, 0.382568359375, 0.5152587890625, 0.64794921875, 0.7806396484375, 0.913330078125, 1.0460205078125, 1.1787109375, 1.3114013671875, 1.444091796875, 1.5767822265625, 1.70947265625, 1.8421630859375, 1.974853515625, 2.1075439453125, 2.240234375, 2.3729248046875, 2.505615234375, 2.6383056640625, 2.77099609375, 2.9036865234375, 3.036376953125, 3.1690673828125, 3.3017578125, 3.4344482421875, 3.567138671875, 3.6998291015625, 3.83251953125, 3.9652099609375, 4.097900390625, 4.2305908203125, 4.36328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 10.0, 10.0, 12.0, 20.0, 61.0, 136.0, 2524.0, 1015.0, 127.0, 53.0, 34.0, 21.0, 11.0, 9.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.978515625, -2.9091644287109375, -2.839813232421875, -2.7704620361328125, -2.70111083984375, -2.6317596435546875, -2.562408447265625, -2.4930572509765625, -2.4237060546875, -2.3543548583984375, -2.285003662109375, -2.2156524658203125, -2.14630126953125, -2.0769500732421875, -2.007598876953125, -1.9382476806640625, -1.868896484375, -1.7995452880859375, -1.730194091796875, -1.6608428955078125, -1.59149169921875, -1.5221405029296875, -1.452789306640625, -1.3834381103515625, -1.3140869140625, -1.2447357177734375, -1.175384521484375, -1.1060333251953125, -1.03668212890625, -0.9673309326171875, -0.897979736328125, -0.8286285400390625, -0.75927734375, -0.6899261474609375, -0.620574951171875, -0.5512237548828125, -0.48187255859375, -0.4125213623046875, -0.343170166015625, -0.2738189697265625, -0.2044677734375, -0.1351165771484375, -0.065765380859375, 0.0035858154296875, 0.07293701171875, 0.1422882080078125, 0.211639404296875, 0.2809906005859375, 0.350341796875, 0.4196929931640625, 0.489044189453125, 0.5583953857421875, 0.62774658203125, 0.6970977783203125, 0.766448974609375, 0.8358001708984375, 0.9051513671875, 0.9745025634765625, 1.043853759765625, 1.1132049560546875, 1.18255615234375, 1.2519073486328125, 1.321258544921875, 1.3906097412109375, 1.4599609375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 15.0, 43.0, 72.0, 146.0, 195.0, 201.0, 167.0, 69.0, 45.0, 22.0, 6.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.503490447998047, -16.11924934387207, -15.73500919342041, -15.350768089294434, -14.966527938842773, -14.582286834716797, -14.19804573059082, -13.81380558013916, -13.429564476013184, -13.045323371887207, -12.661083221435547, -12.27684211730957, -11.89260196685791, -11.508360862731934, -11.124120712280273, -10.739879608154297, -10.35563850402832, -9.971397399902344, -9.587157249450684, -9.202916145324707, -8.818675994873047, -8.43443489074707, -8.050193786621094, -7.665953636169434, -7.281713485717773, -6.897472858428955, -6.513232231140137, -6.12899112701416, -5.744750499725342, -5.360509872436523, -4.976269245147705, -4.592028617858887, -4.20778751373291, -3.823546886444092, -3.4393060207366943, -3.055065393447876, -2.6708245277404785, -2.28658390045166, -1.9023432731628418, -1.5181024074554443, -1.133861780166626, -0.7496210336685181, -0.36538034677505493, 0.018860340118408203, 0.4031010866165161, 0.787341833114624, 1.1715824604034424, 1.5558233261108398, 1.9400639533996582, 2.3243045806884766, 2.708545446395874, 3.0927860736846924, 3.47702693939209, 3.861267566680908, 4.245508193969727, 4.629749298095703, 5.013989448547363, 5.398230075836182, 5.782470703125, 6.166711807250977, 6.550952434539795, 6.935193061828613, 7.319433689117432, 7.70367431640625, 8.087915420532227]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 5.0, 4.0, 12.0, 10.0, 8.0, 15.0, 18.0, 19.0, 15.0, 23.0, 36.0, 33.0, 33.0, 34.0, 42.0, 28.0, 42.0, 46.0, 48.0, 49.0, 42.0, 36.0, 45.0, 41.0, 41.0, 40.0, 40.0, 17.0, 30.0, 20.0, 19.0, 12.0, 21.0, 18.0, 15.0, 7.0, 9.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.228714942932129, -4.098668575286865, -3.9686222076416016, -3.838575839996338, -3.708529472351074, -3.5784831047058105, -3.448436737060547, -3.318390369415283, -3.1883440017700195, -3.058297634124756, -2.928251266479492, -2.7982048988342285, -2.668158531188965, -2.538112163543701, -2.4080657958984375, -2.278019428253174, -2.147972822189331, -2.0179264545440674, -1.8878800868988037, -1.75783371925354, -1.6277873516082764, -1.4977409839630127, -1.3676944971084595, -1.2376481294631958, -1.1076017618179321, -0.9775553941726685, -0.8475090265274048, -0.7174625992774963, -0.5874162316322327, -0.457369863986969, -0.32732343673706055, -0.19727706909179688, -0.0672307014465332, 0.06281568109989166, 0.19286206364631653, 0.3229084610939026, 0.45295482873916626, 0.5830011963844299, 0.7130476236343384, 0.843093991279602, 0.9731403589248657, 1.1031867265701294, 1.233233094215393, 1.3632795810699463, 1.49332594871521, 1.6233723163604736, 1.7534186840057373, 1.883465051651001, 2.0135114192962646, 2.1435577869415283, 2.273604154586792, 2.4036505222320557, 2.5336968898773193, 2.663743257522583, 2.793789863586426, 2.9238362312316895, 3.053882598876953, 3.183928966522217, 3.3139753341674805, 3.444021701812744, 3.574068069458008, 3.7041144371032715, 3.834160804748535, 3.964207172393799, 4.0942535400390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 11.0, 18.0, 30.0, 33.0, 48.0, 70.0, 108.0, 221.0, 355.0, 591.0, 976.0, 1759.0, 3355.0, 6415.0, 13716.0, 31468.0, 79753.0, 224976.0, 424897.0, 156253.0, 57886.0, 23747.0, 10609.0, 5075.0, 2602.0, 1428.0, 847.0, 459.0, 291.0, 208.0, 113.0, 70.0, 53.0, 32.0, 23.0, 10.0, 11.0, 7.0, 2.0, 5.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.61474609375, -2.5224609375, -2.43017578125, -2.337890625, -2.24560546875, -2.1533203125, -2.06103515625, -1.96875, -1.87646484375, -1.7841796875, -1.69189453125, -1.599609375, -1.50732421875, -1.4150390625, -1.32275390625, -1.23046875, -1.13818359375, -1.0458984375, -0.95361328125, -0.861328125, -0.76904296875, -0.6767578125, -0.58447265625, -0.4921875, -0.39990234375, -0.3076171875, -0.21533203125, -0.123046875, -0.03076171875, 0.0615234375, 0.15380859375, 0.24609375, 0.33837890625, 0.4306640625, 0.52294921875, 0.615234375, 0.70751953125, 0.7998046875, 0.89208984375, 0.984375, 1.07666015625, 1.1689453125, 1.26123046875, 1.353515625, 1.44580078125, 1.5380859375, 1.63037109375, 1.72265625, 1.81494140625, 1.9072265625, 1.99951171875, 2.091796875, 2.18408203125, 2.2763671875, 2.36865234375, 2.4609375, 2.55322265625, 2.6455078125, 2.73779296875, 2.830078125, 2.92236328125, 3.0146484375, 3.10693359375, 3.19921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 17.0, 19.0, 25.0, 21.0, 43.0, 51.0, 53.0, 51.0, 56.0, 74.0, 74.0, 67.0, 74.0, 67.0, 56.0, 37.0, 38.0, 36.0, 40.0, 15.0, 15.0, 11.0, 6.0, 7.0, 12.0, 10.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.705078125, -1.6466064453125, -1.588134765625, -1.5296630859375, -1.47119140625, -1.4127197265625, -1.354248046875, -1.2957763671875, -1.2373046875, -1.1788330078125, -1.120361328125, -1.0618896484375, -1.00341796875, -0.9449462890625, -0.886474609375, -0.8280029296875, -0.76953125, -0.7110595703125, -0.652587890625, -0.5941162109375, -0.53564453125, -0.4771728515625, -0.418701171875, -0.3602294921875, -0.3017578125, -0.2432861328125, -0.184814453125, -0.1263427734375, -0.06787109375, -0.0093994140625, 0.049072265625, 0.1075439453125, 0.166015625, 0.2244873046875, 0.282958984375, 0.3414306640625, 0.39990234375, 0.4583740234375, 0.516845703125, 0.5753173828125, 0.6337890625, 0.6922607421875, 0.750732421875, 0.8092041015625, 0.86767578125, 0.9261474609375, 0.984619140625, 1.0430908203125, 1.1015625, 1.1600341796875, 1.218505859375, 1.2769775390625, 1.33544921875, 1.3939208984375, 1.452392578125, 1.5108642578125, 1.5693359375, 1.6278076171875, 1.686279296875, 1.7447509765625, 1.80322265625, 1.8616943359375, 1.920166015625, 1.9786376953125, 2.037109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 9.0, 12.0, 11.0, 24.0, 17.0, 49.0, 55.0, 79.0, 117.0, 160.0, 238.0, 428.0, 663.0, 1205.0, 2944.0, 11402.0, 98454.0, 798007.0, 115577.0, 12638.0, 3149.0, 1306.0, 727.0, 412.0, 259.0, 178.0, 122.0, 90.0, 55.0, 36.0, 34.0, 30.0, 18.0, 6.0, 11.0, 7.0, 8.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.796875, -6.60003662109375, -6.4031982421875, -6.20635986328125, -6.009521484375, -5.81268310546875, -5.6158447265625, -5.41900634765625, -5.22216796875, -5.02532958984375, -4.8284912109375, -4.63165283203125, -4.434814453125, -4.23797607421875, -4.0411376953125, -3.84429931640625, -3.6474609375, -3.45062255859375, -3.2537841796875, -3.05694580078125, -2.860107421875, -2.66326904296875, -2.4664306640625, -2.26959228515625, -2.07275390625, -1.87591552734375, -1.6790771484375, -1.48223876953125, -1.285400390625, -1.08856201171875, -0.8917236328125, -0.69488525390625, -0.498046875, -0.30120849609375, -0.1043701171875, 0.09246826171875, 0.289306640625, 0.48614501953125, 0.6829833984375, 0.87982177734375, 1.07666015625, 1.27349853515625, 1.4703369140625, 1.66717529296875, 1.864013671875, 2.06085205078125, 2.2576904296875, 2.45452880859375, 2.6513671875, 2.84820556640625, 3.0450439453125, 3.24188232421875, 3.438720703125, 3.63555908203125, 3.8323974609375, 4.02923583984375, 4.22607421875, 4.42291259765625, 4.6197509765625, 4.81658935546875, 5.013427734375, 5.21026611328125, 5.4071044921875, 5.60394287109375, 5.80078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 3.0, 8.0, 8.0, 7.0, 7.0, 8.0, 11.0, 20.0, 17.0, 25.0, 26.0, 21.0, 29.0, 30.0, 30.0, 40.0, 38.0, 31.0, 36.0, 30.0, 44.0, 45.0, 47.0, 33.0, 34.0, 39.0, 34.0, 24.0, 40.0, 37.0, 27.0, 26.0, 20.0, 14.0, 14.0, 17.0, 16.0, 16.0, 11.0, 6.0, 6.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.0703125, -4.91455078125, -4.7587890625, -4.60302734375, -4.447265625, -4.29150390625, -4.1357421875, -3.97998046875, -3.82421875, -3.66845703125, -3.5126953125, -3.35693359375, -3.201171875, -3.04541015625, -2.8896484375, -2.73388671875, -2.578125, -2.42236328125, -2.2666015625, -2.11083984375, -1.955078125, -1.79931640625, -1.6435546875, -1.48779296875, -1.33203125, -1.17626953125, -1.0205078125, -0.86474609375, -0.708984375, -0.55322265625, -0.3974609375, -0.24169921875, -0.0859375, 0.06982421875, 0.2255859375, 0.38134765625, 0.537109375, 0.69287109375, 0.8486328125, 1.00439453125, 1.16015625, 1.31591796875, 1.4716796875, 1.62744140625, 1.783203125, 1.93896484375, 2.0947265625, 2.25048828125, 2.40625, 2.56201171875, 2.7177734375, 2.87353515625, 3.029296875, 3.18505859375, 3.3408203125, 3.49658203125, 3.65234375, 3.80810546875, 3.9638671875, 4.11962890625, 4.275390625, 4.43115234375, 4.5869140625, 4.74267578125, 4.8984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 13.0, 10.0, 16.0, 31.0, 73.0, 183.0, 454.0, 1313.0, 5458.0, 45657.0, 762871.0, 213872.0, 14773.0, 2641.0, 675.0, 257.0, 102.0, 58.0, 34.0, 16.0, 10.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.78515625, -2.707275390625, -2.62939453125, -2.551513671875, -2.4736328125, -2.395751953125, -2.31787109375, -2.239990234375, -2.162109375, -2.084228515625, -2.00634765625, -1.928466796875, -1.8505859375, -1.772705078125, -1.69482421875, -1.616943359375, -1.5390625, -1.461181640625, -1.38330078125, -1.305419921875, -1.2275390625, -1.149658203125, -1.07177734375, -0.993896484375, -0.916015625, -0.838134765625, -0.76025390625, -0.682373046875, -0.6044921875, -0.526611328125, -0.44873046875, -0.370849609375, -0.29296875, -0.215087890625, -0.13720703125, -0.059326171875, 0.0185546875, 0.096435546875, 0.17431640625, 0.252197265625, 0.330078125, 0.407958984375, 0.48583984375, 0.563720703125, 0.6416015625, 0.719482421875, 0.79736328125, 0.875244140625, 0.953125, 1.031005859375, 1.10888671875, 1.186767578125, 1.2646484375, 1.342529296875, 1.42041015625, 1.498291015625, 1.576171875, 1.654052734375, 1.73193359375, 1.809814453125, 1.8876953125, 1.965576171875, 2.04345703125, 2.121337890625, 2.19921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 6.0, 14.0, 15.0, 12.0, 15.0, 22.0, 24.0, 24.0, 25.0, 31.0, 44.0, 54.0, 75.0, 106.0, 109.0, 75.0, 65.0, 46.0, 41.0, 26.0, 22.0, 21.0, 32.0, 18.0, 13.0, 9.0, 14.0, 6.0, 4.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003502368927001953, -0.0003407709300518036, -0.00033130496740341187, -0.00032183900475502014, -0.0003123730421066284, -0.0003029070794582367, -0.00029344111680984497, -0.00028397515416145325, -0.0002745091915130615, -0.0002650432288646698, -0.0002555772662162781, -0.00024611130356788635, -0.00023664534091949463, -0.0002271793782711029, -0.00021771341562271118, -0.00020824745297431946, -0.00019878149032592773, -0.000189315527677536, -0.0001798495650291443, -0.00017038360238075256, -0.00016091763973236084, -0.00015145167708396912, -0.0001419857144355774, -0.00013251975178718567, -0.00012305378913879395, -0.00011358782649040222, -0.0001041218638420105, -9.465590119361877e-05, -8.518993854522705e-05, -7.572397589683533e-05, -6.62580132484436e-05, -5.679205060005188e-05, -4.7326087951660156e-05, -3.786012530326843e-05, -2.839416265487671e-05, -1.8928200006484985e-05, -9.462237358093262e-06, 3.725290298461914e-09, 9.469687938690186e-06, 1.893565058708191e-05, 2.8401613235473633e-05, 3.7867575883865356e-05, 4.733353853225708e-05, 5.6799501180648804e-05, 6.626546382904053e-05, 7.573142647743225e-05, 8.519738912582397e-05, 9.46633517742157e-05, 0.00010412931442260742, 0.00011359527707099915, 0.00012306123971939087, 0.0001325272023677826, 0.00014199316501617432, 0.00015145912766456604, 0.00016092509031295776, 0.0001703910529613495, 0.0001798570156097412, 0.00018932297825813293, 0.00019878894090652466, 0.00020825490355491638, 0.0002177208662033081, 0.00022718682885169983, 0.00023665279150009155, 0.0002461187541484833, 0.000255584716796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 11.0, 14.0, 24.0, 23.0, 37.0, 65.0, 115.0, 179.0, 288.0, 585.0, 1245.0, 3262.0, 11563.0, 84024.0, 746160.0, 174910.0, 18438.0, 4441.0, 1560.0, 697.0, 354.0, 193.0, 127.0, 87.0, 52.0, 29.0, 19.0, 15.0, 7.0, 9.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.128143310546875, -2.06488037109375, -2.001617431640625, -1.9383544921875, -1.875091552734375, -1.81182861328125, -1.748565673828125, -1.685302734375, -1.622039794921875, -1.55877685546875, -1.495513916015625, -1.4322509765625, -1.368988037109375, -1.30572509765625, -1.242462158203125, -1.17919921875, -1.115936279296875, -1.05267333984375, -0.989410400390625, -0.9261474609375, -0.862884521484375, -0.79962158203125, -0.736358642578125, -0.673095703125, -0.609832763671875, -0.54656982421875, -0.483306884765625, -0.4200439453125, -0.356781005859375, -0.29351806640625, -0.230255126953125, -0.1669921875, -0.103729248046875, -0.04046630859375, 0.022796630859375, 0.0860595703125, 0.149322509765625, 0.21258544921875, 0.275848388671875, 0.339111328125, 0.402374267578125, 0.46563720703125, 0.528900146484375, 0.5921630859375, 0.655426025390625, 0.71868896484375, 0.781951904296875, 0.84521484375, 0.908477783203125, 0.97174072265625, 1.035003662109375, 1.0982666015625, 1.161529541015625, 1.22479248046875, 1.288055419921875, 1.351318359375, 1.414581298828125, 1.47784423828125, 1.541107177734375, 1.6043701171875, 1.667633056640625, 1.73089599609375, 1.794158935546875, 1.857421875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 7.0, 7.0, 4.0, 6.0, 15.0, 17.0, 17.0, 24.0, 26.0, 24.0, 40.0, 55.0, 54.0, 61.0, 50.0, 62.0, 64.0, 64.0, 61.0, 44.0, 41.0, 32.0, 38.0, 26.0, 20.0, 24.0, 17.0, 13.0, 12.0, 10.0, 11.0, 7.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.14453125, -1.1098785400390625, -1.075225830078125, -1.0405731201171875, -1.00592041015625, -0.9712677001953125, -0.936614990234375, -0.9019622802734375, -0.8673095703125, -0.8326568603515625, -0.798004150390625, -0.7633514404296875, -0.72869873046875, -0.6940460205078125, -0.659393310546875, -0.6247406005859375, -0.590087890625, -0.5554351806640625, -0.520782470703125, -0.4861297607421875, -0.45147705078125, -0.4168243408203125, -0.382171630859375, -0.3475189208984375, -0.3128662109375, -0.2782135009765625, -0.243560791015625, -0.2089080810546875, -0.17425537109375, -0.1396026611328125, -0.104949951171875, -0.0702972412109375, -0.03564453125, -0.0009918212890625, 0.033660888671875, 0.0683135986328125, 0.10296630859375, 0.1376190185546875, 0.172271728515625, 0.2069244384765625, 0.2415771484375, 0.2762298583984375, 0.310882568359375, 0.3455352783203125, 0.38018798828125, 0.4148406982421875, 0.449493408203125, 0.4841461181640625, 0.518798828125, 0.5534515380859375, 0.588104248046875, 0.6227569580078125, 0.65740966796875, 0.6920623779296875, 0.726715087890625, 0.7613677978515625, 0.7960205078125, 0.8306732177734375, 0.865325927734375, 0.8999786376953125, 0.93463134765625, 0.9692840576171875, 1.003936767578125, 1.0385894775390625, 1.0732421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 12.0, 11.0, 37.0, 91.0, 159.0, 228.0, 225.0, 118.0, 62.0, 32.0, 14.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.107818603515625, -35.557586669921875, -34.007354736328125, -32.457122802734375, -30.906890869140625, -29.356658935546875, -27.806425094604492, -26.256193161010742, -24.705961227416992, -23.155729293823242, -21.605497360229492, -20.05526351928711, -18.50503158569336, -16.95479965209961, -15.40456771850586, -13.85433578491211, -12.30410385131836, -10.75387191772461, -9.20363998413086, -7.653407096862793, -6.103175163269043, -4.552943229675293, -3.0027103424072266, -1.4524784088134766, 0.09775352478027344, 1.6479856967926025, 3.1982178688049316, 4.74845027923584, 6.29868221282959, 7.84891414642334, 9.399147033691406, 10.949378967285156, 12.49960708618164, 14.04983901977539, 15.60007095336914, 17.15030288696289, 18.70053482055664, 20.25076675415039, 21.801000595092773, 23.351232528686523, 24.901464462280273, 26.451696395874023, 28.001928329467773, 29.552162170410156, 31.102394104003906, 32.652626037597656, 34.202857971191406, 35.753089904785156, 37.303321838378906, 38.853553771972656, 40.403785705566406, 41.954017639160156, 43.504249572753906, 45.054481506347656, 46.604713439941406, 48.154945373535156, 49.705177307128906, 51.255409240722656, 52.805641174316406, 54.355873107910156, 55.906105041503906, 57.456336975097656, 59.006568908691406, 60.556800842285156, 62.10703659057617]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 11.0, 14.0, 14.0, 32.0, 25.0, 24.0, 33.0, 37.0, 50.0, 41.0, 69.0, 56.0, 55.0, 54.0, 55.0, 65.0, 44.0, 49.0, 45.0, 39.0, 30.0, 21.0, 37.0, 17.0, 15.0, 18.0, 7.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.744510650634766, -29.82948875427246, -28.914466857910156, -27.99944496154785, -27.084423065185547, -26.169401168823242, -25.254379272460938, -24.33935546875, -23.424335479736328, -22.509313583374023, -21.59429168701172, -20.679269790649414, -19.76424789428711, -18.849225997924805, -17.9342041015625, -17.019180297851562, -16.104158401489258, -15.189136505126953, -14.274114608764648, -13.359092712402344, -12.444070816040039, -11.529048919677734, -10.614026069641113, -9.699004173278809, -8.783982276916504, -7.868960380554199, -6.9539384841918945, -6.038916110992432, -5.123894214630127, -4.208872318267822, -3.2938499450683594, -2.3788280487060547, -1.46380615234375, -0.5487841367721558, 0.3662378787994385, 1.2812600135803223, 2.196281909942627, 3.1113038063049316, 4.0263261795043945, 4.941348075866699, 5.856369972229004, 6.771391868591309, 7.686413764953613, 8.601436614990234, 9.516458511352539, 10.431480407714844, 11.346502304077148, 12.261524200439453, 13.176546096801758, 14.091567993164062, 15.006589889526367, 15.921611785888672, 16.836633682250977, 17.75165557861328, 18.66667938232422, 19.58169937133789, 20.496723175048828, 21.411745071411133, 22.326766967773438, 23.241788864135742, 24.156810760498047, 25.07183265686035, 25.986854553222656, 26.901878356933594, 27.816898345947266]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 11.0, 22.0, 19.0, 45.0, 60.0, 83.0, 134.0, 192.0, 295.0, 473.0, 767.0, 1135.0, 1712.0, 2875.0, 4836.0, 8577.0, 16363.0, 35123.0, 99739.0, 475176.0, 2458741.0, 847771.0, 148448.0, 46418.0, 20208.0, 10399.0, 5769.0, 3290.0, 2041.0, 1265.0, 783.0, 532.0, 345.0, 204.0, 135.0, 84.0, 73.0, 40.0, 30.0, 22.0, 20.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.5351409912109375, -1.483367919921875, -1.4315948486328125, -1.37982177734375, -1.3280487060546875, -1.276275634765625, -1.2245025634765625, -1.1727294921875, -1.1209564208984375, -1.069183349609375, -1.0174102783203125, -0.96563720703125, -0.9138641357421875, -0.862091064453125, -0.8103179931640625, -0.758544921875, -0.7067718505859375, -0.654998779296875, -0.6032257080078125, -0.55145263671875, -0.4996795654296875, -0.447906494140625, -0.3961334228515625, -0.3443603515625, -0.2925872802734375, -0.240814208984375, -0.1890411376953125, -0.13726806640625, -0.0854949951171875, -0.033721923828125, 0.0180511474609375, 0.06982421875, 0.1215972900390625, 0.173370361328125, 0.2251434326171875, 0.27691650390625, 0.3286895751953125, 0.380462646484375, 0.4322357177734375, 0.4840087890625, 0.5357818603515625, 0.587554931640625, 0.6393280029296875, 0.69110107421875, 0.7428741455078125, 0.794647216796875, 0.8464202880859375, 0.898193359375, 0.9499664306640625, 1.001739501953125, 1.0535125732421875, 1.10528564453125, 1.1570587158203125, 1.208831787109375, 1.2606048583984375, 1.3123779296875, 1.3641510009765625, 1.415924072265625, 1.4676971435546875, 1.51947021484375, 1.5712432861328125, 1.623016357421875, 1.6747894287109375, 1.7265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 17.0, 16.0, 14.0, 26.0, 29.0, 31.0, 36.0, 48.0, 36.0, 49.0, 55.0, 43.0, 58.0, 43.0, 51.0, 52.0, 57.0, 53.0, 50.0, 35.0, 37.0, 22.0, 26.0, 21.0, 12.0, 13.0, 17.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.0881805419921875, -1.045501708984375, -1.0028228759765625, -0.96014404296875, -0.9174652099609375, -0.874786376953125, -0.8321075439453125, -0.7894287109375, -0.7467498779296875, -0.704071044921875, -0.6613922119140625, -0.61871337890625, -0.5760345458984375, -0.533355712890625, -0.4906768798828125, -0.447998046875, -0.4053192138671875, -0.362640380859375, -0.3199615478515625, -0.27728271484375, -0.2346038818359375, -0.191925048828125, -0.1492462158203125, -0.1065673828125, -0.0638885498046875, -0.021209716796875, 0.0214691162109375, 0.06414794921875, 0.1068267822265625, 0.149505615234375, 0.1921844482421875, 0.23486328125, 0.2775421142578125, 0.320220947265625, 0.3628997802734375, 0.40557861328125, 0.4482574462890625, 0.490936279296875, 0.5336151123046875, 0.5762939453125, 0.6189727783203125, 0.661651611328125, 0.7043304443359375, 0.74700927734375, 0.7896881103515625, 0.832366943359375, 0.8750457763671875, 0.917724609375, 0.9604034423828125, 1.003082275390625, 1.0457611083984375, 1.08843994140625, 1.1311187744140625, 1.173797607421875, 1.2164764404296875, 1.2591552734375, 1.3018341064453125, 1.344512939453125, 1.3871917724609375, 1.42987060546875, 1.4725494384765625, 1.515228271484375, 1.5579071044921875, 1.6005859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 3.0, 8.0, 10.0, 18.0, 11.0, 24.0, 34.0, 46.0, 71.0, 136.0, 207.0, 423.0, 877.0, 2178.0, 6154.0, 19651.0, 81422.0, 1141323.0, 2773436.0, 127945.0, 27276.0, 7965.0, 2745.0, 1123.0, 541.0, 242.0, 122.0, 80.0, 61.0, 41.0, 21.0, 25.0, 11.0, 16.0, 9.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.03515625, -3.92645263671875, -3.8177490234375, -3.70904541015625, -3.600341796875, -3.49163818359375, -3.3829345703125, -3.27423095703125, -3.16552734375, -3.05682373046875, -2.9481201171875, -2.83941650390625, -2.730712890625, -2.62200927734375, -2.5133056640625, -2.40460205078125, -2.2958984375, -2.18719482421875, -2.0784912109375, -1.96978759765625, -1.861083984375, -1.75238037109375, -1.6436767578125, -1.53497314453125, -1.42626953125, -1.31756591796875, -1.2088623046875, -1.10015869140625, -0.991455078125, -0.88275146484375, -0.7740478515625, -0.66534423828125, -0.556640625, -0.44793701171875, -0.3392333984375, -0.23052978515625, -0.121826171875, -0.01312255859375, 0.0955810546875, 0.20428466796875, 0.31298828125, 0.42169189453125, 0.5303955078125, 0.63909912109375, 0.747802734375, 0.85650634765625, 0.9652099609375, 1.07391357421875, 1.1826171875, 1.29132080078125, 1.4000244140625, 1.50872802734375, 1.617431640625, 1.72613525390625, 1.8348388671875, 1.94354248046875, 2.05224609375, 2.16094970703125, 2.2696533203125, 2.37835693359375, 2.487060546875, 2.59576416015625, 2.7044677734375, 2.81317138671875, 2.921875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 12.0, 13.0, 11.0, 14.0, 17.0, 17.0, 22.0, 50.0, 80.0, 124.0, 267.0, 581.0, 1038.0, 874.0, 372.0, 195.0, 112.0, 69.0, 49.0, 41.0, 27.0, 18.0, 20.0, 9.0, 7.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.346099853515625, -3.22149658203125, -3.096893310546875, -2.9722900390625, -2.847686767578125, -2.72308349609375, -2.598480224609375, -2.473876953125, -2.349273681640625, -2.22467041015625, -2.100067138671875, -1.9754638671875, -1.850860595703125, -1.72625732421875, -1.601654052734375, -1.47705078125, -1.352447509765625, -1.22784423828125, -1.103240966796875, -0.9786376953125, -0.854034423828125, -0.72943115234375, -0.604827880859375, -0.480224609375, -0.355621337890625, -0.23101806640625, -0.106414794921875, 0.0181884765625, 0.142791748046875, 0.26739501953125, 0.391998291015625, 0.5166015625, 0.641204833984375, 0.76580810546875, 0.890411376953125, 1.0150146484375, 1.139617919921875, 1.26422119140625, 1.388824462890625, 1.513427734375, 1.638031005859375, 1.76263427734375, 1.887237548828125, 2.0118408203125, 2.136444091796875, 2.26104736328125, 2.385650634765625, 2.51025390625, 2.634857177734375, 2.75946044921875, 2.884063720703125, 3.0086669921875, 3.133270263671875, 3.25787353515625, 3.382476806640625, 3.507080078125, 3.631683349609375, 3.75628662109375, 3.880889892578125, 4.0054931640625, 4.130096435546875, 4.25469970703125, 4.379302978515625, 4.50390625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 23.0, 77.0, 219.0, 320.0, 215.0, 72.0, 34.0, 12.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.67559814453125, -75.95823669433594, -74.24087524414062, -72.52352142333984, -70.80615997314453, -69.08879852294922, -67.37144470214844, -65.65408325195312, -63.93672180175781, -62.2193603515625, -60.50200271606445, -58.784645080566406, -57.067283630371094, -55.34992218017578, -53.632564544677734, -51.91520690917969, -50.197845458984375, -48.48048400878906, -46.763126373291016, -45.04576873779297, -43.328407287597656, -41.611045837402344, -39.8936882019043, -38.17633056640625, -36.45896911621094, -34.741607666015625, -33.02425003051758, -31.3068904876709, -29.58953094482422, -27.87217140197754, -26.15481185913086, -24.43745231628418, -22.720088958740234, -21.002729415893555, -19.285369873046875, -17.568010330200195, -15.850650787353516, -14.133291244506836, -12.415931701660156, -10.698572158813477, -8.981212615966797, -7.263853073120117, -5.5464935302734375, -3.829133987426758, -2.111774444580078, -0.39441490173339844, 1.3229446411132812, 3.040304183959961, 4.757663726806641, 6.47502326965332, 8.1923828125, 9.90974235534668, 11.62710189819336, 13.344461441040039, 15.061820983886719, 16.7791805267334, 18.496540069580078, 20.213899612426758, 21.931259155273438, 23.648618698120117, 25.365978240966797, 27.083337783813477, 28.800697326660156, 30.518056869506836, 32.235416412353516]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 5.0, 11.0, 10.0, 16.0, 23.0, 19.0, 29.0, 29.0, 40.0, 29.0, 37.0, 37.0, 57.0, 50.0, 47.0, 61.0, 42.0, 40.0, 40.0, 53.0, 44.0, 34.0, 38.0, 30.0, 25.0, 22.0, 22.0, 15.0, 11.0, 14.0, 13.0, 7.0, 4.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.093931198120117, -17.575700759887695, -17.057470321655273, -16.53923988342285, -16.021011352539062, -15.502779960632324, -14.984550476074219, -14.466320037841797, -13.948089599609375, -13.429859161376953, -12.911628723144531, -12.393399238586426, -11.875168800354004, -11.356938362121582, -10.838708877563477, -10.320478439331055, -9.802248001098633, -9.284017562866211, -8.765787124633789, -8.247557640075684, -7.729327201843262, -7.21109676361084, -6.692866802215576, -6.1746368408203125, -5.656406402587891, -5.138175964355469, -4.619946002960205, -4.101716041564941, -3.5834856033325195, -3.0652554035186768, -2.547025203704834, -2.028795003890991, -1.5105648040771484, -0.9923346042633057, -0.4741044044494629, 0.04412579536437988, 0.5623559951782227, 1.0805861949920654, 1.5988163948059082, 2.117046594619751, 2.6352767944335938, 3.1535069942474365, 3.6717371940612793, 4.189967155456543, 4.708197593688965, 5.226428031921387, 5.74465799331665, 6.262887954711914, 6.781118392944336, 7.299348831176758, 7.8175787925720215, 8.335808753967285, 8.854039192199707, 9.372269630432129, 9.890499114990234, 10.408729553222656, 10.926959991455078, 11.4451904296875, 11.963420867919922, 12.481650352478027, 12.99988079071045, 13.518111228942871, 14.036340713500977, 14.554571151733398, 15.07280158996582]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 13.0, 15.0, 9.0, 15.0, 27.0, 38.0, 60.0, 72.0, 104.0, 160.0, 232.0, 298.0, 399.0, 582.0, 878.0, 1140.0, 1758.0, 2485.0, 3788.0, 5754.0, 9024.0, 14436.0, 23753.0, 41744.0, 79817.0, 179209.0, 324603.0, 174687.0, 78240.0, 40820.0, 23562.0, 14110.0, 8930.0, 5652.0, 3858.0, 2516.0, 1699.0, 1198.0, 842.0, 624.0, 401.0, 273.0, 226.0, 147.0, 106.0, 70.0, 53.0, 30.0, 42.0, 23.0, 11.0, 8.0, 9.0, 6.0, 1.0, 0.0, 5.0], "bins": [-1.8486328125, -1.793426513671875, -1.73822021484375, -1.683013916015625, -1.6278076171875, -1.572601318359375, -1.51739501953125, -1.462188720703125, -1.406982421875, -1.351776123046875, -1.29656982421875, -1.241363525390625, -1.1861572265625, -1.130950927734375, -1.07574462890625, -1.020538330078125, -0.96533203125, -0.910125732421875, -0.85491943359375, -0.799713134765625, -0.7445068359375, -0.689300537109375, -0.63409423828125, -0.578887939453125, -0.523681640625, -0.468475341796875, -0.41326904296875, -0.358062744140625, -0.3028564453125, -0.247650146484375, -0.19244384765625, -0.137237548828125, -0.08203125, -0.026824951171875, 0.02838134765625, 0.083587646484375, 0.1387939453125, 0.194000244140625, 0.24920654296875, 0.304412841796875, 0.359619140625, 0.414825439453125, 0.47003173828125, 0.525238037109375, 0.5804443359375, 0.635650634765625, 0.69085693359375, 0.746063232421875, 0.80126953125, 0.856475830078125, 0.91168212890625, 0.966888427734375, 1.0220947265625, 1.077301025390625, 1.13250732421875, 1.187713623046875, 1.242919921875, 1.298126220703125, 1.35333251953125, 1.408538818359375, 1.4637451171875, 1.518951416015625, 1.57415771484375, 1.629364013671875, 1.6845703125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 12.0, 13.0, 15.0, 18.0, 20.0, 21.0, 19.0, 33.0, 15.0, 36.0, 24.0, 34.0, 33.0, 41.0, 27.0, 38.0, 47.0, 48.0, 39.0, 38.0, 43.0, 46.0, 29.0, 31.0, 29.0, 31.0, 24.0, 28.0, 16.0, 19.0, 27.0, 13.0, 12.0, 15.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 7.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0498046875, -1.016357421875, -0.98291015625, -0.949462890625, -0.916015625, -0.882568359375, -0.84912109375, -0.815673828125, -0.7822265625, -0.748779296875, -0.71533203125, -0.681884765625, -0.6484375, -0.614990234375, -0.58154296875, -0.548095703125, -0.5146484375, -0.481201171875, -0.44775390625, -0.414306640625, -0.380859375, -0.347412109375, -0.31396484375, -0.280517578125, -0.2470703125, -0.213623046875, -0.18017578125, -0.146728515625, -0.11328125, -0.079833984375, -0.04638671875, -0.012939453125, 0.0205078125, 0.053955078125, 0.08740234375, 0.120849609375, 0.154296875, 0.187744140625, 0.22119140625, 0.254638671875, 0.2880859375, 0.321533203125, 0.35498046875, 0.388427734375, 0.421875, 0.455322265625, 0.48876953125, 0.522216796875, 0.5556640625, 0.589111328125, 0.62255859375, 0.656005859375, 0.689453125, 0.722900390625, 0.75634765625, 0.789794921875, 0.8232421875, 0.856689453125, 0.89013671875, 0.923583984375, 0.95703125, 0.990478515625, 1.02392578125, 1.057373046875, 1.0908203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 3.0, 8.0, 10.0, 14.0, 20.0, 28.0, 32.0, 52.0, 60.0, 94.0, 134.0, 199.0, 330.0, 498.0, 1040.0, 2233.0, 6248.0, 28877.0, 659312.0, 317935.0, 21697.0, 5279.0, 2045.0, 974.0, 503.0, 311.0, 194.0, 107.0, 89.0, 61.0, 34.0, 35.0, 23.0, 14.0, 15.0, 12.0, 6.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.0625, -7.8248291015625, -7.587158203125, -7.3494873046875, -7.11181640625, -6.8741455078125, -6.636474609375, -6.3988037109375, -6.1611328125, -5.9234619140625, -5.685791015625, -5.4481201171875, -5.21044921875, -4.9727783203125, -4.735107421875, -4.4974365234375, -4.259765625, -4.0220947265625, -3.784423828125, -3.5467529296875, -3.30908203125, -3.0714111328125, -2.833740234375, -2.5960693359375, -2.3583984375, -2.1207275390625, -1.883056640625, -1.6453857421875, -1.40771484375, -1.1700439453125, -0.932373046875, -0.6947021484375, -0.45703125, -0.2193603515625, 0.018310546875, 0.2559814453125, 0.49365234375, 0.7313232421875, 0.968994140625, 1.2066650390625, 1.4443359375, 1.6820068359375, 1.919677734375, 2.1573486328125, 2.39501953125, 2.6326904296875, 2.870361328125, 3.1080322265625, 3.345703125, 3.5833740234375, 3.821044921875, 4.0587158203125, 4.29638671875, 4.5340576171875, 4.771728515625, 5.0093994140625, 5.2470703125, 5.4847412109375, 5.722412109375, 5.9600830078125, 6.19775390625, 6.4354248046875, 6.673095703125, 6.9107666015625, 7.1484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 0.0, 3.0, 8.0, 1.0, 4.0, 8.0, 13.0, 29.0, 17.0, 27.0, 33.0, 30.0, 45.0, 64.0, 58.0, 53.0, 78.0, 67.0, 70.0, 54.0, 55.0, 51.0, 62.0, 39.0, 27.0, 19.0, 21.0, 15.0, 15.0, 13.0, 4.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-10.4375, -10.18902587890625, -9.9405517578125, -9.69207763671875, -9.443603515625, -9.19512939453125, -8.9466552734375, -8.69818115234375, -8.44970703125, -8.20123291015625, -7.9527587890625, -7.70428466796875, -7.455810546875, -7.20733642578125, -6.9588623046875, -6.71038818359375, -6.4619140625, -6.21343994140625, -5.9649658203125, -5.71649169921875, -5.468017578125, -5.21954345703125, -4.9710693359375, -4.72259521484375, -4.47412109375, -4.22564697265625, -3.9771728515625, -3.72869873046875, -3.480224609375, -3.23175048828125, -2.9832763671875, -2.73480224609375, -2.486328125, -2.23785400390625, -1.9893798828125, -1.74090576171875, -1.492431640625, -1.24395751953125, -0.9954833984375, -0.74700927734375, -0.49853515625, -0.25006103515625, -0.0015869140625, 0.24688720703125, 0.495361328125, 0.74383544921875, 0.9923095703125, 1.24078369140625, 1.4892578125, 1.73773193359375, 1.9862060546875, 2.23468017578125, 2.483154296875, 2.73162841796875, 2.9801025390625, 3.22857666015625, 3.47705078125, 3.72552490234375, 3.9739990234375, 4.22247314453125, 4.470947265625, 4.71942138671875, 4.9678955078125, 5.21636962890625, 5.46484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 12.0, 6.0, 15.0, 26.0, 26.0, 31.0, 66.0, 81.0, 119.0, 201.0, 272.0, 494.0, 880.0, 1518.0, 2940.0, 6568.0, 18152.0, 78460.0, 685466.0, 201793.0, 32453.0, 9967.0, 4148.0, 2033.0, 1086.0, 648.0, 383.0, 225.0, 149.0, 94.0, 74.0, 51.0, 16.0, 26.0, 17.0, 12.0, 12.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.95703125, -1.8990020751953125, -1.840972900390625, -1.7829437255859375, -1.72491455078125, -1.6668853759765625, -1.608856201171875, -1.5508270263671875, -1.4927978515625, -1.4347686767578125, -1.376739501953125, -1.3187103271484375, -1.26068115234375, -1.2026519775390625, -1.144622802734375, -1.0865936279296875, -1.028564453125, -0.9705352783203125, -0.912506103515625, -0.8544769287109375, -0.79644775390625, -0.7384185791015625, -0.680389404296875, -0.6223602294921875, -0.5643310546875, -0.5063018798828125, -0.448272705078125, -0.3902435302734375, -0.33221435546875, -0.2741851806640625, -0.216156005859375, -0.1581268310546875, -0.10009765625, -0.0420684814453125, 0.015960693359375, 0.0739898681640625, 0.13201904296875, 0.1900482177734375, 0.248077392578125, 0.3061065673828125, 0.3641357421875, 0.4221649169921875, 0.480194091796875, 0.5382232666015625, 0.59625244140625, 0.6542816162109375, 0.712310791015625, 0.7703399658203125, 0.828369140625, 0.8863983154296875, 0.944427490234375, 1.0024566650390625, 1.06048583984375, 1.1185150146484375, 1.176544189453125, 1.2345733642578125, 1.2926025390625, 1.3506317138671875, 1.408660888671875, 1.4666900634765625, 1.52471923828125, 1.5827484130859375, 1.640777587890625, 1.6988067626953125, 1.7568359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 16.0, 24.0, 34.0, 83.0, 206.0, 364.0, 129.0, 55.0, 19.0, 12.0, 14.0, 8.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011920928955078125, -0.001151353120803833, -0.0011106133460998535, -0.001069873571395874, -0.0010291337966918945, -0.000988394021987915, -0.0009476542472839355, -0.0009069144725799561, -0.0008661746978759766, -0.0008254349231719971, -0.0007846951484680176, -0.0007439553737640381, -0.0007032155990600586, -0.0006624758243560791, -0.0006217360496520996, -0.0005809962749481201, -0.0005402565002441406, -0.0004995167255401611, -0.00045877695083618164, -0.00041803717613220215, -0.00037729740142822266, -0.00033655762672424316, -0.00029581785202026367, -0.0002550780773162842, -0.0002143383026123047, -0.0001735985279083252, -0.0001328587532043457, -9.211897850036621e-05, -5.137920379638672e-05, -1.0639429092407227e-05, 3.0100345611572266e-05, 7.084012031555176e-05, 0.00011157989501953125, 0.00015231966972351074, 0.00019305944442749023, 0.00023379921913146973, 0.0002745389938354492, 0.0003152787685394287, 0.0003560185432434082, 0.0003967583179473877, 0.0004374980926513672, 0.0004782378673553467, 0.0005189776420593262, 0.0005597174167633057, 0.0006004571914672852, 0.0006411969661712646, 0.0006819367408752441, 0.0007226765155792236, 0.0007634162902832031, 0.0008041560649871826, 0.0008448958396911621, 0.0008856356143951416, 0.0009263753890991211, 0.0009671151638031006, 0.00100785493850708, 0.0010485947132110596, 0.001089334487915039, 0.0011300742626190186, 0.001170814037322998, 0.0012115538120269775, 0.001252293586730957, 0.0012930333614349365, 0.001333773136138916, 0.0013745129108428955, 0.001415252685546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 5.0, 6.0, 1.0, 15.0, 14.0, 16.0, 21.0, 39.0, 47.0, 64.0, 114.0, 194.0, 267.0, 460.0, 850.0, 1736.0, 4378.0, 14108.0, 83214.0, 729579.0, 179558.0, 22883.0, 6002.0, 2378.0, 1034.0, 599.0, 348.0, 204.0, 124.0, 86.0, 78.0, 44.0, 28.0, 14.0, 14.0, 10.0, 10.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.146484375, -2.0827178955078125, -2.018951416015625, -1.9551849365234375, -1.89141845703125, -1.8276519775390625, -1.763885498046875, -1.7001190185546875, -1.6363525390625, -1.5725860595703125, -1.508819580078125, -1.4450531005859375, -1.38128662109375, -1.3175201416015625, -1.253753662109375, -1.1899871826171875, -1.126220703125, -1.0624542236328125, -0.998687744140625, -0.9349212646484375, -0.87115478515625, -0.8073883056640625, -0.743621826171875, -0.6798553466796875, -0.6160888671875, -0.5523223876953125, -0.488555908203125, -0.4247894287109375, -0.36102294921875, -0.2972564697265625, -0.233489990234375, -0.1697235107421875, -0.10595703125, -0.0421905517578125, 0.021575927734375, 0.0853424072265625, 0.14910888671875, 0.2128753662109375, 0.276641845703125, 0.3404083251953125, 0.4041748046875, 0.4679412841796875, 0.531707763671875, 0.5954742431640625, 0.65924072265625, 0.7230072021484375, 0.786773681640625, 0.8505401611328125, 0.914306640625, 0.9780731201171875, 1.041839599609375, 1.1056060791015625, 1.16937255859375, 1.2331390380859375, 1.296905517578125, 1.3606719970703125, 1.4244384765625, 1.4882049560546875, 1.551971435546875, 1.6157379150390625, 1.67950439453125, 1.7432708740234375, 1.807037353515625, 1.8708038330078125, 1.9345703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 11.0, 13.0, 14.0, 12.0, 14.0, 22.0, 29.0, 35.0, 37.0, 48.0, 51.0, 57.0, 70.0, 71.0, 74.0, 70.0, 55.0, 51.0, 45.0, 32.0, 33.0, 17.0, 14.0, 18.0, 11.0, 10.0, 10.0, 8.0, 13.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3505859375, -1.3050384521484375, -1.259490966796875, -1.2139434814453125, -1.16839599609375, -1.1228485107421875, -1.077301025390625, -1.0317535400390625, -0.9862060546875, -0.9406585693359375, -0.895111083984375, -0.8495635986328125, -0.80401611328125, -0.7584686279296875, -0.712921142578125, -0.6673736572265625, -0.621826171875, -0.5762786865234375, -0.530731201171875, -0.4851837158203125, -0.43963623046875, -0.3940887451171875, -0.348541259765625, -0.3029937744140625, -0.2574462890625, -0.2118988037109375, -0.166351318359375, -0.1208038330078125, -0.07525634765625, -0.0297088623046875, 0.015838623046875, 0.0613861083984375, 0.10693359375, 0.1524810791015625, 0.198028564453125, 0.2435760498046875, 0.28912353515625, 0.3346710205078125, 0.380218505859375, 0.4257659912109375, 0.4713134765625, 0.5168609619140625, 0.562408447265625, 0.6079559326171875, 0.65350341796875, 0.6990509033203125, 0.744598388671875, 0.7901458740234375, 0.835693359375, 0.8812408447265625, 0.926788330078125, 0.9723358154296875, 1.01788330078125, 1.0634307861328125, 1.108978271484375, 1.1545257568359375, 1.2000732421875, 1.2456207275390625, 1.291168212890625, 1.3367156982421875, 1.38226318359375, 1.4278106689453125, 1.473358154296875, 1.5189056396484375, 1.564453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 18.0, 23.0, 49.0, 131.0, 214.0, 235.0, 128.0, 97.0, 39.0, 25.0, 11.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.17965698242188, -64.53168487548828, -62.88371276855469, -61.235740661621094, -59.587764739990234, -57.93979263305664, -56.29182052612305, -54.64384841918945, -52.99587631225586, -51.347904205322266, -49.69993209838867, -48.05195617675781, -46.40398406982422, -44.756011962890625, -43.10803985595703, -41.46006774902344, -39.812095642089844, -38.16412353515625, -36.516151428222656, -34.86817932128906, -33.2202033996582, -31.57223129272461, -29.924259185791016, -28.276287078857422, -26.628311157226562, -24.98033905029297, -23.332365036010742, -21.68439292907715, -20.036420822143555, -18.388446807861328, -16.740474700927734, -15.09250259399414, -13.444530487060547, -11.796557426452637, -10.148585319519043, -8.500612258911133, -6.852639675140381, -5.204667091369629, -3.5566940307617188, -1.908721923828125, -0.26074886322021484, 1.3872238397598267, 3.035196542739868, 4.683169364929199, 6.331141948699951, 7.979114532470703, 9.627087593078613, 11.275059700012207, 12.923032760620117, 14.571005821228027, 16.218978881835938, 17.86695098876953, 19.514923095703125, 21.16289520263672, 22.810869216918945, 24.45884132385254, 26.106815338134766, 27.75478744506836, 29.402761459350586, 31.05073356628418, 32.698707580566406, 34.3466796875, 35.994651794433594, 37.64262390136719, 39.29059600830078]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 12.0, 13.0, 19.0, 12.0, 10.0, 21.0, 19.0, 29.0, 24.0, 35.0, 40.0, 33.0, 33.0, 65.0, 44.0, 56.0, 53.0, 47.0, 34.0, 51.0, 33.0, 35.0, 24.0, 23.0, 21.0, 19.0, 27.0, 17.0, 14.0, 25.0, 15.0, 6.0, 11.0, 10.0, 8.0, 3.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.765743255615234, -18.12302017211914, -17.480297088623047, -16.837574005126953, -16.19485092163086, -15.552127838134766, -14.909404754638672, -14.266681671142578, -13.623958587646484, -12.98123550415039, -12.338512420654297, -11.695789337158203, -11.05306625366211, -10.410343170166016, -9.767620086669922, -9.124897003173828, -8.482172966003418, -7.839449882507324, -7.1967267990112305, -6.554003715515137, -5.911280632019043, -5.268557548522949, -4.625833988189697, -3.9831109046936035, -3.3403878211975098, -2.697664737701416, -2.0549416542053223, -1.4122183322906494, -0.7694952487945557, -0.12677216529846191, 0.5159511566162109, 1.1586742401123047, 1.8013973236083984, 2.444120407104492, 3.086843490600586, 3.729566812515259, 4.372289657592773, 5.015012741088867, 5.657736301422119, 6.300459384918213, 6.943182468414307, 7.5859055519104, 8.228629112243652, 8.871352195739746, 9.51407527923584, 10.156798362731934, 10.799521446228027, 11.442244529724121, 12.084967613220215, 12.727690696716309, 13.370413780212402, 14.013136863708496, 14.65585994720459, 15.298583030700684, 15.941307067871094, 16.584030151367188, 17.22675323486328, 17.869476318359375, 18.51219940185547, 19.154922485351562, 19.797645568847656, 20.44036865234375, 21.083091735839844, 21.725814819335938, 22.36853790283203]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 4.0, 3.0, 12.0, 14.0, 26.0, 18.0, 13.0, 22.0, 35.0, 51.0, 55.0, 86.0, 126.0, 197.0, 575.0, 5587.0, 3199142.0, 983234.0, 3989.0, 469.0, 181.0, 103.0, 83.0, 55.0, 44.0, 41.0, 25.0, 19.0, 12.0, 13.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.984375, -10.6175537109375, -10.250732421875, -9.8839111328125, -9.51708984375, -9.1502685546875, -8.783447265625, -8.4166259765625, -8.0498046875, -7.6829833984375, -7.316162109375, -6.9493408203125, -6.58251953125, -6.2156982421875, -5.848876953125, -5.4820556640625, -5.115234375, -4.7484130859375, -4.381591796875, -4.0147705078125, -3.64794921875, -3.2811279296875, -2.914306640625, -2.5474853515625, -2.1806640625, -1.8138427734375, -1.447021484375, -1.0802001953125, -0.71337890625, -0.3465576171875, 0.020263671875, 0.3870849609375, 0.75390625, 1.1207275390625, 1.487548828125, 1.8543701171875, 2.22119140625, 2.5880126953125, 2.954833984375, 3.3216552734375, 3.6884765625, 4.0552978515625, 4.422119140625, 4.7889404296875, 5.15576171875, 5.5225830078125, 5.889404296875, 6.2562255859375, 6.623046875, 6.9898681640625, 7.356689453125, 7.7235107421875, 8.09033203125, 8.4571533203125, 8.823974609375, 9.1907958984375, 9.5576171875, 9.9244384765625, 10.291259765625, 10.6580810546875, 11.02490234375, 11.3917236328125, 11.758544921875, 12.1253662109375, 12.4921875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 9.0, 17.0, 17.0, 16.0, 21.0, 36.0, 34.0, 41.0, 53.0, 45.0, 72.0, 61.0, 49.0, 57.0, 57.0, 55.0, 65.0, 51.0, 52.0, 32.0, 29.0, 28.0, 31.0, 9.0, 16.0, 8.0, 10.0, 7.0, 6.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5263671875, -1.4760894775390625, -1.425811767578125, -1.3755340576171875, -1.32525634765625, -1.2749786376953125, -1.224700927734375, -1.1744232177734375, -1.1241455078125, -1.0738677978515625, -1.023590087890625, -0.9733123779296875, -0.92303466796875, -0.8727569580078125, -0.822479248046875, -0.7722015380859375, -0.721923828125, -0.6716461181640625, -0.621368408203125, -0.5710906982421875, -0.52081298828125, -0.4705352783203125, -0.420257568359375, -0.3699798583984375, -0.3197021484375, -0.2694244384765625, -0.219146728515625, -0.1688690185546875, -0.11859130859375, -0.0683135986328125, -0.018035888671875, 0.0322418212890625, 0.08251953125, 0.1327972412109375, 0.183074951171875, 0.2333526611328125, 0.28363037109375, 0.3339080810546875, 0.384185791015625, 0.4344635009765625, 0.4847412109375, 0.5350189208984375, 0.585296630859375, 0.6355743408203125, 0.68585205078125, 0.7361297607421875, 0.786407470703125, 0.8366851806640625, 0.886962890625, 0.9372406005859375, 0.987518310546875, 1.0377960205078125, 1.08807373046875, 1.1383514404296875, 1.188629150390625, 1.2389068603515625, 1.2891845703125, 1.3394622802734375, 1.389739990234375, 1.4400177001953125, 1.49029541015625, 1.5405731201171875, 1.590850830078125, 1.6411285400390625, 1.69140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 10.0, 21.0, 21.0, 41.0, 60.0, 109.0, 144.0, 237.0, 357.0, 575.0, 1034.0, 1838.0, 3635.0, 7745.0, 18653.0, 55857.0, 311423.0, 3188316.0, 492516.0, 70999.0, 22196.0, 8970.0, 4240.0, 2122.0, 1192.0, 723.0, 412.0, 280.0, 180.0, 102.0, 82.0, 63.0, 49.0, 16.0, 12.0, 11.0, 11.0, 8.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.390625, -3.2896728515625, -3.188720703125, -3.0877685546875, -2.98681640625, -2.8858642578125, -2.784912109375, -2.6839599609375, -2.5830078125, -2.4820556640625, -2.381103515625, -2.2801513671875, -2.17919921875, -2.0782470703125, -1.977294921875, -1.8763427734375, -1.775390625, -1.6744384765625, -1.573486328125, -1.4725341796875, -1.37158203125, -1.2706298828125, -1.169677734375, -1.0687255859375, -0.9677734375, -0.8668212890625, -0.765869140625, -0.6649169921875, -0.56396484375, -0.4630126953125, -0.362060546875, -0.2611083984375, -0.16015625, -0.0592041015625, 0.041748046875, 0.1427001953125, 0.24365234375, 0.3446044921875, 0.445556640625, 0.5465087890625, 0.6474609375, 0.7484130859375, 0.849365234375, 0.9503173828125, 1.05126953125, 1.1522216796875, 1.253173828125, 1.3541259765625, 1.455078125, 1.5560302734375, 1.656982421875, 1.7579345703125, 1.85888671875, 1.9598388671875, 2.060791015625, 2.1617431640625, 2.2626953125, 2.3636474609375, 2.464599609375, 2.5655517578125, 2.66650390625, 2.7674560546875, 2.868408203125, 2.9693603515625, 3.0703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 11.0, 9.0, 8.0, 9.0, 12.0, 14.0, 23.0, 29.0, 63.0, 85.0, 136.0, 317.0, 702.0, 1152.0, 739.0, 319.0, 157.0, 97.0, 50.0, 38.0, 25.0, 16.0, 14.0, 17.0, 5.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3046875, -4.15887451171875, -4.0130615234375, -3.86724853515625, -3.721435546875, -3.57562255859375, -3.4298095703125, -3.28399658203125, -3.13818359375, -2.99237060546875, -2.8465576171875, -2.70074462890625, -2.554931640625, -2.40911865234375, -2.2633056640625, -2.11749267578125, -1.9716796875, -1.82586669921875, -1.6800537109375, -1.53424072265625, -1.388427734375, -1.24261474609375, -1.0968017578125, -0.95098876953125, -0.80517578125, -0.65936279296875, -0.5135498046875, -0.36773681640625, -0.221923828125, -0.07611083984375, 0.0697021484375, 0.21551513671875, 0.361328125, 0.50714111328125, 0.6529541015625, 0.79876708984375, 0.944580078125, 1.09039306640625, 1.2362060546875, 1.38201904296875, 1.52783203125, 1.67364501953125, 1.8194580078125, 1.96527099609375, 2.111083984375, 2.25689697265625, 2.4027099609375, 2.54852294921875, 2.6943359375, 2.84014892578125, 2.9859619140625, 3.13177490234375, 3.277587890625, 3.42340087890625, 3.5692138671875, 3.71502685546875, 3.86083984375, 4.00665283203125, 4.1524658203125, 4.29827880859375, 4.444091796875, 4.58990478515625, 4.7357177734375, 4.88153076171875, 5.02734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 15.0, 36.0, 86.0, 177.0, 256.0, 212.0, 106.0, 45.0, 23.0, 16.0, 12.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.385852813720703, -20.845966339111328, -19.306079864501953, -17.766191482543945, -16.22630500793457, -14.686418533325195, -13.146531105041504, -11.606643676757812, -10.066757202148438, -8.526870727539062, -6.986983299255371, -5.447096347808838, -3.9072093963623047, -2.3673224449157715, -0.8274354934692383, 0.7124519348144531, 2.252338409423828, 3.7922253608703613, 5.3321123123168945, 6.871999263763428, 8.411886215209961, 9.951772689819336, 11.491660118103027, 13.031547546386719, 14.571434020996094, 16.11132049560547, 17.651206970214844, 19.19109535217285, 20.730981826782227, 22.2708683013916, 23.81075668334961, 25.350643157958984, 26.890533447265625, 28.430419921875, 29.970306396484375, 31.510194778442383, 33.050079345703125, 34.589969635009766, 36.12985610961914, 37.669742584228516, 39.20962905883789, 40.749515533447266, 42.28940200805664, 43.829288482666016, 45.369178771972656, 46.90906524658203, 48.448951721191406, 49.98883819580078, 51.528724670410156, 53.06861114501953, 54.608497619628906, 56.14838409423828, 57.688270568847656, 59.2281608581543, 60.76804733276367, 62.30793380737305, 63.84782028198242, 65.38771057128906, 66.92759704589844, 68.46748352050781, 70.00736999511719, 71.54725646972656, 73.08714294433594, 74.62702941894531, 76.16691589355469]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 10.0, 11.0, 8.0, 14.0, 16.0, 26.0, 13.0, 28.0, 41.0, 24.0, 36.0, 38.0, 31.0, 46.0, 52.0, 44.0, 44.0, 42.0, 51.0, 55.0, 38.0, 49.0, 33.0, 37.0, 34.0, 28.0, 22.0, 28.0, 15.0, 14.0, 19.0, 13.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.111093521118164, -15.549979209899902, -14.98886489868164, -14.427750587463379, -13.866636276245117, -13.305522918701172, -12.74440860748291, -12.183294296264648, -11.622179985046387, -11.061065673828125, -10.499951362609863, -9.938837051391602, -9.377723693847656, -8.816608428955078, -8.255495071411133, -7.694380760192871, -7.133266448974609, -6.572152137756348, -6.011037826538086, -5.449923992156982, -4.888809680938721, -4.327695369720459, -3.7665812969207764, -3.2054672241210938, -2.644352912902832, -2.0832386016845703, -1.5221245288848877, -0.9610103368759155, -0.39989614486694336, 0.16121816635131836, 0.722332239151001, 1.2834463119506836, 1.8445625305175781, 2.40567684173584, 2.9667909145355225, 3.527904987335205, 4.089019298553467, 4.6501336097717285, 5.211247444152832, 5.772361755371094, 6.3334760665893555, 6.894590377807617, 7.455704689025879, 8.01681900024414, 8.577932357788086, 9.139047622680664, 9.70016098022461, 10.261275291442871, 10.822389602661133, 11.383503913879395, 11.944618225097656, 12.505732536315918, 13.06684684753418, 13.627960205078125, 14.189074516296387, 14.750188827514648, 15.31130313873291, 15.872417449951172, 16.433530807495117, 16.994646072387695, 17.55575942993164, 18.11687469482422, 18.677988052368164, 19.23910140991211, 19.800216674804688]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 5.0, 6.0, 10.0, 22.0, 30.0, 52.0, 55.0, 87.0, 138.0, 216.0, 387.0, 597.0, 1046.0, 1781.0, 3101.0, 5704.0, 11377.0, 24563.0, 63904.0, 222277.0, 470969.0, 153130.0, 48450.0, 20002.0, 9383.0, 4831.0, 2643.0, 1495.0, 879.0, 555.0, 303.0, 203.0, 131.0, 74.0, 40.0, 31.0, 24.0, 19.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.923828125, -2.8387451171875, -2.753662109375, -2.6685791015625, -2.58349609375, -2.4984130859375, -2.413330078125, -2.3282470703125, -2.2431640625, -2.1580810546875, -2.072998046875, -1.9879150390625, -1.90283203125, -1.8177490234375, -1.732666015625, -1.6475830078125, -1.5625, -1.4774169921875, -1.392333984375, -1.3072509765625, -1.22216796875, -1.1370849609375, -1.052001953125, -0.9669189453125, -0.8818359375, -0.7967529296875, -0.711669921875, -0.6265869140625, -0.54150390625, -0.4564208984375, -0.371337890625, -0.2862548828125, -0.201171875, -0.1160888671875, -0.031005859375, 0.0540771484375, 0.13916015625, 0.2242431640625, 0.309326171875, 0.3944091796875, 0.4794921875, 0.5645751953125, 0.649658203125, 0.7347412109375, 0.81982421875, 0.9049072265625, 0.989990234375, 1.0750732421875, 1.16015625, 1.2452392578125, 1.330322265625, 1.4154052734375, 1.50048828125, 1.5855712890625, 1.670654296875, 1.7557373046875, 1.8408203125, 1.9259033203125, 2.010986328125, 2.0960693359375, 2.18115234375, 2.2662353515625, 2.351318359375, 2.4364013671875, 2.521484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 17.0, 11.0, 17.0, 27.0, 30.0, 26.0, 37.0, 37.0, 54.0, 49.0, 46.0, 49.0, 59.0, 41.0, 56.0, 57.0, 46.0, 40.0, 58.0, 38.0, 39.0, 22.0, 16.0, 33.0, 16.0, 17.0, 8.0, 14.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.095703125, -1.046844482421875, -0.99798583984375, -0.949127197265625, -0.9002685546875, -0.851409912109375, -0.80255126953125, -0.753692626953125, -0.704833984375, -0.655975341796875, -0.60711669921875, -0.558258056640625, -0.5093994140625, -0.460540771484375, -0.41168212890625, -0.362823486328125, -0.31396484375, -0.265106201171875, -0.21624755859375, -0.167388916015625, -0.1185302734375, -0.069671630859375, -0.02081298828125, 0.028045654296875, 0.076904296875, 0.125762939453125, 0.17462158203125, 0.223480224609375, 0.2723388671875, 0.321197509765625, 0.37005615234375, 0.418914794921875, 0.4677734375, 0.516632080078125, 0.56549072265625, 0.614349365234375, 0.6632080078125, 0.712066650390625, 0.76092529296875, 0.809783935546875, 0.858642578125, 0.907501220703125, 0.95635986328125, 1.005218505859375, 1.0540771484375, 1.102935791015625, 1.15179443359375, 1.200653076171875, 1.24951171875, 1.298370361328125, 1.34722900390625, 1.396087646484375, 1.4449462890625, 1.493804931640625, 1.54266357421875, 1.591522216796875, 1.640380859375, 1.689239501953125, 1.73809814453125, 1.786956787109375, 1.8358154296875, 1.884674072265625, 1.93353271484375, 1.982391357421875, 2.03125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 10.0, 9.0, 24.0, 27.0, 46.0, 42.0, 79.0, 100.0, 169.0, 229.0, 396.0, 753.0, 1524.0, 3672.0, 11665.0, 53397.0, 699518.0, 235929.0, 28377.0, 7293.0, 2566.0, 1102.0, 612.0, 337.0, 209.0, 139.0, 93.0, 53.0, 44.0, 35.0, 24.0, 18.0, 13.0, 13.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.140625, -5.95904541015625, -5.7774658203125, -5.59588623046875, -5.414306640625, -5.23272705078125, -5.0511474609375, -4.86956787109375, -4.68798828125, -4.50640869140625, -4.3248291015625, -4.14324951171875, -3.961669921875, -3.78009033203125, -3.5985107421875, -3.41693115234375, -3.2353515625, -3.05377197265625, -2.8721923828125, -2.69061279296875, -2.509033203125, -2.32745361328125, -2.1458740234375, -1.96429443359375, -1.78271484375, -1.60113525390625, -1.4195556640625, -1.23797607421875, -1.056396484375, -0.87481689453125, -0.6932373046875, -0.51165771484375, -0.330078125, -0.14849853515625, 0.0330810546875, 0.21466064453125, 0.396240234375, 0.57781982421875, 0.7593994140625, 0.94097900390625, 1.12255859375, 1.30413818359375, 1.4857177734375, 1.66729736328125, 1.848876953125, 2.03045654296875, 2.2120361328125, 2.39361572265625, 2.5751953125, 2.75677490234375, 2.9383544921875, 3.11993408203125, 3.301513671875, 3.48309326171875, 3.6646728515625, 3.84625244140625, 4.02783203125, 4.20941162109375, 4.3909912109375, 4.57257080078125, 4.754150390625, 4.93572998046875, 5.1173095703125, 5.29888916015625, 5.48046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 2.0, 2.0, 7.0, 6.0, 14.0, 13.0, 15.0, 25.0, 16.0, 32.0, 50.0, 33.0, 52.0, 57.0, 53.0, 60.0, 58.0, 62.0, 71.0, 50.0, 49.0, 45.0, 49.0, 32.0, 32.0, 19.0, 19.0, 17.0, 13.0, 6.0, 10.0, 7.0, 1.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.12109375, -6.8922119140625, -6.663330078125, -6.4344482421875, -6.20556640625, -5.9766845703125, -5.747802734375, -5.5189208984375, -5.2900390625, -5.0611572265625, -4.832275390625, -4.6033935546875, -4.37451171875, -4.1456298828125, -3.916748046875, -3.6878662109375, -3.458984375, -3.2301025390625, -3.001220703125, -2.7723388671875, -2.54345703125, -2.3145751953125, -2.085693359375, -1.8568115234375, -1.6279296875, -1.3990478515625, -1.170166015625, -0.9412841796875, -0.71240234375, -0.4835205078125, -0.254638671875, -0.0257568359375, 0.203125, 0.4320068359375, 0.660888671875, 0.8897705078125, 1.11865234375, 1.3475341796875, 1.576416015625, 1.8052978515625, 2.0341796875, 2.2630615234375, 2.491943359375, 2.7208251953125, 2.94970703125, 3.1785888671875, 3.407470703125, 3.6363525390625, 3.865234375, 4.0941162109375, 4.322998046875, 4.5518798828125, 4.78076171875, 5.0096435546875, 5.238525390625, 5.4674072265625, 5.6962890625, 5.9251708984375, 6.154052734375, 6.3829345703125, 6.61181640625, 6.8406982421875, 7.069580078125, 7.2984619140625, 7.52734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 10.0, 16.0, 26.0, 39.0, 45.0, 81.0, 157.0, 319.0, 645.0, 1825.0, 6706.0, 36717.0, 556489.0, 403622.0, 32648.0, 6104.0, 1739.0, 666.0, 261.0, 170.0, 91.0, 55.0, 36.0, 26.0, 12.0, 8.0, 2.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.940765380859375, -2.85418701171875, -2.767608642578125, -2.6810302734375, -2.594451904296875, -2.50787353515625, -2.421295166015625, -2.334716796875, -2.248138427734375, -2.16156005859375, -2.074981689453125, -1.9884033203125, -1.901824951171875, -1.81524658203125, -1.728668212890625, -1.64208984375, -1.555511474609375, -1.46893310546875, -1.382354736328125, -1.2957763671875, -1.209197998046875, -1.12261962890625, -1.036041259765625, -0.949462890625, -0.862884521484375, -0.77630615234375, -0.689727783203125, -0.6031494140625, -0.516571044921875, -0.42999267578125, -0.343414306640625, -0.2568359375, -0.170257568359375, -0.08367919921875, 0.002899169921875, 0.0894775390625, 0.176055908203125, 0.26263427734375, 0.349212646484375, 0.435791015625, 0.522369384765625, 0.60894775390625, 0.695526123046875, 0.7821044921875, 0.868682861328125, 0.95526123046875, 1.041839599609375, 1.12841796875, 1.214996337890625, 1.30157470703125, 1.388153076171875, 1.4747314453125, 1.561309814453125, 1.64788818359375, 1.734466552734375, 1.821044921875, 1.907623291015625, 1.99420166015625, 2.080780029296875, 2.1673583984375, 2.253936767578125, 2.34051513671875, 2.427093505859375, 2.513671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 9.0, 10.0, 6.0, 14.0, 14.0, 17.0, 20.0, 41.0, 49.0, 60.0, 105.0, 126.0, 125.0, 111.0, 63.0, 38.0, 37.0, 25.0, 20.0, 16.0, 20.0, 14.0, 8.0, 6.0, 8.0, 3.0, 4.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003972053527832031, -0.00038359686732292175, -0.0003699883818626404, -0.000356379896402359, -0.00034277141094207764, -0.00032916292548179626, -0.0003155544400215149, -0.0003019459545612335, -0.00028833746910095215, -0.0002747289836406708, -0.0002611204981803894, -0.00024751201272010803, -0.00023390352725982666, -0.0002202950417995453, -0.00020668655633926392, -0.00019307807087898254, -0.00017946958541870117, -0.0001658610999584198, -0.00015225261449813843, -0.00013864412903785706, -0.00012503564357757568, -0.00011142715811729431, -9.781867265701294e-05, -8.421018719673157e-05, -7.06017017364502e-05, -5.699321627616882e-05, -4.338473081588745e-05, -2.977624535560608e-05, -1.6167759895324707e-05, -2.559274435043335e-06, 1.1049211025238037e-05, 2.465769648551941e-05, 3.826618194580078e-05, 5.187466740608215e-05, 6.548315286636353e-05, 7.90916383266449e-05, 9.270012378692627e-05, 0.00010630860924720764, 0.00011991709470748901, 0.00013352558016777039, 0.00014713406562805176, 0.00016074255108833313, 0.0001743510365486145, 0.00018795952200889587, 0.00020156800746917725, 0.00021517649292945862, 0.00022878497838974, 0.00024239346385002136, 0.00025600194931030273, 0.0002696104347705841, 0.0002832189202308655, 0.00029682740569114685, 0.0003104358911514282, 0.0003240443766117096, 0.00033765286207199097, 0.00035126134753227234, 0.0003648698329925537, 0.0003784783184528351, 0.00039208680391311646, 0.00040569528937339783, 0.0004193037748336792, 0.00043291226029396057, 0.00044652074575424194, 0.0004601292312145233, 0.0004737377166748047]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 11.0, 7.0, 10.0, 18.0, 18.0, 26.0, 49.0, 81.0, 114.0, 167.0, 251.0, 389.0, 666.0, 1119.0, 2227.0, 4733.0, 12359.0, 41078.0, 193636.0, 606639.0, 135305.0, 31085.0, 10000.0, 4059.0, 1901.0, 1016.0, 555.0, 352.0, 206.0, 154.0, 93.0, 53.0, 51.0, 34.0, 23.0, 21.0, 7.0, 13.0, 8.0, 5.0, 2.0, 1.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.7109375, -1.66259765625, -1.6142578125, -1.56591796875, -1.517578125, -1.46923828125, -1.4208984375, -1.37255859375, -1.32421875, -1.27587890625, -1.2275390625, -1.17919921875, -1.130859375, -1.08251953125, -1.0341796875, -0.98583984375, -0.9375, -0.88916015625, -0.8408203125, -0.79248046875, -0.744140625, -0.69580078125, -0.6474609375, -0.59912109375, -0.55078125, -0.50244140625, -0.4541015625, -0.40576171875, -0.357421875, -0.30908203125, -0.2607421875, -0.21240234375, -0.1640625, -0.11572265625, -0.0673828125, -0.01904296875, 0.029296875, 0.07763671875, 0.1259765625, 0.17431640625, 0.22265625, 0.27099609375, 0.3193359375, 0.36767578125, 0.416015625, 0.46435546875, 0.5126953125, 0.56103515625, 0.609375, 0.65771484375, 0.7060546875, 0.75439453125, 0.802734375, 0.85107421875, 0.8994140625, 0.94775390625, 0.99609375, 1.04443359375, 1.0927734375, 1.14111328125, 1.189453125, 1.23779296875, 1.2861328125, 1.33447265625, 1.3828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 11.0, 16.0, 11.0, 24.0, 23.0, 40.0, 37.0, 52.0, 78.0, 91.0, 90.0, 106.0, 85.0, 75.0, 78.0, 41.0, 42.0, 28.0, 24.0, 19.0, 9.0, 8.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0], "bins": [-3.0390625, -2.9748687744140625, -2.910675048828125, -2.8464813232421875, -2.78228759765625, -2.7180938720703125, -2.653900146484375, -2.5897064208984375, -2.5255126953125, -2.4613189697265625, -2.397125244140625, -2.3329315185546875, -2.26873779296875, -2.2045440673828125, -2.140350341796875, -2.0761566162109375, -2.011962890625, -1.9477691650390625, -1.883575439453125, -1.8193817138671875, -1.75518798828125, -1.6909942626953125, -1.626800537109375, -1.5626068115234375, -1.4984130859375, -1.4342193603515625, -1.370025634765625, -1.3058319091796875, -1.24163818359375, -1.1774444580078125, -1.113250732421875, -1.0490570068359375, -0.98486328125, -0.9206695556640625, -0.856475830078125, -0.7922821044921875, -0.72808837890625, -0.6638946533203125, -0.599700927734375, -0.5355072021484375, -0.4713134765625, -0.4071197509765625, -0.342926025390625, -0.2787322998046875, -0.21453857421875, -0.1503448486328125, -0.086151123046875, -0.0219573974609375, 0.042236328125, 0.1064300537109375, 0.170623779296875, 0.2348175048828125, 0.29901123046875, 0.3632049560546875, 0.427398681640625, 0.4915924072265625, 0.5557861328125, 0.6199798583984375, 0.684173583984375, 0.7483673095703125, 0.81256103515625, 0.8767547607421875, 0.940948486328125, 1.0051422119140625, 1.0693359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 20.0, 35.0, 76.0, 139.0, 219.0, 229.0, 145.0, 50.0, 28.0, 14.0, 10.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.80448913574219, -49.42918014526367, -48.053871154785156, -46.678558349609375, -45.30324935913086, -43.927940368652344, -42.55263137817383, -41.17732238769531, -39.80200958251953, -38.426700592041016, -37.0513916015625, -35.67607879638672, -34.3007698059082, -32.92546081542969, -31.550151824951172, -30.174842834472656, -28.79953384399414, -27.424224853515625, -26.048913955688477, -24.67360496520996, -23.298294067382812, -21.922985076904297, -20.54767608642578, -19.172367095947266, -17.797056198120117, -16.4217472076416, -15.046436309814453, -13.671127319335938, -12.295817375183105, -10.920507431030273, -9.545198440551758, -8.169888496398926, -6.794574737548828, -5.419264793395996, -4.043955326080322, -2.6686458587646484, -1.2933359146118164, 0.08197402954101562, 1.4572830200195312, 2.8325929641723633, 4.207902908325195, 5.583212852478027, 6.958522319793701, 8.333831787109375, 9.709141731262207, 11.084451675415039, 12.459760665893555, 13.835070610046387, 15.210380554199219, 16.585689544677734, 17.961000442504883, 19.3363094329834, 20.711620330810547, 22.086929321289062, 23.462238311767578, 24.837547302246094, 26.212858200073242, 27.588167190551758, 28.963478088378906, 30.338787078857422, 31.714096069335938, 33.08940887451172, 34.46471405029297, 35.84002685546875, 37.215335845947266]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 8.0, 7.0, 10.0, 17.0, 31.0, 31.0, 37.0, 53.0, 48.0, 62.0, 78.0, 112.0, 98.0, 81.0, 68.0, 61.0, 61.0, 46.0, 31.0, 19.0, 11.0, 14.0, 13.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-63.39222717285156, -62.04682159423828, -60.701416015625, -59.35601043701172, -58.01060104370117, -56.66519546508789, -55.31978988647461, -53.97438430786133, -52.62897491455078, -51.2835693359375, -49.93816375732422, -48.59275817871094, -47.24734878540039, -45.90194320678711, -44.55653762817383, -43.21113204956055, -41.865726470947266, -40.520320892333984, -39.1749153137207, -37.829505920410156, -36.484100341796875, -35.138694763183594, -33.79328918457031, -32.44788360595703, -31.102476119995117, -29.757070541381836, -28.411663055419922, -27.06625747680664, -25.72085189819336, -24.375444412231445, -23.030038833618164, -21.68463134765625, -20.339229583740234, -18.993824005126953, -17.64841651916504, -16.303010940551758, -14.95760440826416, -13.612197875976562, -12.266792297363281, -10.921385765075684, -9.575979232788086, -8.230572700500488, -6.885166645050049, -5.539760589599609, -4.194354057312012, -2.848947525024414, -1.5035419464111328, -0.15813541412353516, 1.1872711181640625, 2.532677412033081, 3.8780837059020996, 5.223489761352539, 6.568896293640137, 7.914302825927734, 9.259708404541016, 10.605114936828613, 11.950521469116211, 13.295928001403809, 14.641334533691406, 15.986740112304688, 17.33214569091797, 18.677553176879883, 20.022958755493164, 21.368366241455078, 22.71377182006836]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 5.0, 2.0, 13.0, 20.0, 24.0, 29.0, 36.0, 61.0, 88.0, 143.0, 230.0, 442.0, 693.0, 1449.0, 2949.0, 6564.0, 16707.0, 54161.0, 298295.0, 2188127.0, 1387371.0, 172610.0, 39661.0, 13788.0, 5732.0, 2539.0, 1213.0, 606.0, 310.0, 186.0, 94.0, 55.0, 35.0, 27.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.01177978515625, -1.9395751953125, -1.86737060546875, -1.795166015625, -1.72296142578125, -1.6507568359375, -1.57855224609375, -1.50634765625, -1.43414306640625, -1.3619384765625, -1.28973388671875, -1.217529296875, -1.14532470703125, -1.0731201171875, -1.00091552734375, -0.9287109375, -0.85650634765625, -0.7843017578125, -0.71209716796875, -0.639892578125, -0.56768798828125, -0.4954833984375, -0.42327880859375, -0.35107421875, -0.27886962890625, -0.2066650390625, -0.13446044921875, -0.062255859375, 0.00994873046875, 0.0821533203125, 0.15435791015625, 0.2265625, 0.29876708984375, 0.3709716796875, 0.44317626953125, 0.515380859375, 0.58758544921875, 0.6597900390625, 0.73199462890625, 0.80419921875, 0.87640380859375, 0.9486083984375, 1.02081298828125, 1.093017578125, 1.16522216796875, 1.2374267578125, 1.30963134765625, 1.3818359375, 1.45404052734375, 1.5262451171875, 1.59844970703125, 1.670654296875, 1.74285888671875, 1.8150634765625, 1.88726806640625, 1.95947265625, 2.03167724609375, 2.1038818359375, 2.17608642578125, 2.248291015625, 2.32049560546875, 2.3927001953125, 2.46490478515625, 2.537109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 24.0, 59.0, 56.0, 81.0, 106.0, 110.0, 104.0, 117.0, 99.0, 92.0, 47.0, 32.0, 29.0, 19.0, 9.0, 2.0, 5.0, 2.0, 1.0], "bins": [-5.0703125, -4.9716339111328125, -4.872955322265625, -4.7742767333984375, -4.67559814453125, -4.5769195556640625, -4.478240966796875, -4.3795623779296875, -4.2808837890625, -4.1822052001953125, -4.083526611328125, -3.9848480224609375, -3.88616943359375, -3.7874908447265625, -3.688812255859375, -3.5901336669921875, -3.491455078125, -3.3927764892578125, -3.294097900390625, -3.1954193115234375, -3.09674072265625, -2.9980621337890625, -2.899383544921875, -2.8007049560546875, -2.7020263671875, -2.6033477783203125, -2.504669189453125, -2.4059906005859375, -2.30731201171875, -2.2086334228515625, -2.109954833984375, -2.0112762451171875, -1.91259765625, -1.8139190673828125, -1.715240478515625, -1.6165618896484375, -1.51788330078125, -1.4192047119140625, -1.320526123046875, -1.2218475341796875, -1.1231689453125, -1.0244903564453125, -0.925811767578125, -0.8271331787109375, -0.72845458984375, -0.6297760009765625, -0.531097412109375, -0.4324188232421875, -0.333740234375, -0.2350616455078125, -0.136383056640625, -0.0377044677734375, 0.06097412109375, 0.1596527099609375, 0.258331298828125, 0.3570098876953125, 0.4556884765625, 0.5543670654296875, 0.653045654296875, 0.7517242431640625, 0.85040283203125, 0.9490814208984375, 1.047760009765625, 1.1464385986328125, 1.2451171875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 12.0, 9.0, 14.0, 10.0, 20.0, 30.0, 49.0, 70.0, 131.0, 208.0, 307.0, 466.0, 720.0, 1374.0, 2637.0, 5499.0, 12949.0, 36490.0, 147112.0, 1612788.0, 2125215.0, 180844.0, 41834.0, 13739.0, 5650.0, 2720.0, 1395.0, 701.0, 459.0, 279.0, 162.0, 122.0, 74.0, 55.0, 27.0, 26.0, 22.0, 9.0, 13.0, 6.0, 10.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.150390625, -3.045562744140625, -2.94073486328125, -2.835906982421875, -2.7310791015625, -2.626251220703125, -2.52142333984375, -2.416595458984375, -2.311767578125, -2.206939697265625, -2.10211181640625, -1.997283935546875, -1.8924560546875, -1.787628173828125, -1.68280029296875, -1.577972412109375, -1.47314453125, -1.368316650390625, -1.26348876953125, -1.158660888671875, -1.0538330078125, -0.949005126953125, -0.84417724609375, -0.739349365234375, -0.634521484375, -0.529693603515625, -0.42486572265625, -0.320037841796875, -0.2152099609375, -0.110382080078125, -0.00555419921875, 0.099273681640625, 0.2041015625, 0.308929443359375, 0.41375732421875, 0.518585205078125, 0.6234130859375, 0.728240966796875, 0.83306884765625, 0.937896728515625, 1.042724609375, 1.147552490234375, 1.25238037109375, 1.357208251953125, 1.4620361328125, 1.566864013671875, 1.67169189453125, 1.776519775390625, 1.88134765625, 1.986175537109375, 2.09100341796875, 2.195831298828125, 2.3006591796875, 2.405487060546875, 2.51031494140625, 2.615142822265625, 2.719970703125, 2.824798583984375, 2.92962646484375, 3.034454345703125, 3.1392822265625, 3.244110107421875, 3.34893798828125, 3.453765869140625, 3.55859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 12.0, 7.0, 10.0, 13.0, 14.0, 17.0, 25.0, 39.0, 53.0, 53.0, 95.0, 173.0, 267.0, 480.0, 735.0, 752.0, 516.0, 279.0, 153.0, 134.0, 70.0, 44.0, 27.0, 29.0, 16.0, 12.0, 8.0, 10.0, 4.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58984375, -4.441650390625, -4.29345703125, -4.145263671875, -3.9970703125, -3.848876953125, -3.70068359375, -3.552490234375, -3.404296875, -3.256103515625, -3.10791015625, -2.959716796875, -2.8115234375, -2.663330078125, -2.51513671875, -2.366943359375, -2.21875, -2.070556640625, -1.92236328125, -1.774169921875, -1.6259765625, -1.477783203125, -1.32958984375, -1.181396484375, -1.033203125, -0.885009765625, -0.73681640625, -0.588623046875, -0.4404296875, -0.292236328125, -0.14404296875, 0.004150390625, 0.15234375, 0.300537109375, 0.44873046875, 0.596923828125, 0.7451171875, 0.893310546875, 1.04150390625, 1.189697265625, 1.337890625, 1.486083984375, 1.63427734375, 1.782470703125, 1.9306640625, 2.078857421875, 2.22705078125, 2.375244140625, 2.5234375, 2.671630859375, 2.81982421875, 2.968017578125, 3.1162109375, 3.264404296875, 3.41259765625, 3.560791015625, 3.708984375, 3.857177734375, 4.00537109375, 4.153564453125, 4.3017578125, 4.449951171875, 4.59814453125, 4.746337890625, 4.89453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 11.0, 22.0, 43.0, 116.0, 224.0, 313.0, 167.0, 58.0, 23.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.81341552734375, -95.54957580566406, -93.28572845458984, -91.02188873291016, -88.75804901123047, -86.49420166015625, -84.23036193847656, -81.96652221679688, -79.70267486572266, -77.43883514404297, -75.17498779296875, -72.91114807128906, -70.64730834960938, -68.38346099853516, -66.11962127685547, -63.855777740478516, -61.59193801879883, -59.328094482421875, -57.06425476074219, -54.800411224365234, -52.53656768798828, -50.272727966308594, -48.00888442993164, -45.74504089355469, -43.481201171875, -41.21735763549805, -38.95351791381836, -36.689674377441406, -34.42583084106445, -32.1619873046875, -29.898147583007812, -27.63430404663086, -25.370460510253906, -23.106618881225586, -20.842775344848633, -18.578933715820312, -16.31509017944336, -14.051248550415039, -11.787406921386719, -9.523564338684082, -7.259721755981445, -4.995879173278809, -2.73203706741333, -0.46819496154785156, 1.7956476211547852, 4.059490203857422, 6.323331832885742, 8.587174415588379, 10.851016998291016, 13.114859580993652, 15.378702163696289, 17.64254379272461, 19.906387329101562, 22.170228958129883, 24.434070587158203, 26.697914123535156, 28.961755752563477, 31.225597381591797, 33.48944091796875, 35.75328063964844, 38.01712417602539, 40.280967712402344, 42.54480743408203, 44.808650970458984, 47.07249450683594]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 6.0, 11.0, 11.0, 20.0, 25.0, 33.0, 29.0, 46.0, 45.0, 61.0, 57.0, 65.0, 57.0, 59.0, 84.0, 46.0, 60.0, 46.0, 43.0, 47.0, 29.0, 27.0, 18.0, 21.0, 14.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.395706176757812, -25.450843811035156, -24.505983352661133, -23.56112289428711, -22.616260528564453, -21.671398162841797, -20.726537704467773, -19.78167724609375, -18.836814880371094, -17.891952514648438, -16.947092056274414, -16.00223159790039, -15.057369232177734, -14.112507820129395, -13.167646408081055, -12.222784996032715, -11.277923583984375, -10.333062171936035, -9.388200759887695, -8.443339347839355, -7.498477935791016, -6.553616523742676, -5.608755111694336, -4.663893699645996, -3.7190322875976562, -2.7741708755493164, -1.8293094635009766, -0.8844480514526367, 0.060413360595703125, 1.005274772644043, 1.9501361846923828, 2.8949975967407227, 3.8398590087890625, 4.784720420837402, 5.729581832885742, 6.674443244934082, 7.619304656982422, 8.564166069030762, 9.509027481079102, 10.453888893127441, 11.398750305175781, 12.343611717224121, 13.288473129272461, 14.2333345413208, 15.17819595336914, 16.123058319091797, 17.06791877746582, 18.012779235839844, 18.9576416015625, 19.902503967285156, 20.84736442565918, 21.792224884033203, 22.73708724975586, 23.681949615478516, 24.62681007385254, 25.571670532226562, 26.51653289794922, 27.461395263671875, 28.4062557220459, 29.351116180419922, 30.295978546142578, 31.240840911865234, 32.185699462890625, 33.13056182861328, 34.07542419433594]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 6.0, 11.0, 18.0, 19.0, 30.0, 41.0, 77.0, 136.0, 221.0, 313.0, 609.0, 1091.0, 1969.0, 3879.0, 8109.0, 18259.0, 46004.0, 132038.0, 456561.0, 253894.0, 73540.0, 28078.0, 11955.0, 5518.0, 2760.0, 1503.0, 751.0, 441.0, 279.0, 163.0, 114.0, 55.0, 34.0, 34.0, 20.0, 6.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.15582275390625, -3.0460205078125, -2.93621826171875, -2.826416015625, -2.71661376953125, -2.6068115234375, -2.49700927734375, -2.38720703125, -2.27740478515625, -2.1676025390625, -2.05780029296875, -1.947998046875, -1.83819580078125, -1.7283935546875, -1.61859130859375, -1.5087890625, -1.39898681640625, -1.2891845703125, -1.17938232421875, -1.069580078125, -0.95977783203125, -0.8499755859375, -0.74017333984375, -0.63037109375, -0.52056884765625, -0.4107666015625, -0.30096435546875, -0.191162109375, -0.08135986328125, 0.0284423828125, 0.13824462890625, 0.248046875, 0.35784912109375, 0.4676513671875, 0.57745361328125, 0.687255859375, 0.79705810546875, 0.9068603515625, 1.01666259765625, 1.12646484375, 1.23626708984375, 1.3460693359375, 1.45587158203125, 1.565673828125, 1.67547607421875, 1.7852783203125, 1.89508056640625, 2.0048828125, 2.11468505859375, 2.2244873046875, 2.33428955078125, 2.444091796875, 2.55389404296875, 2.6636962890625, 2.77349853515625, 2.88330078125, 2.99310302734375, 3.1029052734375, 3.21270751953125, 3.322509765625, 3.43231201171875, 3.5421142578125, 3.65191650390625, 3.76171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 16.0, 17.0, 20.0, 24.0, 31.0, 45.0, 43.0, 42.0, 64.0, 63.0, 73.0, 51.0, 69.0, 67.0, 67.0, 66.0, 58.0, 29.0, 36.0, 30.0, 22.0, 18.0, 13.0, 12.0, 6.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.332794189453125, -2.27105712890625, -2.209320068359375, -2.1475830078125, -2.085845947265625, -2.02410888671875, -1.962371826171875, -1.900634765625, -1.838897705078125, -1.77716064453125, -1.715423583984375, -1.6536865234375, -1.591949462890625, -1.53021240234375, -1.468475341796875, -1.40673828125, -1.345001220703125, -1.28326416015625, -1.221527099609375, -1.1597900390625, -1.098052978515625, -1.03631591796875, -0.974578857421875, -0.912841796875, -0.851104736328125, -0.78936767578125, -0.727630615234375, -0.6658935546875, -0.604156494140625, -0.54241943359375, -0.480682373046875, -0.4189453125, -0.357208251953125, -0.29547119140625, -0.233734130859375, -0.1719970703125, -0.110260009765625, -0.04852294921875, 0.013214111328125, 0.074951171875, 0.136688232421875, 0.19842529296875, 0.260162353515625, 0.3218994140625, 0.383636474609375, 0.44537353515625, 0.507110595703125, 0.56884765625, 0.630584716796875, 0.69232177734375, 0.754058837890625, 0.8157958984375, 0.877532958984375, 0.93927001953125, 1.001007080078125, 1.062744140625, 1.124481201171875, 1.18621826171875, 1.247955322265625, 1.3096923828125, 1.371429443359375, 1.43316650390625, 1.494903564453125, 1.556640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 9.0, 13.0, 19.0, 21.0, 40.0, 42.0, 66.0, 92.0, 148.0, 222.0, 351.0, 627.0, 1157.0, 2577.0, 7450.0, 36652.0, 758088.0, 212446.0, 19534.0, 4928.0, 1845.0, 885.0, 490.0, 273.0, 181.0, 122.0, 76.0, 64.0, 46.0, 24.0, 18.0, 14.0, 16.0, 7.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.20703125, -8.8984375, -8.58984375, -8.28125, -7.97265625, -7.6640625, -7.35546875, -7.046875, -6.73828125, -6.4296875, -6.12109375, -5.8125, -5.50390625, -5.1953125, -4.88671875, -4.578125, -4.26953125, -3.9609375, -3.65234375, -3.34375, -3.03515625, -2.7265625, -2.41796875, -2.109375, -1.80078125, -1.4921875, -1.18359375, -0.875, -0.56640625, -0.2578125, 0.05078125, 0.359375, 0.66796875, 0.9765625, 1.28515625, 1.59375, 1.90234375, 2.2109375, 2.51953125, 2.828125, 3.13671875, 3.4453125, 3.75390625, 4.0625, 4.37109375, 4.6796875, 4.98828125, 5.296875, 5.60546875, 5.9140625, 6.22265625, 6.53125, 6.83984375, 7.1484375, 7.45703125, 7.765625, 8.07421875, 8.3828125, 8.69140625, 9.0, 9.30859375, 9.6171875, 9.92578125, 10.234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 8.0, 8.0, 12.0, 8.0, 16.0, 12.0, 23.0, 14.0, 14.0, 21.0, 22.0, 24.0, 23.0, 25.0, 33.0, 30.0, 49.0, 40.0, 45.0, 35.0, 39.0, 54.0, 50.0, 39.0, 35.0, 38.0, 31.0, 33.0, 22.0, 21.0, 27.0, 20.0, 22.0, 12.0, 11.0, 10.0, 13.0, 11.0, 11.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.03125, -5.847412109375, -5.66357421875, -5.479736328125, -5.2958984375, -5.112060546875, -4.92822265625, -4.744384765625, -4.560546875, -4.376708984375, -4.19287109375, -4.009033203125, -3.8251953125, -3.641357421875, -3.45751953125, -3.273681640625, -3.08984375, -2.906005859375, -2.72216796875, -2.538330078125, -2.3544921875, -2.170654296875, -1.98681640625, -1.802978515625, -1.619140625, -1.435302734375, -1.25146484375, -1.067626953125, -0.8837890625, -0.699951171875, -0.51611328125, -0.332275390625, -0.1484375, 0.035400390625, 0.21923828125, 0.403076171875, 0.5869140625, 0.770751953125, 0.95458984375, 1.138427734375, 1.322265625, 1.506103515625, 1.68994140625, 1.873779296875, 2.0576171875, 2.241455078125, 2.42529296875, 2.609130859375, 2.79296875, 2.976806640625, 3.16064453125, 3.344482421875, 3.5283203125, 3.712158203125, 3.89599609375, 4.079833984375, 4.263671875, 4.447509765625, 4.63134765625, 4.815185546875, 4.9990234375, 5.182861328125, 5.36669921875, 5.550537109375, 5.734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 3.0, 11.0, 12.0, 10.0, 21.0, 35.0, 45.0, 81.0, 121.0, 180.0, 281.0, 455.0, 787.0, 1471.0, 3186.0, 7770.0, 24138.0, 113760.0, 716147.0, 136876.0, 27694.0, 8434.0, 3319.0, 1626.0, 872.0, 415.0, 249.0, 164.0, 137.0, 86.0, 50.0, 39.0, 15.0, 15.0, 11.0, 10.0, 4.0, 5.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.5390625, -2.46337890625, -2.3876953125, -2.31201171875, -2.236328125, -2.16064453125, -2.0849609375, -2.00927734375, -1.93359375, -1.85791015625, -1.7822265625, -1.70654296875, -1.630859375, -1.55517578125, -1.4794921875, -1.40380859375, -1.328125, -1.25244140625, -1.1767578125, -1.10107421875, -1.025390625, -0.94970703125, -0.8740234375, -0.79833984375, -0.72265625, -0.64697265625, -0.5712890625, -0.49560546875, -0.419921875, -0.34423828125, -0.2685546875, -0.19287109375, -0.1171875, -0.04150390625, 0.0341796875, 0.10986328125, 0.185546875, 0.26123046875, 0.3369140625, 0.41259765625, 0.48828125, 0.56396484375, 0.6396484375, 0.71533203125, 0.791015625, 0.86669921875, 0.9423828125, 1.01806640625, 1.09375, 1.16943359375, 1.2451171875, 1.32080078125, 1.396484375, 1.47216796875, 1.5478515625, 1.62353515625, 1.69921875, 1.77490234375, 1.8505859375, 1.92626953125, 2.001953125, 2.07763671875, 2.1533203125, 2.22900390625, 2.3046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 3.0, 9.0, 15.0, 19.0, 21.0, 32.0, 38.0, 49.0, 102.0, 182.0, 190.0, 99.0, 50.0, 47.0, 33.0, 22.0, 20.0, 16.0, 7.0, 3.0, 8.0, 6.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010395050048828125, -0.0010097473859786987, -0.000979989767074585, -0.0009502321481704712, -0.0009204745292663574, -0.0008907169103622437, -0.0008609592914581299, -0.0008312016725540161, -0.0008014440536499023, -0.0007716864347457886, -0.0007419288158416748, -0.000712171196937561, -0.0006824135780334473, -0.0006526559591293335, -0.0006228983402252197, -0.000593140721321106, -0.0005633831024169922, -0.0005336254835128784, -0.0005038678646087646, -0.0004741102457046509, -0.0004443526268005371, -0.00041459500789642334, -0.00038483738899230957, -0.0003550797700881958, -0.00032532215118408203, -0.00029556453227996826, -0.0002658069133758545, -0.00023604929447174072, -0.00020629167556762695, -0.00017653405666351318, -0.00014677643775939941, -0.00011701881885528564, -8.726119995117188e-05, -5.7503581047058105e-05, -2.7745962142944336e-05, 2.0116567611694336e-06, 3.17692756652832e-05, 6.152689456939697e-05, 9.128451347351074e-05, 0.00012104213237762451, 0.00015079975128173828, 0.00018055737018585205, 0.00021031498908996582, 0.0002400726079940796, 0.00026983022689819336, 0.00029958784580230713, 0.0003293454647064209, 0.00035910308361053467, 0.00038886070251464844, 0.0004186183214187622, 0.000448375940322876, 0.00047813355922698975, 0.0005078911781311035, 0.0005376487970352173, 0.0005674064159393311, 0.0005971640348434448, 0.0006269216537475586, 0.0006566792726516724, 0.0006864368915557861, 0.0007161945104598999, 0.0007459521293640137, 0.0007757097482681274, 0.0008054673671722412, 0.000835224986076355, 0.0008649826049804688]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 9.0, 9.0, 16.0, 16.0, 20.0, 18.0, 29.0, 49.0, 75.0, 107.0, 177.0, 256.0, 429.0, 806.0, 1598.0, 3567.0, 10600.0, 61154.0, 748080.0, 189246.0, 21853.0, 5769.0, 2228.0, 1013.0, 497.0, 330.0, 203.0, 111.0, 68.0, 66.0, 31.0, 29.0, 24.0, 16.0, 9.0, 13.0, 12.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0], "bins": [-3.240234375, -3.15435791015625, -3.0684814453125, -2.98260498046875, -2.896728515625, -2.81085205078125, -2.7249755859375, -2.63909912109375, -2.55322265625, -2.46734619140625, -2.3814697265625, -2.29559326171875, -2.209716796875, -2.12384033203125, -2.0379638671875, -1.95208740234375, -1.8662109375, -1.78033447265625, -1.6944580078125, -1.60858154296875, -1.522705078125, -1.43682861328125, -1.3509521484375, -1.26507568359375, -1.17919921875, -1.09332275390625, -1.0074462890625, -0.92156982421875, -0.835693359375, -0.74981689453125, -0.6639404296875, -0.57806396484375, -0.4921875, -0.40631103515625, -0.3204345703125, -0.23455810546875, -0.148681640625, -0.06280517578125, 0.0230712890625, 0.10894775390625, 0.19482421875, 0.28070068359375, 0.3665771484375, 0.45245361328125, 0.538330078125, 0.62420654296875, 0.7100830078125, 0.79595947265625, 0.8818359375, 0.96771240234375, 1.0535888671875, 1.13946533203125, 1.225341796875, 1.31121826171875, 1.3970947265625, 1.48297119140625, 1.56884765625, 1.65472412109375, 1.7406005859375, 1.82647705078125, 1.912353515625, 1.99822998046875, 2.0841064453125, 2.16998291015625, 2.255859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 11.0, 9.0, 25.0, 14.0, 28.0, 50.0, 40.0, 53.0, 69.0, 99.0, 126.0, 110.0, 79.0, 66.0, 53.0, 35.0, 34.0, 37.0, 12.0, 19.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.42578125, -3.32989501953125, -3.2340087890625, -3.13812255859375, -3.042236328125, -2.94635009765625, -2.8504638671875, -2.75457763671875, -2.65869140625, -2.56280517578125, -2.4669189453125, -2.37103271484375, -2.275146484375, -2.17926025390625, -2.0833740234375, -1.98748779296875, -1.8916015625, -1.79571533203125, -1.6998291015625, -1.60394287109375, -1.508056640625, -1.41217041015625, -1.3162841796875, -1.22039794921875, -1.12451171875, -1.02862548828125, -0.9327392578125, -0.83685302734375, -0.740966796875, -0.64508056640625, -0.5491943359375, -0.45330810546875, -0.357421875, -0.26153564453125, -0.1656494140625, -0.06976318359375, 0.026123046875, 0.12200927734375, 0.2178955078125, 0.31378173828125, 0.40966796875, 0.50555419921875, 0.6014404296875, 0.69732666015625, 0.793212890625, 0.88909912109375, 0.9849853515625, 1.08087158203125, 1.1767578125, 1.27264404296875, 1.3685302734375, 1.46441650390625, 1.560302734375, 1.65618896484375, 1.7520751953125, 1.84796142578125, 1.94384765625, 2.03973388671875, 2.1356201171875, 2.23150634765625, 2.327392578125, 2.42327880859375, 2.5191650390625, 2.61505126953125, 2.7109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 7.0, 13.0, 45.0, 84.0, 175.0, 333.0, 180.0, 78.0, 36.0, 21.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.177146911621094, -38.8262939453125, -36.475440979003906, -34.12458801269531, -31.773733139038086, -29.422880172729492, -27.072025299072266, -24.721172332763672, -22.370319366455078, -20.019466400146484, -17.66861343383789, -15.317758560180664, -12.96690559387207, -10.616052627563477, -8.265198707580566, -5.914344787597656, -3.5634918212890625, -1.2126383781433105, 1.1382150650024414, 3.4890685081481934, 5.839921951293945, 8.190774917602539, 10.54162883758545, 12.89248275756836, 15.243335723876953, 17.594188690185547, 19.94504165649414, 22.295896530151367, 24.64674949645996, 26.997602462768555, 29.34845733642578, 31.699310302734375, 34.05015563964844, 36.40100860595703, 38.751861572265625, 41.10271453857422, 43.45356750488281, 45.804420471191406, 48.155277252197266, 50.50613021850586, 52.85698318481445, 55.20783615112305, 57.55868911743164, 59.909542083740234, 62.260398864746094, 64.61125183105469, 66.96210479736328, 69.31295776367188, 71.66381072998047, 74.01466369628906, 76.36551666259766, 78.71636962890625, 81.06722259521484, 83.41807556152344, 85.76892852783203, 88.11978149414062, 90.47064208984375, 92.82149505615234, 95.17234802246094, 97.52320098876953, 99.87405395507812, 102.22490692138672, 104.57575988769531, 106.92662048339844, 109.2774658203125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 10.0, 12.0, 11.0, 20.0, 29.0, 27.0, 27.0, 27.0, 27.0, 38.0, 53.0, 59.0, 62.0, 84.0, 90.0, 86.0, 53.0, 41.0, 39.0, 39.0, 30.0, 28.0, 22.0, 26.0, 20.0, 9.0, 8.0, 8.0, 1.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.56633758544922, -28.478527069091797, -27.390716552734375, -26.302907943725586, -25.215097427368164, -24.127286911010742, -23.039478302001953, -21.95166778564453, -20.86385726928711, -19.776046752929688, -18.688236236572266, -17.600427627563477, -16.512617111206055, -15.424806594848633, -14.336997032165527, -13.249187469482422, -12.161376953125, -11.073566436767578, -9.985756874084473, -8.897947311401367, -7.810136795043945, -6.722326755523682, -5.634516716003418, -4.546706676483154, -3.4588966369628906, -2.371086597442627, -1.2832765579223633, -0.1954665184020996, 0.8923435211181641, 1.9801535606384277, 3.0679636001586914, 4.155773639678955, 5.243583679199219, 6.331393718719482, 7.419203758239746, 8.507013320922852, 9.594823837280273, 10.682634353637695, 11.7704439163208, 12.858253479003906, 13.946063995361328, 15.03387451171875, 16.121685028076172, 17.20949363708496, 18.297304153442383, 19.385114669799805, 20.472923278808594, 21.560733795166016, 22.648544311523438, 23.73635482788086, 24.82416534423828, 25.91197395324707, 26.999784469604492, 28.087594985961914, 29.175403594970703, 30.263214111328125, 31.351024627685547, 32.43883514404297, 33.52664566040039, 34.61445617675781, 35.70226287841797, 36.79007339477539, 37.87788391113281, 38.965694427490234, 40.053504943847656]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 9.0, 5.0, 11.0, 7.0, 13.0, 16.0, 26.0, 36.0, 59.0, 98.0, 148.0, 285.0, 588.0, 1238.0, 2739.0, 6765.0, 19978.0, 86650.0, 902183.0, 2830984.0, 280324.0, 41947.0, 12043.0, 4447.0, 1872.0, 883.0, 412.0, 215.0, 122.0, 53.0, 44.0, 32.0, 25.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.74664306640625, -2.6495361328125, -2.55242919921875, -2.455322265625, -2.35821533203125, -2.2611083984375, -2.16400146484375, -2.06689453125, -1.96978759765625, -1.8726806640625, -1.77557373046875, -1.678466796875, -1.58135986328125, -1.4842529296875, -1.38714599609375, -1.2900390625, -1.19293212890625, -1.0958251953125, -0.99871826171875, -0.901611328125, -0.80450439453125, -0.7073974609375, -0.61029052734375, -0.51318359375, -0.41607666015625, -0.3189697265625, -0.22186279296875, -0.124755859375, -0.02764892578125, 0.0694580078125, 0.16656494140625, 0.263671875, 0.36077880859375, 0.4578857421875, 0.55499267578125, 0.652099609375, 0.74920654296875, 0.8463134765625, 0.94342041015625, 1.04052734375, 1.13763427734375, 1.2347412109375, 1.33184814453125, 1.428955078125, 1.52606201171875, 1.6231689453125, 1.72027587890625, 1.8173828125, 1.91448974609375, 2.0115966796875, 2.10870361328125, 2.205810546875, 2.30291748046875, 2.4000244140625, 2.49713134765625, 2.59423828125, 2.69134521484375, 2.7884521484375, 2.88555908203125, 2.982666015625, 3.07977294921875, 3.1768798828125, 3.27398681640625, 3.37109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 9.0, 18.0, 21.0, 21.0, 20.0, 31.0, 39.0, 34.0, 43.0, 52.0, 58.0, 69.0, 67.0, 57.0, 66.0, 64.0, 37.0, 49.0, 45.0, 43.0, 26.0, 30.0, 21.0, 21.0, 11.0, 10.0, 6.0, 8.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.542877197265625, -1.48419189453125, -1.425506591796875, -1.3668212890625, -1.308135986328125, -1.24945068359375, -1.190765380859375, -1.132080078125, -1.073394775390625, -1.01470947265625, -0.956024169921875, -0.8973388671875, -0.838653564453125, -0.77996826171875, -0.721282958984375, -0.66259765625, -0.603912353515625, -0.54522705078125, -0.486541748046875, -0.4278564453125, -0.369171142578125, -0.31048583984375, -0.251800537109375, -0.193115234375, -0.134429931640625, -0.07574462890625, -0.017059326171875, 0.0416259765625, 0.100311279296875, 0.15899658203125, 0.217681884765625, 0.2763671875, 0.335052490234375, 0.39373779296875, 0.452423095703125, 0.5111083984375, 0.569793701171875, 0.62847900390625, 0.687164306640625, 0.745849609375, 0.804534912109375, 0.86322021484375, 0.921905517578125, 0.9805908203125, 1.039276123046875, 1.09796142578125, 1.156646728515625, 1.21533203125, 1.274017333984375, 1.33270263671875, 1.391387939453125, 1.4500732421875, 1.508758544921875, 1.56744384765625, 1.626129150390625, 1.684814453125, 1.743499755859375, 1.80218505859375, 1.860870361328125, 1.9195556640625, 1.978240966796875, 2.03692626953125, 2.095611572265625, 2.154296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 6.0, 11.0, 15.0, 22.0, 25.0, 42.0, 77.0, 96.0, 121.0, 224.0, 299.0, 449.0, 709.0, 1199.0, 2050.0, 3939.0, 8138.0, 20582.0, 64456.0, 432156.0, 3208048.0, 358252.0, 60061.0, 18229.0, 7123.0, 3331.0, 1795.0, 1044.0, 594.0, 386.0, 228.0, 160.0, 124.0, 86.0, 61.0, 33.0, 21.0, 19.0, 15.0, 20.0, 2.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.947265625, -3.80859375, -3.669921875, -3.53125, -3.392578125, -3.25390625, -3.115234375, -2.9765625, -2.837890625, -2.69921875, -2.560546875, -2.421875, -2.283203125, -2.14453125, -2.005859375, -1.8671875, -1.728515625, -1.58984375, -1.451171875, -1.3125, -1.173828125, -1.03515625, -0.896484375, -0.7578125, -0.619140625, -0.48046875, -0.341796875, -0.203125, -0.064453125, 0.07421875, 0.212890625, 0.3515625, 0.490234375, 0.62890625, 0.767578125, 0.90625, 1.044921875, 1.18359375, 1.322265625, 1.4609375, 1.599609375, 1.73828125, 1.876953125, 2.015625, 2.154296875, 2.29296875, 2.431640625, 2.5703125, 2.708984375, 2.84765625, 2.986328125, 3.125, 3.263671875, 3.40234375, 3.541015625, 3.6796875, 3.818359375, 3.95703125, 4.095703125, 4.234375, 4.373046875, 4.51171875, 4.650390625, 4.7890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 10.0, 11.0, 8.0, 14.0, 27.0, 34.0, 49.0, 49.0, 114.0, 197.0, 373.0, 741.0, 984.0, 647.0, 315.0, 179.0, 91.0, 65.0, 42.0, 21.0, 28.0, 18.0, 12.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.94635009765625, -5.7442626953125, -5.54217529296875, -5.340087890625, -5.13800048828125, -4.9359130859375, -4.73382568359375, -4.53173828125, -4.32965087890625, -4.1275634765625, -3.92547607421875, -3.723388671875, -3.52130126953125, -3.3192138671875, -3.11712646484375, -2.9150390625, -2.71295166015625, -2.5108642578125, -2.30877685546875, -2.106689453125, -1.90460205078125, -1.7025146484375, -1.50042724609375, -1.29833984375, -1.09625244140625, -0.8941650390625, -0.69207763671875, -0.489990234375, -0.28790283203125, -0.0858154296875, 0.11627197265625, 0.318359375, 0.52044677734375, 0.7225341796875, 0.92462158203125, 1.126708984375, 1.32879638671875, 1.5308837890625, 1.73297119140625, 1.93505859375, 2.13714599609375, 2.3392333984375, 2.54132080078125, 2.743408203125, 2.94549560546875, 3.1475830078125, 3.34967041015625, 3.5517578125, 3.75384521484375, 3.9559326171875, 4.15802001953125, 4.360107421875, 4.56219482421875, 4.7642822265625, 4.96636962890625, 5.16845703125, 5.37054443359375, 5.5726318359375, 5.77471923828125, 5.976806640625, 6.17889404296875, 6.3809814453125, 6.58306884765625, 6.78515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 10.0, 7.0, 20.0, 34.0, 103.0, 166.0, 295.0, 200.0, 82.0, 49.0, 16.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.16498565673828, -98.67304229736328, -96.18109130859375, -93.68914794921875, -91.19719696044922, -88.70525360107422, -86.21330261230469, -83.72135925292969, -81.22941589355469, -78.73747253417969, -76.24552154541016, -73.75357818603516, -71.26162719726562, -68.76968383789062, -66.27774047851562, -63.785789489746094, -61.29384231567383, -58.80189514160156, -56.3099479675293, -53.81800079345703, -51.32605743408203, -48.834110260009766, -46.3421630859375, -43.8502197265625, -41.35826873779297, -38.8663215637207, -36.37437438964844, -33.88243103027344, -31.390483856201172, -28.898536682128906, -26.40658950805664, -23.914644241333008, -21.42269515991211, -18.930747985839844, -16.43880271911621, -13.946855545043945, -11.454909324645996, -8.962963104248047, -6.471015930175781, -3.9790706634521484, -1.4871234893798828, 1.0048229694366455, 3.496769428253174, 5.988716125488281, 8.48066234588623, 10.97260856628418, 13.464555740356445, 15.956501007080078, 18.448448181152344, 20.94039535522461, 23.432340621948242, 25.924287796020508, 28.41623306274414, 30.908180236816406, 33.40012741088867, 35.89207458496094, 38.38401794433594, 40.8759651184082, 43.36791229248047, 45.85985565185547, 48.351802825927734, 50.84375, 53.335697174072266, 55.82764434814453, 58.3195915222168]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 15.0, 13.0, 19.0, 21.0, 24.0, 29.0, 27.0, 34.0, 37.0, 52.0, 36.0, 38.0, 39.0, 57.0, 50.0, 48.0, 43.0, 45.0, 51.0, 43.0, 40.0, 29.0, 28.0, 26.0, 19.0, 27.0, 18.0, 23.0, 13.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.742271423339844, -25.885761260986328, -25.029253005981445, -24.17274284362793, -23.316232681274414, -22.45972442626953, -21.603214263916016, -20.7467041015625, -19.890193939208984, -19.03368377685547, -18.177175521850586, -17.32066535949707, -16.464155197143555, -15.607645988464355, -14.751136779785156, -13.89462661743164, -13.038117408752441, -12.181608200073242, -11.325098037719727, -10.468588829040527, -9.612078666687012, -8.755569458007812, -7.899059772491455, -7.042550086975098, -6.18604040145874, -5.329530715942383, -4.473021030426025, -3.616511583328247, -2.7600018978118896, -1.9034924507141113, -1.046982765197754, -0.19047307968139648, 0.6660366058349609, 1.5225462913513184, 2.379055976867676, 3.235565423965454, 4.092075347900391, 4.94858455657959, 5.805094242095947, 6.661603927612305, 7.518113613128662, 8.37462329864502, 9.231132507324219, 10.087642669677734, 10.944151878356934, 11.800661087036133, 12.657171249389648, 13.513681411743164, 14.370190620422363, 15.226699829101562, 16.083209991455078, 16.939720153808594, 17.796228408813477, 18.652738571166992, 19.509248733520508, 20.36575698852539, 21.222267150878906, 22.078777313232422, 22.935285568237305, 23.79179573059082, 24.648305892944336, 25.50481414794922, 26.361324310302734, 27.21783447265625, 28.074344635009766]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 4.0, 2.0, 8.0, 10.0, 9.0, 9.0, 22.0, 33.0, 35.0, 61.0, 77.0, 115.0, 188.0, 250.0, 402.0, 544.0, 804.0, 1210.0, 1900.0, 3000.0, 5286.0, 9373.0, 18722.0, 41837.0, 120305.0, 413337.0, 285334.0, 80933.0, 30874.0, 14417.0, 7595.0, 4344.0, 2635.0, 1600.0, 1051.0, 656.0, 497.0, 325.0, 227.0, 157.0, 117.0, 60.0, 54.0, 44.0, 27.0, 19.0, 13.0, 8.0, 11.0, 7.0, 5.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.2890625, -3.188873291015625, -3.08868408203125, -2.988494873046875, -2.8883056640625, -2.788116455078125, -2.68792724609375, -2.587738037109375, -2.487548828125, -2.387359619140625, -2.28717041015625, -2.186981201171875, -2.0867919921875, -1.986602783203125, -1.88641357421875, -1.786224365234375, -1.68603515625, -1.585845947265625, -1.48565673828125, -1.385467529296875, -1.2852783203125, -1.185089111328125, -1.08489990234375, -0.984710693359375, -0.884521484375, -0.784332275390625, -0.68414306640625, -0.583953857421875, -0.4837646484375, -0.383575439453125, -0.28338623046875, -0.183197021484375, -0.0830078125, 0.017181396484375, 0.11737060546875, 0.217559814453125, 0.3177490234375, 0.417938232421875, 0.51812744140625, 0.618316650390625, 0.718505859375, 0.818695068359375, 0.91888427734375, 1.019073486328125, 1.1192626953125, 1.219451904296875, 1.31964111328125, 1.419830322265625, 1.52001953125, 1.620208740234375, 1.72039794921875, 1.820587158203125, 1.9207763671875, 2.020965576171875, 2.12115478515625, 2.221343994140625, 2.321533203125, 2.421722412109375, 2.52191162109375, 2.622100830078125, 2.7222900390625, 2.822479248046875, 2.92266845703125, 3.022857666015625, 3.123046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 11.0, 8.0, 14.0, 15.0, 29.0, 17.0, 22.0, 30.0, 43.0, 37.0, 51.0, 44.0, 54.0, 50.0, 51.0, 45.0, 59.0, 33.0, 48.0, 42.0, 43.0, 36.0, 39.0, 29.0, 22.0, 24.0, 19.0, 12.0, 19.0, 10.0, 4.0, 8.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6552734375, -1.5967254638671875, -1.538177490234375, -1.4796295166015625, -1.42108154296875, -1.3625335693359375, -1.303985595703125, -1.2454376220703125, -1.1868896484375, -1.1283416748046875, -1.069793701171875, -1.0112457275390625, -0.95269775390625, -0.8941497802734375, -0.835601806640625, -0.7770538330078125, -0.718505859375, -0.6599578857421875, -0.601409912109375, -0.5428619384765625, -0.48431396484375, -0.4257659912109375, -0.367218017578125, -0.3086700439453125, -0.2501220703125, -0.1915740966796875, -0.133026123046875, -0.0744781494140625, -0.01593017578125, 0.0426177978515625, 0.101165771484375, 0.1597137451171875, 0.21826171875, 0.2768096923828125, 0.335357666015625, 0.3939056396484375, 0.45245361328125, 0.5110015869140625, 0.569549560546875, 0.6280975341796875, 0.6866455078125, 0.7451934814453125, 0.803741455078125, 0.8622894287109375, 0.92083740234375, 0.9793853759765625, 1.037933349609375, 1.0964813232421875, 1.155029296875, 1.2135772705078125, 1.272125244140625, 1.3306732177734375, 1.38922119140625, 1.4477691650390625, 1.506317138671875, 1.5648651123046875, 1.6234130859375, 1.6819610595703125, 1.740509033203125, 1.7990570068359375, 1.85760498046875, 1.9161529541015625, 1.974700927734375, 2.0332489013671875, 2.091796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 11.0, 17.0, 21.0, 21.0, 45.0, 52.0, 100.0, 125.0, 199.0, 284.0, 427.0, 835.0, 1729.0, 4544.0, 16389.0, 99646.0, 819105.0, 82531.0, 14651.0, 4084.0, 1664.0, 816.0, 414.0, 287.0, 176.0, 117.0, 90.0, 54.0, 33.0, 25.0, 16.0, 15.0, 10.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.85986328125, -8.5869140625, -8.31396484375, -8.041015625, -7.76806640625, -7.4951171875, -7.22216796875, -6.94921875, -6.67626953125, -6.4033203125, -6.13037109375, -5.857421875, -5.58447265625, -5.3115234375, -5.03857421875, -4.765625, -4.49267578125, -4.2197265625, -3.94677734375, -3.673828125, -3.40087890625, -3.1279296875, -2.85498046875, -2.58203125, -2.30908203125, -2.0361328125, -1.76318359375, -1.490234375, -1.21728515625, -0.9443359375, -0.67138671875, -0.3984375, -0.12548828125, 0.1474609375, 0.42041015625, 0.693359375, 0.96630859375, 1.2392578125, 1.51220703125, 1.78515625, 2.05810546875, 2.3310546875, 2.60400390625, 2.876953125, 3.14990234375, 3.4228515625, 3.69580078125, 3.96875, 4.24169921875, 4.5146484375, 4.78759765625, 5.060546875, 5.33349609375, 5.6064453125, 5.87939453125, 6.15234375, 6.42529296875, 6.6982421875, 6.97119140625, 7.244140625, 7.51708984375, 7.7900390625, 8.06298828125, 8.3359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 9.0, 8.0, 11.0, 8.0, 11.0, 18.0, 11.0, 23.0, 30.0, 40.0, 39.0, 45.0, 45.0, 55.0, 56.0, 53.0, 56.0, 64.0, 69.0, 50.0, 54.0, 41.0, 42.0, 28.0, 25.0, 16.0, 15.0, 18.0, 9.0, 17.0, 5.0, 5.0, 8.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.983642578125, -9.70166015625, -9.419677734375, -9.1376953125, -8.855712890625, -8.57373046875, -8.291748046875, -8.009765625, -7.727783203125, -7.44580078125, -7.163818359375, -6.8818359375, -6.599853515625, -6.31787109375, -6.035888671875, -5.75390625, -5.471923828125, -5.18994140625, -4.907958984375, -4.6259765625, -4.343994140625, -4.06201171875, -3.780029296875, -3.498046875, -3.216064453125, -2.93408203125, -2.652099609375, -2.3701171875, -2.088134765625, -1.80615234375, -1.524169921875, -1.2421875, -0.960205078125, -0.67822265625, -0.396240234375, -0.1142578125, 0.167724609375, 0.44970703125, 0.731689453125, 1.013671875, 1.295654296875, 1.57763671875, 1.859619140625, 2.1416015625, 2.423583984375, 2.70556640625, 2.987548828125, 3.26953125, 3.551513671875, 3.83349609375, 4.115478515625, 4.3974609375, 4.679443359375, 4.96142578125, 5.243408203125, 5.525390625, 5.807373046875, 6.08935546875, 6.371337890625, 6.6533203125, 6.935302734375, 7.21728515625, 7.499267578125, 7.78125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 3.0, 5.0, 17.0, 38.0, 69.0, 121.0, 236.0, 483.0, 1269.0, 4836.0, 31018.0, 655721.0, 325894.0, 22970.0, 3942.0, 1058.0, 411.0, 191.0, 120.0, 53.0, 42.0, 19.0, 11.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.53125, -5.3814697265625, -5.231689453125, -5.0819091796875, -4.93212890625, -4.7823486328125, -4.632568359375, -4.4827880859375, -4.3330078125, -4.1832275390625, -4.033447265625, -3.8836669921875, -3.73388671875, -3.5841064453125, -3.434326171875, -3.2845458984375, -3.134765625, -2.9849853515625, -2.835205078125, -2.6854248046875, -2.53564453125, -2.3858642578125, -2.236083984375, -2.0863037109375, -1.9365234375, -1.7867431640625, -1.636962890625, -1.4871826171875, -1.33740234375, -1.1876220703125, -1.037841796875, -0.8880615234375, -0.73828125, -0.5885009765625, -0.438720703125, -0.2889404296875, -0.13916015625, 0.0106201171875, 0.160400390625, 0.3101806640625, 0.4599609375, 0.6097412109375, 0.759521484375, 0.9093017578125, 1.05908203125, 1.2088623046875, 1.358642578125, 1.5084228515625, 1.658203125, 1.8079833984375, 1.957763671875, 2.1075439453125, 2.25732421875, 2.4071044921875, 2.556884765625, 2.7066650390625, 2.8564453125, 3.0062255859375, 3.156005859375, 3.3057861328125, 3.45556640625, 3.6053466796875, 3.755126953125, 3.9049072265625, 4.0546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 8.0, 9.0, 10.0, 16.0, 19.0, 21.0, 27.0, 43.0, 70.0, 93.0, 134.0, 161.0, 113.0, 66.0, 52.0, 28.0, 22.0, 17.0, 17.0, 17.0, 12.0, 7.0, 5.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006017684936523438, -0.0005754977464675903, -0.0005492269992828369, -0.0005229562520980835, -0.0004966855049133301, -0.00047041475772857666, -0.00044414401054382324, -0.0004178732633590698, -0.0003916025161743164, -0.000365331768989563, -0.00033906102180480957, -0.00031279027462005615, -0.00028651952743530273, -0.0002602487802505493, -0.0002339780330657959, -0.00020770728588104248, -0.00018143653869628906, -0.00015516579151153564, -0.00012889504432678223, -0.00010262429714202881, -7.635354995727539e-05, -5.008280277252197e-05, -2.3812055587768555e-05, 2.4586915969848633e-06, 2.872943878173828e-05, 5.50001859664917e-05, 8.127093315124512e-05, 0.00010754168033599854, 0.00013381242752075195, 0.00016008317470550537, 0.0001863539218902588, 0.0002126246690750122, 0.00023889541625976562, 0.00026516616344451904, 0.00029143691062927246, 0.0003177076578140259, 0.0003439784049987793, 0.0003702491521835327, 0.00039651989936828613, 0.00042279064655303955, 0.00044906139373779297, 0.0004753321409225464, 0.0005016028881072998, 0.0005278736352920532, 0.0005541443824768066, 0.0005804151296615601, 0.0006066858768463135, 0.0006329566240310669, 0.0006592273712158203, 0.0006854981184005737, 0.0007117688655853271, 0.0007380396127700806, 0.000764310359954834, 0.0007905811071395874, 0.0008168518543243408, 0.0008431226015090942, 0.0008693933486938477, 0.0008956640958786011, 0.0009219348430633545, 0.0009482055902481079, 0.0009744763374328613, 0.0010007470846176147, 0.0010270178318023682, 0.0010532885789871216, 0.001079559326171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 13.0, 20.0, 22.0, 56.0, 82.0, 145.0, 225.0, 413.0, 843.0, 2097.0, 7184.0, 41481.0, 741568.0, 226712.0, 20444.0, 4418.0, 1475.0, 579.0, 324.0, 171.0, 93.0, 65.0, 44.0, 32.0, 14.0, 8.0, 8.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.636383056640625, -4.50323486328125, -4.370086669921875, -4.2369384765625, -4.103790283203125, -3.97064208984375, -3.837493896484375, -3.704345703125, -3.571197509765625, -3.43804931640625, -3.304901123046875, -3.1717529296875, -3.038604736328125, -2.90545654296875, -2.772308349609375, -2.63916015625, -2.506011962890625, -2.37286376953125, -2.239715576171875, -2.1065673828125, -1.973419189453125, -1.84027099609375, -1.707122802734375, -1.573974609375, -1.440826416015625, -1.30767822265625, -1.174530029296875, -1.0413818359375, -0.908233642578125, -0.77508544921875, -0.641937255859375, -0.5087890625, -0.375640869140625, -0.24249267578125, -0.109344482421875, 0.0238037109375, 0.156951904296875, 0.29010009765625, 0.423248291015625, 0.556396484375, 0.689544677734375, 0.82269287109375, 0.955841064453125, 1.0889892578125, 1.222137451171875, 1.35528564453125, 1.488433837890625, 1.62158203125, 1.754730224609375, 1.88787841796875, 2.021026611328125, 2.1541748046875, 2.287322998046875, 2.42047119140625, 2.553619384765625, 2.686767578125, 2.819915771484375, 2.95306396484375, 3.086212158203125, 3.2193603515625, 3.352508544921875, 3.48565673828125, 3.618804931640625, 3.751953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 4.0, 5.0, 5.0, 6.0, 11.0, 10.0, 10.0, 18.0, 17.0, 34.0, 47.0, 48.0, 84.0, 103.0, 124.0, 112.0, 89.0, 65.0, 48.0, 48.0, 31.0, 19.0, 14.0, 13.0, 11.0, 7.0, 5.0, 1.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.62109375, -3.52557373046875, -3.4300537109375, -3.33453369140625, -3.239013671875, -3.14349365234375, -3.0479736328125, -2.95245361328125, -2.85693359375, -2.76141357421875, -2.6658935546875, -2.57037353515625, -2.474853515625, -2.37933349609375, -2.2838134765625, -2.18829345703125, -2.0927734375, -1.99725341796875, -1.9017333984375, -1.80621337890625, -1.710693359375, -1.61517333984375, -1.5196533203125, -1.42413330078125, -1.32861328125, -1.23309326171875, -1.1375732421875, -1.04205322265625, -0.946533203125, -0.85101318359375, -0.7554931640625, -0.65997314453125, -0.564453125, -0.46893310546875, -0.3734130859375, -0.27789306640625, -0.182373046875, -0.08685302734375, 0.0086669921875, 0.10418701171875, 0.19970703125, 0.29522705078125, 0.3907470703125, 0.48626708984375, 0.581787109375, 0.67730712890625, 0.7728271484375, 0.86834716796875, 0.9638671875, 1.05938720703125, 1.1549072265625, 1.25042724609375, 1.345947265625, 1.44146728515625, 1.5369873046875, 1.63250732421875, 1.72802734375, 1.82354736328125, 1.9190673828125, 2.01458740234375, 2.110107421875, 2.20562744140625, 2.3011474609375, 2.39666748046875, 2.4921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 5.0, 3.0, 2.0, 5.0, 5.0, 17.0, 29.0, 55.0, 111.0, 184.0, 262.0, 144.0, 85.0, 42.0, 18.0, 12.0, 12.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.494224548339844, -60.66911697387695, -58.84400939941406, -57.01890182495117, -55.19379425048828, -53.36868667602539, -51.5435791015625, -49.718475341796875, -47.89336395263672, -46.06825637817383, -44.24314880371094, -42.41804122924805, -40.592933654785156, -38.767826080322266, -36.942718505859375, -35.11761474609375, -33.29250717163086, -31.46739959716797, -29.642292022705078, -27.817184448242188, -25.992076873779297, -24.166969299316406, -22.34186363220215, -20.516756057739258, -18.691648483276367, -16.866540908813477, -15.041433334350586, -13.216326713562012, -11.391219139099121, -9.56611156463623, -7.741004943847656, -5.915897369384766, -4.090785980224609, -2.265678644180298, -0.44057130813598633, 1.384535789489746, 3.2096433639526367, 5.034750938415527, 6.859857559204102, 8.684965133666992, 10.510072708129883, 12.335180282592773, 14.160287857055664, 15.985394477844238, 17.810501098632812, 19.635608673095703, 21.460716247558594, 23.285823822021484, 25.110931396484375, 26.936038970947266, 28.761146545410156, 30.586254119873047, 32.41136169433594, 34.23646926879883, 36.06157684326172, 37.886680603027344, 39.7117919921875, 41.53689956665039, 43.36200714111328, 45.18711471557617, 47.01222229003906, 48.83732986450195, 50.662437438964844, 52.48754119873047, 54.31264877319336]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 3.0, 5.0, 12.0, 12.0, 29.0, 21.0, 23.0, 22.0, 29.0, 32.0, 42.0, 52.0, 52.0, 75.0, 100.0, 72.0, 60.0, 55.0, 41.0, 42.0, 35.0, 33.0, 24.0, 24.0, 23.0, 12.0, 16.0, 11.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.252498626708984, -32.011741638183594, -30.770984649658203, -29.530227661132812, -28.289470672607422, -27.04871368408203, -25.807958602905273, -24.567201614379883, -23.326444625854492, -22.0856876373291, -20.84493064880371, -19.60417366027832, -18.363418579101562, -17.122661590576172, -15.881904602050781, -14.64114761352539, -13.400390625, -12.15963363647461, -10.918876647949219, -9.678120613098145, -8.437363624572754, -7.196606636047363, -5.955850124359131, -4.715093612670898, -3.474336624145508, -2.2335798740386963, -0.9928231239318848, 0.24793362617492676, 1.4886903762817383, 2.729447364807129, 3.9702038764953613, 5.210960388183594, 6.451717376708984, 7.692474365234375, 8.933231353759766, 10.17398738861084, 11.41474437713623, 12.655501365661621, 13.896257400512695, 15.137014389038086, 16.377771377563477, 17.618528366088867, 18.859285354614258, 20.10004234313965, 21.340797424316406, 22.581554412841797, 23.822311401367188, 25.063068389892578, 26.30382537841797, 27.54458236694336, 28.78533935546875, 30.02609634399414, 31.26685333251953, 32.50761032104492, 33.74836730957031, 34.98912048339844, 36.229881286621094, 37.470638275146484, 38.711395263671875, 39.952152252197266, 41.192909240722656, 42.43366622924805, 43.67442321777344, 44.91517639160156, 46.15593338012695]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 12.0, 10.0, 19.0, 21.0, 36.0, 39.0, 60.0, 102.0, 168.0, 236.0, 398.0, 814.0, 1558.0, 3334.0, 8152.0, 24974.0, 160329.0, 2623438.0, 1260224.0, 82396.0, 16733.0, 5778.0, 2524.0, 1206.0, 655.0, 371.0, 239.0, 140.0, 100.0, 51.0, 44.0, 26.0, 21.0, 16.0, 10.0, 13.0, 11.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.92352294921875, -3.8040771484375, -3.68463134765625, -3.565185546875, -3.44573974609375, -3.3262939453125, -3.20684814453125, -3.08740234375, -2.96795654296875, -2.8485107421875, -2.72906494140625, -2.609619140625, -2.49017333984375, -2.3707275390625, -2.25128173828125, -2.1318359375, -2.01239013671875, -1.8929443359375, -1.77349853515625, -1.654052734375, -1.53460693359375, -1.4151611328125, -1.29571533203125, -1.17626953125, -1.05682373046875, -0.9373779296875, -0.81793212890625, -0.698486328125, -0.57904052734375, -0.4595947265625, -0.34014892578125, -0.220703125, -0.10125732421875, 0.0181884765625, 0.13763427734375, 0.257080078125, 0.37652587890625, 0.4959716796875, 0.61541748046875, 0.73486328125, 0.85430908203125, 0.9737548828125, 1.09320068359375, 1.212646484375, 1.33209228515625, 1.4515380859375, 1.57098388671875, 1.6904296875, 1.80987548828125, 1.9293212890625, 2.04876708984375, 2.168212890625, 2.28765869140625, 2.4071044921875, 2.52655029296875, 2.64599609375, 2.76544189453125, 2.8848876953125, 3.00433349609375, 3.123779296875, 3.24322509765625, 3.3626708984375, 3.48211669921875, 3.6015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 3.0, 3.0, 6.0, 7.0, 4.0, 6.0, 8.0, 12.0, 18.0, 25.0, 19.0, 25.0, 34.0, 32.0, 28.0, 27.0, 29.0, 50.0, 40.0, 38.0, 36.0, 54.0, 42.0, 38.0, 45.0, 41.0, 50.0, 44.0, 31.0, 27.0, 24.0, 20.0, 21.0, 20.0, 12.0, 9.0, 13.0, 5.0, 12.0, 5.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0], "bins": [-1.63671875, -1.5878448486328125, -1.538970947265625, -1.4900970458984375, -1.44122314453125, -1.3923492431640625, -1.343475341796875, -1.2946014404296875, -1.2457275390625, -1.1968536376953125, -1.147979736328125, -1.0991058349609375, -1.05023193359375, -1.0013580322265625, -0.952484130859375, -0.9036102294921875, -0.854736328125, -0.8058624267578125, -0.756988525390625, -0.7081146240234375, -0.65924072265625, -0.6103668212890625, -0.561492919921875, -0.5126190185546875, -0.4637451171875, -0.4148712158203125, -0.365997314453125, -0.3171234130859375, -0.26824951171875, -0.2193756103515625, -0.170501708984375, -0.1216278076171875, -0.07275390625, -0.0238800048828125, 0.024993896484375, 0.0738677978515625, 0.12274169921875, 0.1716156005859375, 0.220489501953125, 0.2693634033203125, 0.3182373046875, 0.3671112060546875, 0.415985107421875, 0.4648590087890625, 0.51373291015625, 0.5626068115234375, 0.611480712890625, 0.6603546142578125, 0.709228515625, 0.7581024169921875, 0.806976318359375, 0.8558502197265625, 0.90472412109375, 0.9535980224609375, 1.002471923828125, 1.0513458251953125, 1.1002197265625, 1.1490936279296875, 1.197967529296875, 1.2468414306640625, 1.29571533203125, 1.3445892333984375, 1.393463134765625, 1.4423370361328125, 1.4912109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 8.0, 25.0, 25.0, 54.0, 94.0, 164.0, 283.0, 590.0, 1400.0, 3827.0, 12768.0, 69236.0, 3343091.0, 710208.0, 38434.0, 8774.0, 2815.0, 1200.0, 565.0, 273.0, 160.0, 89.0, 63.0, 35.0, 32.0, 12.0, 20.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.484619140625, -9.19580078125, -8.906982421875, -8.6181640625, -8.329345703125, -8.04052734375, -7.751708984375, -7.462890625, -7.174072265625, -6.88525390625, -6.596435546875, -6.3076171875, -6.018798828125, -5.72998046875, -5.441162109375, -5.15234375, -4.863525390625, -4.57470703125, -4.285888671875, -3.9970703125, -3.708251953125, -3.41943359375, -3.130615234375, -2.841796875, -2.552978515625, -2.26416015625, -1.975341796875, -1.6865234375, -1.397705078125, -1.10888671875, -0.820068359375, -0.53125, -0.242431640625, 0.04638671875, 0.335205078125, 0.6240234375, 0.912841796875, 1.20166015625, 1.490478515625, 1.779296875, 2.068115234375, 2.35693359375, 2.645751953125, 2.9345703125, 3.223388671875, 3.51220703125, 3.801025390625, 4.08984375, 4.378662109375, 4.66748046875, 4.956298828125, 5.2451171875, 5.533935546875, 5.82275390625, 6.111572265625, 6.400390625, 6.689208984375, 6.97802734375, 7.266845703125, 7.5556640625, 7.844482421875, 8.13330078125, 8.422119140625, 8.7109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 14.0, 20.0, 33.0, 48.0, 74.0, 116.0, 369.0, 972.0, 1285.0, 605.0, 224.0, 100.0, 52.0, 47.0, 18.0, 19.0, 14.0, 12.0, 13.0, 4.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.390625, -7.0980224609375, -6.805419921875, -6.5128173828125, -6.22021484375, -5.9276123046875, -5.635009765625, -5.3424072265625, -5.0498046875, -4.7572021484375, -4.464599609375, -4.1719970703125, -3.87939453125, -3.5867919921875, -3.294189453125, -3.0015869140625, -2.708984375, -2.4163818359375, -2.123779296875, -1.8311767578125, -1.53857421875, -1.2459716796875, -0.953369140625, -0.6607666015625, -0.3681640625, -0.0755615234375, 0.217041015625, 0.5096435546875, 0.80224609375, 1.0948486328125, 1.387451171875, 1.6800537109375, 1.97265625, 2.2652587890625, 2.557861328125, 2.8504638671875, 3.14306640625, 3.4356689453125, 3.728271484375, 4.0208740234375, 4.3134765625, 4.6060791015625, 4.898681640625, 5.1912841796875, 5.48388671875, 5.7764892578125, 6.069091796875, 6.3616943359375, 6.654296875, 6.9468994140625, 7.239501953125, 7.5321044921875, 7.82470703125, 8.1173095703125, 8.409912109375, 8.7025146484375, 8.9951171875, 9.2877197265625, 9.580322265625, 9.8729248046875, 10.16552734375, 10.4581298828125, 10.750732421875, 11.0433349609375, 11.3359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 26.0, 76.0, 223.0, 322.0, 189.0, 79.0, 31.0, 19.0, 10.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.85055541992188, -74.6424331665039, -71.43431091308594, -68.2261962890625, -65.01807403564453, -61.80995178222656, -58.601829528808594, -55.393707275390625, -52.18558883666992, -48.97746658325195, -45.76934814453125, -42.56122589111328, -39.35310363769531, -36.14498519897461, -32.93686294555664, -29.728742599487305, -26.52062225341797, -23.312501907348633, -20.104381561279297, -16.896259307861328, -13.688138961791992, -10.480018615722656, -7.2718963623046875, -4.063776016235352, -0.8556556701660156, 2.3524651527404785, 5.560585975646973, 8.768707275390625, 11.976827621459961, 15.184947967529297, 18.393070220947266, 21.6011905670166, 24.809310913085938, 28.017431259155273, 31.22555160522461, 34.43367385864258, 37.64179229736328, 40.84991455078125, 44.05803680419922, 47.26615905761719, 50.47427749633789, 53.68239974975586, 56.89051818847656, 60.09864044189453, 63.3067626953125, 66.51487731933594, 69.72300720214844, 72.93112182617188, 76.13924407958984, 79.34736633300781, 82.55548858642578, 85.76361083984375, 88.97172546386719, 92.17984771728516, 95.38796997070312, 98.5960922241211, 101.80421447753906, 105.01233673095703, 108.220458984375, 111.42857360839844, 114.6366958618164, 117.84481811523438, 121.05294036865234, 124.26106262207031, 127.46917724609375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 7.0, 3.0, 6.0, 6.0, 12.0, 9.0, 10.0, 14.0, 20.0, 17.0, 10.0, 18.0, 26.0, 31.0, 45.0, 29.0, 30.0, 40.0, 47.0, 47.0, 40.0, 47.0, 34.0, 55.0, 42.0, 50.0, 42.0, 34.0, 32.0, 31.0, 32.0, 23.0, 25.0, 17.0, 15.0, 8.0, 9.0, 9.0, 7.0, 6.0, 2.0, 7.0, 2.0, 5.0, 5.0, 2.0, 3.0], "bins": [-33.93211364746094, -33.05696487426758, -32.181819915771484, -31.306671142578125, -30.4315242767334, -29.556377410888672, -28.681228637695312, -27.806081771850586, -26.93093490600586, -26.055788040161133, -25.180641174316406, -24.305492401123047, -23.43034553527832, -22.555198669433594, -21.680049896240234, -20.804903030395508, -19.92975616455078, -19.054609298706055, -18.179462432861328, -17.30431365966797, -16.429166793823242, -15.554019927978516, -14.678872108459473, -13.80372428894043, -12.928577423095703, -12.053430557250977, -11.178282737731934, -10.30313491821289, -9.427988052368164, -8.552841186523438, -7.6776933670043945, -6.80254602432251, -5.927398681640625, -5.05225133895874, -4.1771039962768555, -3.3019566535949707, -2.426809310913086, -1.5516619682312012, -0.6765146255493164, 0.19863271713256836, 1.0737800598144531, 1.948927402496338, 2.8240747451782227, 3.6992220878601074, 4.574369430541992, 5.449516773223877, 6.324664115905762, 7.1998114585876465, 8.074958801269531, 8.950105667114258, 9.8252534866333, 10.700401306152344, 11.57554817199707, 12.450695037841797, 13.32584285736084, 14.200990676879883, 15.07613754272461, 15.951284408569336, 16.826431274414062, 17.701580047607422, 18.57672691345215, 19.451873779296875, 20.327022552490234, 21.20216941833496, 22.077316284179688]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 11.0, 13.0, 24.0, 22.0, 30.0, 38.0, 76.0, 72.0, 121.0, 206.0, 302.0, 476.0, 879.0, 1460.0, 2942.0, 6413.0, 18682.0, 73995.0, 378615.0, 438871.0, 89290.0, 21569.0, 7274.0, 3141.0, 1627.0, 881.0, 541.0, 312.0, 210.0, 125.0, 95.0, 65.0, 34.0, 38.0, 32.0, 12.0, 10.0, 10.0, 10.0, 2.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.1640625, -4.0452880859375, -3.926513671875, -3.8077392578125, -3.68896484375, -3.5701904296875, -3.451416015625, -3.3326416015625, -3.2138671875, -3.0950927734375, -2.976318359375, -2.8575439453125, -2.73876953125, -2.6199951171875, -2.501220703125, -2.3824462890625, -2.263671875, -2.1448974609375, -2.026123046875, -1.9073486328125, -1.78857421875, -1.6697998046875, -1.551025390625, -1.4322509765625, -1.3134765625, -1.1947021484375, -1.075927734375, -0.9571533203125, -0.83837890625, -0.7196044921875, -0.600830078125, -0.4820556640625, -0.36328125, -0.2445068359375, -0.125732421875, -0.0069580078125, 0.11181640625, 0.2305908203125, 0.349365234375, 0.4681396484375, 0.5869140625, 0.7056884765625, 0.824462890625, 0.9432373046875, 1.06201171875, 1.1807861328125, 1.299560546875, 1.4183349609375, 1.537109375, 1.6558837890625, 1.774658203125, 1.8934326171875, 2.01220703125, 2.1309814453125, 2.249755859375, 2.3685302734375, 2.4873046875, 2.6060791015625, 2.724853515625, 2.8436279296875, 2.96240234375, 3.0811767578125, 3.199951171875, 3.3187255859375, 3.4375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 7.0, 4.0, 9.0, 11.0, 9.0, 6.0, 17.0, 15.0, 29.0, 28.0, 26.0, 27.0, 31.0, 38.0, 38.0, 36.0, 49.0, 34.0, 32.0, 39.0, 55.0, 44.0, 46.0, 33.0, 44.0, 36.0, 34.0, 30.0, 30.0, 17.0, 25.0, 12.0, 22.0, 10.0, 10.0, 11.0, 15.0, 6.0, 9.0, 10.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-2.01953125, -1.9594879150390625, -1.899444580078125, -1.8394012451171875, -1.77935791015625, -1.7193145751953125, -1.659271240234375, -1.5992279052734375, -1.5391845703125, -1.4791412353515625, -1.419097900390625, -1.3590545654296875, -1.29901123046875, -1.2389678955078125, -1.178924560546875, -1.1188812255859375, -1.058837890625, -0.9987945556640625, -0.938751220703125, -0.8787078857421875, -0.81866455078125, -0.7586212158203125, -0.698577880859375, -0.6385345458984375, -0.5784912109375, -0.5184478759765625, -0.458404541015625, -0.3983612060546875, -0.33831787109375, -0.2782745361328125, -0.218231201171875, -0.1581878662109375, -0.09814453125, -0.0381011962890625, 0.021942138671875, 0.0819854736328125, 0.14202880859375, 0.2020721435546875, 0.262115478515625, 0.3221588134765625, 0.3822021484375, 0.4422454833984375, 0.502288818359375, 0.5623321533203125, 0.62237548828125, 0.6824188232421875, 0.742462158203125, 0.8025054931640625, 0.862548828125, 0.9225921630859375, 0.982635498046875, 1.0426788330078125, 1.10272216796875, 1.1627655029296875, 1.222808837890625, 1.2828521728515625, 1.3428955078125, 1.4029388427734375, 1.462982177734375, 1.5230255126953125, 1.58306884765625, 1.6431121826171875, 1.703155517578125, 1.7631988525390625, 1.8232421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 10.0, 19.0, 22.0, 42.0, 59.0, 106.0, 168.0, 303.0, 633.0, 1431.0, 4547.0, 23896.0, 362233.0, 618527.0, 28428.0, 5067.0, 1609.0, 683.0, 335.0, 171.0, 109.0, 52.0, 31.0, 21.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4375, -7.18994140625, -6.9423828125, -6.69482421875, -6.447265625, -6.19970703125, -5.9521484375, -5.70458984375, -5.45703125, -5.20947265625, -4.9619140625, -4.71435546875, -4.466796875, -4.21923828125, -3.9716796875, -3.72412109375, -3.4765625, -3.22900390625, -2.9814453125, -2.73388671875, -2.486328125, -2.23876953125, -1.9912109375, -1.74365234375, -1.49609375, -1.24853515625, -1.0009765625, -0.75341796875, -0.505859375, -0.25830078125, -0.0107421875, 0.23681640625, 0.484375, 0.73193359375, 0.9794921875, 1.22705078125, 1.474609375, 1.72216796875, 1.9697265625, 2.21728515625, 2.46484375, 2.71240234375, 2.9599609375, 3.20751953125, 3.455078125, 3.70263671875, 3.9501953125, 4.19775390625, 4.4453125, 4.69287109375, 4.9404296875, 5.18798828125, 5.435546875, 5.68310546875, 5.9306640625, 6.17822265625, 6.42578125, 6.67333984375, 6.9208984375, 7.16845703125, 7.416015625, 7.66357421875, 7.9111328125, 8.15869140625, 8.40625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 8.0, 9.0, 14.0, 11.0, 19.0, 32.0, 35.0, 30.0, 37.0, 55.0, 56.0, 64.0, 46.0, 58.0, 46.0, 63.0, 59.0, 66.0, 51.0, 42.0, 30.0, 43.0, 26.0, 20.0, 19.0, 12.0, 8.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.6243896484375, -10.295654296875, -9.9669189453125, -9.63818359375, -9.3094482421875, -8.980712890625, -8.6519775390625, -8.3232421875, -7.9945068359375, -7.665771484375, -7.3370361328125, -7.00830078125, -6.6795654296875, -6.350830078125, -6.0220947265625, -5.693359375, -5.3646240234375, -5.035888671875, -4.7071533203125, -4.37841796875, -4.0496826171875, -3.720947265625, -3.3922119140625, -3.0634765625, -2.7347412109375, -2.406005859375, -2.0772705078125, -1.74853515625, -1.4197998046875, -1.091064453125, -0.7623291015625, -0.43359375, -0.1048583984375, 0.223876953125, 0.5526123046875, 0.88134765625, 1.2100830078125, 1.538818359375, 1.8675537109375, 2.1962890625, 2.5250244140625, 2.853759765625, 3.1824951171875, 3.51123046875, 3.8399658203125, 4.168701171875, 4.4974365234375, 4.826171875, 5.1549072265625, 5.483642578125, 5.8123779296875, 6.14111328125, 6.4698486328125, 6.798583984375, 7.1273193359375, 7.4560546875, 7.7847900390625, 8.113525390625, 8.4422607421875, 8.77099609375, 9.0997314453125, 9.428466796875, 9.7572021484375, 10.0859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 4.0, 22.0, 45.0, 85.0, 198.0, 505.0, 1840.0, 11688.0, 223499.0, 781087.0, 25217.0, 3138.0, 750.0, 241.0, 98.0, 41.0, 30.0, 16.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.83203125, -4.67181396484375, -4.5115966796875, -4.35137939453125, -4.191162109375, -4.03094482421875, -3.8707275390625, -3.71051025390625, -3.55029296875, -3.39007568359375, -3.2298583984375, -3.06964111328125, -2.909423828125, -2.74920654296875, -2.5889892578125, -2.42877197265625, -2.2685546875, -2.10833740234375, -1.9481201171875, -1.78790283203125, -1.627685546875, -1.46746826171875, -1.3072509765625, -1.14703369140625, -0.98681640625, -0.82659912109375, -0.6663818359375, -0.50616455078125, -0.345947265625, -0.18572998046875, -0.0255126953125, 0.13470458984375, 0.294921875, 0.45513916015625, 0.6153564453125, 0.77557373046875, 0.935791015625, 1.09600830078125, 1.2562255859375, 1.41644287109375, 1.57666015625, 1.73687744140625, 1.8970947265625, 2.05731201171875, 2.217529296875, 2.37774658203125, 2.5379638671875, 2.69818115234375, 2.8583984375, 3.01861572265625, 3.1788330078125, 3.33905029296875, 3.499267578125, 3.65948486328125, 3.8197021484375, 3.97991943359375, 4.14013671875, 4.30035400390625, 4.4605712890625, 4.62078857421875, 4.781005859375, 4.94122314453125, 5.1014404296875, 5.26165771484375, 5.421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 13.0, 13.0, 8.0, 25.0, 31.0, 48.0, 55.0, 98.0, 129.0, 166.0, 99.0, 80.0, 82.0, 40.0, 30.0, 21.0, 13.0, 7.0, 9.0, 10.0, 4.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007100105285644531, -0.0006868019700050354, -0.0006635934114456177, -0.0006403848528862, -0.0006171762943267822, -0.0005939677357673645, -0.0005707591772079468, -0.000547550618648529, -0.0005243420600891113, -0.0005011335015296936, -0.0004779249429702759, -0.00045471638441085815, -0.00043150782585144043, -0.0004082992672920227, -0.000385090708732605, -0.00036188215017318726, -0.00033867359161376953, -0.0003154650330543518, -0.0002922564744949341, -0.00026904791593551636, -0.00024583935737609863, -0.0002226307988166809, -0.00019942224025726318, -0.00017621368169784546, -0.00015300512313842773, -0.00012979656457901, -0.00010658800601959229, -8.337944746017456e-05, -6.0170888900756836e-05, -3.696233034133911e-05, -1.3753771781921387e-05, 9.454786777496338e-06, 3.266334533691406e-05, 5.587190389633179e-05, 7.908046245574951e-05, 0.00010228902101516724, 0.00012549757957458496, 0.00014870613813400269, 0.0001719146966934204, 0.00019512325525283813, 0.00021833181381225586, 0.00024154037237167358, 0.0002647489309310913, 0.00028795748949050903, 0.00031116604804992676, 0.0003343746066093445, 0.0003575831651687622, 0.00038079172372817993, 0.00040400028228759766, 0.0004272088408470154, 0.0004504173994064331, 0.00047362595796585083, 0.0004968345165252686, 0.0005200430750846863, 0.000543251633644104, 0.0005664601922035217, 0.0005896687507629395, 0.0006128773093223572, 0.0006360858678817749, 0.0006592944264411926, 0.0006825029850006104, 0.0007057115435600281, 0.0007289201021194458, 0.0007521286606788635, 0.0007753372192382812]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 8.0, 9.0, 15.0, 26.0, 46.0, 65.0, 115.0, 195.0, 414.0, 858.0, 2058.0, 6435.0, 28989.0, 278135.0, 669260.0, 47975.0, 9087.0, 2729.0, 1092.0, 473.0, 227.0, 140.0, 74.0, 39.0, 25.0, 13.0, 15.0, 11.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.29449462890625, -4.1788330078125, -4.06317138671875, -3.947509765625, -3.83184814453125, -3.7161865234375, -3.60052490234375, -3.48486328125, -3.36920166015625, -3.2535400390625, -3.13787841796875, -3.022216796875, -2.90655517578125, -2.7908935546875, -2.67523193359375, -2.5595703125, -2.44390869140625, -2.3282470703125, -2.21258544921875, -2.096923828125, -1.98126220703125, -1.8656005859375, -1.74993896484375, -1.63427734375, -1.51861572265625, -1.4029541015625, -1.28729248046875, -1.171630859375, -1.05596923828125, -0.9403076171875, -0.82464599609375, -0.708984375, -0.59332275390625, -0.4776611328125, -0.36199951171875, -0.246337890625, -0.13067626953125, -0.0150146484375, 0.10064697265625, 0.21630859375, 0.33197021484375, 0.4476318359375, 0.56329345703125, 0.678955078125, 0.79461669921875, 0.9102783203125, 1.02593994140625, 1.1416015625, 1.25726318359375, 1.3729248046875, 1.48858642578125, 1.604248046875, 1.71990966796875, 1.8355712890625, 1.95123291015625, 2.06689453125, 2.18255615234375, 2.2982177734375, 2.41387939453125, 2.529541015625, 2.64520263671875, 2.7608642578125, 2.87652587890625, 2.9921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 13.0, 8.0, 12.0, 24.0, 27.0, 43.0, 69.0, 87.0, 132.0, 127.0, 128.0, 87.0, 49.0, 56.0, 48.0, 28.0, 23.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.23828125, -4.131439208984375, -4.02459716796875, -3.917755126953125, -3.8109130859375, -3.704071044921875, -3.59722900390625, -3.490386962890625, -3.383544921875, -3.276702880859375, -3.16986083984375, -3.063018798828125, -2.9561767578125, -2.849334716796875, -2.74249267578125, -2.635650634765625, -2.52880859375, -2.421966552734375, -2.31512451171875, -2.208282470703125, -2.1014404296875, -1.994598388671875, -1.88775634765625, -1.780914306640625, -1.674072265625, -1.567230224609375, -1.46038818359375, -1.353546142578125, -1.2467041015625, -1.139862060546875, -1.03302001953125, -0.926177978515625, -0.8193359375, -0.712493896484375, -0.60565185546875, -0.498809814453125, -0.3919677734375, -0.285125732421875, -0.17828369140625, -0.071441650390625, 0.035400390625, 0.142242431640625, 0.24908447265625, 0.355926513671875, 0.4627685546875, 0.569610595703125, 0.67645263671875, 0.783294677734375, 0.89013671875, 0.996978759765625, 1.10382080078125, 1.210662841796875, 1.3175048828125, 1.424346923828125, 1.53118896484375, 1.638031005859375, 1.744873046875, 1.851715087890625, 1.95855712890625, 2.065399169921875, 2.1722412109375, 2.279083251953125, 2.38592529296875, 2.492767333984375, 2.599609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 15.0, 20.0, 55.0, 80.0, 158.0, 340.0, 172.0, 75.0, 40.0, 23.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.26711654663086, -48.28437805175781, -46.30164337158203, -44.31890869140625, -42.3361701965332, -40.353431701660156, -38.370697021484375, -36.387962341308594, -34.40522384643555, -32.4224853515625, -30.43975067138672, -28.457014083862305, -26.47427749633789, -24.491540908813477, -22.508804321289062, -20.52606773376465, -18.543331146240234, -16.56059455871582, -14.577857971191406, -12.595121383666992, -10.612384796142578, -8.629648208618164, -6.64691162109375, -4.664175033569336, -2.681438446044922, -0.6987018585205078, 1.2840347290039062, 3.2667713165283203, 5.249507904052734, 7.232244491577148, 9.214981079101562, 11.197717666625977, 13.180450439453125, 15.163187026977539, 17.145923614501953, 19.128660202026367, 21.11139678955078, 23.094133377075195, 25.07686996459961, 27.059606552124023, 29.042343139648438, 31.02507972717285, 33.007816314697266, 34.99055480957031, 36.973289489746094, 38.956024169921875, 40.93876266479492, 42.92150115966797, 44.90423583984375, 46.88697052001953, 48.86970901489258, 50.852447509765625, 52.835182189941406, 54.81791687011719, 56.800655364990234, 58.78339385986328, 60.76612854003906, 62.748863220214844, 64.73159790039062, 66.71434020996094, 68.69707489013672, 70.6798095703125, 72.66255187988281, 74.6452865600586, 76.62802124023438]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 4.0, 7.0, 11.0, 12.0, 24.0, 20.0, 30.0, 41.0, 35.0, 43.0, 42.0, 47.0, 58.0, 77.0, 113.0, 84.0, 56.0, 34.0, 44.0, 37.0, 31.0, 30.0, 28.0, 18.0, 17.0, 10.0, 9.0, 7.0, 5.0, 10.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.804588317871094, -44.3445930480957, -42.88459777832031, -41.424598693847656, -39.964603424072266, -38.504608154296875, -37.044612884521484, -35.584617614746094, -34.12461853027344, -32.66462326049805, -31.204626083374023, -29.744630813598633, -28.28463363647461, -26.82463836669922, -25.364643096923828, -23.904647827148438, -22.444652557373047, -20.984657287597656, -19.524660110473633, -18.064664840698242, -16.60466766357422, -15.144672393798828, -13.684677124023438, -12.22468090057373, -10.764684677124023, -9.304688453674316, -7.844692707061768, -6.384696960449219, -4.924700736999512, -3.4647045135498047, -2.004709243774414, -0.544713020324707, 0.915283203125, 2.375279188156128, 3.835275173187256, 5.295270919799805, 6.755267143249512, 8.215263366699219, 9.67525863647461, 11.135254859924316, 12.595251083374023, 14.05524730682373, 15.515243530273438, 16.975238800048828, 18.43523406982422, 19.895231246948242, 21.355226516723633, 22.815223693847656, 24.275218963623047, 25.735214233398438, 27.19521141052246, 28.65520668029785, 30.115203857421875, 31.575199127197266, 33.035194396972656, 34.49518966674805, 35.95518493652344, 37.41518020629883, 38.87517547607422, 40.335174560546875, 41.795169830322266, 43.255165100097656, 44.71516036987305, 46.17515563964844, 47.635154724121094]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 9.0, 8.0, 7.0, 18.0, 28.0, 31.0, 27.0, 59.0, 82.0, 114.0, 151.0, 247.0, 368.0, 573.0, 977.0, 1587.0, 3244.0, 7836.0, 28929.0, 348732.0, 3312009.0, 439451.0, 33688.0, 8246.0, 3477.0, 1805.0, 887.0, 553.0, 379.0, 208.0, 152.0, 114.0, 63.0, 60.0, 48.0, 30.0, 19.0, 17.0, 10.0, 9.0, 9.0, 8.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.1060791015625, -3.962158203125, -3.8182373046875, -3.67431640625, -3.5303955078125, -3.386474609375, -3.2425537109375, -3.0986328125, -2.9547119140625, -2.810791015625, -2.6668701171875, -2.52294921875, -2.3790283203125, -2.235107421875, -2.0911865234375, -1.947265625, -1.8033447265625, -1.659423828125, -1.5155029296875, -1.37158203125, -1.2276611328125, -1.083740234375, -0.9398193359375, -0.7958984375, -0.6519775390625, -0.508056640625, -0.3641357421875, -0.22021484375, -0.0762939453125, 0.067626953125, 0.2115478515625, 0.35546875, 0.4993896484375, 0.643310546875, 0.7872314453125, 0.93115234375, 1.0750732421875, 1.218994140625, 1.3629150390625, 1.5068359375, 1.6507568359375, 1.794677734375, 1.9385986328125, 2.08251953125, 2.2264404296875, 2.370361328125, 2.5142822265625, 2.658203125, 2.8021240234375, 2.946044921875, 3.0899658203125, 3.23388671875, 3.3778076171875, 3.521728515625, 3.6656494140625, 3.8095703125, 3.9534912109375, 4.097412109375, 4.2413330078125, 4.38525390625, 4.5291748046875, 4.673095703125, 4.8170166015625, 4.9609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 7.0, 10.0, 15.0, 15.0, 27.0, 30.0, 40.0, 39.0, 49.0, 38.0, 52.0, 50.0, 51.0, 54.0, 62.0, 73.0, 58.0, 52.0, 53.0, 39.0, 27.0, 28.0, 24.0, 22.0, 17.0, 13.0, 14.0, 9.0, 6.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.798919677734375, -2.72088623046875, -2.642852783203125, -2.5648193359375, -2.486785888671875, -2.40875244140625, -2.330718994140625, -2.252685546875, -2.174652099609375, -2.09661865234375, -2.018585205078125, -1.9405517578125, -1.862518310546875, -1.78448486328125, -1.706451416015625, -1.62841796875, -1.550384521484375, -1.47235107421875, -1.394317626953125, -1.3162841796875, -1.238250732421875, -1.16021728515625, -1.082183837890625, -1.004150390625, -0.926116943359375, -0.84808349609375, -0.770050048828125, -0.6920166015625, -0.613983154296875, -0.53594970703125, -0.457916259765625, -0.3798828125, -0.301849365234375, -0.22381591796875, -0.145782470703125, -0.0677490234375, 0.010284423828125, 0.08831787109375, 0.166351318359375, 0.244384765625, 0.322418212890625, 0.40045166015625, 0.478485107421875, 0.5565185546875, 0.634552001953125, 0.71258544921875, 0.790618896484375, 0.86865234375, 0.946685791015625, 1.02471923828125, 1.102752685546875, 1.1807861328125, 1.258819580078125, 1.33685302734375, 1.414886474609375, 1.492919921875, 1.570953369140625, 1.64898681640625, 1.727020263671875, 1.8050537109375, 1.883087158203125, 1.96112060546875, 2.039154052734375, 2.1171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 14.0, 27.0, 49.0, 88.0, 167.0, 357.0, 1010.0, 4416.0, 38769.0, 4007949.0, 130953.0, 8014.0, 1495.0, 504.0, 221.0, 114.0, 61.0, 23.0, 13.0, 9.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9296875, -15.4420166015625, -14.954345703125, -14.4666748046875, -13.97900390625, -13.4913330078125, -13.003662109375, -12.5159912109375, -12.0283203125, -11.5406494140625, -11.052978515625, -10.5653076171875, -10.07763671875, -9.5899658203125, -9.102294921875, -8.6146240234375, -8.126953125, -7.6392822265625, -7.151611328125, -6.6639404296875, -6.17626953125, -5.6885986328125, -5.200927734375, -4.7132568359375, -4.2255859375, -3.7379150390625, -3.250244140625, -2.7625732421875, -2.27490234375, -1.7872314453125, -1.299560546875, -0.8118896484375, -0.32421875, 0.1634521484375, 0.651123046875, 1.1387939453125, 1.62646484375, 2.1141357421875, 2.601806640625, 3.0894775390625, 3.5771484375, 4.0648193359375, 4.552490234375, 5.0401611328125, 5.52783203125, 6.0155029296875, 6.503173828125, 6.9908447265625, 7.478515625, 7.9661865234375, 8.453857421875, 8.9415283203125, 9.42919921875, 9.9168701171875, 10.404541015625, 10.8922119140625, 11.3798828125, 11.8675537109375, 12.355224609375, 12.8428955078125, 13.33056640625, 13.8182373046875, 14.305908203125, 14.7935791015625, 15.28125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 27.0, 32.0, 70.0, 127.0, 363.0, 1120.0, 1451.0, 515.0, 162.0, 62.0, 45.0, 24.0, 16.0, 12.0, 7.0, 2.0, 5.0, 0.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.3671875, -11.0245361328125, -10.681884765625, -10.3392333984375, -9.99658203125, -9.6539306640625, -9.311279296875, -8.9686279296875, -8.6259765625, -8.2833251953125, -7.940673828125, -7.5980224609375, -7.25537109375, -6.9127197265625, -6.570068359375, -6.2274169921875, -5.884765625, -5.5421142578125, -5.199462890625, -4.8568115234375, -4.51416015625, -4.1715087890625, -3.828857421875, -3.4862060546875, -3.1435546875, -2.8009033203125, -2.458251953125, -2.1156005859375, -1.77294921875, -1.4302978515625, -1.087646484375, -0.7449951171875, -0.40234375, -0.0596923828125, 0.282958984375, 0.6256103515625, 0.96826171875, 1.3109130859375, 1.653564453125, 1.9962158203125, 2.3388671875, 2.6815185546875, 3.024169921875, 3.3668212890625, 3.70947265625, 4.0521240234375, 4.394775390625, 4.7374267578125, 5.080078125, 5.4227294921875, 5.765380859375, 6.1080322265625, 6.45068359375, 6.7933349609375, 7.135986328125, 7.4786376953125, 7.8212890625, 8.1639404296875, 8.506591796875, 8.8492431640625, 9.19189453125, 9.5345458984375, 9.877197265625, 10.2198486328125, 10.5625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 32.0, 189.0, 493.0, 220.0, 49.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.47402954101562, -201.50881958007812, -196.5436248779297, -191.5784149169922, -186.6132049560547, -181.64801025390625, -176.68280029296875, -171.71759033203125, -166.75238037109375, -161.78717041015625, -156.8219757080078, -151.8567657470703, -146.8915557861328, -141.92636108398438, -136.96115112304688, -131.99594116210938, -127.03074645996094, -122.06554412841797, -117.10033416748047, -112.1351318359375, -107.169921875, -102.20471954345703, -97.23951721191406, -92.27430725097656, -87.3091049194336, -82.34390258789062, -77.37869262695312, -72.41349029541016, -67.44828796386719, -62.48307800292969, -57.51787567138672, -52.552669525146484, -47.58747863769531, -42.62227249145508, -37.657066345214844, -32.691864013671875, -27.72665786743164, -22.761451721191406, -17.796247482299805, -12.831043243408203, -7.865837097167969, -2.900631904602051, 2.064573287963867, 7.029778480529785, 11.994983673095703, 16.960189819335938, 21.92539405822754, 26.89059829711914, 31.855804443359375, 36.82101058959961, 41.786216735839844, 46.75141906738281, 51.71662521362305, 56.68183135986328, 61.64703369140625, 66.61224365234375, 71.57744598388672, 76.54264831542969, 81.50785827636719, 86.47306060791016, 91.43826293945312, 96.40347290039062, 101.3686752319336, 106.33387756347656, 111.29908752441406]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 16.0, 12.0, 14.0, 14.0, 20.0, 24.0, 27.0, 39.0, 46.0, 45.0, 56.0, 54.0, 61.0, 56.0, 73.0, 70.0, 46.0, 41.0, 38.0, 43.0, 43.0, 40.0, 27.0, 23.0, 19.0, 12.0, 10.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.374725341796875, -20.35686492919922, -19.339004516601562, -18.321144104003906, -17.30328369140625, -16.285423278808594, -15.267560958862305, -14.249700546264648, -13.231840133666992, -12.213979721069336, -11.19611930847168, -10.178257942199707, -9.16039752960205, -8.142537117004395, -7.12467622756958, -6.106815338134766, -5.088954925537109, -4.071094512939453, -3.0532336235046387, -2.0353729724884033, -1.017512321472168, 0.00034809112548828125, 1.0182089805603027, 2.036069869995117, 3.0539302825927734, 4.07179069519043, 5.089651584625244, 6.107512474060059, 7.125372886657715, 8.143233299255371, 9.161094665527344, 10.178955078125, 11.196815490722656, 12.214675903320312, 13.232536315917969, 14.250397682189941, 15.268258094787598, 16.286117553710938, 17.303979873657227, 18.321840286254883, 19.33970069885254, 20.357561111450195, 21.37542152404785, 22.393281936645508, 23.411144256591797, 24.429004669189453, 25.44686508178711, 26.464725494384766, 27.482585906982422, 28.500446319580078, 29.518306732177734, 30.53616714477539, 31.554027557373047, 32.5718879699707, 33.58974838256836, 34.60761260986328, 35.62547302246094, 36.643333435058594, 37.66119384765625, 38.679054260253906, 39.69691467285156, 40.71477508544922, 41.732635498046875, 42.75049591064453, 43.76835632324219]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 2.0, 8.0, 12.0, 12.0, 22.0, 29.0, 39.0, 60.0, 100.0, 138.0, 228.0, 411.0, 677.0, 1333.0, 2705.0, 6410.0, 17673.0, 71842.0, 470170.0, 389863.0, 60092.0, 15644.0, 5661.0, 2487.0, 1207.0, 684.0, 386.0, 238.0, 144.0, 88.0, 56.0, 43.0, 24.0, 18.0, 12.0, 14.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.26287841796875, -4.1156005859375, -3.96832275390625, -3.821044921875, -3.67376708984375, -3.5264892578125, -3.37921142578125, -3.23193359375, -3.08465576171875, -2.9373779296875, -2.79010009765625, -2.642822265625, -2.49554443359375, -2.3482666015625, -2.20098876953125, -2.0537109375, -1.90643310546875, -1.7591552734375, -1.61187744140625, -1.464599609375, -1.31732177734375, -1.1700439453125, -1.02276611328125, -0.87548828125, -0.72821044921875, -0.5809326171875, -0.43365478515625, -0.286376953125, -0.13909912109375, 0.0081787109375, 0.15545654296875, 0.302734375, 0.45001220703125, 0.5972900390625, 0.74456787109375, 0.891845703125, 1.03912353515625, 1.1864013671875, 1.33367919921875, 1.48095703125, 1.62823486328125, 1.7755126953125, 1.92279052734375, 2.070068359375, 2.21734619140625, 2.3646240234375, 2.51190185546875, 2.6591796875, 2.80645751953125, 2.9537353515625, 3.10101318359375, 3.248291015625, 3.39556884765625, 3.5428466796875, 3.69012451171875, 3.83740234375, 3.98468017578125, 4.1319580078125, 4.27923583984375, 4.426513671875, 4.57379150390625, 4.7210693359375, 4.86834716796875, 5.015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 13.0, 14.0, 7.0, 12.0, 11.0, 19.0, 19.0, 24.0, 34.0, 40.0, 41.0, 46.0, 45.0, 38.0, 61.0, 52.0, 60.0, 55.0, 54.0, 41.0, 48.0, 44.0, 33.0, 29.0, 24.0, 29.0, 28.0, 12.0, 11.0, 12.0, 8.0, 10.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.728515625, -2.645965576171875, -2.56341552734375, -2.480865478515625, -2.3983154296875, -2.315765380859375, -2.23321533203125, -2.150665283203125, -2.068115234375, -1.985565185546875, -1.90301513671875, -1.820465087890625, -1.7379150390625, -1.655364990234375, -1.57281494140625, -1.490264892578125, -1.40771484375, -1.325164794921875, -1.24261474609375, -1.160064697265625, -1.0775146484375, -0.994964599609375, -0.91241455078125, -0.829864501953125, -0.747314453125, -0.664764404296875, -0.58221435546875, -0.499664306640625, -0.4171142578125, -0.334564208984375, -0.25201416015625, -0.169464111328125, -0.0869140625, -0.004364013671875, 0.07818603515625, 0.160736083984375, 0.2432861328125, 0.325836181640625, 0.40838623046875, 0.490936279296875, 0.573486328125, 0.656036376953125, 0.73858642578125, 0.821136474609375, 0.9036865234375, 0.986236572265625, 1.06878662109375, 1.151336669921875, 1.23388671875, 1.316436767578125, 1.39898681640625, 1.481536865234375, 1.5640869140625, 1.646636962890625, 1.72918701171875, 1.811737060546875, 1.894287109375, 1.976837158203125, 2.05938720703125, 2.141937255859375, 2.2244873046875, 2.307037353515625, 2.38958740234375, 2.472137451171875, 2.5546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 4.0, 15.0, 14.0, 28.0, 44.0, 95.0, 174.0, 376.0, 1357.0, 7256.0, 150878.0, 865799.0, 19039.0, 2300.0, 645.0, 241.0, 122.0, 58.0, 42.0, 22.0, 15.0, 9.0, 2.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.765625, -15.3529052734375, -14.940185546875, -14.5274658203125, -14.11474609375, -13.7020263671875, -13.289306640625, -12.8765869140625, -12.4638671875, -12.0511474609375, -11.638427734375, -11.2257080078125, -10.81298828125, -10.4002685546875, -9.987548828125, -9.5748291015625, -9.162109375, -8.7493896484375, -8.336669921875, -7.9239501953125, -7.51123046875, -7.0985107421875, -6.685791015625, -6.2730712890625, -5.8603515625, -5.4476318359375, -5.034912109375, -4.6221923828125, -4.20947265625, -3.7967529296875, -3.384033203125, -2.9713134765625, -2.55859375, -2.1458740234375, -1.733154296875, -1.3204345703125, -0.90771484375, -0.4949951171875, -0.082275390625, 0.3304443359375, 0.7431640625, 1.1558837890625, 1.568603515625, 1.9813232421875, 2.39404296875, 2.8067626953125, 3.219482421875, 3.6322021484375, 4.044921875, 4.4576416015625, 4.870361328125, 5.2830810546875, 5.69580078125, 6.1085205078125, 6.521240234375, 6.9339599609375, 7.3466796875, 7.7593994140625, 8.172119140625, 8.5848388671875, 8.99755859375, 9.4102783203125, 9.822998046875, 10.2357177734375, 10.6484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 5.0, 6.0, 7.0, 9.0, 10.0, 10.0, 13.0, 11.0, 11.0, 22.0, 30.0, 34.0, 51.0, 45.0, 49.0, 56.0, 60.0, 64.0, 44.0, 82.0, 46.0, 49.0, 37.0, 25.0, 31.0, 43.0, 34.0, 27.0, 11.0, 12.0, 11.0, 13.0, 13.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.9840087890625, -9.639892578125, -9.2957763671875, -8.95166015625, -8.6075439453125, -8.263427734375, -7.9193115234375, -7.5751953125, -7.2310791015625, -6.886962890625, -6.5428466796875, -6.19873046875, -5.8546142578125, -5.510498046875, -5.1663818359375, -4.822265625, -4.4781494140625, -4.134033203125, -3.7899169921875, -3.44580078125, -3.1016845703125, -2.757568359375, -2.4134521484375, -2.0693359375, -1.7252197265625, -1.381103515625, -1.0369873046875, -0.69287109375, -0.3487548828125, -0.004638671875, 0.3394775390625, 0.68359375, 1.0277099609375, 1.371826171875, 1.7159423828125, 2.06005859375, 2.4041748046875, 2.748291015625, 3.0924072265625, 3.4365234375, 3.7806396484375, 4.124755859375, 4.4688720703125, 4.81298828125, 5.1571044921875, 5.501220703125, 5.8453369140625, 6.189453125, 6.5335693359375, 6.877685546875, 7.2218017578125, 7.56591796875, 7.9100341796875, 8.254150390625, 8.5982666015625, 8.9423828125, 9.2864990234375, 9.630615234375, 9.9747314453125, 10.31884765625, 10.6629638671875, 11.007080078125, 11.3511962890625, 11.6953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 6.0, 10.0, 9.0, 39.0, 56.0, 123.0, 293.0, 745.0, 2308.0, 10126.0, 101846.0, 875341.0, 48387.0, 6483.0, 1725.0, 554.0, 261.0, 86.0, 56.0, 37.0, 22.0, 10.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.39715576171875, -4.2474365234375, -4.09771728515625, -3.947998046875, -3.79827880859375, -3.6485595703125, -3.49884033203125, -3.34912109375, -3.19940185546875, -3.0496826171875, -2.89996337890625, -2.750244140625, -2.60052490234375, -2.4508056640625, -2.30108642578125, -2.1513671875, -2.00164794921875, -1.8519287109375, -1.70220947265625, -1.552490234375, -1.40277099609375, -1.2530517578125, -1.10333251953125, -0.95361328125, -0.80389404296875, -0.6541748046875, -0.50445556640625, -0.354736328125, -0.20501708984375, -0.0552978515625, 0.09442138671875, 0.244140625, 0.39385986328125, 0.5435791015625, 0.69329833984375, 0.843017578125, 0.99273681640625, 1.1424560546875, 1.29217529296875, 1.44189453125, 1.59161376953125, 1.7413330078125, 1.89105224609375, 2.040771484375, 2.19049072265625, 2.3402099609375, 2.48992919921875, 2.6396484375, 2.78936767578125, 2.9390869140625, 3.08880615234375, 3.238525390625, 3.38824462890625, 3.5379638671875, 3.68768310546875, 3.83740234375, 3.98712158203125, 4.1368408203125, 4.28656005859375, 4.436279296875, 4.58599853515625, 4.7357177734375, 4.88543701171875, 5.03515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 11.0, 11.0, 20.0, 36.0, 67.0, 88.0, 179.0, 200.0, 136.0, 78.0, 52.0, 22.0, 20.0, 11.0, 17.0, 10.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010595321655273438, -0.0010268092155456543, -0.0009940862655639648, -0.0009613633155822754, -0.0009286403656005859, -0.0008959174156188965, -0.000863194465637207, -0.0008304715156555176, -0.0007977485656738281, -0.0007650256156921387, -0.0007323026657104492, -0.0006995797157287598, -0.0006668567657470703, -0.0006341338157653809, -0.0006014108657836914, -0.000568687915802002, -0.0005359649658203125, -0.000503242015838623, -0.0004705190658569336, -0.00043779611587524414, -0.0004050731658935547, -0.00037235021591186523, -0.0003396272659301758, -0.00030690431594848633, -0.0002741813659667969, -0.00024145841598510742, -0.00020873546600341797, -0.00017601251602172852, -0.00014328956604003906, -0.00011056661605834961, -7.784366607666016e-05, -4.51207160949707e-05, -1.239776611328125e-05, 2.0325183868408203e-05, 5.3048133850097656e-05, 8.577108383178711e-05, 0.00011849403381347656, 0.00015121698379516602, 0.00018393993377685547, 0.00021666288375854492, 0.0002493858337402344, 0.00028210878372192383, 0.0003148317337036133, 0.00034755468368530273, 0.0003802776336669922, 0.00041300058364868164, 0.0004457235336303711, 0.00047844648361206055, 0.00051116943359375, 0.0005438923835754395, 0.0005766153335571289, 0.0006093382835388184, 0.0006420612335205078, 0.0006747841835021973, 0.0007075071334838867, 0.0007402300834655762, 0.0007729530334472656, 0.0008056759834289551, 0.0008383989334106445, 0.000871121883392334, 0.0009038448333740234, 0.0009365677833557129, 0.0009692907333374023, 0.0010020136833190918, 0.0010347366333007812]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 10.0, 11.0, 16.0, 24.0, 38.0, 66.0, 98.0, 202.0, 342.0, 742.0, 1761.0, 5455.0, 23868.0, 207546.0, 743464.0, 50768.0, 9338.0, 2698.0, 1049.0, 465.0, 221.0, 124.0, 75.0, 50.0, 29.0, 30.0, 13.0, 10.0, 14.0, 2.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.94189453125, -3.8330078125, -3.72412109375, -3.615234375, -3.50634765625, -3.3974609375, -3.28857421875, -3.1796875, -3.07080078125, -2.9619140625, -2.85302734375, -2.744140625, -2.63525390625, -2.5263671875, -2.41748046875, -2.30859375, -2.19970703125, -2.0908203125, -1.98193359375, -1.873046875, -1.76416015625, -1.6552734375, -1.54638671875, -1.4375, -1.32861328125, -1.2197265625, -1.11083984375, -1.001953125, -0.89306640625, -0.7841796875, -0.67529296875, -0.56640625, -0.45751953125, -0.3486328125, -0.23974609375, -0.130859375, -0.02197265625, 0.0869140625, 0.19580078125, 0.3046875, 0.41357421875, 0.5224609375, 0.63134765625, 0.740234375, 0.84912109375, 0.9580078125, 1.06689453125, 1.17578125, 1.28466796875, 1.3935546875, 1.50244140625, 1.611328125, 1.72021484375, 1.8291015625, 1.93798828125, 2.046875, 2.15576171875, 2.2646484375, 2.37353515625, 2.482421875, 2.59130859375, 2.7001953125, 2.80908203125, 2.91796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 6.0, 6.0, 8.0, 9.0, 10.0, 10.0, 20.0, 24.0, 32.0, 51.0, 49.0, 73.0, 103.0, 108.0, 111.0, 90.0, 80.0, 55.0, 42.0, 29.0, 15.0, 13.0, 10.0, 11.0, 5.0, 8.0, 12.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.532257080078125, -2.45513916015625, -2.378021240234375, -2.3009033203125, -2.223785400390625, -2.14666748046875, -2.069549560546875, -1.992431640625, -1.915313720703125, -1.83819580078125, -1.761077880859375, -1.6839599609375, -1.606842041015625, -1.52972412109375, -1.452606201171875, -1.37548828125, -1.298370361328125, -1.22125244140625, -1.144134521484375, -1.0670166015625, -0.989898681640625, -0.91278076171875, -0.835662841796875, -0.758544921875, -0.681427001953125, -0.60430908203125, -0.527191162109375, -0.4500732421875, -0.372955322265625, -0.29583740234375, -0.218719482421875, -0.1416015625, -0.064483642578125, 0.01263427734375, 0.089752197265625, 0.1668701171875, 0.243988037109375, 0.32110595703125, 0.398223876953125, 0.475341796875, 0.552459716796875, 0.62957763671875, 0.706695556640625, 0.7838134765625, 0.860931396484375, 0.93804931640625, 1.015167236328125, 1.09228515625, 1.169403076171875, 1.24652099609375, 1.323638916015625, 1.4007568359375, 1.477874755859375, 1.55499267578125, 1.632110595703125, 1.709228515625, 1.786346435546875, 1.86346435546875, 1.940582275390625, 2.0177001953125, 2.094818115234375, 2.17193603515625, 2.249053955078125, 2.326171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 13.0, 41.0, 121.0, 299.0, 294.0, 122.0, 55.0, 18.0, 16.0, 8.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.32205963134766, -67.7159423828125, -65.10982513427734, -62.50370788574219, -59.89759063720703, -57.291473388671875, -54.685359954833984, -52.07924270629883, -49.47312545776367, -46.867008209228516, -44.26089096069336, -41.6547737121582, -39.04866027832031, -36.442543029785156, -33.83642578125, -31.230308532714844, -28.624191284179688, -26.01807403564453, -23.411956787109375, -20.80584144592285, -18.199724197387695, -15.593606948852539, -12.9874906539917, -10.38137435913086, -7.775257110595703, -5.169140338897705, -2.563023567199707, 0.043093204498291016, 2.649209976196289, 5.255327224731445, 7.861443519592285, 10.467559814453125, 13.073684692382812, 15.679801940917969, 18.285919189453125, 20.89203453063965, 23.498151779174805, 26.10426902770996, 28.710384368896484, 31.31650161743164, 33.9226188659668, 36.52873611450195, 39.13485336303711, 41.740970611572266, 44.347084045410156, 46.95320129394531, 49.55931854248047, 52.165435791015625, 54.77155303955078, 57.37767028808594, 59.983787536621094, 62.58990478515625, 65.1960220336914, 67.80213928222656, 70.40825653076172, 73.01437377929688, 75.6204833984375, 78.22660064697266, 80.83271789550781, 83.43883514404297, 86.04495239257812, 88.65106964111328, 91.25718688964844, 93.86329650878906, 96.46942138671875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 5.0, 4.0, 5.0, 11.0, 7.0, 7.0, 11.0, 9.0, 19.0, 17.0, 16.0, 13.0, 22.0, 16.0, 24.0, 27.0, 34.0, 32.0, 51.0, 71.0, 96.0, 73.0, 56.0, 39.0, 33.0, 26.0, 36.0, 30.0, 18.0, 22.0, 21.0, 14.0, 23.0, 8.0, 12.0, 16.0, 7.0, 10.0, 10.0, 10.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-33.65734100341797, -32.637664794921875, -31.61798858642578, -30.598312377929688, -29.578636169433594, -28.5589599609375, -27.539281845092773, -26.51960563659668, -25.499929428100586, -24.480253219604492, -23.4605770111084, -22.440900802612305, -21.421222686767578, -20.401546478271484, -19.38187026977539, -18.362194061279297, -17.342517852783203, -16.32284164428711, -15.303165435791016, -14.283488273620605, -13.263812065124512, -12.244135856628418, -11.224458694458008, -10.204782485961914, -9.18510627746582, -8.165430068969727, -7.145753383636475, -6.126076698303223, -5.106400489807129, -4.086724281311035, -3.067047595977783, -2.0473709106445312, -1.0276908874511719, -0.008014440536499023, 1.0116620063781738, 2.0313384532928467, 3.0510149002075195, 4.070691108703613, 5.090367794036865, 6.110044479370117, 7.129720687866211, 8.149396896362305, 9.169073104858398, 10.188750267028809, 11.208426475524902, 12.228102684020996, 13.247779846191406, 14.2674560546875, 15.287132263183594, 16.306808471679688, 17.32648468017578, 18.346160888671875, 19.36583709716797, 20.385513305664062, 21.40519142150879, 22.424867630004883, 23.444543838500977, 24.46422004699707, 25.483896255493164, 26.503572463989258, 27.523250579833984, 28.542926788330078, 29.562602996826172, 30.582279205322266, 31.60195541381836]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 8.0, 17.0, 22.0, 37.0, 48.0, 74.0, 140.0, 157.0, 317.0, 615.0, 1122.0, 2211.0, 5557.0, 20850.0, 261504.0, 3398386.0, 461030.0, 29802.0, 6726.0, 2609.0, 1322.0, 678.0, 398.0, 207.0, 150.0, 88.0, 76.0, 28.0, 28.0, 13.0, 21.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.4788818359375, -5.293701171875, -5.1085205078125, -4.92333984375, -4.7381591796875, -4.552978515625, -4.3677978515625, -4.1826171875, -3.9974365234375, -3.812255859375, -3.6270751953125, -3.44189453125, -3.2567138671875, -3.071533203125, -2.8863525390625, -2.701171875, -2.5159912109375, -2.330810546875, -2.1456298828125, -1.96044921875, -1.7752685546875, -1.590087890625, -1.4049072265625, -1.2197265625, -1.0345458984375, -0.849365234375, -0.6641845703125, -0.47900390625, -0.2938232421875, -0.108642578125, 0.0765380859375, 0.26171875, 0.4468994140625, 0.632080078125, 0.8172607421875, 1.00244140625, 1.1876220703125, 1.372802734375, 1.5579833984375, 1.7431640625, 1.9283447265625, 2.113525390625, 2.2987060546875, 2.48388671875, 2.6690673828125, 2.854248046875, 3.0394287109375, 3.224609375, 3.4097900390625, 3.594970703125, 3.7801513671875, 3.96533203125, 4.1505126953125, 4.335693359375, 4.5208740234375, 4.7060546875, 4.8912353515625, 5.076416015625, 5.2615966796875, 5.44677734375, 5.6319580078125, 5.817138671875, 6.0023193359375, 6.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 4.0, 7.0, 8.0, 17.0, 15.0, 20.0, 19.0, 41.0, 45.0, 27.0, 55.0, 56.0, 50.0, 61.0, 58.0, 71.0, 62.0, 51.0, 57.0, 54.0, 43.0, 30.0, 28.0, 25.0, 22.0, 16.0, 16.0, 14.0, 9.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.158203125, -3.0648193359375, -2.971435546875, -2.8780517578125, -2.78466796875, -2.6912841796875, -2.597900390625, -2.5045166015625, -2.4111328125, -2.3177490234375, -2.224365234375, -2.1309814453125, -2.03759765625, -1.9442138671875, -1.850830078125, -1.7574462890625, -1.6640625, -1.5706787109375, -1.477294921875, -1.3839111328125, -1.29052734375, -1.1971435546875, -1.103759765625, -1.0103759765625, -0.9169921875, -0.8236083984375, -0.730224609375, -0.6368408203125, -0.54345703125, -0.4500732421875, -0.356689453125, -0.2633056640625, -0.169921875, -0.0765380859375, 0.016845703125, 0.1102294921875, 0.20361328125, 0.2969970703125, 0.390380859375, 0.4837646484375, 0.5771484375, 0.6705322265625, 0.763916015625, 0.8572998046875, 0.95068359375, 1.0440673828125, 1.137451171875, 1.2308349609375, 1.32421875, 1.4176025390625, 1.510986328125, 1.6043701171875, 1.69775390625, 1.7911376953125, 1.884521484375, 1.9779052734375, 2.0712890625, 2.1646728515625, 2.258056640625, 2.3514404296875, 2.44482421875, 2.5382080078125, 2.631591796875, 2.7249755859375, 2.818359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 14.0, 27.0, 40.0, 68.0, 130.0, 351.0, 1172.0, 5189.0, 49088.0, 3975226.0, 151468.0, 8923.0, 1685.0, 486.0, 169.0, 84.0, 66.0, 23.0, 22.0, 13.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8984375, -14.4556884765625, -14.012939453125, -13.5701904296875, -13.12744140625, -12.6846923828125, -12.241943359375, -11.7991943359375, -11.3564453125, -10.9136962890625, -10.470947265625, -10.0281982421875, -9.58544921875, -9.1427001953125, -8.699951171875, -8.2572021484375, -7.814453125, -7.3717041015625, -6.928955078125, -6.4862060546875, -6.04345703125, -5.6007080078125, -5.157958984375, -4.7152099609375, -4.2724609375, -3.8297119140625, -3.386962890625, -2.9442138671875, -2.50146484375, -2.0587158203125, -1.615966796875, -1.1732177734375, -0.73046875, -0.2877197265625, 0.155029296875, 0.5977783203125, 1.04052734375, 1.4832763671875, 1.926025390625, 2.3687744140625, 2.8115234375, 3.2542724609375, 3.697021484375, 4.1397705078125, 4.58251953125, 5.0252685546875, 5.468017578125, 5.9107666015625, 6.353515625, 6.7962646484375, 7.239013671875, 7.6817626953125, 8.12451171875, 8.5672607421875, 9.010009765625, 9.4527587890625, 9.8955078125, 10.3382568359375, 10.781005859375, 11.2237548828125, 11.66650390625, 12.1092529296875, 12.552001953125, 12.9947509765625, 13.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 16.0, 18.0, 19.0, 36.0, 53.0, 83.0, 160.0, 355.0, 793.0, 1229.0, 684.0, 300.0, 128.0, 59.0, 39.0, 26.0, 17.0, 8.0, 10.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.8402099609375, -6.547607421875, -6.2550048828125, -5.96240234375, -5.6697998046875, -5.377197265625, -5.0845947265625, -4.7919921875, -4.4993896484375, -4.206787109375, -3.9141845703125, -3.62158203125, -3.3289794921875, -3.036376953125, -2.7437744140625, -2.451171875, -2.1585693359375, -1.865966796875, -1.5733642578125, -1.28076171875, -0.9881591796875, -0.695556640625, -0.4029541015625, -0.1103515625, 0.1822509765625, 0.474853515625, 0.7674560546875, 1.06005859375, 1.3526611328125, 1.645263671875, 1.9378662109375, 2.23046875, 2.5230712890625, 2.815673828125, 3.1082763671875, 3.40087890625, 3.6934814453125, 3.986083984375, 4.2786865234375, 4.5712890625, 4.8638916015625, 5.156494140625, 5.4490966796875, 5.74169921875, 6.0343017578125, 6.326904296875, 6.6195068359375, 6.912109375, 7.2047119140625, 7.497314453125, 7.7899169921875, 8.08251953125, 8.3751220703125, 8.667724609375, 8.9603271484375, 9.2529296875, 9.5455322265625, 9.838134765625, 10.1307373046875, 10.42333984375, 10.7159423828125, 11.008544921875, 11.3011474609375, 11.59375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 6.0, 19.0, 15.0, 35.0, 70.0, 98.0, 165.0, 179.0, 149.0, 97.0, 63.0, 30.0, 27.0, 13.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25990295410156, -46.7340087890625, -45.20811462402344, -43.68222427368164, -42.15633010864258, -40.630435943603516, -39.10454559326172, -37.578651428222656, -36.052757263183594, -34.52686309814453, -33.00096893310547, -31.475078582763672, -29.94918441772461, -28.423290252685547, -26.897397994995117, -25.371505737304688, -23.845611572265625, -22.319717407226562, -20.793825149536133, -19.267932891845703, -17.74203872680664, -16.216144561767578, -14.690252304077148, -13.164359092712402, -11.638465881347656, -10.11257266998291, -8.586679458618164, -7.060786247253418, -5.534893035888672, -4.008999824523926, -2.4831066131591797, -0.9572134017944336, 0.5686798095703125, 2.0945730209350586, 3.6204662322998047, 5.146359443664551, 6.672252655029297, 8.198145866394043, 9.724039077758789, 11.249932289123535, 12.775825500488281, 14.301718711853027, 15.827611923217773, 17.353504180908203, 18.879398345947266, 20.405292510986328, 21.931184768676758, 23.457077026367188, 24.98297119140625, 26.508865356445312, 28.034757614135742, 29.560649871826172, 31.086544036865234, 32.6124382019043, 34.138328552246094, 35.664222717285156, 37.19011688232422, 38.71601104736328, 40.241905212402344, 41.76779556274414, 43.2936897277832, 44.819583892822266, 46.34547424316406, 47.871368408203125, 49.39726257324219]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 3.0, 5.0, 11.0, 7.0, 14.0, 4.0, 11.0, 13.0, 19.0, 27.0, 27.0, 29.0, 35.0, 44.0, 39.0, 45.0, 62.0, 55.0, 51.0, 60.0, 43.0, 54.0, 56.0, 49.0, 39.0, 29.0, 27.0, 20.0, 22.0, 20.0, 15.0, 18.0, 9.0, 12.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.790239334106445, -29.869121551513672, -28.948001861572266, -28.026884078979492, -27.10576629638672, -26.184648513793945, -25.263530731201172, -24.342411041259766, -23.421293258666992, -22.50017547607422, -21.579055786132812, -20.65793800354004, -19.736820220947266, -18.815702438354492, -17.89458465576172, -16.973464965820312, -16.05234718322754, -15.131229400634766, -14.210110664367676, -13.288991928100586, -12.367874145507812, -11.446756362915039, -10.52563762664795, -9.60451889038086, -8.683401107788086, -7.762282848358154, -6.841164588928223, -5.920046329498291, -4.998928070068359, -4.077809810638428, -3.156691551208496, -2.2355732917785645, -1.314453125, -0.39333486557006836, 0.5277833938598633, 1.448901653289795, 2.3700199127197266, 3.291138172149658, 4.21225643157959, 5.1333746910095215, 6.054492950439453, 6.975611209869385, 7.896729469299316, 8.817848205566406, 9.73896598815918, 10.660083770751953, 11.581202507019043, 12.502321243286133, 13.423439025878906, 14.34455680847168, 15.26567554473877, 16.18679428100586, 17.107912063598633, 18.029029846191406, 18.950149536132812, 19.871267318725586, 20.79238510131836, 21.713502883911133, 22.634620666503906, 23.555740356445312, 24.476858139038086, 25.39797592163086, 26.319095611572266, 27.24021339416504, 28.161331176757812]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 12.0, 15.0, 13.0, 27.0, 31.0, 64.0, 87.0, 129.0, 196.0, 307.0, 617.0, 1211.0, 2646.0, 6992.0, 22305.0, 94906.0, 576465.0, 273522.0, 47461.0, 13106.0, 4502.0, 1859.0, 859.0, 443.0, 273.0, 158.0, 97.0, 71.0, 44.0, 29.0, 33.0, 19.0, 16.0, 9.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0], "bins": [-6.65234375, -6.485107421875, -6.31787109375, -6.150634765625, -5.9833984375, -5.816162109375, -5.64892578125, -5.481689453125, -5.314453125, -5.147216796875, -4.97998046875, -4.812744140625, -4.6455078125, -4.478271484375, -4.31103515625, -4.143798828125, -3.9765625, -3.809326171875, -3.64208984375, -3.474853515625, -3.3076171875, -3.140380859375, -2.97314453125, -2.805908203125, -2.638671875, -2.471435546875, -2.30419921875, -2.136962890625, -1.9697265625, -1.802490234375, -1.63525390625, -1.468017578125, -1.30078125, -1.133544921875, -0.96630859375, -0.799072265625, -0.6318359375, -0.464599609375, -0.29736328125, -0.130126953125, 0.037109375, 0.204345703125, 0.37158203125, 0.538818359375, 0.7060546875, 0.873291015625, 1.04052734375, 1.207763671875, 1.375, 1.542236328125, 1.70947265625, 1.876708984375, 2.0439453125, 2.211181640625, 2.37841796875, 2.545654296875, 2.712890625, 2.880126953125, 3.04736328125, 3.214599609375, 3.3818359375, 3.549072265625, 3.71630859375, 3.883544921875, 4.05078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 4.0, 12.0, 11.0, 13.0, 16.0, 20.0, 17.0, 26.0, 39.0, 51.0, 36.0, 56.0, 67.0, 52.0, 78.0, 66.0, 55.0, 55.0, 47.0, 45.0, 36.0, 34.0, 39.0, 24.0, 22.0, 26.0, 11.0, 9.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7890625, -3.686309814453125, -3.58355712890625, -3.480804443359375, -3.3780517578125, -3.275299072265625, -3.17254638671875, -3.069793701171875, -2.967041015625, -2.864288330078125, -2.76153564453125, -2.658782958984375, -2.5560302734375, -2.453277587890625, -2.35052490234375, -2.247772216796875, -2.14501953125, -2.042266845703125, -1.93951416015625, -1.836761474609375, -1.7340087890625, -1.631256103515625, -1.52850341796875, -1.425750732421875, -1.322998046875, -1.220245361328125, -1.11749267578125, -1.014739990234375, -0.9119873046875, -0.809234619140625, -0.70648193359375, -0.603729248046875, -0.5009765625, -0.398223876953125, -0.29547119140625, -0.192718505859375, -0.0899658203125, 0.012786865234375, 0.11553955078125, 0.218292236328125, 0.321044921875, 0.423797607421875, 0.52655029296875, 0.629302978515625, 0.7320556640625, 0.834808349609375, 0.93756103515625, 1.040313720703125, 1.14306640625, 1.245819091796875, 1.34857177734375, 1.451324462890625, 1.5540771484375, 1.656829833984375, 1.75958251953125, 1.862335205078125, 1.965087890625, 2.067840576171875, 2.17059326171875, 2.273345947265625, 2.3760986328125, 2.478851318359375, 2.58160400390625, 2.684356689453125, 2.787109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 8.0, 12.0, 23.0, 36.0, 50.0, 97.0, 159.0, 365.0, 829.0, 2603.0, 13076.0, 260447.0, 747481.0, 18541.0, 3128.0, 912.0, 392.0, 159.0, 95.0, 39.0, 30.0, 18.0, 13.0, 11.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.5404052734375, -9.174560546875, -8.8087158203125, -8.44287109375, -8.0770263671875, -7.711181640625, -7.3453369140625, -6.9794921875, -6.6136474609375, -6.247802734375, -5.8819580078125, -5.51611328125, -5.1502685546875, -4.784423828125, -4.4185791015625, -4.052734375, -3.6868896484375, -3.321044921875, -2.9552001953125, -2.58935546875, -2.2235107421875, -1.857666015625, -1.4918212890625, -1.1259765625, -0.7601318359375, -0.394287109375, -0.0284423828125, 0.33740234375, 0.7032470703125, 1.069091796875, 1.4349365234375, 1.80078125, 2.1666259765625, 2.532470703125, 2.8983154296875, 3.26416015625, 3.6300048828125, 3.995849609375, 4.3616943359375, 4.7275390625, 5.0933837890625, 5.459228515625, 5.8250732421875, 6.19091796875, 6.5567626953125, 6.922607421875, 7.2884521484375, 7.654296875, 8.0201416015625, 8.385986328125, 8.7518310546875, 9.11767578125, 9.4835205078125, 9.849365234375, 10.2152099609375, 10.5810546875, 10.9468994140625, 11.312744140625, 11.6785888671875, 12.04443359375, 12.4102783203125, 12.776123046875, 13.1419677734375, 13.5078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 4.0, 9.0, 11.0, 18.0, 21.0, 23.0, 40.0, 59.0, 52.0, 77.0, 80.0, 83.0, 83.0, 86.0, 69.0, 76.0, 47.0, 38.0, 30.0, 24.0, 22.0, 18.0, 16.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.137939453125, -15.58837890625, -15.038818359375, -14.4892578125, -13.939697265625, -13.39013671875, -12.840576171875, -12.291015625, -11.741455078125, -11.19189453125, -10.642333984375, -10.0927734375, -9.543212890625, -8.99365234375, -8.444091796875, -7.89453125, -7.344970703125, -6.79541015625, -6.245849609375, -5.6962890625, -5.146728515625, -4.59716796875, -4.047607421875, -3.498046875, -2.948486328125, -2.39892578125, -1.849365234375, -1.2998046875, -0.750244140625, -0.20068359375, 0.348876953125, 0.8984375, 1.447998046875, 1.99755859375, 2.547119140625, 3.0966796875, 3.646240234375, 4.19580078125, 4.745361328125, 5.294921875, 5.844482421875, 6.39404296875, 6.943603515625, 7.4931640625, 8.042724609375, 8.59228515625, 9.141845703125, 9.69140625, 10.240966796875, 10.79052734375, 11.340087890625, 11.8896484375, 12.439208984375, 12.98876953125, 13.538330078125, 14.087890625, 14.637451171875, 15.18701171875, 15.736572265625, 16.2861328125, 16.835693359375, 17.38525390625, 17.934814453125, 18.484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 9.0, 15.0, 10.0, 17.0, 24.0, 47.0, 59.0, 60.0, 108.0, 177.0, 244.0, 430.0, 783.0, 1499.0, 3189.0, 8368.0, 33483.0, 720089.0, 244444.0, 23119.0, 6585.0, 2670.0, 1276.0, 729.0, 416.0, 232.0, 150.0, 94.0, 73.0, 44.0, 41.0, 12.0, 15.0, 13.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.546630859375, -2.45849609375, -2.370361328125, -2.2822265625, -2.194091796875, -2.10595703125, -2.017822265625, -1.9296875, -1.841552734375, -1.75341796875, -1.665283203125, -1.5771484375, -1.489013671875, -1.40087890625, -1.312744140625, -1.224609375, -1.136474609375, -1.04833984375, -0.960205078125, -0.8720703125, -0.783935546875, -0.69580078125, -0.607666015625, -0.51953125, -0.431396484375, -0.34326171875, -0.255126953125, -0.1669921875, -0.078857421875, 0.00927734375, 0.097412109375, 0.185546875, 0.273681640625, 0.36181640625, 0.449951171875, 0.5380859375, 0.626220703125, 0.71435546875, 0.802490234375, 0.890625, 0.978759765625, 1.06689453125, 1.155029296875, 1.2431640625, 1.331298828125, 1.41943359375, 1.507568359375, 1.595703125, 1.683837890625, 1.77197265625, 1.860107421875, 1.9482421875, 2.036376953125, 2.12451171875, 2.212646484375, 2.30078125, 2.388916015625, 2.47705078125, 2.565185546875, 2.6533203125, 2.741455078125, 2.82958984375, 2.917724609375, 3.005859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 13.0, 25.0, 47.0, 71.0, 220.0, 365.0, 138.0, 49.0, 23.0, 16.0, 12.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0017557144165039062, -0.0017045289278030396, -0.0016533434391021729, -0.0016021579504013062, -0.0015509724617004395, -0.0014997869729995728, -0.001448601484298706, -0.0013974159955978394, -0.0013462305068969727, -0.001295045018196106, -0.0012438595294952393, -0.0011926740407943726, -0.0011414885520935059, -0.0010903030633926392, -0.0010391175746917725, -0.0009879320859909058, -0.0009367465972900391, -0.0008855611085891724, -0.0008343756198883057, -0.000783190131187439, -0.0007320046424865723, -0.0006808191537857056, -0.0006296336650848389, -0.0005784481763839722, -0.0005272626876831055, -0.00047607719898223877, -0.00042489171028137207, -0.00037370622158050537, -0.00032252073287963867, -0.00027133524417877197, -0.00022014975547790527, -0.00016896426677703857, -0.00011777877807617188, -6.659328937530518e-05, -1.5407800674438477e-05, 3.577768802642822e-05, 8.696317672729492e-05, 0.00013814866542816162, 0.00018933415412902832, 0.00024051964282989502, 0.0002917051315307617, 0.0003428906202316284, 0.0003940761089324951, 0.0004452615976333618, 0.0004964470863342285, 0.0005476325750350952, 0.0005988180637359619, 0.0006500035524368286, 0.0007011890411376953, 0.000752374529838562, 0.0008035600185394287, 0.0008547455072402954, 0.0009059309959411621, 0.0009571164846420288, 0.0010083019733428955, 0.0010594874620437622, 0.001110672950744629, 0.0011618584394454956, 0.0012130439281463623, 0.001264229416847229, 0.0013154149055480957, 0.0013666003942489624, 0.001417785882949829, 0.0014689713716506958, 0.0015201568603515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 11.0, 17.0, 13.0, 28.0, 52.0, 81.0, 155.0, 293.0, 660.0, 1587.0, 6692.0, 55838.0, 900323.0, 71881.0, 7724.0, 1869.0, 638.0, 290.0, 154.0, 86.0, 42.0, 35.0, 18.0, 12.0, 7.0, 9.0, 9.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.0625, -3.9337158203125, -3.804931640625, -3.6761474609375, -3.54736328125, -3.4185791015625, -3.289794921875, -3.1610107421875, -3.0322265625, -2.9034423828125, -2.774658203125, -2.6458740234375, -2.51708984375, -2.3883056640625, -2.259521484375, -2.1307373046875, -2.001953125, -1.8731689453125, -1.744384765625, -1.6156005859375, -1.48681640625, -1.3580322265625, -1.229248046875, -1.1004638671875, -0.9716796875, -0.8428955078125, -0.714111328125, -0.5853271484375, -0.45654296875, -0.3277587890625, -0.198974609375, -0.0701904296875, 0.05859375, 0.1873779296875, 0.316162109375, 0.4449462890625, 0.57373046875, 0.7025146484375, 0.831298828125, 0.9600830078125, 1.0888671875, 1.2176513671875, 1.346435546875, 1.4752197265625, 1.60400390625, 1.7327880859375, 1.861572265625, 1.9903564453125, 2.119140625, 2.2479248046875, 2.376708984375, 2.5054931640625, 2.63427734375, 2.7630615234375, 2.891845703125, 3.0206298828125, 3.1494140625, 3.2781982421875, 3.406982421875, 3.5357666015625, 3.66455078125, 3.7933349609375, 3.922119140625, 4.0509033203125, 4.1796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 7.0, 5.0, 7.0, 18.0, 25.0, 45.0, 71.0, 92.0, 144.0, 178.0, 120.0, 84.0, 73.0, 38.0, 23.0, 12.0, 9.0, 12.0, 5.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.7109375, -2.6043701171875, -2.497802734375, -2.3912353515625, -2.28466796875, -2.1781005859375, -2.071533203125, -1.9649658203125, -1.8583984375, -1.7518310546875, -1.645263671875, -1.5386962890625, -1.43212890625, -1.3255615234375, -1.218994140625, -1.1124267578125, -1.005859375, -0.8992919921875, -0.792724609375, -0.6861572265625, -0.57958984375, -0.4730224609375, -0.366455078125, -0.2598876953125, -0.1533203125, -0.0467529296875, 0.059814453125, 0.1663818359375, 0.27294921875, 0.3795166015625, 0.486083984375, 0.5926513671875, 0.69921875, 0.8057861328125, 0.912353515625, 1.0189208984375, 1.12548828125, 1.2320556640625, 1.338623046875, 1.4451904296875, 1.5517578125, 1.6583251953125, 1.764892578125, 1.8714599609375, 1.97802734375, 2.0845947265625, 2.191162109375, 2.2977294921875, 2.404296875, 2.5108642578125, 2.617431640625, 2.7239990234375, 2.83056640625, 2.9371337890625, 3.043701171875, 3.1502685546875, 3.2568359375, 3.3634033203125, 3.469970703125, 3.5765380859375, 3.68310546875, 3.7896728515625, 3.896240234375, 4.0028076171875, 4.109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 37.0, 95.0, 539.0, 223.0, 62.0, 19.0, 6.0, 7.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.8167266845703, -146.924560546875, -143.03240966796875, -139.14024353027344, -135.24807739257812, -131.35592651367188, -127.46376037597656, -123.57160186767578, -119.679443359375, -115.78728485107422, -111.89512634277344, -108.00296020507812, -104.11080169677734, -100.21864318847656, -96.32647705078125, -92.43431854248047, -88.54216003417969, -84.6500015258789, -80.75784301757812, -76.86567687988281, -72.97351837158203, -69.08135986328125, -65.18919372558594, -61.297035217285156, -57.404876708984375, -53.512718200683594, -49.62055587768555, -45.7283935546875, -41.83623504638672, -37.94407653808594, -34.05191421508789, -30.159753799438477, -26.267601013183594, -22.37544059753418, -18.483280181884766, -14.591119766235352, -10.698959350585938, -6.806798934936523, -2.9146385192871094, 0.9775218963623047, 4.869682312011719, 8.761842727661133, 12.654003143310547, 16.54616355895996, 20.438323974609375, 24.33048439025879, 28.222644805908203, 32.11480712890625, 36.00696563720703, 39.89912414550781, 43.79128646850586, 47.683448791503906, 51.57560729980469, 55.46776580810547, 59.359928131103516, 63.25209045410156, 67.14424896240234, 71.03640747070312, 74.92857360839844, 78.82073211669922, 82.712890625, 86.60504913330078, 90.49720764160156, 94.38937377929688, 98.28153228759766]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 11.0, 13.0, 4.0, 10.0, 13.0, 12.0, 17.0, 27.0, 26.0, 26.0, 36.0, 27.0, 39.0, 46.0, 68.0, 143.0, 115.0, 67.0, 43.0, 34.0, 23.0, 23.0, 25.0, 22.0, 21.0, 17.0, 13.0, 15.0, 11.0, 5.0, 10.0, 7.0, 4.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.199832916259766, -41.7989616394043, -40.39809036254883, -38.997222900390625, -37.596351623535156, -36.19548034667969, -34.79460906982422, -33.39373779296875, -31.992868423461914, -30.591997146606445, -29.19112777709961, -27.79025650024414, -26.389385223388672, -24.988515853881836, -23.587644577026367, -22.18677520751953, -20.785903930664062, -19.385032653808594, -17.984163284301758, -16.58329200744629, -15.182421684265137, -13.781551361083984, -12.380680084228516, -10.979809761047363, -9.578939437866211, -8.178069114685059, -6.777198314666748, -5.3763275146484375, -3.975457191467285, -2.574586868286133, -1.173715591430664, 0.22715473175048828, 1.628021240234375, 3.0288918018341064, 4.429762363433838, 5.830633163452148, 7.231503486633301, 8.632373809814453, 10.033245086669922, 11.434115409851074, 12.834985733032227, 14.235856056213379, 15.636726379394531, 17.03759765625, 18.43846893310547, 19.839338302612305, 21.240209579467773, 22.64107894897461, 24.041950225830078, 25.442821502685547, 26.843690872192383, 28.24456214904785, 29.645431518554688, 31.046302795410156, 32.447174072265625, 33.848045349121094, 35.24891662597656, 36.64978790283203, 38.0506591796875, 39.45153045654297, 40.85239791870117, 42.25326919555664, 43.65414047241211, 45.05501174926758, 46.45587921142578]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 4.0, 13.0, 16.0, 22.0, 31.0, 45.0, 43.0, 66.0, 110.0, 137.0, 221.0, 304.0, 493.0, 766.0, 1168.0, 1893.0, 3049.0, 5615.0, 11511.0, 28368.0, 98577.0, 488528.0, 1982334.0, 1222081.0, 251768.0, 57516.0, 19405.0, 8823.0, 4359.0, 2535.0, 1546.0, 962.0, 594.0, 439.0, 240.0, 220.0, 133.0, 105.0, 71.0, 52.0, 24.0, 27.0, 14.0, 10.0, 13.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0], "bins": [-4.515625, -4.3858642578125, -4.256103515625, -4.1263427734375, -3.99658203125, -3.8668212890625, -3.737060546875, -3.6072998046875, -3.4775390625, -3.3477783203125, -3.218017578125, -3.0882568359375, -2.95849609375, -2.8287353515625, -2.698974609375, -2.5692138671875, -2.439453125, -2.3096923828125, -2.179931640625, -2.0501708984375, -1.92041015625, -1.7906494140625, -1.660888671875, -1.5311279296875, -1.4013671875, -1.2716064453125, -1.141845703125, -1.0120849609375, -0.88232421875, -0.7525634765625, -0.622802734375, -0.4930419921875, -0.36328125, -0.2335205078125, -0.103759765625, 0.0260009765625, 0.15576171875, 0.2855224609375, 0.415283203125, 0.5450439453125, 0.6748046875, 0.8045654296875, 0.934326171875, 1.0640869140625, 1.19384765625, 1.3236083984375, 1.453369140625, 1.5831298828125, 1.712890625, 1.8426513671875, 1.972412109375, 2.1021728515625, 2.23193359375, 2.3616943359375, 2.491455078125, 2.6212158203125, 2.7509765625, 2.8807373046875, 3.010498046875, 3.1402587890625, 3.27001953125, 3.3997802734375, 3.529541015625, 3.6593017578125, 3.7890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 10.0, 8.0, 12.0, 11.0, 12.0, 10.0, 15.0, 14.0, 33.0, 24.0, 30.0, 31.0, 37.0, 51.0, 45.0, 43.0, 32.0, 37.0, 43.0, 41.0, 36.0, 40.0, 47.0, 44.0, 36.0, 29.0, 29.0, 27.0, 16.0, 18.0, 18.0, 12.0, 23.0, 11.0, 10.0, 14.0, 13.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.779205322265625, -1.71075439453125, -1.642303466796875, -1.5738525390625, -1.505401611328125, -1.43695068359375, -1.368499755859375, -1.300048828125, -1.231597900390625, -1.16314697265625, -1.094696044921875, -1.0262451171875, -0.957794189453125, -0.88934326171875, -0.820892333984375, -0.75244140625, -0.683990478515625, -0.61553955078125, -0.547088623046875, -0.4786376953125, -0.410186767578125, -0.34173583984375, -0.273284912109375, -0.204833984375, -0.136383056640625, -0.06793212890625, 0.000518798828125, 0.0689697265625, 0.137420654296875, 0.20587158203125, 0.274322509765625, 0.3427734375, 0.411224365234375, 0.47967529296875, 0.548126220703125, 0.6165771484375, 0.685028076171875, 0.75347900390625, 0.821929931640625, 0.890380859375, 0.958831787109375, 1.02728271484375, 1.095733642578125, 1.1641845703125, 1.232635498046875, 1.30108642578125, 1.369537353515625, 1.43798828125, 1.506439208984375, 1.57489013671875, 1.643341064453125, 1.7117919921875, 1.780242919921875, 1.84869384765625, 1.917144775390625, 1.985595703125, 2.054046630859375, 2.12249755859375, 2.190948486328125, 2.2593994140625, 2.327850341796875, 2.39630126953125, 2.464752197265625, 2.533203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 9.0, 12.0, 14.0, 15.0, 33.0, 61.0, 77.0, 110.0, 229.0, 392.0, 770.0, 2095.0, 8903.0, 127516.0, 3975359.0, 69120.0, 6357.0, 1664.0, 663.0, 336.0, 179.0, 119.0, 74.0, 51.0, 29.0, 30.0, 13.0, 12.0, 2.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.265625, -17.684326171875, -17.10302734375, -16.521728515625, -15.9404296875, -15.359130859375, -14.77783203125, -14.196533203125, -13.615234375, -13.033935546875, -12.45263671875, -11.871337890625, -11.2900390625, -10.708740234375, -10.12744140625, -9.546142578125, -8.96484375, -8.383544921875, -7.80224609375, -7.220947265625, -6.6396484375, -6.058349609375, -5.47705078125, -4.895751953125, -4.314453125, -3.733154296875, -3.15185546875, -2.570556640625, -1.9892578125, -1.407958984375, -0.82666015625, -0.245361328125, 0.3359375, 0.917236328125, 1.49853515625, 2.079833984375, 2.6611328125, 3.242431640625, 3.82373046875, 4.405029296875, 4.986328125, 5.567626953125, 6.14892578125, 6.730224609375, 7.3115234375, 7.892822265625, 8.47412109375, 9.055419921875, 9.63671875, 10.218017578125, 10.79931640625, 11.380615234375, 11.9619140625, 12.543212890625, 13.12451171875, 13.705810546875, 14.287109375, 14.868408203125, 15.44970703125, 16.031005859375, 16.6123046875, 17.193603515625, 17.77490234375, 18.356201171875, 18.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 10.0, 12.0, 9.0, 19.0, 21.0, 40.0, 46.0, 58.0, 73.0, 104.0, 166.0, 274.0, 456.0, 686.0, 746.0, 474.0, 284.0, 160.0, 129.0, 97.0, 52.0, 44.0, 30.0, 22.0, 14.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.515625, -10.19775390625, -9.8798828125, -9.56201171875, -9.244140625, -8.92626953125, -8.6083984375, -8.29052734375, -7.97265625, -7.65478515625, -7.3369140625, -7.01904296875, -6.701171875, -6.38330078125, -6.0654296875, -5.74755859375, -5.4296875, -5.11181640625, -4.7939453125, -4.47607421875, -4.158203125, -3.84033203125, -3.5224609375, -3.20458984375, -2.88671875, -2.56884765625, -2.2509765625, -1.93310546875, -1.615234375, -1.29736328125, -0.9794921875, -0.66162109375, -0.34375, -0.02587890625, 0.2919921875, 0.60986328125, 0.927734375, 1.24560546875, 1.5634765625, 1.88134765625, 2.19921875, 2.51708984375, 2.8349609375, 3.15283203125, 3.470703125, 3.78857421875, 4.1064453125, 4.42431640625, 4.7421875, 5.06005859375, 5.3779296875, 5.69580078125, 6.013671875, 6.33154296875, 6.6494140625, 6.96728515625, 7.28515625, 7.60302734375, 7.9208984375, 8.23876953125, 8.556640625, 8.87451171875, 9.1923828125, 9.51025390625, 9.828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 8.0, 5.0, 3.0, 9.0, 15.0, 30.0, 91.0, 187.0, 278.0, 183.0, 115.0, 33.0, 27.0, 15.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.67697143554688, -125.78134155273438, -120.88571166992188, -115.99007415771484, -111.09444427490234, -106.19881439208984, -101.30317687988281, -96.40754699707031, -91.51191711425781, -86.61628723144531, -81.72065734863281, -76.82501983642578, -71.92938995361328, -67.03376007080078, -62.138126373291016, -57.24249267578125, -52.34686279296875, -47.45123291015625, -42.555599212646484, -37.65996551513672, -32.76433563232422, -27.868703842163086, -22.973072052001953, -18.077438354492188, -13.181808471679688, -8.286176681518555, -3.390544891357422, 1.505086898803711, 6.400718688964844, 11.296350479125977, 16.19198226928711, 21.087615966796875, 25.983261108398438, 30.87889289855957, 35.7745246887207, 40.67015838623047, 45.56578826904297, 50.46141815185547, 55.357051849365234, 60.252685546875, 65.1483154296875, 70.0439453125, 74.9395751953125, 79.83521270751953, 84.73084259033203, 89.62647247314453, 94.52210998535156, 99.41773986816406, 104.31336975097656, 109.20899963378906, 114.10462951660156, 119.0002670288086, 123.8958969116211, 128.79153442382812, 133.68716430664062, 138.58279418945312, 143.47842407226562, 148.37405395507812, 153.26968383789062, 158.16531372070312, 163.06094360351562, 167.9565887451172, 172.8522186279297, 177.7478485107422, 182.6434783935547]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 2.0, 6.0, 7.0, 12.0, 4.0, 11.0, 14.0, 14.0, 27.0, 33.0, 29.0, 28.0, 34.0, 35.0, 46.0, 55.0, 48.0, 70.0, 42.0, 62.0, 55.0, 44.0, 40.0, 38.0, 30.0, 29.0, 32.0, 25.0, 24.0, 18.0, 23.0, 16.0, 9.0, 14.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.880672454833984, -55.204959869384766, -53.52924728393555, -51.85353469848633, -50.177818298339844, -48.502105712890625, -46.826393127441406, -45.15068054199219, -43.47496795654297, -41.79925537109375, -40.12354278564453, -38.44783020019531, -36.772117614746094, -35.096405029296875, -33.42068862915039, -31.744976043701172, -30.069263458251953, -28.393550872802734, -26.717838287353516, -25.042123794555664, -23.366411209106445, -21.690698623657227, -20.014984130859375, -18.339271545410156, -16.663558959960938, -14.987846374511719, -13.312132835388184, -11.636419296264648, -9.96070671081543, -8.284994125366211, -6.609280586242676, -4.933567047119141, -3.257854461669922, -1.582141399383545, 0.09357166290283203, 1.769284725189209, 3.444997787475586, 5.120710372924805, 6.79642391204834, 8.472137451171875, 10.147850036621094, 11.823562622070312, 13.499276161193848, 15.174989700317383, 16.8507022857666, 18.52641487121582, 20.202129364013672, 21.87784194946289, 23.55355453491211, 25.229267120361328, 26.904979705810547, 28.5806941986084, 30.256406784057617, 31.932119369506836, 33.60783386230469, 35.283546447753906, 36.959259033203125, 38.634971618652344, 40.31068420410156, 41.98639678955078, 43.662109375, 45.33782196044922, 47.0135383605957, 48.68925094604492, 50.36496353149414]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 13.0, 6.0, 22.0, 16.0, 33.0, 46.0, 83.0, 115.0, 184.0, 344.0, 647.0, 1251.0, 2597.0, 6626.0, 20383.0, 86520.0, 608359.0, 256746.0, 43906.0, 12405.0, 4373.0, 1850.0, 879.0, 451.0, 251.0, 160.0, 103.0, 55.0, 36.0, 27.0, 22.0, 14.0, 6.0, 5.0, 7.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.33203125, -5.15301513671875, -4.9739990234375, -4.79498291015625, -4.615966796875, -4.43695068359375, -4.2579345703125, -4.07891845703125, -3.89990234375, -3.72088623046875, -3.5418701171875, -3.36285400390625, -3.183837890625, -3.00482177734375, -2.8258056640625, -2.64678955078125, -2.4677734375, -2.28875732421875, -2.1097412109375, -1.93072509765625, -1.751708984375, -1.57269287109375, -1.3936767578125, -1.21466064453125, -1.03564453125, -0.85662841796875, -0.6776123046875, -0.49859619140625, -0.319580078125, -0.14056396484375, 0.0384521484375, 0.21746826171875, 0.396484375, 0.57550048828125, 0.7545166015625, 0.93353271484375, 1.112548828125, 1.29156494140625, 1.4705810546875, 1.64959716796875, 1.82861328125, 2.00762939453125, 2.1866455078125, 2.36566162109375, 2.544677734375, 2.72369384765625, 2.9027099609375, 3.08172607421875, 3.2607421875, 3.43975830078125, 3.6187744140625, 3.79779052734375, 3.976806640625, 4.15582275390625, 4.3348388671875, 4.51385498046875, 4.69287109375, 4.87188720703125, 5.0509033203125, 5.22991943359375, 5.408935546875, 5.58795166015625, 5.7669677734375, 5.94598388671875, 6.125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 8.0, 16.0, 11.0, 16.0, 28.0, 28.0, 44.0, 39.0, 56.0, 51.0, 79.0, 66.0, 77.0, 64.0, 82.0, 57.0, 62.0, 41.0, 41.0, 25.0, 21.0, 17.0, 17.0, 15.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2265625, -6.05181884765625, -5.8770751953125, -5.70233154296875, -5.527587890625, -5.35284423828125, -5.1781005859375, -5.00335693359375, -4.82861328125, -4.65386962890625, -4.4791259765625, -4.30438232421875, -4.129638671875, -3.95489501953125, -3.7801513671875, -3.60540771484375, -3.4306640625, -3.25592041015625, -3.0811767578125, -2.90643310546875, -2.731689453125, -2.55694580078125, -2.3822021484375, -2.20745849609375, -2.03271484375, -1.85797119140625, -1.6832275390625, -1.50848388671875, -1.333740234375, -1.15899658203125, -0.9842529296875, -0.80950927734375, -0.634765625, -0.46002197265625, -0.2852783203125, -0.11053466796875, 0.064208984375, 0.23895263671875, 0.4136962890625, 0.58843994140625, 0.76318359375, 0.93792724609375, 1.1126708984375, 1.28741455078125, 1.462158203125, 1.63690185546875, 1.8116455078125, 1.98638916015625, 2.1611328125, 2.33587646484375, 2.5106201171875, 2.68536376953125, 2.860107421875, 3.03485107421875, 3.2095947265625, 3.38433837890625, 3.55908203125, 3.73382568359375, 3.9085693359375, 4.08331298828125, 4.258056640625, 4.43280029296875, 4.6075439453125, 4.78228759765625, 4.95703125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 12.0, 10.0, 27.0, 52.0, 86.0, 139.0, 211.0, 456.0, 954.0, 2650.0, 11354.0, 168601.0, 835706.0, 21531.0, 4093.0, 1356.0, 588.0, 280.0, 143.0, 88.0, 65.0, 37.0, 28.0, 17.0, 8.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.9168701171875, -8.630615234375, -8.3443603515625, -8.05810546875, -7.7718505859375, -7.485595703125, -7.1993408203125, -6.9130859375, -6.6268310546875, -6.340576171875, -6.0543212890625, -5.76806640625, -5.4818115234375, -5.195556640625, -4.9093017578125, -4.623046875, -4.3367919921875, -4.050537109375, -3.7642822265625, -3.47802734375, -3.1917724609375, -2.905517578125, -2.6192626953125, -2.3330078125, -2.0467529296875, -1.760498046875, -1.4742431640625, -1.18798828125, -0.9017333984375, -0.615478515625, -0.3292236328125, -0.04296875, 0.2432861328125, 0.529541015625, 0.8157958984375, 1.10205078125, 1.3883056640625, 1.674560546875, 1.9608154296875, 2.2470703125, 2.5333251953125, 2.819580078125, 3.1058349609375, 3.39208984375, 3.6783447265625, 3.964599609375, 4.2508544921875, 4.537109375, 4.8233642578125, 5.109619140625, 5.3958740234375, 5.68212890625, 5.9683837890625, 6.254638671875, 6.5408935546875, 6.8271484375, 7.1134033203125, 7.399658203125, 7.6859130859375, 7.97216796875, 8.2584228515625, 8.544677734375, 8.8309326171875, 9.1171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 6.0, 9.0, 14.0, 16.0, 13.0, 21.0, 19.0, 22.0, 29.0, 37.0, 35.0, 46.0, 61.0, 67.0, 87.0, 71.0, 74.0, 63.0, 65.0, 36.0, 32.0, 25.0, 26.0, 24.0, 20.0, 9.0, 11.0, 9.0, 7.0, 9.0, 6.0, 5.0, 2.0, 7.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.421875, -15.891357421875, -15.36083984375, -14.830322265625, -14.2998046875, -13.769287109375, -13.23876953125, -12.708251953125, -12.177734375, -11.647216796875, -11.11669921875, -10.586181640625, -10.0556640625, -9.525146484375, -8.99462890625, -8.464111328125, -7.93359375, -7.403076171875, -6.87255859375, -6.342041015625, -5.8115234375, -5.281005859375, -4.75048828125, -4.219970703125, -3.689453125, -3.158935546875, -2.62841796875, -2.097900390625, -1.5673828125, -1.036865234375, -0.50634765625, 0.024169921875, 0.5546875, 1.085205078125, 1.61572265625, 2.146240234375, 2.6767578125, 3.207275390625, 3.73779296875, 4.268310546875, 4.798828125, 5.329345703125, 5.85986328125, 6.390380859375, 6.9208984375, 7.451416015625, 7.98193359375, 8.512451171875, 9.04296875, 9.573486328125, 10.10400390625, 10.634521484375, 11.1650390625, 11.695556640625, 12.22607421875, 12.756591796875, 13.287109375, 13.817626953125, 14.34814453125, 14.878662109375, 15.4091796875, 15.939697265625, 16.47021484375, 17.000732421875, 17.53125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 9.0, 17.0, 20.0, 33.0, 68.0, 94.0, 138.0, 272.0, 486.0, 973.0, 2230.0, 6831.0, 27409.0, 278448.0, 690127.0, 29601.0, 7339.0, 2359.0, 989.0, 469.0, 238.0, 163.0, 74.0, 55.0, 35.0, 19.0, 18.0, 7.0, 7.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0547332763671875, -1.010833740234375, -0.9669342041015625, -0.92303466796875, -0.8791351318359375, -0.835235595703125, -0.7913360595703125, -0.7474365234375, -0.7035369873046875, -0.659637451171875, -0.6157379150390625, -0.57183837890625, -0.5279388427734375, -0.484039306640625, -0.4401397705078125, -0.396240234375, -0.3523406982421875, -0.308441162109375, -0.2645416259765625, -0.22064208984375, -0.1767425537109375, -0.132843017578125, -0.0889434814453125, -0.0450439453125, -0.0011444091796875, 0.042755126953125, 0.0866546630859375, 0.13055419921875, 0.1744537353515625, 0.218353271484375, 0.2622528076171875, 0.30615234375, 0.3500518798828125, 0.393951416015625, 0.4378509521484375, 0.48175048828125, 0.5256500244140625, 0.569549560546875, 0.6134490966796875, 0.6573486328125, 0.7012481689453125, 0.745147705078125, 0.7890472412109375, 0.83294677734375, 0.8768463134765625, 0.920745849609375, 0.9646453857421875, 1.008544921875, 1.0524444580078125, 1.096343994140625, 1.1402435302734375, 1.18414306640625, 1.2280426025390625, 1.271942138671875, 1.3158416748046875, 1.3597412109375, 1.4036407470703125, 1.447540283203125, 1.4914398193359375, 1.53533935546875, 1.5792388916015625, 1.623138427734375, 1.6670379638671875, 1.7109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 5.0, 9.0, 7.0, 10.0, 19.0, 26.0, 39.0, 96.0, 179.0, 247.0, 168.0, 77.0, 59.0, 27.0, 15.0, 6.0, 4.0, 6.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.0002260357141494751, -0.0002079308032989502, -0.0001898258924484253, -0.0001717209815979004, -0.0001536160707473755, -0.00013551115989685059, -0.00011740624904632568, -9.930133819580078e-05, -8.119642734527588e-05, -6.309151649475098e-05, -4.4986605644226074e-05, -2.6881694793701172e-05, -8.77678394317627e-06, 9.328126907348633e-06, 2.7433037757873535e-05, 4.553794860839844e-05, 6.364285945892334e-05, 8.174777030944824e-05, 9.985268115997314e-05, 0.00011795759201049805, 0.00013606250286102295, 0.00015416741371154785, 0.00017227232456207275, 0.00019037723541259766, 0.00020848214626312256, 0.00022658705711364746, 0.00024469196796417236, 0.00026279687881469727, 0.00028090178966522217, 0.00029900670051574707, 0.00031711161136627197, 0.0003352165222167969, 0.0003533214330673218, 0.0003714263439178467, 0.0003895312547683716, 0.0004076361656188965, 0.0004257410764694214, 0.0004438459873199463, 0.0004619508981704712, 0.0004800558090209961, 0.000498160719871521, 0.0005162656307220459, 0.0005343705415725708, 0.0005524754524230957, 0.0005705803632736206, 0.0005886852741241455, 0.0006067901849746704, 0.0006248950958251953, 0.0006430000066757202, 0.0006611049175262451, 0.00067920982837677, 0.0006973147392272949, 0.0007154196500778198, 0.0007335245609283447, 0.0007516294717788696, 0.0007697343826293945, 0.0007878392934799194, 0.0008059442043304443, 0.0008240491151809692, 0.0008421540260314941, 0.000860258936882019, 0.0008783638477325439, 0.0008964687585830688, 0.0009145736694335938]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 12.0, 14.0, 26.0, 26.0, 52.0, 67.0, 125.0, 211.0, 376.0, 743.0, 1629.0, 3868.0, 10930.0, 44263.0, 827308.0, 126874.0, 20637.0, 6448.0, 2501.0, 1132.0, 560.0, 278.0, 154.0, 116.0, 67.0, 32.0, 24.0, 17.0, 14.0, 6.0, 6.0, 2.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6962890625, -1.646026611328125, -1.59576416015625, -1.545501708984375, -1.4952392578125, -1.444976806640625, -1.39471435546875, -1.344451904296875, -1.294189453125, -1.243927001953125, -1.19366455078125, -1.143402099609375, -1.0931396484375, -1.042877197265625, -0.99261474609375, -0.942352294921875, -0.89208984375, -0.841827392578125, -0.79156494140625, -0.741302490234375, -0.6910400390625, -0.640777587890625, -0.59051513671875, -0.540252685546875, -0.489990234375, -0.439727783203125, -0.38946533203125, -0.339202880859375, -0.2889404296875, -0.238677978515625, -0.18841552734375, -0.138153076171875, -0.087890625, -0.037628173828125, 0.01263427734375, 0.062896728515625, 0.1131591796875, 0.163421630859375, 0.21368408203125, 0.263946533203125, 0.314208984375, 0.364471435546875, 0.41473388671875, 0.464996337890625, 0.5152587890625, 0.565521240234375, 0.61578369140625, 0.666046142578125, 0.71630859375, 0.766571044921875, 0.81683349609375, 0.867095947265625, 0.9173583984375, 0.967620849609375, 1.01788330078125, 1.068145751953125, 1.118408203125, 1.168670654296875, 1.21893310546875, 1.269195556640625, 1.3194580078125, 1.369720458984375, 1.41998291015625, 1.470245361328125, 1.5205078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 12.0, 3.0, 12.0, 5.0, 14.0, 16.0, 16.0, 27.0, 31.0, 48.0, 65.0, 86.0, 110.0, 112.0, 105.0, 78.0, 47.0, 47.0, 38.0, 20.0, 20.0, 11.0, 10.0, 12.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.708984375, -1.6595001220703125, -1.610015869140625, -1.5605316162109375, -1.51104736328125, -1.4615631103515625, -1.412078857421875, -1.3625946044921875, -1.3131103515625, -1.2636260986328125, -1.214141845703125, -1.1646575927734375, -1.11517333984375, -1.0656890869140625, -1.016204833984375, -0.9667205810546875, -0.917236328125, -0.8677520751953125, -0.818267822265625, -0.7687835693359375, -0.71929931640625, -0.6698150634765625, -0.620330810546875, -0.5708465576171875, -0.5213623046875, -0.4718780517578125, -0.422393798828125, -0.3729095458984375, -0.32342529296875, -0.2739410400390625, -0.224456787109375, -0.1749725341796875, -0.12548828125, -0.0760040283203125, -0.026519775390625, 0.0229644775390625, 0.07244873046875, 0.1219329833984375, 0.171417236328125, 0.2209014892578125, 0.2703857421875, 0.3198699951171875, 0.369354248046875, 0.4188385009765625, 0.46832275390625, 0.5178070068359375, 0.567291259765625, 0.6167755126953125, 0.666259765625, 0.7157440185546875, 0.765228271484375, 0.8147125244140625, 0.86419677734375, 0.9136810302734375, 0.963165283203125, 1.0126495361328125, 1.0621337890625, 1.1116180419921875, 1.161102294921875, 1.2105865478515625, 1.26007080078125, 1.3095550537109375, 1.359039306640625, 1.4085235595703125, 1.4580078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 21.0, 33.0, 48.0, 81.0, 407.0, 202.0, 58.0, 39.0, 39.0, 20.0, 9.0, 4.0, 6.0, 4.0, 9.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.11646270751953, -38.43195343017578, -36.74744415283203, -35.06293487548828, -33.3784294128418, -31.693920135498047, -30.009410858154297, -28.324901580810547, -26.64039421081543, -24.95588493347168, -23.271377563476562, -21.586868286132812, -19.902359008789062, -18.217851638793945, -16.533342361450195, -14.848834037780762, -13.164325714111328, -11.479817390441895, -9.795309066772461, -8.110799789428711, -6.426291465759277, -4.741783142089844, -3.0572738647460938, -1.3727655410766602, 0.31174278259277344, 1.9962513446807861, 3.680759906768799, 5.365268707275391, 7.049777030944824, 8.734285354614258, 10.418794631958008, 12.103302955627441, 13.787811279296875, 15.472319602966309, 17.156827926635742, 18.841337203979492, 20.52584457397461, 22.21035385131836, 23.89486312866211, 25.57937240600586, 27.263879776000977, 28.948389053344727, 30.632896423339844, 32.317405700683594, 34.001914978027344, 35.686424255371094, 37.370933532714844, 39.05543899536133, 40.73994827270508, 42.42445755004883, 44.10896682739258, 45.79347229003906, 47.47798156738281, 49.16249084472656, 50.84700012207031, 52.53150939941406, 54.21601867675781, 55.90052795410156, 57.58503723144531, 59.26954650878906, 60.95405197143555, 62.6385612487793, 64.32307434082031, 66.00757598876953, 67.69208526611328]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 9.0, 6.0, 9.0, 8.0, 8.0, 7.0, 19.0, 14.0, 19.0, 17.0, 11.0, 14.0, 30.0, 27.0, 22.0, 59.0, 218.0, 187.0, 74.0, 20.0, 20.0, 28.0, 22.0, 13.0, 19.0, 17.0, 11.0, 18.0, 13.0, 12.0, 3.0, 5.0, 7.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-42.114017486572266, -40.83651351928711, -39.55900573730469, -38.28150177001953, -37.003997802734375, -35.72649002075195, -34.4489860534668, -33.171478271484375, -31.89397430419922, -30.61646842956543, -29.33896255493164, -28.061458587646484, -26.783952713012695, -25.506446838378906, -24.22894287109375, -22.95143699645996, -21.673931121826172, -20.396425247192383, -19.118919372558594, -17.841415405273438, -16.56390953063965, -15.28640365600586, -14.008898735046387, -12.731393814086914, -11.453887939453125, -10.176382064819336, -8.898877143859863, -7.621371746063232, -6.343866348266602, -5.066360950469971, -3.78885555267334, -2.511350631713867, -1.2338409423828125, 0.04366445541381836, 1.3211698532104492, 2.59867525100708, 3.876180648803711, 5.153686046600342, 6.431191444396973, 7.708696365356445, 8.986202239990234, 10.263708114624023, 11.541213035583496, 12.818717956542969, 14.096223831176758, 15.373729705810547, 16.651233673095703, 17.928739547729492, 19.20624542236328, 20.48375129699707, 21.76125717163086, 23.038761138916016, 24.316267013549805, 25.593772888183594, 26.87127685546875, 28.14878273010254, 29.426288604736328, 30.703794479370117, 31.981300354003906, 33.25880432128906, 34.53630828857422, 35.81381607055664, 37.0913200378418, 38.36882781982422, 39.646331787109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 6.0, 3.0, 3.0, 8.0, 4.0, 11.0, 10.0, 12.0, 9.0, 10.0, 19.0, 25.0, 35.0, 36.0, 40.0, 60.0, 206.0, 159.0, 79.0, 43.0, 38.0, 34.0, 35.0, 21.0, 21.0, 19.0, 15.0, 9.0, 4.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.50567626953125, -5.3433837890625, -5.18109130859375, -5.018798828125, -4.85650634765625, -4.6942138671875, -4.53192138671875, -4.36962890625, -4.20733642578125, -4.0450439453125, -3.88275146484375, -3.720458984375, -3.55816650390625, -3.3958740234375, -3.23358154296875, -3.0712890625, -2.90899658203125, -2.7467041015625, -2.58441162109375, -2.422119140625, -2.25982666015625, -2.0975341796875, -1.93524169921875, -1.77294921875, -1.61065673828125, -1.4483642578125, -1.28607177734375, -1.123779296875, -0.96148681640625, -0.7991943359375, -0.63690185546875, -0.474609375, -0.31231689453125, -0.1500244140625, 0.01226806640625, 0.174560546875, 0.33685302734375, 0.4991455078125, 0.66143798828125, 0.82373046875, 0.98602294921875, 1.1483154296875, 1.31060791015625, 1.472900390625, 1.63519287109375, 1.7974853515625, 1.95977783203125, 2.1220703125, 2.28436279296875, 2.4466552734375, 2.60894775390625, 2.771240234375, 2.93353271484375, 3.0958251953125, 3.25811767578125, 3.42041015625, 3.58270263671875, 3.7449951171875, 3.90728759765625, 4.069580078125, 4.23187255859375, 4.3941650390625, 4.55645751953125, 4.71875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 4.0, 5.0, 17.0, 9.0, 9.0, 19.0, 30.0, 29.0, 62.0, 85.0, 114.0, 263.0, 569.0, 1261.0, 3507.0, 13096.0, 8211631.0, 144445.0, 8653.0, 2671.0, 1013.0, 449.0, 198.0, 126.0, 72.0, 60.0, 42.0, 37.0, 17.0, 13.0, 9.0, 12.0, 13.0, 12.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.67251968383789, -18.025653839111328, -17.378787994384766, -16.731922149658203, -16.08505630493164, -15.438190460205078, -14.791324615478516, -14.144458770751953, -13.49759292602539, -12.850727081298828, -12.203861236572266, -11.556995391845703, -10.91012954711914, -10.263263702392578, -9.616397857666016, -8.969532012939453, -8.32266616821289, -7.675800323486328, -7.028934478759766, -6.382068634033203, -5.735202789306641, -5.088336944580078, -4.441471099853516, -3.794605255126953, -3.1477394104003906, -2.500873565673828, -1.8540077209472656, -1.2071418762207031, -0.5602760314941406, 0.08658981323242188, 0.7334556579589844, 1.3803215026855469, 2.027189254760742, 2.6740550994873047, 3.320920944213867, 3.9677867889404297, 4.614652633666992, 5.261518478393555, 5.908384323120117, 6.55525016784668, 7.202116012573242, 7.848981857299805, 8.495847702026367, 9.14271354675293, 9.789579391479492, 10.436445236206055, 11.083311080932617, 11.73017692565918, 12.377042770385742, 13.023908615112305, 13.670774459838867, 14.31764030456543, 14.964506149291992, 15.611371994018555, 16.258237838745117, 16.90510368347168, 17.551969528198242, 18.198835372924805, 18.845701217651367, 19.49256706237793, 20.139432907104492, 20.786298751831055, 21.433164596557617, 22.08003044128418, 22.726896286010742]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 9.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.566499710083008, -28.805587768554688, -28.044675827026367, -27.283763885498047, -26.522851943969727, -25.761940002441406, -25.001026153564453, -24.240116119384766, -23.479202270507812, -22.718290328979492, -21.957378387451172, -21.19646644592285, -20.43555450439453, -19.67464256286621, -18.91373062133789, -18.152816772460938, -17.39190673828125, -16.63099479675293, -15.87008285522461, -15.109170913696289, -14.348258972167969, -13.587347030639648, -12.826434135437012, -12.065522193908691, -11.304610252380371, -10.54369831085205, -9.78278636932373, -9.021873474121094, -8.260961532592773, -7.500050067901611, -6.739137649536133, -5.9782257080078125, -5.217315673828125, -4.456403732299805, -3.6954915523529053, -2.934579372406006, -2.1736674308776855, -1.4127554893493652, -0.6518430709838867, 0.1090688705444336, 0.8699808120727539, 1.6308928728103638, 2.3918049335479736, 3.152717113494873, 3.9136290550231934, 4.674540996551514, 5.435453414916992, 6.1963653564453125, 6.957277297973633, 7.718189239501953, 8.479101181030273, 9.240013122558594, 10.000925064086914, 10.761837005615234, 11.522749900817871, 12.283661842346191, 13.044573783874512, 13.805485725402832, 14.566397666931152, 15.327310562133789, 16.08822250366211, 16.84913444519043, 17.61004638671875, 18.37095832824707, 19.13187026977539]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 7.0, 5.0, 6.0, 10.0, 18.0, 9.0, 11.0, 13.0, 18.0, 22.0, 31.0, 34.0, 20.0, 33.0, 47.0, 47.0, 52.0, 47.0, 59.0, 64.0, 45.0, 52.0, 41.0, 45.0, 36.0, 33.0, 30.0, 30.0, 18.0, 20.0, 13.0, 26.0, 7.0, 12.0, 6.0, 6.0, 4.0, 9.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.497528076171875, -3.38958740234375, -3.281646728515625, -3.1737060546875, -3.065765380859375, -2.95782470703125, -2.849884033203125, -2.741943359375, -2.634002685546875, -2.52606201171875, -2.418121337890625, -2.3101806640625, -2.202239990234375, -2.09429931640625, -1.986358642578125, -1.87841796875, -1.770477294921875, -1.66253662109375, -1.554595947265625, -1.4466552734375, -1.338714599609375, -1.23077392578125, -1.122833251953125, -1.014892578125, -0.906951904296875, -0.79901123046875, -0.691070556640625, -0.5831298828125, -0.475189208984375, -0.36724853515625, -0.259307861328125, -0.1513671875, -0.043426513671875, 0.06451416015625, 0.172454833984375, 0.2803955078125, 0.388336181640625, 0.49627685546875, 0.604217529296875, 0.712158203125, 0.820098876953125, 0.92803955078125, 1.035980224609375, 1.1439208984375, 1.251861572265625, 1.35980224609375, 1.467742919921875, 1.57568359375, 1.683624267578125, 1.79156494140625, 1.899505615234375, 2.0074462890625, 2.115386962890625, 2.22332763671875, 2.331268310546875, 2.439208984375, 2.547149658203125, 2.65509033203125, 2.763031005859375, 2.8709716796875, 2.978912353515625, 3.08685302734375, 3.194793701171875, 3.302734375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 6.0, 7.0, 7.0, 14.0, 19.0, 33.0, 28.0, 46.0, 84.0, 122.0, 169.0, 271.0, 586.0, 1096.0, 2601.0, 7283.0, 25390.0, 108680.0, 255082.0, 89716.0, 21928.0, 6507.0, 2383.0, 1020.0, 471.0, 262.0, 158.0, 121.0, 49.0, 40.0, 30.0, 17.0, 10.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.96875, -32.06396484375, -31.1591796875, -30.25439453125, -29.349609375, -28.44482421875, -27.5400390625, -26.63525390625, -25.73046875, -24.82568359375, -23.9208984375, -23.01611328125, -22.111328125, -21.20654296875, -20.3017578125, -19.39697265625, -18.4921875, -17.58740234375, -16.6826171875, -15.77783203125, -14.873046875, -13.96826171875, -13.0634765625, -12.15869140625, -11.25390625, -10.34912109375, -9.4443359375, -8.53955078125, -7.634765625, -6.72998046875, -5.8251953125, -4.92041015625, -4.015625, -3.11083984375, -2.2060546875, -1.30126953125, -0.396484375, 0.50830078125, 1.4130859375, 2.31787109375, 3.22265625, 4.12744140625, 5.0322265625, 5.93701171875, 6.841796875, 7.74658203125, 8.6513671875, 9.55615234375, 10.4609375, 11.36572265625, 12.2705078125, 13.17529296875, 14.080078125, 14.98486328125, 15.8896484375, 16.79443359375, 17.69921875, 18.60400390625, 19.5087890625, 20.41357421875, 21.318359375, 22.22314453125, 23.1279296875, 24.03271484375, 24.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 7.0, 3.0, 5.0, 5.0, 8.0, 7.0, 7.0, 15.0, 20.0, 15.0, 28.0, 14.0, 38.0, 37.0, 33.0, 55.0, 52.0, 52.0, 51.0, 60.0, 45.0, 49.0, 48.0, 38.0, 45.0, 45.0, 38.0, 17.0, 24.0, 23.0, 20.0, 21.0, 15.0, 9.0, 8.0, 12.0, 6.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.32421875, -3.226531982421875, -3.12884521484375, -3.031158447265625, -2.9334716796875, -2.835784912109375, -2.73809814453125, -2.640411376953125, -2.542724609375, -2.445037841796875, -2.34735107421875, -2.249664306640625, -2.1519775390625, -2.054290771484375, -1.95660400390625, -1.858917236328125, -1.76123046875, -1.663543701171875, -1.56585693359375, -1.468170166015625, -1.3704833984375, -1.272796630859375, -1.17510986328125, -1.077423095703125, -0.979736328125, -0.882049560546875, -0.78436279296875, -0.686676025390625, -0.5889892578125, -0.491302490234375, -0.39361572265625, -0.295928955078125, -0.1982421875, -0.100555419921875, -0.00286865234375, 0.094818115234375, 0.1925048828125, 0.290191650390625, 0.38787841796875, 0.485565185546875, 0.583251953125, 0.680938720703125, 0.77862548828125, 0.876312255859375, 0.9739990234375, 1.071685791015625, 1.16937255859375, 1.267059326171875, 1.36474609375, 1.462432861328125, 1.56011962890625, 1.657806396484375, 1.7554931640625, 1.853179931640625, 1.95086669921875, 2.048553466796875, 2.146240234375, 2.243927001953125, 2.34161376953125, 2.439300537109375, 2.5369873046875, 2.634674072265625, 2.73236083984375, 2.830047607421875, 2.927734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 10.0, 10.0, 11.0, 10.0, 39.0, 105.0, 128.0, 73.0, 31.0, 8.0, 7.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.47846221923828, -34.467498779296875, -33.45653533935547, -32.44557189941406, -31.434608459472656, -30.42364501953125, -29.412683486938477, -28.40172004699707, -27.390756607055664, -26.379793167114258, -25.36882972717285, -24.357866287231445, -23.346904754638672, -22.335941314697266, -21.32497787475586, -20.314014434814453, -19.303050994873047, -18.29208755493164, -17.281124114990234, -16.270160675048828, -15.259198188781738, -14.248234748840332, -13.237272262573242, -12.226308822631836, -11.21534538269043, -10.204381942749023, -9.193418502807617, -8.182456016540527, -7.171492576599121, -6.160529136657715, -5.149566173553467, -4.138603210449219, -3.127643585205078, -2.116680383682251, -1.1057171821594238, -0.09475398063659668, 0.9162092208862305, 1.9271726608276367, 2.9381356239318848, 3.949098587036133, 4.960062026977539, 5.971025466918945, 6.981988430023193, 7.992951393127441, 9.003914833068848, 10.014878273010254, 11.025840759277344, 12.03680419921875, 13.047767639160156, 14.058731079101562, 15.069694519042969, 16.080657958984375, 17.09162139892578, 18.102584838867188, 19.11354637145996, 20.124509811401367, 21.135473251342773, 22.14643669128418, 23.157400131225586, 24.168363571166992, 25.179325103759766, 26.190288543701172, 27.201251983642578, 28.212215423583984, 29.22317886352539]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 1.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 6.0, 16.0, 25.0, 47.0, 83.0, 88.0, 60.0, 42.0, 17.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.257474899291992, -21.610557556152344, -20.963642120361328, -20.31672477722168, -19.669809341430664, -19.022891998291016, -18.3759765625, -17.72905921936035, -17.082141876220703, -16.435224533081055, -15.788309097290039, -15.14139175415039, -14.494475364685059, -13.847558975219727, -13.200642585754395, -12.553726196289062, -11.90680980682373, -11.259893417358398, -10.612977027893066, -9.966060638427734, -9.319143295288086, -8.672226905822754, -8.025310516357422, -7.378393650054932, -6.7314772605896, -6.084560871124268, -5.437644004821777, -4.790727615356445, -4.143811225891113, -3.496894359588623, -2.849977970123291, -2.203061103820801, -1.5561447143554688, -0.9092281460762024, -0.26231157779693604, 0.38460493087768555, 1.0315215587615967, 1.6784381866455078, 2.32535457611084, 2.97227144241333, 3.619187831878662, 4.266104221343994, 4.913021087646484, 5.559937477111816, 6.206853866577148, 6.853770732879639, 7.500687122344971, 8.147603988647461, 8.794520378112793, 9.441436767578125, 10.088353157043457, 10.735269546508789, 11.382186889648438, 12.02910327911377, 12.676019668579102, 13.32293701171875, 13.969852447509766, 14.616768836975098, 15.26368522644043, 15.910602569580078, 16.557518005371094, 17.204435348510742, 17.85135269165039, 18.498268127441406, 19.145185470581055]}} \ No newline at end of file